本文整理汇总了Python中mrjob.util.bash_wrap函数的典型用法代码示例。如果您正苦于以下问题:Python bash_wrap函数的具体用法?Python bash_wrap怎么用?Python bash_wrap使用的例子?那么恭喜您, 这里精选的函数代码示例或许可以为您提供帮助。
在下文中一共展示了bash_wrap函数的12个代码示例,这些例子默认根据受欢迎程度排序。您可以为喜欢或者感觉有用的代码点赞,您的评价将有助于我们的系统推荐出更棒的Python代码示例。
示例1: _hadoop_streaming_commands
def _hadoop_streaming_commands(self, step_num):
version = self.get_hadoop_version()
# Hadoop streaming stuff
mapper, bash_wrap_mapper = self._render_substep(
step_num, 'mapper')
combiner, bash_wrap_combiner = self._render_substep(
step_num, 'combiner')
reducer, bash_wrap_reducer = self._render_substep(
step_num, 'reducer')
if (combiner is not None and
not supports_combiners_in_hadoop_streaming(version)):
# krazy hack to support combiners on hadoop <0.20
bash_wrap_mapper = True
mapper = "%s | sort | %s" % (mapper, combiner)
# take the combiner away, hadoop will just be confused
combiner = None
bash_wrap_combiner = False
if bash_wrap_mapper:
mapper = bash_wrap(mapper)
if bash_wrap_combiner:
combiner = bash_wrap(combiner)
if bash_wrap_reducer:
reducer = bash_wrap(reducer)
return mapper, combiner, reducer
开发者ID:parastoo-62,项目名称:mrjob,代码行数:34,代码来源:runner.py
示例2: steps
def steps(self):
steps = []
for step in self.options.steps:
step_kwargs = {}
if "mapper" in step:
step_kwargs["mapper_cmd"] = bash_wrap(step["mapper"])
if "combiner" in step:
step_kwargs["combiner_cmd"] = bash_wrap(step["combiner"])
if "reducer" in step:
step_kwargs["reducer_cmd"] = bash_wrap(step["reducer"])
steps.append(MRStep(**step_kwargs))
return steps
开发者ID:hophacker,项目名称:mrjob,代码行数:12,代码来源:mr_cmd.py
示例3: steps
def steps(self):
steps = []
for step in self.options.steps:
step_kwargs = {}
if 'mapper' in step:
step_kwargs['mapper_cmd'] = bash_wrap(step['mapper'])
if 'combiner' in step:
step_kwargs['combiner_cmd'] = bash_wrap(step['combiner'])
if 'reducer' in step:
step_kwargs['reducer_cmd'] = bash_wrap(step['reducer'])
steps.append(self.mr(**step_kwargs))
return steps
开发者ID:Anihc,项目名称:mrjob,代码行数:12,代码来源:mr_cmd.py
示例4: _hadoop_streaming_commands
def _hadoop_streaming_commands(self, step_num):
# Hadoop streaming stuff
mapper, bash_wrap_mapper = self._render_substep(step_num, "mapper")
combiner, bash_wrap_combiner = self._render_substep(step_num, "combiner")
reducer, bash_wrap_reducer = self._render_substep(step_num, "reducer")
if bash_wrap_mapper:
mapper = bash_wrap(mapper)
if bash_wrap_combiner:
combiner = bash_wrap(combiner)
if bash_wrap_reducer:
reducer = bash_wrap(reducer)
return mapper, combiner, reducer
开发者ID:irskep,项目名称:mrjob,代码行数:18,代码来源:runner.py
示例5: test_pre_filter_escaping
def test_pre_filter_escaping(self):
# ESCAPE ALL THE THINGS!!!
self._assert_streaming_step(
{"type": "streaming", "mapper": {"type": "script", "pre_filter": bash_wrap("grep 'anything'")}},
[
"-mapper",
"bash -c 'bash -c '\\''grep"
" '\\''\\'\\'''\\''anything'\\''\\'\\'''\\'''\\'' |"
" python my_job.py --step-num=0 --mapper'",
"-jobconf",
"mapred.reduce.tasks=0",
],
)
开发者ID:swiftserve,项目名称:mrjob,代码行数:13,代码来源:test_hadoop.py
示例6: _hadoop_streaming_commands
def _hadoop_streaming_commands(self, step_num):
version = self.get_hadoop_version()
# Hadoop streaming stuff
mapper, bash_wrap_mapper = self._render_substep(
step_num, 'mapper')
combiner, bash_wrap_combiner = self._render_substep(
step_num, 'combiner')
reducer, bash_wrap_reducer = self._render_substep(
step_num, 'reducer')
if bash_wrap_mapper:
mapper = bash_wrap(mapper)
if bash_wrap_combiner:
combiner = bash_wrap(combiner)
if bash_wrap_reducer:
reducer = bash_wrap(reducer)
return mapper, combiner, reducer
开发者ID:Milkigit,项目名称:mrjob,代码行数:23,代码来源:runner.py
示例7: test_pre_filter_escaping
def test_pre_filter_escaping(self):
# ESCAPE ALL THE THINGS!!!
self._assert_streaming_step(
{
'type': 'streaming',
'mapper': {
'type': 'script',
'pre_filter': bash_wrap("grep 'anything'"),
},
},
['-mapper',
"bash -c 'bash -c '\\''grep"
" '\\''\\'\\'''\\''anything'\\''\\'\\'''\\'''\\'' |"
" python my_job.py --step-num=0 --mapper'",
'-jobconf', 'mapred.reduce.tasks=0'])
开发者ID:DepengLuan,项目名称:mrjob,代码行数:15,代码来源:test_hadoop.py
示例8: test_pre_filter_escaping
def test_pre_filter_escaping(self):
# ESCAPE ALL THE THINGS!!!
self.runner._steps = [
{
'type': 'streaming',
'mapper': {
'type': 'script',
'pre_filter': bash_wrap("grep 'anything'"),
},
},
]
self.assertEqual(
self.runner._args_for_streaming_step(0),
(self.BASIC_HADOOP_ARGS + ['-D', 'mapreduce.job.reduces=0'] +
self.BASIC_JOB_ARGS + [
'-mapper',
"bash -c 'bash -c '\\''grep"
" '\\''\\'\\'''\\''anything'\\''\\'\\'''\\'''\\'' | " +
PYTHON_BIN +
" my_job.py --step-num=0 --mapper'"]))
开发者ID:Milkigit,项目名称:mrjob,代码行数:21,代码来源:test_hadoop.py
示例9: test_multiple
def test_multiple(self):
data = 'x\nx\nx\nx\nx\nx\n'
mapper_cmd = 'cat -e'
reducer_cmd = bash_wrap('wc -l | tr -Cd "[:digit:]"')
job = CmdJob([
'--runner', 'local',
'--mapper-cmd', mapper_cmd,
'--combiner-cmd', 'uniq',
'--reducer-cmd', reducer_cmd])
job.sandbox(stdin=StringIO(data))
with job.make_runner() as r:
self.assertEqual(
r._get_steps(),
[{
'type': 'streaming',
'mapper': {'type': 'command', 'command': mapper_cmd},
'combiner': {'type': 'command', 'command': 'uniq'},
'reducer': {'type': 'command', 'command': reducer_cmd},
}])
r.run()
self.assertEqual(list(r.stream_output()), ['2'])
开发者ID:eklitzke,项目名称:mrjob,代码行数:23,代码来源:test_local.py
示例10: test_multiple
def test_multiple(self):
data = b"x\nx\nx\nx\nx\nx\n"
mapper_cmd = "cat -e"
reducer_cmd = bash_wrap('wc -l | tr -Cd "[:digit:]"')
job = CmdJob(
["--runner", "local", "--mapper-cmd", mapper_cmd, "--combiner-cmd", "uniq", "--reducer-cmd", reducer_cmd]
)
job.sandbox(stdin=BytesIO(data))
with job.make_runner() as r:
self.assertEqual(
r._get_steps(),
[
{
"type": "streaming",
"mapper": {"type": "command", "command": mapper_cmd},
"combiner": {"type": "command", "command": "uniq"},
"reducer": {"type": "command", "command": reducer_cmd},
}
],
)
r.run()
self.assertEqual(list(r.stream_output()), [b"2"])
开发者ID:alanhdu,项目名称:mrjob,代码行数:24,代码来源:test_local.py
示例11: reducer_cmd
def reducer_cmd(self):
return bash_wrap('./wordcount.sh reducer')
开发者ID:Anihc,项目名称:mrjob,代码行数:2,代码来源:BashWordcount.py
示例12: mapper_cmd
def mapper_cmd(self):
return bash_wrap('./wordcount.sh mapper')
开发者ID:Anihc,项目名称:mrjob,代码行数:2,代码来源:BashWordcount.py
注:本文中的mrjob.util.bash_wrap函数示例由纯净天空整理自Github/MSDocs等源码及文档管理平台,相关代码片段筛选自各路编程大神贡献的开源项目,源码版权归原作者所有,传播和使用请参考对应项目的License;未经允许,请勿转载。 |
请发表评论