当前位置: 首页>>代码示例>>Python>>正文


Python util.bash_wrap函数代码示例

本文整理汇总了Python中mrjob.util.bash_wrap函数的典型用法代码示例。如果您正苦于以下问题:Python bash_wrap函数的具体用法?Python bash_wrap怎么用?Python bash_wrap使用的例子?那么恭喜您, 这里精选的函数代码示例或许可以为您提供帮助。


在下文中一共展示了bash_wrap函数的12个代码示例,这些例子默认根据受欢迎程度排序。您可以为喜欢或者感觉有用的代码点赞,您的评价将有助于系统推荐出更棒的Python代码示例。

示例1: _hadoop_streaming_commands

    def _hadoop_streaming_commands(self, step_num):
        version = self.get_hadoop_version()

        # Hadoop streaming stuff
        mapper, bash_wrap_mapper = self._render_substep(
            step_num, 'mapper')

        combiner, bash_wrap_combiner = self._render_substep(
            step_num, 'combiner')

        reducer, bash_wrap_reducer = self._render_substep(
            step_num, 'reducer')

        if (combiner is not None and
            not supports_combiners_in_hadoop_streaming(version)):

            # krazy hack to support combiners on hadoop <0.20
            bash_wrap_mapper = True
            mapper = "%s | sort | %s" % (mapper, combiner)

            # take the combiner away, hadoop will just be confused
            combiner = None
            bash_wrap_combiner = False

        if bash_wrap_mapper:
            mapper = bash_wrap(mapper)

        if bash_wrap_combiner:
            combiner = bash_wrap(combiner)

        if bash_wrap_reducer:
            reducer = bash_wrap(reducer)

        return mapper, combiner, reducer
开发者ID:parastoo-62,项目名称:mrjob,代码行数:34,代码来源:runner.py

示例2: steps

 def steps(self):
     steps = []
     for step in self.options.steps:
         step_kwargs = {}
         if "mapper" in step:
             step_kwargs["mapper_cmd"] = bash_wrap(step["mapper"])
         if "combiner" in step:
             step_kwargs["combiner_cmd"] = bash_wrap(step["combiner"])
         if "reducer" in step:
             step_kwargs["reducer_cmd"] = bash_wrap(step["reducer"])
         steps.append(MRStep(**step_kwargs))
     return steps
开发者ID:hophacker,项目名称:mrjob,代码行数:12,代码来源:mr_cmd.py

示例3: steps

 def steps(self):
     steps = []
     for step in self.options.steps:
         step_kwargs = {}
         if 'mapper' in step:
             step_kwargs['mapper_cmd'] = bash_wrap(step['mapper'])
         if 'combiner' in step:
             step_kwargs['combiner_cmd'] = bash_wrap(step['combiner'])
         if 'reducer' in step:
             step_kwargs['reducer_cmd'] = bash_wrap(step['reducer'])
         steps.append(self.mr(**step_kwargs))
     return steps
开发者ID:Anihc,项目名称:mrjob,代码行数:12,代码来源:mr_cmd.py

示例4: _hadoop_streaming_commands

    def _hadoop_streaming_commands(self, step_num):
        # Hadoop streaming stuff
        mapper, bash_wrap_mapper = self._render_substep(step_num, "mapper")

        combiner, bash_wrap_combiner = self._render_substep(step_num, "combiner")

        reducer, bash_wrap_reducer = self._render_substep(step_num, "reducer")

        if bash_wrap_mapper:
            mapper = bash_wrap(mapper)

        if bash_wrap_combiner:
            combiner = bash_wrap(combiner)

        if bash_wrap_reducer:
            reducer = bash_wrap(reducer)

        return mapper, combiner, reducer
开发者ID:irskep,项目名称:mrjob,代码行数:18,代码来源:runner.py

示例5: test_pre_filter_escaping

 def test_pre_filter_escaping(self):
     # ESCAPE ALL THE THINGS!!!
     self._assert_streaming_step(
         {"type": "streaming", "mapper": {"type": "script", "pre_filter": bash_wrap("grep 'anything'")}},
         [
             "-mapper",
             "bash -c 'bash -c '\\''grep"
             " '\\''\\'\\'''\\''anything'\\''\\'\\'''\\'''\\'' |"
             " python my_job.py --step-num=0 --mapper'",
             "-jobconf",
             "mapred.reduce.tasks=0",
         ],
     )
开发者ID:swiftserve,项目名称:mrjob,代码行数:13,代码来源:test_hadoop.py

示例6: _hadoop_streaming_commands

    def _hadoop_streaming_commands(self, step_num):
        version = self.get_hadoop_version()

        # Hadoop streaming stuff
        mapper, bash_wrap_mapper = self._render_substep(
            step_num, 'mapper')

        combiner, bash_wrap_combiner = self._render_substep(
            step_num, 'combiner')

        reducer, bash_wrap_reducer = self._render_substep(
            step_num, 'reducer')

        if bash_wrap_mapper:
            mapper = bash_wrap(mapper)

        if bash_wrap_combiner:
            combiner = bash_wrap(combiner)

        if bash_wrap_reducer:
            reducer = bash_wrap(reducer)

        return mapper, combiner, reducer
开发者ID:Milkigit,项目名称:mrjob,代码行数:23,代码来源:runner.py

示例7: test_pre_filter_escaping

 def test_pre_filter_escaping(self):
     # ESCAPE ALL THE THINGS!!!
     self._assert_streaming_step(
         {
             'type': 'streaming',
             'mapper': {
                 'type': 'script',
                 'pre_filter': bash_wrap("grep 'anything'"),
             },
         },
         ['-mapper',
          "bash -c 'bash -c '\\''grep"
              " '\\''\\'\\'''\\''anything'\\''\\'\\'''\\'''\\'' |"
              " python my_job.py --step-num=0 --mapper'",
          '-jobconf', 'mapred.reduce.tasks=0'])
开发者ID:DepengLuan,项目名称:mrjob,代码行数:15,代码来源:test_hadoop.py

示例8: test_pre_filter_escaping

    def test_pre_filter_escaping(self):
        # ESCAPE ALL THE THINGS!!!
        self.runner._steps = [
            {
                'type': 'streaming',
                'mapper': {
                    'type': 'script',
                    'pre_filter': bash_wrap("grep 'anything'"),
                },
            },
        ]

        self.assertEqual(
            self.runner._args_for_streaming_step(0),
            (self.BASIC_HADOOP_ARGS + ['-D', 'mapreduce.job.reduces=0'] +
             self.BASIC_JOB_ARGS + [
                 '-mapper',
                 "bash -c 'bash -c '\\''grep"
                 " '\\''\\'\\'''\\''anything'\\''\\'\\'''\\'''\\'' | " +
                 PYTHON_BIN +
                 " my_job.py --step-num=0 --mapper'"]))
开发者ID:Milkigit,项目名称:mrjob,代码行数:21,代码来源:test_hadoop.py

示例9: test_multiple

    def test_multiple(self):
        data = 'x\nx\nx\nx\nx\nx\n'
        mapper_cmd = 'cat -e'
        reducer_cmd = bash_wrap('wc -l | tr -Cd "[:digit:]"')
        job = CmdJob([
            '--runner', 'local',
            '--mapper-cmd', mapper_cmd,
            '--combiner-cmd', 'uniq',
            '--reducer-cmd', reducer_cmd])
        job.sandbox(stdin=StringIO(data))
        with job.make_runner() as r:
            self.assertEqual(
                r._get_steps(),
                [{
                    'type': 'streaming',
                    'mapper': {'type': 'command', 'command': mapper_cmd},
                    'combiner': {'type': 'command', 'command': 'uniq'},
                    'reducer': {'type': 'command', 'command': reducer_cmd},
                }])

            r.run()

            self.assertEqual(list(r.stream_output()), ['2'])
开发者ID:eklitzke,项目名称:mrjob,代码行数:23,代码来源:test_local.py

示例10: test_multiple

    def test_multiple(self):
        data = b"x\nx\nx\nx\nx\nx\n"
        mapper_cmd = "cat -e"
        reducer_cmd = bash_wrap('wc -l | tr -Cd "[:digit:]"')
        job = CmdJob(
            ["--runner", "local", "--mapper-cmd", mapper_cmd, "--combiner-cmd", "uniq", "--reducer-cmd", reducer_cmd]
        )
        job.sandbox(stdin=BytesIO(data))
        with job.make_runner() as r:
            self.assertEqual(
                r._get_steps(),
                [
                    {
                        "type": "streaming",
                        "mapper": {"type": "command", "command": mapper_cmd},
                        "combiner": {"type": "command", "command": "uniq"},
                        "reducer": {"type": "command", "command": reducer_cmd},
                    }
                ],
            )

            r.run()

            self.assertEqual(list(r.stream_output()), [b"2"])
开发者ID:alanhdu,项目名称:mrjob,代码行数:24,代码来源:test_local.py

示例11: reducer_cmd

 def reducer_cmd(self):
     return bash_wrap('./wordcount.sh reducer')
开发者ID:Anihc,项目名称:mrjob,代码行数:2,代码来源:BashWordcount.py

示例12: mapper_cmd

 def mapper_cmd(self):
     return bash_wrap('./wordcount.sh mapper')
开发者ID:Anihc,项目名称:mrjob,代码行数:2,代码来源:BashWordcount.py


注:本文中的mrjob.util.bash_wrap函数示例由纯净天空整理自Github/MSDocs等开源代码及文档管理平台,相关代码片段筛选自各路编程大神贡献的开源项目,源码版权归原作者所有,传播和使用请参考对应项目的License;未经允许,请勿转载。