Example #1
0
    def test_sort_values_sets_jobconf(self):
        mr_job = MRSortValues()

        self.assertEqual(
            mr_job.jobconf(),
            {'stream.num.map.output.key.fields': 2,
             'mapred.text.key.partitioner.options': '-k1,1',
             'mapred.output.key.comparator.class': None,
             'mapred.text.key.comparator.options': None})
Example #2
0
    def test_sort_values_sets_jobconf(self):
        mr_job = MRSortValues()

        self.assertEqual(
            mr_job.jobconf(), {
                'stream.num.map.output.key.fields': 2,
                'mapred.text.key.partitioner.options': '-k1,1',
                'mapred.output.key.comparator.class': None,
                'mapred.text.key.comparator.options': None
            })
Example #3
0
    def test_cant_override_sort_values_from_mrjob_conf(self):
        runner = MRSortValues().make_runner()

        self.assertEqual(
            runner._hadoop_args_for_step(0),
            # foo=bar is included, but the other options from mrjob.conf are
            # blanked out so as not to mess up SORT_VALUES
            ['-D', 'foo=bar',
             '-D', 'mapred.text.key.partitioner.options=-k1,1',
             '-D', 'stream.num.map.output.key.fields=2',
             '-partitioner',
                'org.apache.hadoop.mapred.lib.KeyFieldBasedPartitioner'])
Example #4
0
    def test_sort_values_sets_jobconf(self):
        mr_job = MRSortValues()

        self.assertEqual(
            mr_job.jobconf(),
            {
                "stream.num.map.output.key.fields": 2,
                "mapred.text.key.partitioner.options": "-k1,1",
                "mapred.output.key.comparator.class": None,
                "mapred.text.key.comparator.options": None,
            },
        )
Example #5
0
    def test_cant_override_sort_values_from_mrjob_conf(self):
        runner = MRSortValues().make_runner()

        self.assertEqual(
            runner._hadoop_args_for_step(0),
            # foo=bar is included, but the other options from mrjob.conf are
            # blanked out so as not to mess up SORT_VALUES
            [
                '-D', 'foo=bar', '-D',
                'mapred.text.key.partitioner.options=-k1,1', '-D',
                'stream.num.map.output.key.fields=2', '-partitioner',
                'org.apache.hadoop.mapred.lib.KeyFieldBasedPartitioner'
            ])
Example #6
0
    def test_can_override_sort_values_from_cmd_line(self):
        mr_job = MRSortValues(
            ['--partitioner', 'org.pants.FancyPantsPartitioner',
             '--jobconf', 'stream.num.map.output.key.fields=lots'])

        self.assertEqual(
            mr_job.partitioner(),
            'org.pants.FancyPantsPartitioner')

        self.assertEqual(
            mr_job.jobconf(),
            combine_dicts(_SORT_VALUES_JOBCONF,
                          {'stream.num.map.output.key.fields': 'lots'}))
Example #7
0
    def test_can_override_sort_values_from_cmd_line(self):
        mr_job = MRSortValues([
            '--partitioner', 'org.pants.FancyPantsPartitioner', '--jobconf',
            'stream.num.map.output.key.fields=lots'
        ])

        self.assertEqual(mr_job.partitioner(),
                         'org.pants.FancyPantsPartitioner')

        self.assertEqual(
            mr_job.jobconf(),
            combine_dicts(_SORT_VALUES_JOBCONF,
                          {'stream.num.map.output.key.fields': 'lots'}))
Example #8
0
    def test_can_override_sort_values_from_cmd_line(self):
        mr_job = MRSortValues(
            ['--partitioner', 'org.pants.FancyPantsPartitioner',
             '--jobconf', 'stream.num.map.output.key.fields=lots'])

        self.assertEqual(
            mr_job.partitioner(),
            'org.pants.FancyPantsPartitioner')

        self.assertEqual(
            mr_job.jobconf(),
            {'stream.num.map.output.key.fields': 'lots',
             'mapred.text.key.partitioner.options': '-k1,1',
             'mapred.output.key.comparator.class': None,
             'mapred.text.key.comparator.options': None})
Example #9
0
    def test_can_override_sort_values_from_cmd_line(self):
        mr_job = MRSortValues([
            '--partitioner', 'org.pants.FancyPantsPartitioner', '--jobconf',
            'stream.num.map.output.key.fields=lots'
        ])

        self.assertEqual(mr_job.partitioner(),
                         'org.pants.FancyPantsPartitioner')

        self.assertEqual(
            mr_job.jobconf(), {
                'stream.num.map.output.key.fields': 'lots',
                'mapred.text.key.partitioner.options': '-k1,1',
                'mapred.output.key.comparator.class': None,
                'mapred.text.key.comparator.options': None
            })
Example #10
0
    def test_can_override_sort_values_from_cmd_line(self):
        mr_job = MRSortValues(
            ["--partitioner", "org.pants.FancyPantsPartitioner", "--jobconf", "stream.num.map.output.key.fields=lots"]
        )

        self.assertEqual(mr_job.partitioner(), "org.pants.FancyPantsPartitioner")

        self.assertEqual(
            mr_job.jobconf(),
            {
                "stream.num.map.output.key.fields": "lots",
                "mapred.text.key.partitioner.options": "-k1,1",
                "mapred.output.key.comparator.class": None,
                "mapred.text.key.comparator.options": None,
            },
        )
Example #11
0
    def test_sort_values_sets_partitioner(self):
        mr_job = MRSortValues()

        self.assertEqual(
            mr_job.partitioner(),
            'org.apache.hadoop.mapred.lib.KeyFieldBasedPartitioner')
Example #12
0
    def test_sort_values_sets_jobconf(self):
        mr_job = MRSortValues()

        self.assertEqual(mr_job.jobconf(), _SORT_VALUES_JOBCONF)
Example #13
0
    def test_sort_values_sets_partitioner(self):
        mr_job = MRSortValues()

        self.assertEqual(
            mr_job.partitioner(),
            'org.apache.hadoop.mapred.lib.KeyFieldBasedPartitioner')
Example #14
0
    def test_sort_values_sets_jobconf(self):
        mr_job = MRSortValues()

        self.assertEqual(mr_job.jobconf(), _SORT_VALUES_JOBCONF)