示例#1
0
    def test_get_item(self):
        # HeronComponentSpec name set
        spec = HeronComponentSpec("spout", "class", True, 1)
        spec.outputs = [
            "string", "hello",
            Stream(fields=["abc", "def"], name="another_stream"),
            Stream(fields=["another", "default"], name="default")
        ]
        ret = spec['another_stream']
        self.assertEqual(ret, GlobalStreamId("spout", "another_stream"))

        # HeronComponentSpec name not set
        spec = HeronComponentSpec(None, "class", True, 1)
        spec.outputs = [
            "string", "hello",
            Stream(fields=["abc", "def"], name="another_stream"),
            Stream(fields=["another", "default"], name="default")
        ]
        ret = spec['default']
        self.assertEqual(ret, GlobalStreamId(spec, "default"))

        # stream id not registered
        spec = HeronComponentSpec(None, "class", True, 1)
        spec.outputs = [
            "string", "hello",
            Stream(fields=["abc", "def"], name="another_stream"),
            Stream(fields=["another", "default"], name="default")
        ]
        with self.assertRaises(ValueError):
            spec['non_existent_stream']
示例#2
0
class TestSane(Topology):
  config = {"topology.wide.config.1": "value",
            "spout.overriden.config": True}
  spout = HeronComponentSpec(None, "sp_class", True, 3, inputs=None,
                             outputs=["word", "count",
                                      Stream(fields=['error_msg'], name='error_stream')],
                             config={"spout.specific.config.1": "value",
                                     "spout.specific.config.2": True,
                                     "spout.specific.config.3": -12.4,
                                     "spout.specific.config.4": [1, 2, 3],
                                     "spout.overriden.config": False})
  bolt = HeronComponentSpec(None, "bl_class", False, 4,
                            inputs={spout: Grouping.SHUFFLE, spout['error_stream']: Grouping.ALL})
示例#3
0
    def test_component_id_property(self):
        # component id is string
        gsi = GlobalStreamId(componentId="component", streamId="stream")
        self.assertEqual(gsi.component_id, "component")

        # component id is HeronComponentSpec with name
        spec = HeronComponentSpec("spout", "class", True, 1)
        gsi = GlobalStreamId(spec, "stream")
        self.assertEqual(gsi.component_id, "spout")

        # component id is HeronComponentSpec without name
        spec = HeronComponentSpec(None, "class", True, 1)
        gsi = GlobalStreamId(spec, "stream")
        # expecting "<No name available for HeronComponentSpec yet, uuid: %s>"
        self.assertIn(spec.uuid, gsi.component_id)
示例#4
0
  def test_add_spec(self):
    builder = TopologyBuilder("Test")

    with self.assertRaises(ValueError):
      builder.add_spec(HeronComponentSpec(None, "path", True, 1))

    with self.assertRaises(TypeError):
      builder.add_spec(None)

    self.assertEqual(len(builder._specs), 0)

    # add 10 specs
    specs = []
    for i in range(10):
      specs.append(HeronComponentSpec(str(i), "path", True, 1))
    builder.add_spec(*specs)
    self.assertEqual(len(builder._specs), 10)
示例#5
0
 def spec(cls, name, par, inputs, config, user_bolt_classpath, user_output_fields=None):
   python_class_path = "%s.%s" % (cls.__module__, cls.__name__)
   config[integ_const.USER_BOLT_CLASSPATH] = user_bolt_classpath
   # avoid modification to cls.outputs
   _outputs = copy.copy(cls.outputs)
   if user_output_fields is not None:
     _outputs.extend(user_output_fields)
   return HeronComponentSpec(name, python_class_path, is_spout=False, par=par,
                             inputs=inputs, outputs=_outputs, config=config)
示例#6
0
    def test_get_out_streamids(self):
        # outputs is none
        spec = HeronComponentSpec("spout", "class", True, 1)
        ret = spec.get_out_streamids()
        self.assertEqual(ret, set())

        # outputs neither list nor tuple
        spec = HeronComponentSpec("spout", "class", True, 1)
        spec.outputs = "string"
        with self.assertRaises(TypeError):
            spec.get_out_streamids()

        # outputs sane
        spec = HeronComponentSpec("spout", "class", True, 1)
        spec.outputs = [
            "string", "hello",
            Stream(fields=["abc", "def"], name="another_stream"),
            Stream(fields=["another", "default"], name="default")
        ]
        ret = spec.get_out_streamids()
        self.assertEqual(ret, {"default", "another_stream"})
示例#7
0
    def test_sanitize_outputs(self):
        # outputs is None (no argument to outputs)
        spec = HeronComponentSpec("spout", "class", True, 1)
        ret = spec._sanitize_outputs()
        self.assertIsNone(ret)

        # outputs neither list nor tuple
        spec = HeronComponentSpec("spout", "class", True, 1)
        spec.outputs = "string"
        with self.assertRaises(TypeError):
            spec._sanitize_outputs()

        # output list contains a non-string and non-Stream object
        spec = HeronComponentSpec("spout", "class", True, 1)
        spec.outputs = ["string", False, 123]
        with self.assertRaises(TypeError):
            spec._sanitize_outputs()

        # output list is all string
        spec = HeronComponentSpec("spout", "class", True, 1)
        spec.outputs = ["string", "hello", "heron"]
        ret = spec._sanitize_outputs()
        self.assertEqual(ret, {"default": ["string", "hello", "heron"]})

        # output list has mixed stream
        spec = HeronComponentSpec("spout", "class", True, 1)
        spec.outputs = [
            "string", "hello",
            Stream(fields=["abc", "def"], name="another_stream"),
            Stream(fields=["another", "default"], name="default")
        ]
        ret = spec._sanitize_outputs()
        self.assertEqual(
            ret, {
                "default": ["string", "hello", "another", "default"],
                "another_stream": ["abc", "def"]
            })
示例#8
0
    def test_sanitize_args(self):
        # good args
        spec = HeronComponentSpec(name="string",
                                  python_class_path="string.path",
                                  is_spout=True,
                                  par=1)
        self.assertIsNotNone(spec)
        name_none_spec = HeronComponentSpec(name=None,
                                            python_class_path="string.path",
                                            is_spout=True,
                                            par=1)
        self.assertIsNotNone(name_none_spec)

        # bad name
        with self.assertRaises(AssertionError):
            HeronComponentSpec(123, "classpath", True, 1)
        with self.assertRaises(AssertionError):
            HeronComponentSpec(False, "classpath", True, 1)

        # bad classpath
        with self.assertRaises(AssertionError):
            HeronComponentSpec("name", {}, True, 1)
        with self.assertRaises(AssertionError):
            HeronComponentSpec("name", None, True, 1)

        # bad is_spout
        with self.assertRaises(AssertionError):
            HeronComponentSpec("name", "classpath", 1, 1)
        with self.assertRaises(AssertionError):
            HeronComponentSpec("name", "classpath", None, 1)

        # bad par
        with self.assertRaises(AssertionError):
            HeronComponentSpec("name", "classpath", True, "1")
        with self.assertRaises(AssertionError):
            HeronComponentSpec("name", "classpath", True, 1.35)
        with self.assertRaises(AssertionError):
            HeronComponentSpec("name", "classpath", True, -21)
        with self.assertRaises(AssertionError):
            HeronComponentSpec("name", "classpath", True, None)
示例#9
0
    def test_sanitize_inputs(self):
        # Note that _sanitize_inputs() should only be called after HeronComponentSpec's
        # name attribute is set

        # invalid inputs given as argument (valid ones are either dict, list, tuple or None)
        invalid_spec = HeronComponentSpec("name",
                                          "classpath",
                                          True,
                                          1,
                                          inputs="string")
        with self.assertRaises(TypeError):
            invalid_spec._sanitize_inputs()

        invalid_spec = HeronComponentSpec("name",
                                          "classpath",
                                          True,
                                          1,
                                          inputs=100)
        with self.assertRaises(TypeError):
            invalid_spec._sanitize_inputs()

        # dict <HeronComponentSpec -> Grouping>
        from_spec = HeronComponentSpec("spout", "sp_clspath", True, 1)
        to_spec = HeronComponentSpec("bolt",
                                     "bl_clspath",
                                     False,
                                     1,
                                     inputs={from_spec: Grouping.SHUFFLE})
        ret = to_spec._sanitize_inputs()
        self.assertEqual(
            ret, {GlobalStreamId("spout", "default"): Grouping.SHUFFLE})

        from_spec = HeronComponentSpec("spout", "sp_clspath", True, 1)
        from_spec.outputs = [Stream(name='another_stream')]
        to_spec = HeronComponentSpec(
            "bolt",
            "bl_clspath",
            False,
            1,
            inputs={from_spec['another_stream']: Grouping.ALL})
        ret = to_spec._sanitize_inputs()
        self.assertEqual(
            ret, {GlobalStreamId("spout", "another_stream"): Grouping.ALL})

        # HeronComponentSpec's name attribute not set
        from_spec = HeronComponentSpec(None, "sp_clspath", True, 1)
        to_spec = HeronComponentSpec("bolt",
                                     "bl_clspath",
                                     False,
                                     1,
                                     inputs={from_spec: Grouping.ALL})
        with self.assertRaises(RuntimeError):
            to_spec._sanitize_inputs()

        # dict <GlobalStreamId -> Grouping>
        inputs_dict = {
            GlobalStreamId("some_spout", "some_stream"):
            Grouping.NONE,
            GlobalStreamId("another_spout", "default"):
            Grouping.fields(['word', 'count'])
        }
        spec = HeronComponentSpec("bolt",
                                  "classpath",
                                  False,
                                  1,
                                  inputs=inputs_dict)
        ret = spec._sanitize_inputs()
        self.assertEqual(ret, inputs_dict)

        # list of HeronComponentSpec
        from_spec1 = HeronComponentSpec("spout1", "sp1_cls", True, 1)
        from_spec2 = HeronComponentSpec("spout2", "sp2_cls", True, 1)
        to_spec = HeronComponentSpec("bolt",
                                     "bl_cls",
                                     False,
                                     1,
                                     inputs=[from_spec1, from_spec2])
        ret = to_spec._sanitize_inputs()
        self.assertEqual(
            ret, {
                GlobalStreamId("spout1", "default"): Grouping.SHUFFLE,
                GlobalStreamId("spout2", "default"): Grouping.SHUFFLE
            })

        # HeronComponentSpec's name attribute not set
        from_spec = HeronComponentSpec(None, "sp_clspath", True, 1)
        to_spec = HeronComponentSpec("bolt",
                                     "bl_clspath",
                                     False,
                                     1,
                                     inputs=[from_spec])
        with self.assertRaises(RuntimeError):
            to_spec._sanitize_inputs()

        # list of GlobalStreamId
        inputs_list = [
            GlobalStreamId("spout1", "default"),
            GlobalStreamId("spout2", "some_stream")
        ]
        spec = HeronComponentSpec("bolt",
                                  "bl_cls",
                                  False,
                                  1,
                                  inputs=inputs_list)
        ret = spec._sanitize_inputs()
        self.assertEqual(ret, dict(zip(inputs_list, [Grouping.SHUFFLE] * 2)))

        # list of neither GlobalStreamId nor HeronComponentSpec
        inputs_list = [None, 123, "string", [GlobalStreamId("sp", "default")]]
        spec = HeronComponentSpec("bolt",
                                  "bl_cls",
                                  False,
                                  1,
                                  inputs=inputs_list)
        with self.assertRaises(ValueError):
            spec._sanitize_inputs()
示例#10
0
 def test_add_bolt_specs(self):
   spec = HeronComponentSpec("bolt", "bl_cls", False, 1)
   with self.assertRaises(ValueError):
     TopologyType.add_bolt_specs(spec, {})
示例#11
0
 def test_add_spout_specs(self):
   # spout with no output
   spec = HeronComponentSpec("spout", "sp_cls", True, 1)
   with self.assertRaises(ValueError):
     TopologyType.add_spout_specs(spec, {})
示例#12
0
 def test_class_dict_to_specs(self):
   # duplicate component name
   class_dict = {"spout": HeronComponentSpec("same_name", "sp_cls", True, 1),
                 "bolt": HeronComponentSpec("same_name", "bl_cls", False, 2)}
   with self.assertRaises(ValueError):
     TopologyType.class_dict_to_specs(class_dict)
示例#13
0
 class JustBolt(Topology):
   bolt = HeronComponentSpec(None, "bl_class", False, 4)