Exemplo n.º 1
0
def test_merge_floattrackers_should_addup():
    first = IntTracker()
    vals1 = [1, 2, 3]
    for val in vals1:
        first.update(val)

    assert first.count == len(vals1)
    assert first.max == max(vals1)
    assert first.min == min(vals1)
    assert first.sum == sum(vals1)

    second = IntTracker()
    vals2 = [4, 5, 6]
    for val in vals2:
        second.update(val)

    assert second.count == len(vals2)
    assert second.max == max(vals2)
    assert second.min == min(vals2)
    assert second.sum == sum(vals2)

    all_vals = vals1 + vals2
    merge_first = first.merge(second)
    assert merge_first.count == len(all_vals)
    assert merge_first.max == max(all_vals)
    assert merge_first.min == min(all_vals)
    assert merge_first.sum == sum(all_vals)

    merge_second = second.merge(first)
    assert merge_second.__dict__ == merge_first.__dict__
Exemplo n.º 2
0
def test_values_are_min_max():
    first = IntTracker()
    vals1 = [1, 2, 3]
    for val in vals1:
        first.update(val)

    assert first.count == len(vals1)
    assert first.max == max(vals1)
    assert first.min == min(vals1)
    assert first.sum == sum(vals1)
Exemplo n.º 3
0
    def from_protobuf(message: NumbersMessage):
        """
        Load from a protobuf message

        Returns
        -------
        number_tracker : NumberTracker
        """
        theta = None
        if message.theta is not None and len(message.theta) > 0:
            theta = ThetaSketch.deserialize(message.theta)
        elif message.compact_theta is not None and len(message.compact_theta) > 0:
            theta = ThetaSketch.deserialize(message.compact_theta)

        opts = dict(
            theta_sketch=theta,
            variance=VarianceTracker.from_protobuf(message.variance),
            histogram=dsketch.deserialize_kll_floats_sketch(message.histogram),
            frequent_numbers=dsketch.FrequentNumbersSketch.from_protobuf(
                message.frequent_numbers
            ),
        )
        if message.HasField("doubles"):
            opts["floats"] = FloatTracker.from_protobuf(message.doubles)
        if message.HasField("longs"):
            opts["ints"] = IntTracker.from_protobuf(message.longs)
        return NumberTracker(**opts)
Exemplo n.º 4
0
 def __init__(
     self,
     variance: VarianceTracker = None,
     floats: FloatTracker = None,
     ints: IntTracker = None,
     theta_sketch: ThetaSketch = None,
     histogram: datasketches.kll_floats_sketch = None,
     frequent_numbers: dsketch.FrequentNumbersSketch = None,
 ):
     # Our own trackers
     if variance is None:
         variance = VarianceTracker()
     if floats is None:
         floats = FloatTracker()
     if ints is None:
         ints = IntTracker()
     if theta_sketch is None:
         theta_sketch = ThetaSketch()
     if histogram is None:
         histogram = datasketches.kll_floats_sketch(DEFAULT_HIST_K)
     if frequent_numbers is None:
         frequent_numbers = dsketch.FrequentNumbersSketch()
     self.variance = variance
     self.floats = floats
     self.ints = ints
     self.theta_sketch = theta_sketch
     self.histogram = histogram
     self.frequent_numbers = frequent_numbers
Exemplo n.º 5
0
    def from_protobuf(message: NumbersMessage):
        """
        Load from a protobuf message

        Returns
        -------
        number_tracker : NumberTracker
        """
        theta = None
        if message.compact_theta is not None and len(
                message.compact_theta) > 0:
            theta = ThetaSketch.deserialize(message.compact_theta)
        elif message.theta is not None and len(message.theta) > 0:
            logger.warning(
                "Possible missing data. Non-compact theta sketches are no longer supported"
            )

        opts = dict(
            theta_sketch=theta,
            variance=VarianceTracker.from_protobuf(message.variance),
            histogram=dsketch.deserialize_kll_floats_sketch(message.histogram),
        )
        if message.HasField("doubles"):
            opts["floats"] = FloatTracker.from_protobuf(message.doubles)
        if message.HasField("longs"):
            opts["ints"] = IntTracker.from_protobuf(message.longs)
        return NumberTracker(**opts)