def test_merge_histogram(self): data = pd.Series([], dtype=object) profiler = FloatColumn(data.name) profiler.update(data) profiler._stored_histogram['histogram']['bin_counts'] = np.array( [3, 2]) profiler._stored_histogram['histogram']['bin_edges'] = \ np.array([1.0, 3.0, 5.0]) input_array = [0.5, 1.0, 2.0, 5.0] profiler._merge_histogram(input_array) merged_hist = profiler._histogram_for_profile('sqrt')[0] expected_bin_counts, expected_bin_edges = \ [5, 2, 2], [0.5, 2.0, 3.5, 5.0] self.assertEqual(expected_bin_counts, merged_hist['bin_counts'].tolist()) self.assertCountEqual(expected_bin_edges, merged_hist['bin_edges'])
def test_merge_histogram(self): data = pd.Series([], dtype=object) profiler = FloatColumn(data.name) profiler.update(data) profiler.histogram_methods['sqrt']['histogram']['bin_counts'] = \ np.array([3, 2]) profiler.histogram_methods['sqrt']['histogram']['bin_edges'] = \ np.array([1.0, 3.0, 5.0]) input_array = [0.5, 1.0, 2.0, 5.0] profiler._merge_histogram(input_array, 'sqrt') merged_bin_counts = \ profiler.histogram_methods['sqrt']['histogram']['bin_counts'] merged_bin_edges = \ profiler.histogram_methods['sqrt']['histogram']['bin_edges'] expected_bin_counts, expected_bin_edges = \ [5, 2, 2], [0.5, 2.0, 3.5, 5.0] self.assertCountEqual(merged_bin_counts, expected_bin_counts) self.assertCountEqual(merged_bin_edges, expected_bin_edges)