def test_drop_empty_samples(self): df = pd.DataFrame([[1, 2, np.NAN], [np.NAN, np.NAN, np.NAN], [7, 8, 9]]) original = DataSet(df, labels=["a", "b", "c"]) filtered = original.drop_empty_samples() assert_that(filtered.feature_list(), has_length(3)) assert_that(filtered.num_samples(), equal_to(2)) assert_that(filtered, equals_dataset([[1, 2, np.NAN], [7, 8, 9]])) assert_that(filtered.get_labels(), contains("a", "c"))
def test_drop_empty_samples_original_unchanged(self): data_list = [[1, 2, np.NAN], [np.NAN, np.NAN, np.NAN], [7, 8, 9]] label_list = ["a", "b", "c"] original = DataSet(pd.DataFrame(data_list), labels=label_list) filtered = original.drop_empty_samples() filtered.set_column(0, [-1, -1]) filtered.labels[0] = "z" assert_that(original, equals_dataset(data_list)) assert_that(original.get_labels(), contains(*label_list))