예제 #1
0
    def test_ignores_columns_with_different_names_and_same_values(self):
        csv_data = "a,b\n" "1,1\n" "2,2\n"
        df = pd.read_csv(StringIO(csv_data))
        expected = pd.read_csv(StringIO(csv_data))

        delete_duplicate_columns(df)

        assert list(df.columns) == ["a", "b"]
        assert_frame_equal(df, expected)
예제 #2
0
    def test_deletes_columns_with_surrounding_spaces_and_same_names_and_values(
            self, csv_data):
        df = pd.read_csv(StringIO(csv_data))
        csv_data2 = "a,b\n" "1,1\n" "2,2\n"
        expected = pd.read_csv(StringIO(csv_data2))

        delete_duplicate_columns(df)

        assert list(df.columns) == ["a", "b"]
        assert_frame_equal(df, expected)
예제 #3
0
    def test_deletes_columns_with_same_names_and_same_values_with_nan(self):
        csv_data = "a,a,a,b\n" "1,1,1,1\n" f"{np.nan},{np.nan},{np.nan},2\n"
        df = pd.read_csv(StringIO(csv_data))
        csv_data2 = "a,b\n" f"1,1\n" f"{np.nan},2\n"
        expected = pd.read_csv(StringIO(csv_data2))

        delete_duplicate_columns(df)

        assert list(df.columns) == ["a", "b"]
        assert_frame_equal(df, expected)
예제 #4
0
    def test_deletes_multiple_columns_with_same_names_and_same_values(self):
        csv_data = "a,b,a,b\n" "1,3,1,3\n" "2,4,2,4\n"
        df = pd.read_csv(StringIO(csv_data))
        csv_data2 = "a,b\n" "1,3\n" "2,4\n"
        expected = pd.read_csv(StringIO(csv_data2))

        delete_duplicate_columns(df)

        assert list(df.columns) == ["a", "b"]
        assert_frame_equal(df, expected)