Exemple #1
0
    def test_get_all_columns_except(self):
        columns = 'ABCD'
        to_remove = 'D'
        df = create_random_dataframe(rows=4, cols=4, columns=columns)

        df = get_all_columns_except(df, to_remove)
        self.assertEqual(''.join(list(df)), columns.replace(to_remove, ''))
Exemple #2
0
    def test_create_random_dataframe(self):
        rows = 5
        cols = 5
        columns = 'ABCDE'

        df = create_random_dataframe(rows, cols, columns)

        self.__check_dataframe_data(df, rows, cols, columns)
    def test_series_to_list(self):
        df = dataframe_utils.create_random_dataframe(rows=5,
                                                     cols=5,
                                                     columns='ABCDE')

        for row in df.iterrows():
            output_list = series_to_list(row)
            self.assertListEqual(row[1].values.tolist(),
                                 output_list[1].values.tolist())
    def test_get_X_y(self):
        df = dataframe_utils.create_random_dataframe(rows=5,
                                                     cols=5,
                                                     columns='ABCDE')
        target = 'E'

        X_list, y_list = get_X_y(df, target)

        # check y values
        for index, y_final in enumerate(y_list):
            self.assertEqual(
                df.loc[:, df.columns == target].values.tolist()[index][0],
                y_final)

        for index_list, X_list in enumerate(X_list):
            for index_item, item_x in enumerate(X_list):
                current_df = df.loc[:, df.columns != target].values.tolist(
                )[index_list][index_item]

                self.assertEqual(current_df, item_x)
    def test_make_visualizations_generate_artifacts(self):
        labels = [[0], [1]]

        data, labels = label_encode(labels)

        embeddings = np.array([[1, 0], [0, 1]])

        embeddings_list = []
        embeddings_list.append(embeddings)

        df = dataframe_utils.create_random_dataframe(2, 2, 'AB')

        path = 'test_visualization'
        make_visualizations(list(labels),
                            embeddings_list,
                            df,
                            output_path=path)

        path_created = os.path.exists(path)

        self.assertTrue(path_created)

        shutil.rmtree(path)
Exemple #6
0
 def test_check_target_existent_in_df(self) -> None:
     df = dataframe_utils.create_random_dataframe(columns='ABCD')
     self.assertRaises(ValueError, check_target_existent_in_df, 'E', df)