def test_build(self, target_df, spark_client, spark_session): # arrange file_reader = FileReader("test", "path/to/file", "format") spark_client.read.return_value = target_df # act file_reader.build(spark_client) result_df = spark_session.sql("select * from test") # assert assert target_df.collect() == result_df.collect()
def test_build_with_columns(self, target_df, column_target_df, spark_client, spark_session): # arrange file_reader = FileReader("test", "path/to/file", "format") spark_client.read.return_value = target_df # act file_reader.build( client=spark_client, columns=[("col1", "new_col1"), ("col2", "new_col2")], ) result_df = spark_session.sql("select * from test") # assert assert column_target_df.collect() == result_df.collect()