def run_general_rules(self): self.save_result(garbage_symbols(self.source_items)) self.save_result( coverage_rules.check_fields_coverage( self.source_items.df.drop(columns=["_type", "_key"]) ) )
def run_general_rules(self): self.save_result(garbage_symbols(self.source_items.df)) df = self.source_items.df self.save_result( coverage_rules.check_fields_coverage( df.drop(columns=df.columns[df.columns.str.startswith("_")]))) self.save_result(category_rules.get_categories(df))
def run_general_rules(self): self.save_result(garbage_symbols(self.source_items.df)) df = self.source_items.df self.save_result( coverage_rules.check_fields_coverage( df.drop(columns=df.columns[df.columns.str.startswith("_")]))) self.save_result(category_rules.get_categories(df)) if getattr(self, "uniques", None): self.save_result( duplicate_rules.find_by(self.source_items.df, self.uniques))
def scraped_fields_coverage(self, df: pd.DataFrame) -> None: coverage_res = self.report.results.get( "Fields Coverage", coverage_rules.check_fields_coverage(df)) self.figures.extend(coverage_res.figures)
def test_check_fields_coverage(df, expected_messages, expected_stats): result = cov.check_fields_coverage(df) assert result == create_result("Fields Coverage", expected_messages, expected_stats)
def test_check_fields_coverage(df, expected_messages, expected_stats): assert_results_equal( cov.check_fields_coverage(df), create_result("Fields Coverage", expected_messages, expected_stats), )
def run_general_rules(self): self.save_result(garbage_symbols(self.source_items)) self.save_result( coverage_rules.check_fields_coverage(self.source_items.df))