def test_translated_statistic_overview_table(): untranslated_statistics = get_statistics( stat_meta_data_provider=StatisticsSchemaJsonMetaDataProvider() ) translated_statistics = get_statistics( stat_meta_data_provider=StatisticsSchemaJsonMetaDataProvider(), target_language="en", translation_provider=SchemaTranslationProvider(), ) assert untranslated_statistics.shape == translated_statistics.shape assert not untranslated_statistics.equals(translated_statistics)
def translate_schema_to_target_language( target_language: str, translation_provider: TranslationProvider): metadata_provider = StatisticsSchemaJsonMetaDataProvider() statistic_descriptions = metadata_provider.get_stat_descriptions() translation_dictionary: Dict = dict() for source_texts in statistic_descriptions.values(): for source_text in source_texts: if source_text not in translation_dictionary: translated_text = translation_provider.translate_from_german( source_text, target_language) translation_dictionary[source_text] = translated_text time.sleep(sleep_duration_between_requests_in_seconds) return {target_language: translation_dictionary}
def test_get_query_specific_enum_meta(): field_type_list = [ ("id", "String"), ("name", "String"), ("WAHL09", "WAHL09"), ("PART04", "PART04"), ("year", "Int"), ("value", "Float"), ] query_stat_meta = StatisticsSchemaJsonMetaDataProvider( ).get_query_enum_meta(field_type_list) expected_stat_meta = { "PART04": dict([ ("AFD", "AfD"), ("B90_GRUENE", "GRÜNE"), ("CDU", "CDU/CSU"), ("DIELINKE", "DIE LINKE"), ("FDP", "FDP"), ("SONSTIGE", "Sonstige Parteien"), ("SPD", "SPD"), ("GESAMT", "Gesamt"), ]) } print(query_stat_meta, expected_stat_meta) assert query_stat_meta == expected_stat_meta
def test_statistic_overview_table(): stats = get_statistics( stat_meta_data_provider=StatisticsSchemaJsonMetaDataProvider() ) assert isinstance(stats, pd.DataFrame) assert stats.index.name == "statistic" assert list(stats.columns) == ["short_description", "long_description"] assert stats.shape[0] > 400
def test_get_query_specific_stat_meta(): field_type_list = [ ("id", "String"), ("name", "String"), ("WAHL09", "WAHL09"), ("PART04", "PART04"), ("year", "Int"), ("value", "Float"), ] query_stat_meta = StatisticsSchemaJsonMetaDataProvider( ).get_query_stat_meta(field_type_list) expected_stat_meta = {"WAHL09": "Gültige Zweitstimmen"} assert query_stat_meta == expected_stat_meta