def write_local_files_debug(self):
        """Downloads and writes the tables to the local file system as csv and
           json files. This is only for debugging/convenience, and should not
           be used in production."""
        metadata = fetch_acs_metadata(self.base_acs_url)
        var_map = parse_acs_metadata(metadata, list(GROUPS.keys()))

        by_hisp_and_race_json = fetch_acs_group(self.base_acs_url,
                                                HISPANIC_BY_RACE_CONCEPT,
                                                var_map, 2, self.county_level)
        sex_by_age_frames = {}
        for concept in SEX_BY_AGE_CONCEPTS_TO_RACE:
            json_string = fetch_acs_group(self.base_acs_url, concept, var_map,
                                          2, self.county_level)
            frame = gcs_to_bq_util.values_json_to_dataframe(json_string)
            sex_by_age_frames[concept] = update_col_types(frame)

        race_and_hispanic_frame = gcs_to_bq_util.values_json_to_dataframe(
            by_hisp_and_race_json)
        race_and_hispanic_frame = update_col_types(race_and_hispanic_frame)
        race_and_hispanic_frame = standardize_frame(
            race_and_hispanic_frame,
            get_vars_for_group(HISPANIC_BY_RACE_CONCEPT, var_map, 2),
            [HISPANIC_COL, RACE_COL], self.county_level, POPULATION_COL)

        frames = {
            self.get_table_name_by_race():
            self.get_all_races_frame(race_and_hispanic_frame),
            self.get_table_name_by_sex_age_race():
            self.get_sex_by_age_and_race(var_map, sex_by_age_frames)
        }
        for key, df in frames.items():
            df.to_csv("table_" + key + ".csv", index=False)
            df.to_json("table_" + key + ".json", orient="records")
예제 #2
0
    def testStandarizeFrameTwoDims(self):
        """Tests standardizing an ACS DataFrame"""
        metadata = census.parse_acs_metadata(
            self._fake_metadata, ["B02001", "B01001"])
        group_vars = census.get_vars_for_group("SEX BY AGE", metadata, 2)

        df = gcs_to_bq_util.values_json_to_dataframe(
            json.dumps(self._fake_sex_by_age_data))
        df = census.standardize_frame(
            df, group_vars, ["sex", "age"], False, "population")
        expected_df = gcs_to_bq_util.values_json_to_dataframe(
            json.dumps(self._expected_sex_by_age_data)).reset_index(drop=True)
        assert_frame_equal(expected_df, df)