Exemple #1
0
def get_report_ru():
    """
    Get data from Wikipedia page with
    COVID-19 statistics for each state of Russia

    :return: Pandas DataFrame
    """
    url = 'https://en.wikipedia.org/wiki/COVID-19_pandemic_in_Russia'
    df = utils.get_wiki_table_df(url, 'Per 1 million')
    df = pd.DataFrame(df.values[:, 1:5],
                      columns=['state', 'confirmed', 'recovered', 'deaths'])
    df.drop(df[df['state'].str.len() > 40].index, inplace=True)
    df['state'] = df['state'].apply(lambda x: utils.clean_territory_name(x))
    df = utils.wiki_table_df_numeric_column_clean(
        df, ['confirmed', 'deaths', 'recovered'])
    df['country'] = 'Russia'
    check_report(df)
    return df
Exemple #2
0
def get_report_us():
    """
    Get COVID-19 data from Wikipedia page with
    COVID-19 statistics for each state of USA

    :return: Pandas DataFrame
    """
    url = 'https://en.wikipedia.org/wiki/Timeline_of_the_COVID-19_pandemic_in_the_United_States'
    df = utils.get_wiki_table_df(
        url, 'COVID-19 pandemic in the United States by state and territory')
    df = pd.DataFrame(df.values[:, 1:5],
                      columns=['state', 'confirmed', 'deaths', 'recovered'])
    df.drop(df[df['state'].str.len() > 40].index, inplace=True)
    df['state'] = df['state'].apply(lambda x: utils.clean_territory_name(x))
    df = utils.wiki_table_df_numeric_column_clean(
        df, ['confirmed', 'deaths', 'recovered'])
    df['country'] = 'United States'
    check_report(df)
    return df
Exemple #3
0
def get_report_countries():
    """
    Get data from Wikipedia page with
    COVID-19 statistics for each country

    :return: Pandas DataFrame
    """
    url = 'https://en.wikipedia.org/wiki/COVID-19_pandemic_by_country_and_territory'
    df = utils.get_wiki_table_df(url, 'Location[b]')
    df = pd.DataFrame(df.values[:, 1:5],
                      columns=['country', 'confirmed', 'deaths', 'recovered'])
    df = df[~df['country'].isna()]
    df['country'] = df['country'].apply(
        lambda x: utils.clean_territory_name(x))
    df.drop(df[df['country'].str.len() > 40].index, inplace=True)
    df = utils.wiki_table_df_numeric_column_clean(
        df, ['confirmed', 'deaths', 'recovered'])
    df['state'] = None
    check_report(df)
    return df