Exemple #1
0
def test_df_stability_report_expanding():
    # generate report directly from dataframe
    features = ["date:isActive", "date:eyeColor"]
    df_stability_report(pytest.test_df,
                        time_axis="date",
                        reference_type="expanding",
                        features=features)
Exemple #2
0
def test_df_stability_report_rolling():
    # generate report directly from dataframe
    features = ["date:isActive", "date:latitude"]
    df_stability_report(pytest.test_df,
                        time_axis="date",
                        reference_type="rolling",
                        features=features)
Exemple #3
0
def test_df_stability_report_external():
    # generate report directly from dataframe
    features = ["date:eyeColor", "date:latitude"]
    df_stability_report(
        pytest.test_df,
        time_axis="date",
        reference_type="external",
        reference=pytest.test_df,
        features=features,
    )
Exemple #4
0
def test_df_stability_report_self():
    time_width = "1y"
    time_offset = "2020-1-1"

    # generate report directly from dataframe
    features = ["date:eyeColor", "date:latitude"]
    rep = df_stability_report(
        pytest.test_df,
        time_axis="date",
        reference_type="self",
        features=features,
        time_width=time_width,
        time_offset=time_offset,
    )

    # test that time_width and time_offset got picked up correctly.
    datastore = rep.datastore
    hists = datastore["hists"]
    bin_specs = get_bin_specs(hists)

    assert pd.Timedelta(
        time_width).value == bin_specs["date:eyeColor"][0]["bin_width"]
    assert (pd.Timestamp(time_offset).value == bin_specs["date:eyeColor"][0]
            ["bin_offset"])
    assert pd.Timedelta(
        time_width).value == bin_specs["date:latitude"][0]["bin_width"]
    assert (pd.Timestamp(time_offset).value == bin_specs["date:latitude"][0]
            ["bin_offset"])
Exemple #5
0
def test_df_stability_report():
    # generate report directly from dataframe
    features = [
        'date:isActive', 'date:eyeColor', 'date:latitude'
    ]
    bin_specs = {
        'date': {'bin_width': pd.Timedelta('1y').value, 'bin_offset': pd.Timestamp('2000-1-1').value},
        'latitude': {'bin_width': 5., 'bin_offset': 0.},
    }
    rep = df_stability_report(pytest.test_df, time_axis='date', features=features, binning='unit', bin_specs=bin_specs)

    # regenerate report, changing the plot window settings
    rep.regenerate(last_n=4)
    rep.regenerate(skip_first_n=1, skip_last_n=1)
Exemple #6
0
def test_df_stability_report_self():
    time_width = '1y'
    time_offset = '2020-1-1'

    # generate report directly from dataframe
    features = ['date:eyeColor', 'date:latitude']
    rep = df_stability_report(pytest.test_df, time_axis='date', reference_type='self', features=features,
                              time_width=time_width, time_offset=time_offset)

    # test that time_width and time_offset got picked up correctly.
    datastore = rep.datastore
    hists = datastore['hists']
    bin_specs = get_bin_specs(hists)

    assert pd.Timedelta(time_width).value == bin_specs['date:eyeColor'][0]['bin_width']
    assert pd.Timestamp(time_offset).value == bin_specs['date:eyeColor'][0]['bin_offset']
    assert pd.Timedelta(time_width).value == bin_specs['date:latitude'][0]['bin_width']
    assert pd.Timestamp(time_offset).value == bin_specs['date:latitude'][0]['bin_offset']
Exemple #7
0
def test_df_stability_report():
    # generate report directly from dataframe
    features = ["date:isActive", "date:eyeColor", "date:latitude"]
    bin_specs = {
        "date": {
            "bin_width": pd.Timedelta("1y").value,
            "bin_offset": pd.Timestamp("2000-1-1").value,
        },
        "latitude": {
            "bin_width": 5.0,
            "bin_offset": 0.0
        },
    }
    rep = df_stability_report(
        pytest.test_df,
        time_axis="date",
        features=features,
        binning="unit",
        bin_specs=bin_specs,
    )

    # regenerate report, changing the plot window settings
    rep.regenerate(last_n=4)
    rep.regenerate(skip_first_n=1, skip_last_n=1)
Exemple #8
0
def test_df_stability_report_expanding():
    # generate report directly from dataframe
    features = ['date:isActive', 'date:eyeColor']
    df_stability_report(pytest.test_df, time_axis='date', reference_type='expanding', features=features)
Exemple #9
0
def test_df_stability_report_rolling():
    # generate report directly from dataframe
    features = ['date:isActive', 'date:latitude']
    df_stability_report(pytest.test_df, time_axis='date', reference_type='rolling', features=features)
Exemple #10
0
def test_df_stability_report_external():
    # generate report directly from dataframe
    features = ['date:eyeColor', 'date:latitude']
    df_stability_report(pytest.test_df, time_axis='date', reference_type='external',
                        reference=pytest.test_df, features=features)