Example #1
0
def test_scale_with_exclude_cols():
    df = _some_df1()
    scale_stage = Scale("StandardScaler", exclude_columns=["lbl"])
    res_df = scale_stage(df)
    assert list(res_df.columns) == ["ph", "gt", "lbl"]
    assert "ph" in res_df.columns
    assert "gt" in res_df.columns
    assert res_df["ph"][1] < df["ph"][1]

    # see only transform (no fit) when already fitted
    df2 = _some_df1b()
    res_df2 = scale_stage(df2)
    assert "ph" in res_df2.columns
    assert "gt" in res_df2.columns
    assert df['ph'][1] < df2['ph'][1]
    assert res_df2["ph"][1] < df2["ph"][1]
    assert res_df["ph"][1] < res_df2["ph"][1]

    # check fit_transform when already fitted
    df3 = _some_df1b()
    res_df3 = scale_stage.fit_transform(df2)
    assert "ph" in res_df3.columns
    assert "gt" in res_df3.columns
    assert res_df3["ph"][1] < df3["ph"][1]
    assert res_df3["ph"][1] < res_df2["ph"][1]
Example #2
0
def test_scale():
    df = _some_df2()
    scale_stage = Scale("StandardScaler")
    res_df = scale_stage(df)
    assert 'ph' in res_df.columns
    assert 'gt' in res_df.columns
    assert res_df['ph'][1] < df['ph'][1]

    # see only transform (no fit) when already fitted
    df2 = _some_df2b()
    res_df2 = scale_stage(df2)
    assert 'ph' in res_df2.columns
    assert 'gt' in res_df2.columns
    assert res_df2['ph'][1] < df2['ph'][1]
    assert res_df['ph'][1] < res_df2['ph'][1]

    # check fit_transform when already fitted
    df3 = _some_df2b()
    res_df3 = scale_stage.fit_transform(df2)
    assert 'ph' in res_df3.columns
    assert 'gt' in res_df3.columns
    assert res_df3['ph'][1] < df3['ph'][1]
    assert res_df3['ph'][1] < res_df2['ph'][1]
Example #3
0
def test_scale_with_exclude_cols():
    df = _some_df1()
    scale_stage = Scale("StandardScaler", exclude_columns=['lbl'], exmsg='AA')
    res_df = scale_stage(df)
    assert list(res_df.columns) == ['ph', 'gt', 'lbl']
    assert 'ph' in res_df.columns
    assert 'gt' in res_df.columns
    assert res_df['ph'][1] < df['ph'][1]

    # see only transform (no fit) when already fitted
    df2 = _some_df1b()
    res_df2 = scale_stage(df2)
    assert 'ph' in res_df2.columns
    assert 'gt' in res_df2.columns
    assert res_df2['ph'][1] < df2['ph'][1]
    assert res_df['ph'][1] < res_df2['ph'][1]

    # check fit_transform when already fitted
    df3 = _some_df1b()
    res_df3 = scale_stage.fit_transform(df2)
    assert 'ph' in res_df3.columns
    assert 'gt' in res_df3.columns
    assert res_df3['ph'][1] < df3['ph'][1]
    assert res_df3['ph'][1] < res_df2['ph'][1]