예제 #1
0
def test_fit_callable_distance(df):
    clusterer = KMeansClusterer()

    def dist(u, v):
        return 1

    clusterer.fit(df, distance=dist)
예제 #2
0
def test_predict_series(df):
    clusterer = KMeansClusterer()
    clusterer.fit(df)
    new = {'feature1': 2, 'feature2': 2}
    series = pd.Series(data=new)
    clusterer.predict(series)
예제 #3
0
def test_predict_dataframe(df):
    clusterer = KMeansClusterer()
    clusterer.fit(df)
    new = {'feature1': [2], 'feature2': [2]}
    dataframe = pd.DataFrame(data=new)
    clusterer.predict(dataframe)
예제 #4
0
def test_predict_featuresets(df):
    clusterer = KMeansClusterer()
    clusterer.fit(df)
    new = [{'feature1': 2, 'feature2': 2}]
    clusterer.predict(new)
예제 #5
0
def test_predict_dict(df):
    clusterer = KMeansClusterer()
    clusterer.fit(df)
    new = {'feature1': 2, 'feature2': 2}
    clusterer.predict(new)
예제 #6
0
def test_fit_bad_max_iter(df):
    clusterer = KMeansClusterer()
    with pytest.raises(ValueError):
        clusterer.fit(df, max_iter=0)
예제 #7
0
def test_fit_bad_distance(df):
    clusterer = KMeansClusterer()
    with pytest.raises(TypeError):
        clusterer.fit(df, distance=1)
예제 #8
0
def test_fit_bad_data():
    data = [1, 0]
    clusterer = KMeansClusterer()
    with pytest.raises(TypeError):
        clusterer.fit(data)
예제 #9
0
def test_fit_dataframe(df):
    clusterer = KMeansClusterer()
    clusterer.fit(df)
예제 #10
0
def test_fit_tolerance():
    data = pd.DataFrame(data={'feature': [1]})
    clusterer = KMeansClusterer()
    clusterer.fit(data)
예제 #11
0
def test_fit_featureset():
    data = [{'feature1': 2, 'feature2': 3}, {'feature1': 7, 'feature2': 6}]
    clusterer = KMeansClusterer()
    clusterer.fit(data)
예제 #12
0
def test_inertia(df):
    clusterer = KMeansClusterer()
    clusterer.fit(df)
    assert isinstance(clusterer.inertia(), float)
예제 #13
0
def test_get_features(df):
    clusterer = KMeansClusterer()
    clusterer.fit(df)
    assert clusterer.get_features() == ['feature1', 'feature2']
예제 #14
0
def test_predict_bad_input_value(df):
    clusterer = KMeansClusterer()
    clusterer.fit(df)
    with pytest.raises(ValueError):
        clusterer.predict(pd.Series([0, 1, 2]))
예제 #15
0
def test_predict_bad_input_type(df):
    clusterer = KMeansClusterer()
    clusterer.fit(df)
    with pytest.raises(TypeError):
        clusterer.predict([0, 1])