Python find_correlation示例

编程语言: Python

命名空间/包名称: morar.feature_selection

方法/功能: find_correlation

hotexamples.com的示例: 6

Python find_correlation - 已找到6个示例。这些是从开源项目中提取的最受好评的morar.feature_selection.find_correlation现实Python示例。您可以评价示例，以帮助我们提高示例质量。

示例#1

显示文件

文件： test_feature_selection.py 项目： jwildenhain/morar

def test_find_correlation_threshold_works():
    x = range(1000)
    noise = np.random.randn(1000)
    y = [a + b for a, b in zip(x, noise)]
    z = np.random.randn(1000)
    df = pd.DataFrame(list(zip(x, y, z)), columns=["x", "y", "z"])
    out = feature_selection.find_correlation(df, threshold=1.0)
    assert len(out) == 0

示例#2

显示文件

文件： test_feature_selection.py 项目： Swarchal/morar

def test_find_correlation_threshold_works():
    x = range(1000)
    noise = np.random.randn(1000)
    y = [a + b for a, b in zip(x, noise)]
    z = np.random.randn(1000)
    df = pd.DataFrame(list(zip(x, y, z)), columns=["x", "y", "z"])
    out = feature_selection.find_correlation(df, threshold=1.0)
    assert len(out) == 0

示例#3

显示文件

文件： test_feature_selection.py 项目： jwildenhain/morar

def test_find_correlation_large_n():
    x = range(100000)
    noise = np.random.randn(100000)
    y = [a + b for a, b in zip(x, noise)]
    z = np.random.randn(100000)
    df = pd.DataFrame(list(zip(x, y, z)), columns=["x", "y", "z"])
    out = feature_selection.find_correlation(df)
    assert len(out) == 1
    assert out[0] == ["x"] or ["y"]
    assert out[0] != ["z"]

示例#4

显示文件

文件： test_feature_selection.py 项目： jwildenhain/morar

def test_find_correlation_multiple_correlated():
    x = range(1000)
    noise = np.random.randn(1000)
    y = [a + b for a, b in zip(x, noise)]
    xx = [a + b for a, b in zip(x, noise)]
    z = np.random.randn(1000)
    df = pd.DataFrame(list(zip(x, xx, y, z)), columns=["x", "xx", "y", "z"])
    out = feature_selection.find_correlation(df)
    assert len(out) == 2
    assert "z" not in out

示例#5

显示文件

文件： test_feature_selection.py 项目： Swarchal/morar

def test_find_correlation_large_n():
    x = range(100000)
    noise = np.random.randn(100000)
    y = [a + b for a, b in zip(x, noise)]
    z = np.random.randn(100000)
    df = pd.DataFrame(list(zip(x, y, z)), columns=["x", "y", "z"])
    out = feature_selection.find_correlation(df)
    assert len(out) == 1
    assert out[0] == ["x"] or ["y"]
    assert out[0] != ["z"]

示例#6

显示文件

文件： test_feature_selection.py 项目： Swarchal/morar

def test_find_correlation_multiple_correlated():
    x = range(1000)
    noise = np.random.randn(1000)
    y = [a + b for a, b in zip(x, noise)]
    xx = [a + b for a, b in zip(x, noise)]
    z = np.random.randn(1000)
    df = pd.DataFrame(list(zip(x, xx, y, z)), columns=["x", "xx", "y", "z"])
    out = feature_selection.find_correlation(df)
    assert len(out) == 2
    assert "z" not in out