Python Checkの例

プログラミング言語: Python

名前空間/パッケージ名: cognito.check

クラス/型: Check

hotexamples.comのコード掲載数: 27

Python Check - 27件のコード例が見つかりました。すべてオープンソースプロジェクトから抽出されたPythonのcognito.check.Checkの実例で、最も評価が高いものを厳選しています。コード例の評価を行っていただくことで、より質の高いコード例が表示されるようになります。

よく使われるメソッド

表示非表示

Check(24)

ignore_identifier(4)

is_outlier(4)

encoding_categorical(3)

percentage_missing(3)

remove_columns(3)

remove_records(3)

is_categorical(2)

is_discrete(2)

is_missing(2)

is_continuous(1)

is_identifier(1)

is_working(1)

コード例 #1

ファイルを表示

ファイル: test_modules.py プロジェクト: vandana-11/cognito

def test_ignore_identifier_1():
    df = pd.read_csv(
        os.path.join(os.path.dirname(__file__), 'data', 'Freedman.csv'))
    check = Check()
    assert list(check.ignore_identifier(df).columns) == [
        'population', 'nonwhite', 'density', 'crime'
    ]

コード例 #2

ファイルを表示

ファイル: test_modules.py プロジェクト: vandana-11/cognito

def test_remove_columns_1():
    df = pd.read_csv(
        os.path.join(os.path.dirname(__file__), 'data', 'Freedman.csv'))
    check = Check()
    assert list(check.remove_columns(df).columns) == [
        'Location', 'population', 'nonwhite', 'density', 'crime'
    ]

コード例 #3

ファイルを表示

ファイル: test_modules.py プロジェクト: AishikaBanik98/cognito

def test_remove_records():
    df = pd.read_csv(
        os.path.join(os.path.dirname(__file__), 'data', 'Freedman.csv'))
    df1 = pd.read_csv(
        os.path.join(os.path.dirname(__file__), 'data',
                     'Freedman_remove_records.csv'))
    check = Check()
    assert check.remove_records(df).equals(df1) == True

コード例 #4

ファイルを表示

ファイル: test_modules.py プロジェクト: AishikaBanik98/cognito

def test_ignore_identifier_2():
    df = pd.read_csv(
        os.path.join(os.path.dirname(__file__), 'data', 'vgsales.csv'))
    df1 = pd.read_csv(
        os.path.join(os.path.dirname(__file__), 'data',
                     'vgsales_ignore_identifier.csv'))
    check = Check()
    assert check.ignore_identifier(df).equals(df1) == False

コード例 #5

ファイルを表示

ファイル: test_modules.py プロジェクト: vandana-11/cognito

def test_ignore_identifier_2():
    df = pd.read_csv(
        os.path.join(os.path.dirname(__file__), 'data', 'msleep_ggplot.csv'))
    check = Check()
    assert list(check.ignore_identifier(df).columns) == [
        'genus', 'vore', 'order', 'conservation', 'sleep_total', 'sleep_rem',
        'sleep_cycle', 'awake', 'brainwt', 'bodywt'
    ]

コード例 #6

ファイルを表示

ファイル: test_modules.py プロジェクト: vandana-11/cognito

def test_encoding_categorical_2():
    check = Check()
    df = pd.read_csv(
        os.path.join(os.path.dirname(__file__), 'data', 'student.csv'))
    assert check.encoding_categorical(df['sex']) == ([0, 0, 0, 0, 0, 1, 1,
                                                      0], {
                                                          0: 'F',
                                                          1: 'F'
                                                      })

コード例 #7

ファイルを表示

ファイル: test_modules.py プロジェクト: vandana-11/cognito

def test_encoding_categorical_1():
    check = Check()
    df = pd.read_csv(
        os.path.join(os.path.dirname(__file__), 'data', 'cereal.csv'))
    assert check.encoding_categorical(df['mfr']) == ([1, 2, 0, 0, 3, 1], {
        1: 'Q',
        2: 'K',
        0: 'N',
        3: 'K'
    })

コード例 #8

ファイルを表示

ファイル: test_modules.py プロジェクト: AishikaBanik98/cognito

def test_is_categorical():
    """
    Check if the given dataset given a columns
    is categorical or not. 
    
    :raises     AssertionError:  { exception_description }
    """
    df = pd.read_csv(
        os.path.join(os.path.dirname(__file__), 'data', 'Freedman.csv'))
    check = Check()
    assert check.is_categorical(df['Location']) == True

コード例 #9

ファイルを表示

ファイル: test_modules.py プロジェクト: vandana-11/cognito

def test_encoding_categorical_3():
    check = Check()
    df = pd.read_csv(
        os.path.join(os.path.dirname(__file__), 'data', 'student.csv'))
    assert check.encoding_categorical(df['Mjob']) == ([0, 0, 0, 1, 2, 3, 2,
                                                       2], {
                                                           0: 'at_home',
                                                           1: 'at_home',
                                                           2: 'at_home',
                                                           3: 'health'
                                                       })

コード例 #10

ファイルを表示

ファイル: test_modules.py プロジェクト: vandana-11/cognito

def test_is_outlier_2():
    samples = [
        322, 322, 336, 345, 351, 370, 390, 404, 409, 411, 436, 437, -7,
        80000000, 789654123, 0
    ]
    x = pd.Series(samples)
    assert Check.is_outlier(x, 5) == []

コード例 #11

ファイルを表示

ファイル: test_modules.py プロジェクト: vandana-11/cognito

def test_is_outlier_6():
    samples = [
        30, 171, 184, 201, 212, 250, 265, 270, 272, 289, 305, 306, 100000, 8,
        5, 2000
    ]
    x = pd.Series(samples)
    assert Check.is_outlier(x, 5) == []

コード例 #12

ファイルを表示

def test_percentage_missing():
    df = pd.read_csv(
        os.path.join(os.path.dirname(__file__), 'data', 'vgsales.csv'))
    check = Check()
    assert check.percentage_missing(df) == {
        'Rank': 0.0,
        'Name': 0.0,
        'Platform': 0.0,
        'Year': 1.63,
        'Genre': 0.0,
        'Publisher': 0.35,
        'NA_Sales': 0.0,
        'EU_Sales': 0.0,
        'JP_Sales': 0.0,
        'Other_Sales': 0.0,
        'Global_Sales': 0.0
    }

コード例 #13

ファイルを表示

ファイル: test_modules.py プロジェクト: vandana-11/cognito

def test_is_discrete_1():
    df = pd.read_csv(
        os.path.join(os.path.dirname(__file__), 'data', 'Freedman.csv'))
    check = Check()
    assert check.is_discrete(df['crime']) == True

コード例 #14

ファイルを表示

ファイル: test_modules.py プロジェクト: vandana-11/cognito

def test_is_continuous_2():
    df = pd.read_csv(
        os.path.join(os.path.dirname(__file__), 'data', 'Freedman.csv'))
    check = Check()
    assert check.is_continuous(df['population']) == True

コード例 #15

ファイルを表示

def test_remove_records_2():
    df = pd.read_csv(os.path.join(os.path.dirname(__file__), 'data', 'msleep_ggplot.csv'))
    check = Check()
    assert len(check.remove_records(df)) == 61

コード例 #16

ファイルを表示

ファイル: test_modules.py プロジェクト: AishikaBanik98/cognito

def test_ignore_identifier_3():
    df = pd.read_csv(
        os.path.join(os.path.dirname(__file__), 'data', 'msleep_ggplot.csv'))
    check = Check()
    print(check.ignore_identifier(df))

コード例 #17

ファイルを表示

ファイル: test_modules.py プロジェクト: vandana-11/cognito

def test_remove_records_1():
    df = pd.read_csv(
        os.path.join(os.path.dirname(__file__), 'data', 'Freedman.csv'))
    check = Check()
    assert len(check.remove_records(df)) == 110

コード例 #18

ファイルを表示

ファイル: test_modules.py プロジェクト: AishikaBanik98/cognito

def test_is_outlier():
    df = pd.read_csv(
        os.path.join(os.path.dirname(__file__), 'data', 'Freedman.csv'))
    check = Check()
    print(check.is_outlier(df['crime'], 3))

コード例 #19

ファイルを表示

ファイル: test_modules.py プロジェクト: vandana-11/cognito

def test_is_outlier_4():
    samples = [4551, 7875, 931, 1322, 7795, 22005, 78, 95, 9874, 12365]
    x = pd.Series(samples)
    assert Check.is_outlier(x, 2) == [22005]

コード例 #20

ファイルを表示

def test_percentage_missing_2():
    df = pd.read_csv(os.path.join(os.path.dirname(__file__), 'data', 'msleep_ggplot.csv'))
    check=Check()
    assert check.percentage_missing(df) == {'name': 0.0, 'genus': 0.0, 'vore': 8.43, 'order': 0.0, 'conservation': 34.94, 'sleep_total': 0.0, 'sleep_rem': 26.51, 'sleep_cycle': 61.45, 'awake': 0.0, 'brainwt': 32.53, 'bodywt': 0.0}

コード例 #21

ファイルを表示

ファイル: test_modules.py プロジェクト: vandana-11/cognito

def test_is_missing_3():
    df = pd.read_csv(
        os.path.join(os.path.dirname(__file__), 'data', 'Freedman.csv'))
    check = Check()
    assert check.is_missing(df['nonwhite']) != True

コード例 #22

ファイルを表示

ファイル: test_modules.py プロジェクト: vandana-11/cognito

def test_is_discrete_3():
    df = pd.read_csv(
        os.path.join(os.path.dirname(__file__), 'data', 'Freedman.csv'))
    check = Check()
    assert check.is_discrete(df['Location']) == False

コード例 #23

ファイルを表示

ファイル: test_modules.py プロジェクト: vandana-11/cognito

def test_is_working():
    check = Check()
    print(check.is_working())

コード例 #24

ファイルを表示

ファイル: test_modules.py プロジェクト: vandana-11/cognito

def test_is_identifier_3():
    df = pd.read_csv(
        os.path.join(os.path.dirname(__file__), 'data', 'Freedman.csv'))
    check = Check()
    assert check.is_identifier(df['nonwhite']) == False

コード例 #25

ファイルを表示

ファイル: test_modules.py プロジェクト: vandana-11/cognito

def test_is_categorical_1():
    df = pd.read_csv(
        os.path.join(os.path.dirname(__file__), 'data', 'Freedman.csv'))
    check = Check()
    assert check.is_categorical(df['Location']) == True

コード例 #26

ファイルを表示

ファイル: test_modules.py プロジェクト: vandana-11/cognito

def test_is_missing_4():
    df = pd.read_csv(
        os.path.join(os.path.dirname(__file__), 'data', 'Freedman.csv'))
    check = Check()
    assert check.is_missing(df['density']) == True

コード例 #27

ファイルを表示

def test_percentage_missing_1():
    df = pd.read_csv(os.path.join(os.path.dirname(__file__), 'data', 'Freedman.csv'))
    check=Check()
    assert check.percentage_missing(df) == {'Location': 0.0, 'population': 9.09, 'nonwhite': 0.0, 'density': 9.09, 'crime': 0.0}