Python Prep 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: prep_ml.pre_processor

클래스/타입: Prep

hotexamples.com에서의 예제들: 12

Python Prep - 12개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 prep_ml.pre_processor.Prep에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

from_dict(11)

from_json(1)

자주 사용되는 메소드들

예제 #1

0

파일 보기

파일: test_prep_ml.py 프로젝트: vi3m/prep-ml

def test_json_error():
    json_ob = '''{
        "EMPLOYEE_ID": {
            "required": True
        }
    }'''
    with pytest.raises(JSONDeserializationError) as e:
        Prep.from_json(json_ob, df)
        assert 'Error parsing json' in str(e.value)

예제 #2

0

파일 보기

파일: test_prep_ml.py 프로젝트: vi3m/prep-ml

def test_mapper_schema_new_key():
    error_ob = {
        "EMPLOYEE_ID": [{
            "required": True,
            "encoding": None,
            "alias": "EMP_ID",
            "imputation": None,
            "enforce_type": None,
            "derived_eq": None,
            "some_new_key": None
        }]
    }
    Prep.from_dict(prep_ob, df)
    with pytest.raises(IncorrectSchemaError) as e:
        Prep.from_dict(error_ob, df)
        assert 'Unknown keys found in schema.' in str(e.value)

예제 #3

0

파일 보기

파일: test_prep_ml.py 프로젝트: vi3m/prep-ml

def test_required_features():
    p = Prep.from_dict(prep_ob, df)
    p.get_data()
    assert p.get_required_features() == [
        'EMPLOYEE_ID', 'AGE', 'GENDER', 'RATING', 'DESIGNATION', 'PROMOTED'
    ]

예제 #4

0

파일 보기

파일: test_prep_ml.py 프로젝트: vi3m/prep-ml

def test_alias_features():
    p = Prep.from_dict(prep_ob, df)
    p.get_data()
    assert p.get_alias_features() == ['EMPLOYEE_ID', 'AGE']

예제 #5

0

파일 보기

파일: test_prep_ml.py 프로젝트: vi3m/prep-ml

def test_mapper_schema_failed():
    error_ob = {"EMPLOYEE_ID": "FAIL_VALUE"}
    Prep.from_dict(prep_ob, df)
    with pytest.raises(IncorrectSchemaError) as e:
        Prep.from_dict(error_ob, df)
        assert 'Error with mapper schema.' in str(e.value)

예제 #6

0

파일 보기

파일: test_prep_ml.py 프로젝트: vi3m/prep-ml

def test_imputation_process():
    p = Prep.from_dict(prep_ob, df)
    rdf = p.get_data()
    assert not rdf.isnull().values.any()

예제 #7

0

파일 보기

파일: test_prep_ml.py 프로젝트: vi3m/prep-ml

def test_data_missing_exception():
    with pytest.raises(DataMissingError) as e:
        Prep.from_dict(prep_ob)
        assert 'Missing file_path and/or dataframe.' in str(e.value)

예제 #8

0

파일 보기

파일: test_prep_ml.py 프로젝트: vi3m/prep-ml

def test_derived_features():
    p = Prep.from_dict(prep_ob, df)
    rdf = p.get_data()
    assert not all(item in rdf.columns.tolist()
                   for item in ['FIRST_NAME', 'LAST_NAME'])

예제 #9

0

파일 보기

파일: test_prep_ml.py 프로젝트: vi3m/prep-ml

def test_derived_features():
    p = Prep.from_dict(prep_ob, df)
    p.get_data()
    assert p.get_derived_features() == ['DOB']

예제 #10

0

파일 보기

파일: test_prep_ml.py 프로젝트: vi3m/prep-ml

def test_imputation_features():
    p = Prep.from_dict(prep_ob, df)
    p.get_data()
    assert p.get_imputation_features() == ['RATING']

예제 #11

0

파일 보기

파일: test_prep_ml.py 프로젝트: vi3m/prep-ml

def test_encode_features():
    p = Prep.from_dict(prep_ob, df)
    p.get_data()
    assert p.get_encode_features() == ['GENDER', 'DESIGNATION', 'PROMOTED']

예제 #12

0

파일 보기

        "required":
        True,
        "alias":
        "DOB",
        "derived_eq":
        "(pd.Timestamp('now') - pd.to_datetime(df.AGE, format='%m/%d/%Y')).astype('<m8[Y]')"
    },
    "GENDER": {
        "required": True,
        "encoding": 'ohe'
    },
    "RATING": {
        "required": True,
        "imputation": 'most_frequent'
    },
    "DESIGNATION": {
        "required": True,
        "encoding": 'label'
    },
    "PROMOTED": {
        "required": True,
        "encoding": 'label'
    }
}

df = pd.read_csv('tests/MOCK_DATA.csv')

p = Prep.from_dict(prep_ob, df)
rdf = p.get_data()
print(rdf.columns.to_list())
print(rdf.head())