Python LabelEncoder.transform 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: cuml.dask.preprocessing.LabelEncoder

클래스/타입: LabelEncoder

메소드/함수: transform

hotexamples.com에서의 예제들: 4

Python LabelEncoder.transform - 4개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 cuml.dask.preprocessing.LabelEncoder.LabelEncoder.transform에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

LabelEncoder(7)

transform(4)

fit(2)

fit_transform(2)

inverse_transform(2)

예제 #1

파일 보기

def test_labelencoder_unfitted(client):
    """ Try calling `.transform()` without fitting first
    """
    df = dask_cudf.from_cudf(cudf.Series(np.random.choice(10, (10, ))),
                             npartitions=len(client.has_what()))
    le = LabelEncoder()
    with pytest.raises(NotFittedError):
        le.transform(df).compute()

예제 #2

파일 보기

def test_unfitted_inverse_transform(client):
    """ Try calling `.inverse_transform()` without fitting first
    """
    tmp = cudf.Series(np.random.choice(10, (10, )))
    df = dask_cudf.from_cudf(tmp, npartitions=len(client.has_what()))
    le = LabelEncoder()

    with pytest.raises(NotFittedError):
        le.transform(df)

예제 #3

파일 보기

def test_labelencoder_unseen(client):
    """ Try encoding a value that was not present during fitting
    """
    df = dask_cudf.from_cudf(cudf.Series(np.random.choice(10, (10, ))),
                             npartitions=len(client.has_what()))
    le = LabelEncoder().fit(df)
    assert le._fitted

    with pytest.raises(KeyError):
        tmp = dask_cudf.from_cudf(cudf.Series([-100, -120]),
                                  npartitions=len(client.has_what()))
        le.transform(tmp).compute()

예제 #4

파일 보기

def test_labelencoder_transform(length, cardinality, client):
    """ Try fitting and then encoding a small subset of the df
    """
    tmp = cudf.Series(np.random.choice(cardinality, (length, )))
    df = dask_cudf.from_cudf(tmp, npartitions=len(client.has_what()))
    le = LabelEncoder().fit(df)
    assert le._fitted

    encoded = le.transform(df)

    df_arr = df.compute().to_numpy()
    df_arr = _arr_to_similarity_mat(df_arr)
    encoder_arr = cp.asnumpy(encoded.compute().to_numpy())
    encoded_arr = _arr_to_similarity_mat(encoder_arr)
    assert ((encoded_arr == encoded_arr.T) == (df_arr == df_arr.T)).all()