Python Series.from_categoricalの例

プログラミング言語: Python

名前空間/パッケージ名: cudf.dataframe

クラス/型: Series

メソッド/関数: from_categorical

hotexamples.comのコード掲載数: 6

Python Series.from_categorical - 6件のコード例が見つかりました。すべてオープンソースプロジェクトから抽出されたPythonのcudf.dataframe.Series.from_categoricalの実例で、最も評価が高いものを厳選しています。コード例の評価を行っていただくことで、より質の高いコード例が表示されるようになります。

よく使われるメソッド

表示非表示

Series(30)

from_pandas(16)

astype(16)

to_array(15)

from_masked_array(11)

quantile(6)

from_categorical(6)

replace(5)

fillna(4)

groupby(4)

ceil(3)

_concat(3)

to_pandas(2)

set_mask(2)

sum(1)

sum_of_squares(1)

sort_values(1)

scale(1)

std(1)

min(1)

product(1)

nunique(1)

nsmallest(1)

nlargest(1)

max(1)

floor(1)

argsort(1)

applymap(1)

append(1)

abs(1)

unique(1)

コード例 #1

ファイルを表示

ファイル: test_categorical.py プロジェクト: yongsheng268/rapidsai-cudf

def test_categorical_set_categories():
    cat = pd.Categorical(['a', 'a', 'b', 'c', 'a'], categories=['a', 'b', 'c'])
    psr = pd.Series(cat)
    sr = Series.from_categorical(cat)

    # adding category
    expect = psr.cat.set_categories(['a', 'b', 'c', 'd'])
    got = sr.cat.set_categories(['a', 'b', 'c', 'd'])
    assert_eq(expect, got)

    # removing category
    expect = psr.cat.set_categories(['a', 'b'])
    got = sr.cat.set_categories(['a', 'b'])
    assert_eq(expect, got)

コード例 #2

ファイルを表示

def test_categorical_set_categories():
    cat = pd.Categorical(["a", "a", "b", "c", "a"], categories=["a", "b", "c"])
    psr = pd.Series(cat)
    sr = Series.from_categorical(cat)

    # adding category
    expect = psr.cat.set_categories(["a", "b", "c", "d"])
    got = sr.cat.set_categories(["a", "b", "c", "d"])
    assert_eq(expect, got)

    # removing category
    expect = psr.cat.set_categories(["a", "b"])
    got = sr.cat.set_categories(["a", "b"])
    assert_eq(expect, got)

コード例 #3

ファイルを表示

 def _make_dictionary_series(self):
     """Make a dictionary-encoded series from this node
     """
     assert self.is_dictionary
     # create dictionary-encoded column
     dict_meta = self.field_schema['dictionary']
     dictid = dict_meta['id']   # start from 1
     if dict_meta['indexType']['name'] != 'int':
         msg = 'non integer type index for dictionary'
         raise MetadataParsingError(msg)
     ordered = dict_meta['isOrdered']
     # find dictionary
     for dictionary in self.schema['dictionaries']:
         if dictionary['id'] == dictid:
             break
     categories = dictionary['data']['columns'][0]['DATA']
     # make dummy categorical
     cat = pd.Categorical([], categories=categories, ordered=ordered)
     # make the series
     return Series.from_categorical(cat, codes=self.data)

コード例 #4

ファイルを表示

def test_categorical_unique_count(nelem):
    from string import ascii_letters, digits

    # create categorical series
    np.random.seed(12)
    pd_cat = pd.Categorical(
        pd.Series(np.random.choice(list(ascii_letters + digits), nelem),
                  dtype='category'))

    # gdf
    gdf = DataFrame()
    gdf['a'] = Series.from_categorical(pd_cat)
    gdf_unique_count = gdf['a'].unique_count()

    # pandas
    pdf = pd.DataFrame()
    pdf['a'] = pd_cat
    pdf_unique = pdf['a'].unique()

    # verify
    assert gdf_unique_count == len(pdf_unique)

コード例 #5

ファイルを表示

def test_categorical_unique(num_elements):
    from string import ascii_letters, digits

    # create categorical series
    np.random.seed(12)
    pd_cat = pd.Categorical(
        pd.Series(np.random.choice(list(ascii_letters + digits), num_elements),
                  dtype='category'))

    # gdf
    gdf = DataFrame()
    gdf['a'] = Series.from_categorical(pd_cat)
    gdf_unique_sorted = np.sort(gdf['a'].unique())

    # pandas
    pdf = pd.DataFrame()
    pdf['a'] = pd_cat
    pdf_unique_sorted = np.sort(pdf['a'].unique())

    # verify
    np.testing.assert_array_equal(pdf_unique_sorted, gdf_unique_sorted)

コード例 #6

ファイルを表示

def test_categorical_value_counts(num_elements):
    from string import ascii_letters, digits

    # create categorical series
    np.random.seed(12)
    pd_cat = pd.Categorical(
        pd.Series(np.random.choice(list(ascii_letters + digits), num_elements),
                  dtype='category'))

    # gdf
    gdf = DataFrame()
    gdf['a'] = Series.from_categorical(pd_cat)
    gdf_value_counts = gdf['a'].value_counts()

    # pandas
    pdf = pd.DataFrame()
    pdf['a'] = pd_cat
    pdf_value_counts = pdf['a'].value_counts()

    # verify
    pandas_dict = pdf_value_counts.to_dict()
    gdf_dict = gdf_value_counts.to_pandas().to_dict()

    assert pandas_dict == gdf_dict