Esempio n. 1
0
    def testToCPU(self):
        data = pd.DataFrame(np.random.rand(10, 10),
                            index=np.random.randint(-100, 100, size=(10, )),
                            columns=[np.random.bytes(10) for _ in range(10)])
        df = from_pandas_df(data)
        cdf = to_gpu(df)
        df2 = to_cpu(cdf)

        self.assertEqual(df.index_value, df2.index_value)
        self.assertEqual(df.columns_value, df2.columns_value)
        self.assertFalse(df2.op.gpu)
        pd.testing.assert_series_equal(df.dtypes, df2.dtypes)

        df2 = df2.tiles()
        df = get_tiled(df)

        self.assertEqual(df.nsplits, df2.nsplits)
        self.assertEqual(df.chunks[0].index_value, df2.chunks[0].index_value)
        self.assertEqual(df.chunks[0].columns_value,
                         df2.chunks[0].columns_value)
        self.assertFalse(df2.chunks[0].op.gpu)
        pd.testing.assert_series_equal(df.chunks[0].dtypes,
                                       df2.chunks[0].dtypes)

        self.assertIs(df2, to_cpu(df2))
Esempio n. 2
0
    def testToCPUExecution(self):
        pdf = pd.DataFrame(np.random.rand(20, 30), index=np.arange(20, 0, -1))
        df = from_pandas_df(pdf, chunk_size=(13, 21))
        cdf = to_gpu(df)
        df2 = to_cpu(cdf)

        res = self.executor.execute_dataframe(df2, concat=True)[0]
        self.assertIsInstance(res, pd.DataFrame)
        pd.testing.assert_frame_equal(res, pdf)

        pseries = pdf.iloc[:, 0]
        series = from_pandas_series(pseries, chunk_size=(13, 21))
        cseries = to_gpu(series)
        series2 = to_cpu(cseries)

        res = self.executor.execute_dataframe(series2, concat=True)[0]
        self.assertIsInstance(res, pd.Series)
        pd.testing.assert_series_equal(res, pseries)
Esempio n. 3
0
def test_to_cpu():
    data = pd.DataFrame(np.random.rand(10, 10),
                        index=np.random.randint(-100, 100, size=(10, )),
                        columns=[np.random.bytes(10) for _ in range(10)])
    df = from_pandas_df(data)
    cdf = to_gpu(df)
    df2 = to_cpu(cdf)

    assert df.index_value == df2.index_value
    assert df.columns_value == df2.columns_value
    assert df2.op.gpu is False
    pd.testing.assert_series_equal(df.dtypes, df2.dtypes)

    df, df2 = tile(df, df2)

    assert df.nsplits == df2.nsplits
    assert df.chunks[0].index_value == df2.chunks[0].index_value
    assert df.chunks[0].columns_value == df2.chunks[0].columns_value
    assert df2.chunks[0].op.gpu is False
    pd.testing.assert_series_equal(df.chunks[0].dtypes, df2.chunks[0].dtypes)

    assert df2 is to_cpu(df2)