def test_client(tmpdir, data): # construct with a path to a file d = tmpdir / 'pq' d.mkdir() for k, v in data.items(): f = d / "{}.parquet".format(k) table = pa.Table.from_pandas(v) pq.write_table(table, str(f)) c = ParquetClient(tmpdir) assert c.list_databases() == ['pq'] assert c.database().pq.list_tables() == ['close', 'open']
def parquet(tmpdir, data): pa = pytest.importorskip('pyarrow') import pyarrow.parquet as pq # noqa: E402 from ibis.file.parquet import ParquetClient # create single files d = tmpdir.mkdir('pq') for k, v in data.items(): f = d / "{}.parquet".format(k) table = pa.Table.from_pandas(v) pq.write_table(table, str(f)) return ParquetClient(tmpdir).database()
def test_write(transformed, tmpdir): t = transformed expected = t.execute() tpath = tmpdir / 'new_dir' tpath.mkdir() path = tpath / 'foo.parquet' assert not path.exists() t = transformed[['time', 'ticker', 'avg']] c = ibis.parquet.connect(tpath) c.insert('foo.parquet', t) t.execute() assert path.exists() # readback c = ParquetClient(str(tpath)).database() result = c.list_databases() assert result == [] result = c.foo.execute() tm.assert_frame_equal(result, expected) path = tpath / 'foo.parquet' assert path.exists()
def test_write(transformed, tmpdir): t = transformed expected = execute(t) tpath = tmpdir / 'new_dir' tpath.mkdir() path = tpath / 'foo.parquet' assert not path.exists() t = transformed[['time', 'ticker', 'avg']] c = ibis.parquet.connect(tpath) c.insert('foo.parquet', t) execute(t) assert path.exists() # readback c = ParquetClient(str(tpath)).database() result = c.list_databases() assert result == [] result = c.foo.execute() tm.assert_frame_equal(result, expected) path = tpath / 'foo.parquet' assert path.exists()