Ejemplo n.º 1
0
def dataset_num_files_1(tmpdir_factory):
    path = tmpdir_factory.mktemp("data").strpath
    url = 'file://' + path
    data = create_test_dataset(url, range(99), num_files=1)
    dataset = SyntheticDataset(url=url, path=path, data=data)

    return dataset
Ejemplo n.º 2
0
def dataset_0_3_8_10_11_20_23(tmpdir_factory):
    path = tmpdir_factory.mktemp("data").strpath
    url = 'file://' + path
    ids = [0, 3, 8, 10, 11, 20, 23]
    data = create_test_dataset(url, ids, num_files=1)
    dataset = SyntheticDataset(url=url, path=path, data=data)

    return dataset
Ejemplo n.º 3
0
def hello_world_dataset(tmpdir_factory):
    path = tmpdir_factory.mktemp("data").strpath
    url = 'file://' + path

    generate_hello_world_dataset(url)

    dataset = SyntheticDataset(url=url, path=path, data=None)

    # Generate a dataset
    assert os.path.exists(os.path.join(path, '_SUCCESS'))

    return dataset
Ejemplo n.º 4
0
def pycarbon_dataset(tmpdir_factory):
    path = tmpdir_factory.mktemp("data").strpath
    url = LOCAL_FILE_PREFIX + path

    generate_pycarbon_dataset(url)

    dataset = SyntheticDataset(url=url, path=path, data=None)

    # Generate a dataset
    assert os.path.exists(os.path.join(path, '_SUCCESS'))

    return dataset
Ejemplo n.º 5
0
 def _dataset_generator():
     path = tmpdir_factory.mktemp("data").strpath
     url = 'file://' + path
     ids = range(0, 99, 5)
     data = create_test_dataset(url, ids)
     return SyntheticDataset(url=url, path=path, data=data)
Ejemplo n.º 6
0
 def _dataset_generator():
     path = tmpdir_factory.mktemp("data").strpath
     url = 'file://' + path
     ids = [0, 3, 8, 10, 11, 20, 23]
     data = create_test_dataset(url, ids, num_files=1)
     return SyntheticDataset(url=url, path=path, data=data)
Ejemplo n.º 7
0
 def _dataset_generator():
     path = tmpdir_factory.mktemp("data").strpath
     url = 'file://' + path
     data = create_test_dataset(url, range(99), num_files=1)
     return SyntheticDataset(url=url, path=path, data=data)