Example #1
0
def load_datasets(dataset_name, save_path="data/", url=None):
    if dataset_name == "synthetic":
        gene_dataset = SyntheticDataset()
    elif dataset_name == "cortex":
        gene_dataset = CortexDataset()
    elif dataset_name == "brain_large":
        gene_dataset = BrainLargeDataset(save_path=save_path)
    elif dataset_name == "retina":
        gene_dataset = RetinaDataset(save_path=save_path)
    elif dataset_name == "cbmc":
        gene_dataset = CbmcDataset(save_path=save_path)
    elif dataset_name == "brain_small":
        gene_dataset = BrainSmallDataset(save_path=save_path)
    elif dataset_name == "hemato":
        gene_dataset = HematoDataset(save_path="data/HEMATO/")
    elif dataset_name == "pbmc":
        gene_dataset = PbmcDataset(save_path=save_path)
    elif dataset_name[-5:] == ".loom":
        gene_dataset = LoomDataset(filename=dataset_name, save_path=save_path, url=url)
    elif dataset_name[-5:] == ".h5ad":
        gene_dataset = AnnDataset(dataset_name, save_path=save_path, url=url)
    elif ".csv" in dataset_name:
        gene_dataset = CsvDataset(dataset_name, save_path=save_path)
    else:
        raise Exception("No such dataset available")
    return gene_dataset
Example #2
0
def load_datasets(dataset_name, save_path='data/', url=None):
    if dataset_name == 'synthetic':
        gene_dataset = SyntheticDataset()
    elif dataset_name == 'cortex':
        gene_dataset = CortexDataset()
    elif dataset_name == 'brain_large':
        gene_dataset = BrainLargeDataset(save_path=save_path)
    elif dataset_name == 'retina':
        gene_dataset = RetinaDataset(save_path=save_path)
    elif dataset_name == 'cbmc':
        gene_dataset = CbmcDataset(save_path=save_path)
    elif dataset_name == 'brain_small':
        gene_dataset = BrainSmallDataset(save_path=save_path)
    elif dataset_name == 'hemato':
        gene_dataset = HematoDataset(save_path='data/HEMATO/')
    elif dataset_name == 'pbmc':
        gene_dataset = PbmcDataset(save_path=save_path)
    elif dataset_name[-5:] == ".loom":
        gene_dataset = LoomDataset(filename=dataset_name,
                                   save_path=save_path,
                                   url=url)
    elif dataset_name[-5:] == ".h5ad":
        gene_dataset = AnnDataset(dataset_name, save_path=save_path, url=url)
    elif ".csv" in dataset_name:
        gene_dataset = CsvDataset(dataset_name, save_path=save_path)
    else:
        raise "No such dataset available"
    return gene_dataset
Example #3
0
def test_brain_small():
    brain_small_dataset = BrainSmallDataset(save_path='tests/data/')
    base_benchmark(brain_small_dataset)
Example #4
0
def test_brain_small(save_path):
    brain_small_dataset = BrainSmallDataset(save_path=save_path)
    base_benchmark(brain_small_dataset)
Example #5
0
        (70000, -1)).numpy())

mnist_labels = (torch.cat(
    [mnist_train.dataset.targets, mnist_test.dataset.targets], axis=0).reshape(
        (70000, -1)).numpy())

np.savez(f'{data_dir}/MNIST.npz', features=mnist_features, labels=mnist_labels)
del mnist_train, mnist_test, mnist_features, mnist_labels

# %% how to load data from npz
# data = np.load(f'{data_dir}/MNIST.npz')

# %% BrainSmall
os.chdir(data_dir)
brain_small_dataset = BrainSmallDataset(
    save_path=f'{data_dir}/BrainSmall/',
    save_path_10X=f'{data_dir}/BrainSmall/')

brain_small_features = brain_small_dataset.X.toarray()
brain_small_labels = brain_small_dataset.labels

np.savez(f'{data_dir}/BrainSmall.npz',
         features=brain_small_features,
         labels=brain_small_labels)
del brain_small_dataset, brain_small_features, brain_small_labels

# %%
dataset_objects = [
    BrainLargeDataset, CortexDataset, PbmcDataset, RetinaDataset,
    HematoDataset, CbmcDataset, BrainSmallDataset, SmfishDataset
]