def initialize_seq_data_set(self):
     seq_data_and_labels_fname = self.data_config["data_fname"]
     self.data_key = self.data_config["data_key"]
     self.label_key = self.data_config["label_key"]
     self.data_set = init_seq_dataset(
         seq_data_and_labels_fname=seq_data_and_labels_fname
     )
import copy
import time

import numpy as np
import pandas as pd
import torch

from src.helper.data import DataHandler
from src.models.ae import GeneSetAE, VanillaAE
from src.models.custom_networks import GeneSetAE_v2
from src.utils.torch.data import init_seq_dataset
from src.utils.torch.general import get_device

gene_set_dataset = init_seq_dataset(
    "../../data/cd4/cd4_rna_seq_pbmc_10k/gene_kegg_pathway_data_and_labels.csv"
)
gene_set_adjacencies = pd.read_csv(
    "../../data/cd4/cd4_rna_seq_pbmc_10k/gene_kegg_pathway_adj_filtered_nCD4.csv",
    index_col=0,
)
geneset_adj_matrix = torch.from_numpy(np.array(gene_set_adjacencies))

geneset_ae = GeneSetAE(
    input_dim=5785,
    hidden_dims=[512, 512, 512, 512, 512, 512],
    latent_dim=256,
    geneset_adjacencies=geneset_adj_matrix,
)

# geneset_ae = VanillaAE(input_dim=5785, latent_dim=256, hidden_dims=[2048, 1024, 512, 256, 256])
 def initialize_seq_data_set_2(self):
     seq_data_and_labels_fname = self.seq_data_config_2["data_fname"]
     self.seq_data_key_2 = self.seq_data_config_2["data_key"]
     self.seq_label_key_2 = self.seq_data_config_2["label_key"]
     self.seq_data_set_2 = init_seq_dataset(
         seq_data_and_labels_fname=seq_data_and_labels_fname)