Example #1
0
    # del train_df
    gc.collect()

    print('preparing indexes and group')
    train_indexes = list(group.index)[-TRAIN_SAMPLES:]
    valid_indexes = list(group.index)[:-TRAIN_SAMPLES]
    train_group = group[group.index.isin(train_indexes)]
    valid_group = group[group.index.isin(valid_indexes)]
    del group, train_indexes, valid_indexes
    print(len(train_group), len(valid_group))

    # print('preparing questions concepts')
    # q_concepts = load_questions_part_and_tags('./data/questions.csv', params.n_question)

    print('preparing training dataloader')
    train_dataset = DS.AKTDataset(train_group, n_skill, max_seq=params.max_seq)
    train_dataloader = DataLoader(train_dataset,
                                  batch_size=params.batch_size,
                                  shuffle=True,
                                  num_workers=12)
    del train_group

    print('preparing validation dataloader')
    valid_dataset = DS.AKTDataset(valid_group, n_skill, max_seq=params.max_seq)
    valid_dataloader = DataLoader(valid_dataset,
                                  batch_size=params.batch_size,
                                  shuffle=False,
                                  num_workers=12)
    del valid_group
    ###############################