Esempio n. 1
0
def load_real_fake_data_ML_1m(file_index=24):
    data = []
    real = MD.load_user_item_matrix_1m()
    #real = MD.load_user_item_matrix_100k()
    #real = load_user_item_matrix_1m_masked(file_index=17)
    real = real[0:int(real.shape[0] / 2), :]
    #fake = load_user_item_matrix_100k()
    #fake = simulate_data(real.shape)
    fake = load_user_item_matrix_1m_masked(file_index=file_index)
    #fake = MD.load_user_item_matrix_100k_masked(file_index=1)
    fake = fake[int(fake.shape[0] / 2):, :]
    #fake = real
    #fake = np.random.randint(5, size=real.shape)
    #print(fake)
    data = np.zeros(shape=(real.shape[0] + fake.shape[0], real[0].shape[0]))
    labels = np.zeros(shape=(real.shape[0] + fake.shape[0], ))
    for user_index, user in enumerate(real):
        data[user_index, :] = user
        labels[user_index] = 1
    for user_index, user in enumerate(fake):
        data[len(real) + user_index, :] = user
        labels[len(real) + user_index] = 0

    from Utils import shuffle_two_arrays
    data, labels = shuffle_two_arrays(data, labels)
    return data, labels
Esempio n. 2
0
def load_real_fake_data_ML_100k():
    from MovieLensData import load_user_item_matrix_100k, load_user_item_matrix_100k_masked
    data = []
    real = load_user_item_matrix_100k()
    #fake = load_user_item_matrix_100k()
    #fake = simulate_data(real.shape)
    fake = load_user_item_matrix_100k_masked(file_index=1)
    #fake = np.random.randint(5, size=real.shape)
    print(fake)
    data = np.zeros(shape=(len(real) + len(fake), len(real[0])))
    labels = np.zeros(shape=(len(real) + len(fake), ))
    for user_index, user in enumerate(real):
        data[user_index, :] = user
        labels[user_index] = 1
    for user_index, user in enumerate(fake):
        data[len(real) + user_index, :] = user
        labels[len(real) + user_index] = 0

    from Utils import shuffle_two_arrays
    data, labels = shuffle_two_arrays(data, labels)
    return data, labels
Esempio n. 3
0
def load_real_fake_data_libimseti(file_index=-1):
    import LibimSeTiData as LD
    real, _, valid_movies = LD.load_libimseti_data_subset(small=True)

    real = real[0:int(real.shape[0] / 2), :]
    fake = LD.load_libimseti_data_subset_masked(file_index=file_index,
                                                small=True,
                                                valid_movies=valid_movies)[0]
    fake = fake[int(fake.shape[0] / 2):, :]

    data = np.zeros(shape=(real.shape[0] + fake.shape[0], real[0].shape[0]))
    labels = np.zeros(shape=(real.shape[0] + fake.shape[0], ))
    for user_index, user in enumerate(real):
        data[user_index, :] = user
        labels[user_index] = 1
    for user_index, user in enumerate(fake):
        data[len(real) + user_index, :] = user
        labels[len(real) + user_index] = 0

    from Utils import shuffle_two_arrays
    data, labels = shuffle_two_arrays(data, labels)
    return data, labels