Example #1
0
train_fname = 'bAbI_Data/'+str(train_foldername)+'/'+str(train_filename)

valid_foldername = 'en-valid-10k'
valid_filename = dataset + '_valid'
valid_fname = 'bAbI_Data/'+str(valid_foldername)+'/'+str(valid_filename)

test_foldername = 'en-valid-10k'
test_filename = dataset + '_test'
test_fname = 'bAbI_Data/'+str(test_foldername)+'/'+str(test_filename)

vec_fname = 'bAbI_Data/model.vec'

unk_thres = 0
pre_embed = False

train_data_BOW, valid_data_BOW, test_data_BOW, train_data_pe, valid_data_pe, test_data_pe, vocab = data_transform.get_data(
    train_fname, valid_fname, test_fname, vec_fname=vec_fname, unk_thres = unk_thres, pre_embed=pre_embed)
# print(train_data_pe[0:5])


# In[25]:


databag = []
model = torch.load('saved_models/' + model_name)
def test_visualize(model,test_dt_bow,test_dt_pe):
    this_story = []
    test_shape = test_dt_bow.shape
    n_corr = 0;
    count = 0;
    lim = 2000
    with open('variables/word2idx','rb') as handle:
Example #2
0
#Loading data
print("load...")
if data_type == "txt":
    data = np.loadtxt(fname, dtype='float64')
elif data_type == "dat":
    data = np.fromfile(fname, dtype='float64')
elif data_type == "csv":
    data = np.genfromtxt(fname, delimiter=',', dtype='float64')
'''

    Transform Data in data_transform.py

'''
data_transform.load_data(data)
data_transform.main()
data = data_transform.get_data()
'''

    Parameter Part and Global variable

'''
#declare variables

training = parameter.forward_training
training['Data'] = data[int(np.floor(data.shape[0] * training['Region'])):int(
    np.floor(data.shape[0] * training['Region']) +
    np.floor(data.shape[0] * training['Rate']))]
training['BatchSize'] = int(np.floor(training['Data'].shape[0]))
inputLen = parameter.forward_inputLen

##input
Example #3
0
def get_data(folder_name, qa_name, unk_thres=0, pre_embed=False):
    train_foldername = folder_name
    train_filename = qa_name + '_train'
    train_fname = 'bAbI_Data/' + str(train_foldername) + '/' + str(
        train_filename)

    valid_foldername = folder_name
    valid_filename = qa_name + '_valid'
    valid_fname = 'bAbI_Data/' + str(valid_foldername) + '/' + str(
        valid_filename)

    test_foldername = folder_name
    test_filename = qa_name + '_test'
    test_fname = 'bAbI_Data/' + str(test_foldername) + '/' + str(test_filename)

    vec_fname = 'bAbI_Data/model.vec'

    unk_thres = 0
    pre_embed = pre_embed

    train_data_BOW, valid_data_BOW, test_data_BOW, train_data_pe, valid_data_pe, test_data_pe, vocab = data_transform.get_data(
        train_fname,
        valid_fname,
        test_fname,
        vec_fname=vec_fname,
        unk_thres=unk_thres,
        pre_embed=pre_embed)
    print('Train data size : ', train_data_BOW.shape)
    print('Valid data size : ', valid_data_BOW.shape)
    print('Test data size : ', test_data_BOW.shape)
    print('Vocab size : ', len(vocab))
    return train_data_BOW, valid_data_BOW, test_data_BOW, train_data_pe, valid_data_pe, test_data_pe, vocab