hidden1 = 300 #hidden layer 1
hidden2 = 100 #hidden layer 2
acti_type='tanh'                                                    #activation type
epoch = 100                                                               #epochs number
advertiser = '2997'
if len(sys.argv) > 1:
    advertiser = sys.argv[1]
train_file='../../make-ipinyou-data/' + advertiser + '/train.fm.txt'             #training file
test_file='../../make-ipinyou-data/' + advertiser + '/test.fm.txt'                   #test file
fm_model_file='../../make-ipinyou-data/' + advertiser + '/fm.model.txt'                   #fm model file
#feats = ut.feats_len(train_file)                                           #feature size

if len(sys.argv) > 2:
    train_file=train_file+'.10.txt'
    print train_file
train_size=ut.file_len(train_file)                    #training size
test_size=ut.file_len(test_file)                      #test size
n_batch=train_size/batch_size                                        #number of batches
x_dim=133465

#best parameters
if advertiser=='2997': #best 0.615759999486
    hidden0=200
    hidden1=300
    hidden2=100
    lr=0.001
    lambda1=0.0000001
    dropout=0.98
    lambda1=0
elif advertiser=='3386':
    train_size=ut.file_len(train_file)                    #training size
Esempio n. 2
0
acti_type='tanh'                                                    #activation type
epoch = 100                                                               #epochs number
advertiser = '2997'
if len(sys.argv) > 1:
    advertiser = sys.argv[1]
train_file='../data/train.fm.txt'             #training file
test_file='../data/test.fm.txt'                   #test file
fm_model_file='../data/fm.model.txt'                   #fm model file
#feats = ut.feats_len(train_file)                                           #feature size
if len(sys.argv) > 2 and advertiser=='all':
    train_file=train_file+'.5.txt'
elif len(sys.argv) > 2:
    train_file=train_file+'.10.txt'
print(train_file)

train_size=ut.file_len(train_file)                    #training size
test_size=ut.file_len(test_file)                      #test size
n_batch=train_size/batch_size                                        #number of batches
x_drop=1

if advertiser=='2997':#
    lr=0.001
    x_drop=dropout=0.5
    hidden1=300
    hidden2=100
    lambda1=0.0
    lambda_fm=0.1

    
    
Esempio n. 3
0
fi = open(train_file, 'r')
for line in fi:
    if line.strip() != '':
		s = line.strip().replace(':', ' ').split(' ')
		fi=[]
		for f in range(1, len(s), 2):
			if int(s[f+1])==1:
				fi.append(int(s[f]))
		farr.append(fi)
		yarr.append(int(s[0]))
		train_size+=1
farr = numpy.array(farr, dtype = numpy.int32)
yarr = numpy.array(yarr, dtype = numpy.int32)


test_size=ut.file_len(test_file)                      #test size
n_batch=train_size/batch_size                                        #number of batches
x_dim=133465

if advertiser == '2997':
    lr=0.05
if advertiser== '3386':                                       #number of batches
    x_dim=0
    
if sys.argv[2]=='mod' and advertiser=='2997':
    lr=0.1
    lambda1=0.00
    


    
rng.seed(1234)
batch_size=10                                                          #batch size
lr=0.01 # 0.002                                                                #learning rate
lambda1=0.001  # 100 # 3 # .1                                                        #regularisation rate
hidden1 = 300 #hidden layer 1
hidden2 = 100 #hidden layer 2
acti_type='tanh'                                                    #activation type
epoch = 100                                                               #epochs number
advertiser = '2997'
if len(sys.argv) > 1:
    advertiser = sys.argv[1]
train_file='../../make-ipinyou-data/' + advertiser + '/train.fm.txt'             #training file
test_file='../../make-ipinyou-data/' + advertiser + '/test.fm.txt'                   #test file
fm_model_file='../../make-ipinyou-data/' + advertiser + '/fm.model.txt'                   #fm model file
#feats = ut.feats_len(train_file)                                           #feature size
train_size=ut.file_len(train_file)
test_size=ut.file_len(test_file)
# train_size=312437        #ut.file_len(train_file)                    #training size
# test_size=156063         #ut.file_len(test_file)                      #test size
n_batch=train_size/batch_size                                        #number of batches



name_field = {'weekday':0, 'hour':1, 'useragent':2, 'IP':3, 'region':4, 'city':5, 'adexchange':6, 'domain':7, 'slotid':8,
       'slotwidth':9, 'slotheight':10, 'slotvisibility':11, 'slotformat':12, 'creative':13, 'advertiser':14, 'slotprice':15}

feat_field = {}
feat_weights = {}
w_0 = 0
feat_num = 0
k = 0