Example #1
0
import pandas
import sys
from chchao.like_test import like_test

profile = pandas.read_csv('data/TCSS555/Train/Profile/Profile.csv')
relation = pandas.read_csv('data/TCSS555/Train/Relation/Relation.csv')
a = []
b = []
_a = []
_b = []
n_size = 9500
n_train = 8500
knn = 5
x = like_test()

for i in range(0, n_size):
	l = x.lr_formating(relation, profile['userid'][i])
	a.append(l)
	b.append(x.lr_age_format(profile['age'][i]))
	if 1 in a[i]:
		_a.append(a[i])
		_b.append(b[i])
	sys.stdout.write("training : %4d/%04d\r"%(i,n_size))
	sys.stdout.flush()

print("knn : %d"%knn)
print("n_train : %d"%n_train)
print("len(_a):%d len(_b):%d"%(len(_a), len(_b)))

# from sklearn.decomposition import TruncatedSVD
Example #2
0
try:
	relation = pandas.read_csv(input_dir+'relation/relation.csv')
	print("reading relation.csv successed.")
except:
	print("Error: reading relation.csv failed.")
	exit()

try:
	oxford_csv = pandas.read_csv(input_dir+'oxford.csv')
	print("reading oxford.csv successed.")
except:
	print("Warning: reading oxford.csv failed.")


baseline = baseline()
like_test = like_test()

cf = open('/home/itadmin/MLProject/clf_age_SGDC_liketext.pickle', 'rb')
age_predict = pickle.load(cf)

# cf = open('/home/itadmin/MLProject/clf_like_mnb_gender.pickle', 'rb')
# g_predict = pickle.load(cf)
g_predict = gender()

len_profile = len(profile)



try:
	ope_p = text_ope_knn_test()
except: