def sMotif4567(): fdir = "E:/Senior/Graduation project/YahooFlickr/NewYorktemp/Motifs/Motif_UserName" os.chdir(fdir) cateNumber = 3 username = functions.readPickle("lmtimeCategory" + str(cateNumber)) lenu = len(username) no3 = [4, 5, 6, 7] matrix = np.zeros((4, 13)) for i in range(lenu): moid = username[i][2] hlocations = username[i][3] if moid not in no3: continue else: ## time=username[i][4] ## motemtype=judgeTempMo_13types(time[hlocations[0]],time[hlocations[1]],time[hlocations[2]]) lmtime = username[i][5] seq = [] llmtime = len(lmtime) for j in range(llmtime): seq.append(lmtime[j][0]) osum = orderSum(seq) sid = judgeSemMo_13types(osum[1], osum[2], osum[3]) matrix[moid - 4, sid - 1] += 1 for k in range(4): matrix[k, :] = matrix[k, :] / sum(matrix[k, :]) return matrix
def userAnalysis(matrix, names, nsimi, sample): fdir = "E:/Senior/Graduation project/YahooFlickr/NewYorktemp/Motifs/Motif_UserName" os.chdir(fdir) cateNumber = 3 username = functions.readPickle("lmtimeCategory" + str(cateNumber)) lenu = len(username) for ind in sample: print(ind) print(names[ind]) print(matrix[ind]) for i in range(lenu): moid = username[i][2] hlocations = username[i][3] name = username[i][0][:-3] if name == names[ind]: print(username[i]) print('-' * 40)
def userMatrixNew(): fdir = "E:/Senior/Graduation project/YahooFlickr/NewYorktemp/Motifs/Motif_UserName" os.chdir(fdir) cateNumber = 3 username = functions.readPickle("lmtimeCategory" + str(cateNumber)) lenu = len(username) matrix = [] names = {} for i in range(lenu): moid = username[i][2] hlocations = username[i][3] name = username[i][0][:-3] if moid == 1: continue else: time = username[i][4] lmtime = username[i][5] seq = [] seqtime = [] llmtime = len(lmtime) for j in range(llmtime): seq.append(lmtime[j][0]) seqtime.append(time[hlocations[j]]) vectp = topoVec4(moid) vectem = temVec13(seqtime) vecseseq = semaSeqVec13(seq) #vecsepor=semaPortionVec3(seq) #vector=np.hstack((vectp,vectem,vecseseq,vecsepor)) vector = np.hstack((vectp, vectem, vecseseq)) if name in names: names[name] += vector else: names[name] = vector namelist = [] for name, vector in names.items(): matrix.append(vector) namelist.append(name) matarray = np.array(matrix) nameArray = np.array(namelist) return matarray, nameArray
def tMotif4567(): fdir = "E:/Senior/Graduation project/YahooFlickr/NewYorktemp/Motifs/Motif_UserName" os.chdir(fdir) cateNumber = 3 username = functions.readPickle("lmtimeCategory" + str(cateNumber)) lenu = len(username) no3 = [4, 5, 6, 7] matrix = np.zeros((4, 13)) for i in range(lenu): moid = username[i][2] hlocations = username[i][3] if moid not in no3: continue else: time = username[i][4] motemtype = judgeTempMo_13types(time[hlocations[0]], time[hlocations[1]], time[hlocations[2]]) matrix[moid - 4, motemtype - 1] += 1 for k in range(4): matrix[k, :] = matrix[k, :] / sum(matrix[k, :]) return matrix
import functions import url for item in url.urls: title, summary , url, category = functions.parseEntry(item[0],item[1]) functions.add2Pickle(title,summary,url,category) print(functions.readPickle())
def obtain_data(): return str(functions.readPickle())