def __init__(self, pageph, hitph): 'init' self.ict = Ictclas('ICTCLAS50/') self.hitph = hitph self.pageph = pageph self.hitdoclist = Hitlist() #得分统计列表 self.wordbar = wordbar('../store/wordbar') #词库 以便得到wordID #hithash相关 self.hithasher = InitHashWid('../store/sortedwidhits', '../store/hithash') self.hithasher.initHashWid() #初始化hithash #init rank total 单个doc的score总和 self.ranktotal = InitRankTotal('../store/sorteddochits', '../store/tranks') self.ranktotal.initTotalRank() self.hits = [] #初始化pagerank self.pageranker = [] self.initPageranker() self.inithits() #初始化hits self.hithash = self.hithasher.hithash self.length = len(self.hits) #hits长度 #print 'length of hits is',self.length #排序 self.sorter = sorter()