def __init__(self, queryFile, candidatePath, mu, corpusFile, sigma, lamda): self.query = {} self.candidate = candidatePath self.tweet = {} self.mu = mu self.sigma = sigma #similarity threshold self.lamda = lamda #cluster threshold self.jaccInstance = Jaccard() self.klInstance = Distance(mu, corpusFile) print "corpus read done!"