#query = pattern.getPhoneticCode() #document = searchEntry5.getPhoneticCode() #print query #print document #print " " #print pattern.data.comparePhoneticCodeLists(query, document) #varList = ["halten", "hielt", "gehalt", "haltbar"] #so = Stemmer("") #print so.successorVariety ("gehalten", varList) #varObject = Phonetics("") #sv = varObject.calcSuccVarietyList(varList) #print sv #svm = varObject.calcSuccVarietyMerge(sv) #print svm #print varObject.calcSuccVarietyCount(svm) #text = Advas(["die Kinder freuen sich über die Kastanien"], "") #keywordList = ["die", "der", "das", "sich"] #print text.isLanguageByKeywords (keywordList) #text = Advas(["Schule"], "") #print text.getSynonyms("/home/frank/projekte/openthesaurus/openthesaurus.txt", "") #print text.isSynonymOf("Bildungszentrum", "/home/frank/projekte/openthesaurus/openthesaurus.txt", "") # -- ngram stemmer stemmerObject = Stemmer("") print stemmerObject.ngramStemmer( ["halten", "hielt", "halter", "halt", "gehalten"], 2, 0.4)