def __init__(self, session, config, parent): SimpleNormalizer.__init__(self, session, config, parent) lang = self.get_setting(session, 'language', 'english') try: self.stemmer = Stemmer.Stemmer(lang) except: raise ConfigFileException("Unknown stemmer language: " "%s" % (lang))
def getStemmer(language): """ Return a Stemmer instance for a given language or country code or None if no stemmer exists. """ if language not in availableStemmers: language = country_codes.get(language) if language: return stemmer.Stemmer(language) return None
def __init__(self, session, config, parent): SimpleNormalizer.__init__(self, session, config, parent) lang = self.get_setting(session, 'language', 'english') self.punctuationRe = re.compile( "((?<!s)'|[-.,]((?=\s)|$)|(^|(?<=\s))[-.,']|" "[~`!@+=\#\&\^*()\[\]{}\\\|\":;<>?/])") try: self.stemmer = Stemmer.Stemmer(lang) except: raise ConfigFileException("Unknown stemmer language: %s" % (lang))
def __init__(self, session, config, parent): SimpleNormalizer.__init__(self, session, config, parent) if Stemmer is None: raise MissingDependencyException(self.objectType, "zopyx.txng3.ext" ) lang = self.get_setting(session, 'language', 'english') try: self.stemmer = Stemmer.Stemmer(lang) except: raise ConfigFileException("Unknown stemmer language: " "%s" % (lang))
def stemmer(self): if stemmer is None: return broken return stemmer.Stemmer(self.language)