Пример #1
0
 def __init__(self, session, config, parent):
     SimpleNormalizer.__init__(self, session, config, parent)
     lang = self.get_setting(session, 'language', 'english')
     try:
         self.stemmer = Stemmer.Stemmer(lang)
     except:
         raise ConfigFileException("Unknown stemmer language: "
                                   "%s" % (lang))
Пример #2
0
def getStemmer(language):
    """ Return a Stemmer instance for a given language or country code
        or None if no stemmer exists.
    """
    if language not in availableStemmers:
        language = country_codes.get(language)
    if language:
        return stemmer.Stemmer(language)
    return None
Пример #3
0
 def __init__(self, session, config, parent):
     SimpleNormalizer.__init__(self, session, config, parent)
     lang = self.get_setting(session, 'language', 'english')
     self.punctuationRe = re.compile(
         "((?<!s)'|[-.,]((?=\s)|$)|(^|(?<=\s))[-.,']|"
         "[~`!@+=\#\&\^*()\[\]{}\\\|\":;<>?/])")
     try:
         self.stemmer = Stemmer.Stemmer(lang)
     except:
         raise ConfigFileException("Unknown stemmer language: %s" %
                                   (lang))
Пример #4
0
 def __init__(self, session, config, parent):
     SimpleNormalizer.__init__(self, session, config, parent)
     if Stemmer is None:
         raise MissingDependencyException(self.objectType,
                                          "zopyx.txng3.ext"
                                          )
     lang = self.get_setting(session, 'language', 'english')
     try:
         self.stemmer = Stemmer.Stemmer(lang)
     except:
         raise ConfigFileException("Unknown stemmer language: "
                                   "%s" % (lang))
Пример #5
0
 def stemmer(self):
     if stemmer is None:
         return broken
     return stemmer.Stemmer(self.language)