def find_tokens(self, tokens, **kwargs): # 's in Dutch preceded by a vowel indicates plural ("auto's"): don't replace. kwargs.setdefault("abbreviations", ABBREVIATIONS) kwargs.setdefault("replace", {"'n": " 'n"}) s = _Parser.find_tokens(self, tokens, **kwargs) s = [re.sub(r"' s (ochtends|morgens|middags|avonds)", "'s \\1", s) for s in s] return s
def find_tokens(self, tokens, **kwargs): # 's in Dutch preceded by a vowel indicates plural ("auto's"): don't replace. kwargs.setdefault("abbreviations", ABBREVIATIONS) kwargs.setdefault("replace", {"'n": " 'n"}) s = _Parser.find_tokens(self, tokens, **kwargs) s = [re.sub(r"' s (ochtends|morgens|middags|avonds)", "'s \\1", s) for s in s] return s
def find_tokens(self, tokens, **kwargs): kwargs.setdefault("abbreviations", ABBREVIATIONS) kwargs.setdefault("replace", replacements) s = _Parser.find_tokens(self, tokens, **kwargs) s = [s.replace("&rsquo ;", u"’") if isinstance( s, unicode) else s for s in s] return s
def find_tokens(self, tokens, **kwargs): kwargs.setdefault("abbreviations", ABBREVIATIONS) kwargs.setdefault("replace", replacements) #return _Parser.find_tokens(self, tokens, **kwargs) s = _Parser.find_tokens(self, tokens, **kwargs) s = [s.replace(" &contraction ;", u"'").replace("XXX -", "-") for s in s] return s
def find_tokens(self, tokens, **kwargs): kwargs.setdefault("abbreviations", ABBREVIATIONS) kwargs.setdefault("replace", replacements) #return _Parser.find_tokens(self, tokens, **kwargs) s = _Parser.find_tokens(self, tokens, **kwargs) s = [s.replace(" &contraction ;", u"'").replace("XXX -", "-") for s in s] return s
def find_tokens(self, tokens, **kwargs): kwargs.setdefault("abbreviations", ABBREVIATIONS) kwargs.setdefault("replace", replacements) s = _Parser.find_tokens(self, tokens, **kwargs) s = [ s.replace("&rsquo ;", "’") if isinstance(s, str) else s for s in s ] return s
def find_tokens(self, tokens, **kwargs): kwargs.setdefault("abbreviations", ABBREVIATIONS) kwargs.setdefault("replace", REPLACEMENTS) return _Parser.find_tokens(self, tokens, **kwargs)
def find_tokens(self, tokens, **kwargs): kwargs.setdefault("abbreviations", ABBREVIATIONS) kwargs.setdefault("replace", REPLACEMENTS) return _Parser.find_tokens(self, tokens, **kwargs)
def find_tokens(self, tokens, **kwargs): kwargs.setdefault("abbreviations", ABBREVIATIONS) kwargs.setdefault("replace", CONTRACTIONS) return Parser.find_tokens(self, tokens, **kwargs)