def gen_tokenized_content(self): tokens = self._pure_tokenize_content() tokens = TextPreprocesser.filter(tokens) return tokens
def gen_tokenized_title(self): tokens = self._pure_tokenize_title() tokens = TextPreprocesser.filter(tokens) return tokens