def process(self, context, word_string): YLogger.debug(context, "Splitting Chinese into parsable words...") chars = [] for ch in word_string: if ChineseLanguage.is_language(ch): chars.append(" %s " % ch) else: chars.append(ch) text = "".join(chars).strip() return re.sub(' +', ' ', text)
def process(self, context, word_string): YLogger.debug(context, "Splitting Chinese into parsable words...") chars = [] for ch in word_string: if ChineseLanguage.is_language(ch): chars.append(" %s "%ch) else: chars.append(ch) text = "".join(chars).strip() return re.sub(' +',' ', text)
def process(self, bot, clientid, word_string): if logging.getLogger().isEnabledFor(logging.DEBUG): logging.debug("Splitting Chinese into parsable words...") chars = [] for ch in word_string: if ChineseLanguage.is_language(ch): chars.append(" %s " % ch) else: chars.append(ch) text = "".join(chars).strip() return re.sub(' +', ' ', text)
def __init__(self, word, userid='*'): PatternNode.__init__(self, userid) chars = [] for ch in word: if ChineseLanguage.is_language(ch): chars.append(" %s " % ch) else: chars.append(ch) text = "".join(chars).strip() word = re.sub(' +', ' ', text) self._word = word
def process(self, context, word_string): YLogger.debug(context, "Merging Chinese into understandable words...") words = word_string.split(" ") processed = "" for word in words: if ChineseLanguage.is_language(word): processed += word else: processed += " " + word + " " processed = re.sub(r'\s+', ' ', processed) return processed.strip()
def process(self, context, word_string): YLogger.debug(context, "Merging Chinese into understandable words...") words = word_string.split(" ") str = "" for word in words: if ChineseLanguage.is_language(word): str += word else: str += " " + word + " " str = re.sub(r'\s+', ' ', str) return str.strip()
def process(self, bot, clientid, word_string): if logging.getLogger().isEnabledFor(logging.DEBUG): logging.debug("Merging Chinese into understandable words...") words = word_string.split(" ") str = "" for word in words: if ChineseLanguage.is_language(word): str += word else: str += " " + word + " " str = re.sub(r'\s+', ' ', str) return str.strip()
def test_is_language(self): self.assertFalse(ChineseLanguage.is_language("")) self.assertFalse(ChineseLanguage.is_language("H")) self.assertTrue(ChineseLanguage.is_language("你")) self.assertFalse(ChineseLanguage.is_language(32))
def test_is_language(self): self.assertFalse(ChineseLanguage.is_language("")) self.assertFalse(ChineseLanguage.is_language("H")) self.assertTrue(ChineseLanguage.is_language("你"))