def test_is_uni_word(): for char in ["a", "_", "\xe4"]: assert rsre_char.is_uni_word(ord(char)) for char in ["a", "_", "\xe4", u"\u00e4", u"\u03a0"]: assert rsre_char.is_uni_word(ord(char)) for char in [".", " "]: assert not rsre_char.is_uni_word(ord(char)) for char in [".", " ", EM_SPACE]: assert not rsre_char.is_uni_word(ord(char))
def test_is_word(): assert rsre_char.is_word(ord('A')) assert rsre_char.is_word(ord('_')) assert not rsre_char.is_word(UPPER_PI) assert not rsre_char.is_word(LOWER_PI) assert not rsre_char.is_word(ord(',')) # assert rsre_char.is_uni_word(ord('A')) assert rsre_char.is_uni_word(ord('_')) assert rsre_char.is_uni_word(UPPER_PI) assert rsre_char.is_uni_word(LOWER_PI) assert not rsre_char.is_uni_word(ord(','))