예제 #1
0
def normalize(orig_string):
    """Strips non-alphanumeric characters from a string unless doing so would make it blank."""
    string = strip_non_alnum(orig_string.lower())
    if not string:
        string = orig_string
    #string = " ".join(filter(lambda a: a not in _stop_words and len(a) > 1,
    #                         _split_re.split(string)))
    #string = unaccent(string)
    return string
예제 #2
0
def normalize(orig_string):
    """Strips non-alphanumeric characters from a string unless doing so would make it blank."""
    string = strip_non_alnum(orig_string.lower())
    if not string:
        string = orig_string
    #string = " ".join(filter(lambda a: a not in _stop_words and len(a) > 1,
    #                         _split_re.split(string)))
    #string = unaccent(string)
    return string
예제 #3
0
def normalize(orig_string):
    """Strips non-alphanumeric characters from a string unless doing so would make it blank."""
    string = strip_non_alnum(orig_string.lower())
    if not string:
        string = orig_string
    return string
예제 #4
0
파일: similarity.py 프로젝트: totyc/picard
def normalize(orig_string):
    """Strips non-alphanumeric characters from a string unless doing so would make it blank."""
    string = strip_non_alnum(orig_string.lower())
    if not string:
        string = orig_string
    return string