Пример #1
0
def topinyin_sentence(sentence):
    s = sentence.strip()
    pylist = PinyinHelper.convertToPinyinFromSentence(s)
    result = []
    for py in pylist:
        if py == '〇':
            result.append('ling')
        else:
            result.append(utils.simplify_pinyin(py))
    return result
Пример #2
0
def translate(cn):
    ret = PinyinHelper.convertToPinyinFromSentence(
        cn, pinyinFormat=PinyinFormat.WITHOUT_TONE)
    for i in range(len(ret)):
        if ret[i] == 'lve':
            ret[i] = 'lue'
        if ret[i] == 'nve':
            ret[i] = 'nue'
        if ret[i] == 'r':
            ret[i] = 'er'
    return ret
Пример #3
0
def topinyin(s):
    """
    s都是汉字
    """
    s = util.as_text(s)
    py_list = PinyinHelper.convertToPinyinFromSentence(s)
    result = []
    for py in py_list:
        py = util.as_text(py)
        if py == '〇':
            result.append('ling')
        else:
            result.append(util.simplify_pinyin(py))

    if ',' in ''.join(result):
        print(s)
        print(''.join(result))
        sys.exit()
    return result
Пример #4
0
def topinyin(s):
    """
    s都是汉字
    """
    s = util.as_text(s)
    py_list = PinyinHelper.convertToPinyinFromSentence(s)
    result = []
    for py in py_list:
        py = util.as_text(py)
        if py == '〇':
            result.append('ling')
        else:
            result.append(util.simplify_pinyin(py))

    if ',' in ''.join(result):
        print(s)
        print(''.join(result))
        sys.exit()
    return result
Пример #5
0
def readdatafromfile(filename):
    with open(filename) as outfile:
        return json.load(outfile)


result = {}
max_num = 0.
min_num = 100000000000000.

for line in open('./word.txt'):
    line = util.as_text(line.strip())
    if '=' not in line:
        continue
    word, num = line.split('=')
    num = float(num)
    pinyin_list = PinyinHelper.convertToPinyinFromSentence(word, segment=cut)
    pinyins = ','.join(pinyin_list)
    pinyins = util.simplify_pinyin(pinyins)
    result.setdefault(pinyins, {})
    result[pinyins].setdefault(word, 0)
    result[pinyins][word] += num
    max_num = max(max_num, result[pinyins][word])
    min_num = min(min_num, result[pinyins][word])

for line in open('./phrase.txt'):
    line = util.as_text(line.strip())
    if '=' not in line:
        continue
    word, _ = line.split('=')
    num = 1.
    pinyin_list = PinyinHelper.convertToPinyinFromSentence(word, segment=cut)
Пример #6
0
def topinyin_single(word):
    word = word.strip()
    pylist = PinyinHelper.convertToPinyinFromSentence(word)
    result = ''.join([utils.simplify_pinyin(py) for py in pylist])
    result.replace('〇', 'ling')
    return result
Пример #7
0
def readdatafromfile(filename):
    with open(filename) as outfile:
        return json.load(outfile)

result = {}
max_num = 0.
min_num = 100000000000000.


for line in open('./word.txt'):
    line = util.as_text(line.strip())
    if '=' not in line:
        continue
    word, num = line.split('=')
    num = float(num)
    pinyin_list = PinyinHelper.convertToPinyinFromSentence(word, segment=cut)
    pinyins = ','.join(pinyin_list)
    pinyins = util.simplify_pinyin(pinyins)
    result.setdefault(pinyins, {})
    result[pinyins].setdefault(word, 0)
    result[pinyins][word] += num
    max_num = max(max_num, result[pinyins][word])
    min_num = min(min_num, result[pinyins][word])

for line in open('./phrase.txt'):
    line = util.as_text(line.strip())
    if '=' not in line:
        continue
    word, _ = line.split('=')
    num = 1.
    pinyin_list = PinyinHelper.convertToPinyinFromSentence(word, segment=cut)