def topinyin_sentence(sentence): s = sentence.strip() pylist = PinyinHelper.convertToPinyinFromSentence(s) result = [] for py in pylist: if py == '〇': result.append('ling') else: result.append(utils.simplify_pinyin(py)) return result
def translate(cn): ret = PinyinHelper.convertToPinyinFromSentence( cn, pinyinFormat=PinyinFormat.WITHOUT_TONE) for i in range(len(ret)): if ret[i] == 'lve': ret[i] = 'lue' if ret[i] == 'nve': ret[i] = 'nue' if ret[i] == 'r': ret[i] = 'er' return ret
def topinyin(s): """ s都是汉字 """ s = util.as_text(s) py_list = PinyinHelper.convertToPinyinFromSentence(s) result = [] for py in py_list: py = util.as_text(py) if py == '〇': result.append('ling') else: result.append(util.simplify_pinyin(py)) if ',' in ''.join(result): print(s) print(''.join(result)) sys.exit() return result
def readdatafromfile(filename): with open(filename) as outfile: return json.load(outfile) result = {} max_num = 0. min_num = 100000000000000. for line in open('./word.txt'): line = util.as_text(line.strip()) if '=' not in line: continue word, num = line.split('=') num = float(num) pinyin_list = PinyinHelper.convertToPinyinFromSentence(word, segment=cut) pinyins = ','.join(pinyin_list) pinyins = util.simplify_pinyin(pinyins) result.setdefault(pinyins, {}) result[pinyins].setdefault(word, 0) result[pinyins][word] += num max_num = max(max_num, result[pinyins][word]) min_num = min(min_num, result[pinyins][word]) for line in open('./phrase.txt'): line = util.as_text(line.strip()) if '=' not in line: continue word, _ = line.split('=') num = 1. pinyin_list = PinyinHelper.convertToPinyinFromSentence(word, segment=cut)
def topinyin_single(word): word = word.strip() pylist = PinyinHelper.convertToPinyinFromSentence(word) result = ''.join([utils.simplify_pinyin(py) for py in pylist]) result.replace('〇', 'ling') return result