Python cut示例

编程语言: Python

命名空间/包名称: jiebas.jieba_utils

方法/功能: cut

hotexamples.com的示例: 6

Python cut - 已找到6个示例。这些是从开源项目中提取的最受好评的jiebas.jieba_utils.cut现实Python示例。您可以评价示例，以帮助我们提高示例质量。

示例#1

显示文件

文件： comment_preprocessing.py 项目： xuan1280/K-Ming-Course-Reviewer

def comment_to_word_vectors(comment):
    words = list()
    sentence_words = jieba_utils.cut(comment)
    for word in sentence_words:
        if word in word_vector_model.wv:
            words.append(word_vector_model.wv[word])
    return words

示例#2

显示文件

文件： jieba_test.py 项目： xuan1280/K-Ming-Course-Reviewer

def test(comment):
    sentence_words = jieba_utils.cut(comment)
    print(sentence_words)
    words = list()
    for word in sentence_words:
        if word in word_vector_model.wv:
            words.append(word_vector_model.wv[word])
        else:
            print(word, ' 沒有在模組中')

示例#3

显示文件

文件： comment_preprocessing.py 项目： xuan1280/K-Ming-Course-Reviewer

def comment_to_indices(comment, word_to_index):
    indices = []
    size = len(word_to_index)
    words = jieba_utils.cut(comment)
    print('Comment: {}\n Terms: {}'.format(comment, ','.join(words)))
    for word in words:
        if word in word_to_index:
            indices.append(word_to_index[word])
        else:
            indices.append(size)  # other
    return indices

示例#4

显示文件

文件： comment_preprocessing.py 项目： xuan1280/K-Ming-Course-Reviewer

def comment_to_one_hot(comment, word_index_dict):
    data = list()
    words = jieba_utils.cut(comment)
    for word in words:
        data_one_hot = np.zeros(len(word_index_dict) + 1)
        if word in word_index_dict:
            index = word_index_dict[word]
            data_one_hot[index] = 1
        else:
            data_one_hot[-1] = 1
        data.append(data_one_hot.tolist())
    return data

示例#5

显示文件

文件： comment_preprocessing.py 项目： xuan1280/K-Ming-Course-Reviewer

def build_up_word_list(comments, word_list_file_name=None, output_file_name=None):
    if word_list_file_name:
        print('Loading word list from file ' + word_list_file_name)
        with open(word_list_file_name, 'r', encoding='utf-8') as fr:
            word_list = [line.strip() for line in fr.readlines() if len(line.strip()) != 0]
    else:
        wordset = set()
        print('No word list file specified, creating new word list.')
        for comment in comments:
            words = jieba_utils.cut(comment)
            wordset.update(words)
        word_list = list(wordset)

    if output_file_name:
        with open(output_file_name, 'w+', encoding='utf-8') as fw:
            for word in word_list:
                fw.write(word + '\n')
            print('Word list saved to ' + output_file_name + '.')

    return word_list

示例#6

显示文件

文件： comment_preprocessing.py 项目： xuan1280/K-Ming-Course-Reviewer

def comment_to_n_of_words(comment):
    return jieba_utils.cut(comment)