Python convert_to_unicode示例

编程语言: Python

命名空间/包名称: Base_model.bert.tokenization

方法/功能: convert_to_unicode

hotexamples.com的示例: 4

Python convert_to_unicode - 已找到4个示例。这些是从开源项目中提取的最受好评的Base_model.bert.tokenization.convert_to_unicode现实Python示例。您可以评价示例，以帮助我们提高示例质量。

示例#1

显示文件

 def get_sentence_examples(self, questions):
     for index, data in enumerate(questions):
         guid = 'test-%d' % index
         text_a = tokenization.convert_to_unicode(str(data))
         text_b = None
         # label = str(0)
         label = self.labels[0]
         yield InputExample(guid=guid, text_a=text_a, text_b=text_b, label=label)

示例#2

显示文件

    def get_test_examples(self, data_dir):
        file_path = os.path.join(data_dir, 'cnews.test.txt')
        with open(file_path, 'r', encoding="utf-8") as f:
            reader = f.readlines()
        # random.shuffle(reader)  # 测试集不打乱数据，便于比较

        examples = []
        for index, line in enumerate(reader):
            guid = 'test-%d' % index
            split_line = line.strip().split("\t")
            text_a = tokenization.convert_to_unicode(split_line[1])
            text_b = None
            label = split_line[0]
            examples.append(InputExample(guid=guid, text_a=text_a,
                                         text_b=text_b, label=label))
        return examples

示例#3

显示文件

文件： sentiment_classifier_v2.py 项目： xkungfu/Chatbot_Utils

    def get_dev_examples(self, data_dir):
        file_path = os.path.join(data_dir, 'sentiment_valid.txt')
        with open(file_path, 'r', encoding="utf-8") as f:
            reader = f.readlines()
        random.shuffle(reader)

        examples = []
        for index, line in enumerate(reader):
            guid = 'dev-%d' % index
            split_line = line.strip().split('\t')
            text_a = tokenization.convert_to_unicode(split_line[1])
            text_b = None
            label = split_line[0]
            examples.append(InputExample(guid=guid, text_a=text_a,
                                         text_b=text_b, label=label))
        return examples

示例#4

显示文件

    def get_train_examples(self, data_dir):
        file_path = os.path.join(data_dir, 'train.txt')
        with open(file_path, 'r', encoding="utf-8") as f:
            reader = f.readlines()
        random.seed(0)
        random.shuffle(reader)  # 注意要shuffle

        examples, self.labels = [], []
        for index, line in enumerate(reader):
            guid = 'train-%d' % index
            split_line = line.strip().split("\t")
            text_a = tokenization.convert_to_unicode(split_line[1])
            text_b = None
            label = split_line[0]
            examples.append(InputExample(guid=guid, text_a=text_a,
                                         text_b=text_b, label=label))
            self.labels.append(label)
        return examples