예제 #1
0
 def get_sentence_examples(self, questions):
     for index, data in enumerate(questions):
         guid = 'test-%d' % index
         text_a = tokenization.convert_to_unicode(str(data[0]))
         text_b = tokenization.convert_to_unicode(str(data[1]))
         label = str(0)
         yield InputExample(guid=guid,
                            text_a=text_a,
                            text_b=text_b,
                            label=label)
예제 #2
0
 def get_dev_examples(self, data_dir):
     file_path = os.path.join(data_dir, 'dev.csv')
     dev_df = pd.read_csv(file_path, encoding='utf-8')
     dev_data = []
     for index, dev in enumerate(dev_df.values):
         guid = 'test-%d' % index
         text_a = tokenization.convert_to_unicode(str(dev[0]))
         text_b = tokenization.convert_to_unicode(str(dev[1]))
         label = str(dev[2])
         dev_data.append(
             InputExample(guid=guid,
                          text_a=text_a,
                          text_b=text_b,
                          label=label))
     return dev_data