def _create_examples(self, lines, set_type): """Creates examples for the training and dev sets.""" examples = [] for (i, line) in enumerate(lines): if i == 0: continue guid = "%s-%s" % (set_type, i) text_a = tokenization.preprocess_text(line[3], lower=FLAGS.do_lower_case) text_b = tokenization.preprocess_text(line[4], lower=FLAGS.do_lower_case) if set_type == "test": guid = line[0] label = "0" else: label = tokenization.preprocess_text(line[0]) examples.append( InputExample(guid=guid, text_a=text_a, text_b=text_b, label=label)) return examples
def _create_examples(self, lines, set_type): """Creates examples for the training and dev sets.""" examples = [] for (i, line) in enumerate(lines): if i == 0: continue # Note(mingdachen): We will rely on this guid for GLUE submission. guid = tokenization.preprocess_text(line[0], lower=FLAGS.do_lower_case) text_a = tokenization.preprocess_text(line[8], lower=FLAGS.do_lower_case) text_b = tokenization.preprocess_text(line[9], lower=FLAGS.do_lower_case) if set_type == "test": label = "contradiction" else: label = tokenization.preprocess_text(line[-1]) examples.append( InputExample(guid=guid, text_a=text_a, text_b=text_b, label=label)) return examples