Example #1
0
    def encode_fn(e: QCKCompactEntry) -> OrderedDict:
        query, candidate, qk_out_entry = e
        candidate: QCKCandidate = candidate
        info = {
            'query': query,
            'candidate': candidate,
            'kdp': qk_out_entry.kdp
        }

        p = PayloadAsTokens(passage=qk_out_entry.passage_tokens,
                            text1=cache_tokenizer.tokenize(query.text),
                            text2=cache_tokenizer.tokenize(candidate.text),
                            data_id=data_id_man.assign(info),
                            is_correct=0
                            )
        return encode_two_inputs(max_seq_length, tokenizer, p)
Example #2
0
 def encode(inst: PayloadAsTokens) -> OrderedDict:
     return encode_two_inputs(max_seq_length, tokenizer, inst)
Example #3
0
def encode_two_inputs_w_score(max_seq_length, tokenizer,
                              inst: Payload) -> OrderedDict:
    features = encode_two_inputs(max_seq_length, tokenizer,
                                 get_payload_as_token(inst))
    features['rel_score'] = create_float_feature([inst.kdp_score])
    return features
Example #4
0
 def encode_fn(self, inst: PayloadAsTokens) -> OrderedDict:
     return encode_two_inputs(self.max_seq_length, self.tokenizer, inst)
Example #5
0
 def encode(inst: Payload) -> OrderedDict:
     inst_2 = convert_sub_token(tokenizer, inst)
     return encode_two_inputs(max_seq_length, tokenizer, inst_2)