def encode_fn(e: QCKCompactEntry) -> OrderedDict: query, candidate, qk_out_entry = e candidate: QCKCandidate = candidate info = { 'query': query, 'candidate': candidate, 'kdp': qk_out_entry.kdp } p = PayloadAsTokens(passage=qk_out_entry.passage_tokens, text1=cache_tokenizer.tokenize(query.text), text2=cache_tokenizer.tokenize(candidate.text), data_id=data_id_man.assign(info), is_correct=0 ) return encode_two_inputs(max_seq_length, tokenizer, p)
def encode(inst: PayloadAsTokens) -> OrderedDict: return encode_two_inputs(max_seq_length, tokenizer, inst)
def encode_two_inputs_w_score(max_seq_length, tokenizer, inst: Payload) -> OrderedDict: features = encode_two_inputs(max_seq_length, tokenizer, get_payload_as_token(inst)) features['rel_score'] = create_float_feature([inst.kdp_score]) return features
def encode_fn(self, inst: PayloadAsTokens) -> OrderedDict: return encode_two_inputs(self.max_seq_length, self.tokenizer, inst)
def encode(inst: Payload) -> OrderedDict: inst_2 = convert_sub_token(tokenizer, inst) return encode_two_inputs(max_seq_length, tokenizer, inst_2)