def __init__(self, scp_file, utt2label_file, M): 'Initialization' self.M = M self.scp_file = scp_file self.utt2len = ako.read_key_len(scp_file) self.utt2label = ako.read_key_label(utt2label_file) self.feat_gen = ko.read_mat_scp(scp_file) # feature generator self.utt2mat = {} for key, mat in self.feat_gen: self.utt2mat[key] = mat
def __init__(self, scp_file, utt2label_file, M): 'Initialization' self.M = M self.scp_file = scp_file self.utt2len = ako.read_key_len(scp_file) self.utt2label = ako.read_key_label(utt2label_file) self.feat_gen = ko.read_mat_scp(scp_file) # feature generator mats, labels = [], [] # construct feature and label matrices for key,mat in self.feat_gen: mats.append(slice(mat,M)) labels.append(np.repeat(self.utt2label[key], len(mat))) self.label_mat = np.hstack(labels) self.feat_mat = np.vstack(mats)
from __future__ import print_function import adv_kaldi_io as ako test_scp = '/export/b19/jlai/cstr/spoof/baseline/v1/data/train_cqcc/feats.scp' test_utt2label = '/export/b19/jlai/cstr/spoof/baseline/v1/data/train_cqcc/utt2label' test_key = 'M0001-T_1000027' all_key = ako.read_all_key(test_scp) mat = ako.read_mat_key(test_scp, test_key) length = ako.read_total_len(test_scp) print(length) # 938016 label = ako.read_key_label(test_utt2label) key_map = ako.read_key_len(test_scp) print(key_map)