Esempio n. 1
0
def count_total_size(input_path, out_path):
    if os.path.exists(out_path):
        return cPickle.load(open(out_path))
    else:
        generator = index_sequence_maker.index_generator(input_path)
        total_size = sum([1 for _ in generator])
        if out_path != "":
            cPickle.dump(total_size, open(out_path, "wb"))
        return total_size
Esempio n. 2
0
def make_counter(input_path, output_path):
    if os.path.exists(output_path):
        return cPickle.load(open(output_path))
    else:
        dic = collections.defaultdict(int)
        for index in index_sequence_maker.index_generator(input_path):
            dic[index] += 1
        ret = collections.Counter(dic)
        cPickle.dump(ret, open(output_path, "wb"))
        return ret
Esempio n. 3
0
def find_train_max(input_path, output_path):
    if os.path.exists(output_path):
        return cPickle.load(open(output_path))
    else:
        max_index = -1
        for index in index_sequence_maker.index_generator(input_path):
            if index > max_index:
                max_index = index
        cPickle.dump(max_index, open(output_path, "wb"))
        return max_index
 def index_sequence_generator(self, path):
     return index_sequence_maker.index_generator(
         self.index_sequence_file_path)
Esempio n. 5
0
def save_dataset(input_path, output_path):
    dataset = np.array(
        [index for index in index_sequence_maker.index_generator(input_path)])
    cPickle.dump(dataset, open(output_path, "wb"))
    return dataset