예제 #1
0
    def split_data(self):
        self.train_pool = []
        self.valid_pool = []

        partition = Partition()

        train_clips = []
        valid_clips = []

        train_corpus = []

        for clip in self.data:
            side = partition.clip_id_to_side(clip['clip_id'])
            if side == 'L':
                self.valid_pool.append(clip)
                valid_clips.append(clip['clip_id'])
            elif side == 'R' or side == 'C':
                self.train_pool.append(clip)
                train_clips.append(clip['clip_id'])
                train_corpus.append(clip['sentence'])