def build_vocabulary(config): """ Build the vocabulary from the training data and save it to a file. """ coco = COCO(config.train_caption_file) coco.filter_by_cap_len(config.max_caption_length) vocabulary = Vocabulary(config.vocabulary_size) vocabulary.build(coco.all_captions()) # vocabulary.save(config.vocabulary_file) return vocabulary