# testing data def test(data_manager, lda): testing_data_manager = TestingDataManager(data_manager, lda) testing_data_manager.create_testing_img_document_topic_matrix() testing_data_manager.create_testing_textual_document_topic_matrix() testing_data_manager.create_ranking() if __name__ == '__main__': # Create vocabulary - either custom or by gensim textual_dictionary = TextualDictionary() #textual_dictionary.create_custom_vocabulary() textual_dictionary.create_gensim_dictionary() data_manager = DataManager(textual_dictionary) data_manager.count_textual_training_img_ids() #data_manager.load_testing_img_ids() # Inicialize text corpus for training. corpus = ConcatenatedCorpus(len(data_manager.textual_train_image_ids), textual_dictionary) # Inicilize LDA and start training. lda = ConcatenatedLDA(data_manager, corpus) lda.train_lda() teaser(data_manager, lda)