class Test_WikiVectorSummary(unittest.TestCase): """Test wiki Vector class. """ def setUp(self): """ setting initial paramater Args: data: test file name split_module: setting the split_module instance """ wiki_vector_file_name = APP_ROOT + '/../../Data/jawiki_vector/jawiki_vector_delete_first.txt' self.word_net_file_name = APP_ROOT + '/../../Data/wnjpn-all.tab' # wiki_vector_file_name = APP_ROOT + '/../../Data/jawiki_vector/jawiki_vector_part.txt' # self.word_net_file_name = APP_ROOT + '/../../Data/wnjpn-all_part.tab' self.input_module = InputFile(wiki_vector_file_name) def test_summary_class(self): """ test make summary dict """ self.input_module.input_fast_large_file() wiki_vector = self.input_module.get_vector() self.input_module = InputFile(self.word_net_file_name) self.input_module.input_special_format_file("\t") test_data = self.input_module.get_file_data() self.split_synonym_class = SplitSynonymClass(test_data) self.split_synonym_class.make_dict() # test all dict all_dict = self.split_synonym_class.get_all_dict() # test split dict split_dict = self.split_synonym_class.get_split_dict() self.wiki_vector_summary = WikiVectorSummaryCython( all_dict, split_dict, wiki_vector) self.wiki_vector_summary.get_similler_word() split_dict = self.wiki_vector_summary.get_split_dict() for k, v in split_dict.items(): fo = open(APP_ROOT + "/../../Data/wn_summary_all/" + k + ".txt", 'w') sys.stdout = fo print(v) fo.close() sys.stdout = sys.__stdout__ class_average_vector = self.wiki_vector_summary.get_wiki_average_vector( ) for k, v in class_average_vector.items(): fo = open( APP_ROOT + "/../../Data/wn_summary_all_class_average/" + k + ".txt_vector.txt", 'w') sys.stdout = fo print(v) fo.close() sys.stdout = sys.__stdout__
class Test_WikiVectorSummary(unittest.TestCase): """Test wiki Vector class. """ def setUp(self): """ setting initial paramater Args: data: test file name split_module: setting the split_module instance """ wiki_vector_file_name = APP_ROOT + '/../../Data/jawiki_vector/jawiki_vector_delete_first.txt' self.word_net_file_name = APP_ROOT + '/../../Data/wnjpn-all.tab' # wiki_vector_file_name = APP_ROOT + '/../../Data/jawiki_vector/jawiki_vector_part.txt' # self.word_net_file_name = APP_ROOT + '/../../Data/wnjpn-all_part.tab' self.input_module = InputFile(wiki_vector_file_name) def test_summary_class(self): """ test make summary dict """ self.input_module.input_fast_large_file() wiki_vector = self.input_module.get_vector() self.input_module = InputFile(self.word_net_file_name) self.input_module.input_special_format_file("\t") test_data = self.input_module.get_file_data() self.split_synonym_class = SplitSynonymClass(test_data) self.split_synonym_class.make_dict() # test all dict all_dict = self.split_synonym_class.get_all_dict() # test split dict split_dict = self.split_synonym_class.get_split_dict() self.wiki_vector_summary = WikiVectorSummaryCython(all_dict, split_dict, wiki_vector) self.wiki_vector_summary.get_similler_word() split_dict = self.wiki_vector_summary.get_split_dict() for k, v in split_dict.items(): fo = open(APP_ROOT + "/../../Data/wn_summary_all/" + k + ".txt", 'w') sys.stdout = fo print(v) fo.close() sys.stdout = sys.__stdout__ class_average_vector = self.wiki_vector_summary.get_wiki_average_vector() for k, v in class_average_vector.items(): fo = open(APP_ROOT + "/../../Data/wn_summary_all_class_average/" + k + ".txt_vector.txt", 'w') sys.stdout = fo print(v) fo.close() sys.stdout = sys.__stdout__
def test_summary_class(self): """ test make summary dict """ self.input_module.input_fast_large_file() wiki_vector = self.input_module.get_vector() self.input_module = InputFile(self.word_net_file_name) self.input_module.input_special_format_file("\t") test_data = self.input_module.get_file_data() self.split_synonym_class = SplitSynonymClass(test_data) self.split_synonym_class.make_dict() # test all dict all_dict = self.split_synonym_class.get_all_dict() # test split dict split_dict = self.split_synonym_class.get_split_dict() self.wiki_vector_summary = WikiVectorSummaryCython(all_dict, split_dict, wiki_vector) self.wiki_vector_summary.get_similler_word() split_dict = self.wiki_vector_summary.get_split_dict() for k, v in split_dict.items(): fo = open(APP_ROOT + "/../../Data/wn_summary_all/" + k + ".txt", 'w') sys.stdout = fo print(v) fo.close() sys.stdout = sys.__stdout__ class_average_vector = self.wiki_vector_summary.get_wiki_average_vector() for k, v in class_average_vector.items(): fo = open(APP_ROOT + "/../../Data/wn_summary_all_class_average/" + k + ".txt_vector.txt", 'w') sys.stdout = fo print(v) fo.close() sys.stdout = sys.__stdout__
def test_make_dict(self): """ test make split dict and all dict """ self.input_module.input_special_format_file("\t") test_data = self.input_module.get_file_data() self.split_synonym_class = SplitSynonymClass(test_data) self.split_synonym_class.make_dict() # test all dict all_dict = self.split_synonym_class.get_all_dict() self.assertEqual(all_dict['木っ葉'], "00377169-n") self.assertEqual(len(self.split_synonym_class.get_all_dict()), 146517) # test split dict split_dict = self.split_synonym_class.get_split_dict() self.assertEqual(split_dict['02927303-a'], ['アメリカ大陸の', '北アメリカの', '南アメリカの', '南北アメリカ原産の']) self.assertEqual(len(self.split_synonym_class.get_split_dict()), 75771) print(split_dict["00377169-n"])
class Test_SplitSynonymClass(unittest.TestCase): """Test split file class. """ def setUp(self): """ setting initial paramater Args: data: test file name split_module: setting the split_module instance """ file_name = APP_ROOT + '/../../Data/wnjpn-all.tab' self.input_module = InputFile(file_name) def test_make_dict(self): """ test make split dict and all dict """ self.input_module.input_special_format_file("\t") test_data = self.input_module.get_file_data() self.split_synonym_class = SplitSynonymClass(test_data) self.split_synonym_class.make_dict() # test all dict all_dict = self.split_synonym_class.get_all_dict() self.assertEqual(all_dict['木っ葉'], "00377169-n") self.assertEqual(len(self.split_synonym_class.get_all_dict()), 146517) # test split dict split_dict = self.split_synonym_class.get_split_dict() self.assertEqual(split_dict['02927303-a'], ['アメリカ大陸の', '北アメリカの', '南アメリカの', '南北アメリカ原産の']) self.assertEqual(len(self.split_synonym_class.get_split_dict()), 75771) print(split_dict["00377169-n"])
def test_summary_class(self): """ test make summary dict """ self.input_module.input_fast_large_file() wiki_vector = self.input_module.get_vector() self.input_module = InputFile(self.word_net_file_name) self.input_module.input_special_format_file("\t") test_data = self.input_module.get_file_data() self.split_synonym_class = SplitSynonymClass(test_data) self.split_synonym_class.make_dict() # test all dict all_dict = self.split_synonym_class.get_all_dict() # test split dict split_dict = self.split_synonym_class.get_split_dict() self.wiki_vector_summary = WikiVectorSummaryCython( all_dict, split_dict, wiki_vector) self.wiki_vector_summary.get_similler_word() split_dict = self.wiki_vector_summary.get_split_dict() for k, v in split_dict.items(): fo = open(APP_ROOT + "/../../Data/wn_summary_all/" + k + ".txt", 'w') sys.stdout = fo print(v) fo.close() sys.stdout = sys.__stdout__ class_average_vector = self.wiki_vector_summary.get_wiki_average_vector( ) for k, v in class_average_vector.items(): fo = open( APP_ROOT + "/../../Data/wn_summary_all_class_average/" + k + ".txt_vector.txt", 'w') sys.stdout = fo print(v) fo.close() sys.stdout = sys.__stdout__