def test_word_and_count_to_dict(self): word_dict = {} words = main.file_to_list(SAMPLE) test_dict = main.word_count(SAMPLE) self.assertItemsEqual(main.word_count(SAMPLE), test_dict)
def test_file_to_list(self): tokenizer = RegexpTokenizer(r'\w+') content = tokenizer.tokenize(self.testdata) words = [word.lower() for word in content] self.assertEqual(main.file_to_list(SAMPLE), words)