def setUp(self): model = Model(20) model.load('../testdata/lda_model') vocabulary = Vocabulary() vocabulary.load('../testdata/vocabulary.dat') self.sparselda_gibbs_sampler = \ SparseLDAGibbsSampler(model, vocabulary, 10, 5)
class SparseLDAGibbsSamplerTest(unittest.TestCase): def setUp(self): model = Model(20) model.load('../testdata/lda_model') vocabulary = Vocabulary() vocabulary.load('../testdata/vocabulary.dat') self.sparselda_gibbs_sampler = \ SparseLDAGibbsSampler(model, vocabulary, 10, 5) def test_infer_topics(self): doc_tokens = [] doc_topic_dist = self.sparselda_gibbs_sampler.infer_topics(doc_tokens) self.assertEqual(0, len(doc_topic_dist)) doc_tokens = ['apple', 'ipad'] doc_topic_dist = self.sparselda_gibbs_sampler.infer_topics(doc_tokens) self.assertEqual(3, len(doc_topic_dist)) self.assertTrue(1 in doc_topic_dist) doc_tokens = ['apple', 'ipad', 'apple', 'null', 'nokia', 'macbook'] doc_topic_dist = self.sparselda_gibbs_sampler.infer_topics(doc_tokens) self.assertEqual(4, len(doc_topic_dist)) self.assertTrue(0 in doc_topic_dist) self.assertEqual(0.1, doc_topic_dist[0]) self.assertTrue(2 in doc_topic_dist) self.assertEqual(0.3, doc_topic_dist[2])