def setUp(self): self.model = Model(20) self.vocabulary = Vocabulary() self.vocabulary.load('../testdata/vocabulary.dat') self.sparselda_train_gibbs_sampler = \ SparseLDATrainGibbsSampler(self.model, self.vocabulary)
class SparseLDATrainGibbsSamplerTest(unittest.TestCase): def setUp(self): self.model = Model(20) self.vocabulary = Vocabulary() self.vocabulary.load('../testdata/vocabulary.dat') self.sparselda_train_gibbs_sampler = \ SparseLDATrainGibbsSampler(self.model, self.vocabulary) def test_load_corpus(self): self.sparselda_train_gibbs_sampler.load_corpus('../testdata/corpus') self.assertEqual(4, len(self.sparselda_train_gibbs_sampler.documents)) def test_gibbs_sampling(self): self.sparselda_train_gibbs_sampler.load_corpus('../testdata/corpus') rand = random.Random() for i in xrange(100): self.sparselda_train_gibbs_sampler.gibbs_sampling(rand) if (i + 1) % 10 == 0: self.sparselda_train_gibbs_sampler.save_checkpoint( '../testdata/checkpoint', i + 1) self.sparselda_train_gibbs_sampler.save_model( '../testdata/train_model', 100) def test_load_checkpoint(self): cur_iteration = self.sparselda_train_gibbs_sampler.load_checkpoint( '../testdata/checkpoint') rand = random.Random() for i in xrange(cur_iteration, 200): self.sparselda_train_gibbs_sampler.gibbs_sampling(rand) if (i + 1) % 10 == 0: self.sparselda_train_gibbs_sampler.save_checkpoint( '../testdata/checkpoint', i + 1)