예제 #1
0
    def setUp(self):
        self.naiveBayes = Bayes.NaiveBayes()
        posts, classes = self.loadDataSet()
        self.vocabList = self.naiveBayes.composeList(posts)
        logging.log(logging.INFO, "Vocabulary List: " + str(self.vocabList))

        #start = time.time()

        vecMatrix = []
        for post in posts:
            binarizedVocab = self.naiveBayes.binarize(self.vocabList, post)
            #logging.log(logging.DEBUG, "Post: " + str(post))
            logging.log(logging.DEBUG,
                        "Binaried vector: " + str(binarizedVocab))
            vecMatrix.append(binarizedVocab)

        #stop = time.time()
        #logging.log(logging.INFO, "Consume %s seconds" % str(stop - start))

        self.p0, self.p1, self.pAbusive = self.naiveBayes.train(
            vecMatrix, classes)

        logging.log(logging.INFO, "P0: \n" + str(self.p0))
        logging.log(logging.INFO, "P1: \n" + str(self.p1))