예제 #1
0
# training_set = nltk.classify.apply_features(helper.extract_features, helper.filtered_tweet)
# print helper.positive_value
# print helper.negative_value
# classifier = nltk.NaiveBayesClassifier.train(training_set)
# helper.setFilteredTweet('sentiment.dat')
# training_set = nltk.classify.apply_features(helper.extract_features, helper.filtered_tweet)
# classifier2 = nltk.NaiveBayesClassifier.train(training_set)
# helper.save_model('opinion-naivebayes.mdl', classifier)
classifier = helper.load_model('opinion-naivebayes.mdl')
classifier2 = helper.load_model('sentiment-naivebayes.mdl')
# helper.setFilteredTweet('tweets.dat')
classic = helper.extract_features(tweet.split())
corpus_tag = helper.get_tag_from_corpus()
corpus_text = helper.get_text_from_corpus()
test_tag = []
for text in corpus_text:
    result = classifier.classify(helper.extract_features_opinion(text.split()))
    if result == '1':
        result = classifier2.classify(helper.extract_features(text.split()))
    test_tag.append(result)
corpus_tag.reverse()
print corpus_tag
test_tag.reverse()
print test_tag
# print corpus_tag
# print test_tag
cm = nltk.ConfusionMatrix(corpus_tag, test_tag)
print cm.pp(sort_by_count=True, show_percents=True, truncate=9)
print classic
print classifier.classify(classic)