Python NaiveBayesClassifier.classify Examples

Programming Language: Python

Namespace/Package Name: nltk

Method/Function: classify

Examples at hotexamples.com: 5

Python NaiveBayesClassifier.classify - 5 examples found. These are the top rated real world Python examples of nltk.NaiveBayesClassifier.classify extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

train(30)

NaiveBayesClassifier(12)

classify(4)

accuracy(2)

prob_classify(2)

show_most_informative_features(2)

labels(1)

most_informative_features(1)

Example #1

Show file

File: spamclassifier.py Project: dsuneelc/spam_classifier

 def predict(self, text):
     """
     Returns prediction labels of given input text.
     """
     if isinstance(text, str):
         predictions = NaiveBayesClassifier.classify(self.classifier, self.extract_features(text))
     elif isinstance(text, list):
         predictions = [NaiveBayesClassifier.classify(self.classifier, self.extract_features(email))
                        for email in text]
     elif isinstance(text, dict):
         predictions = collections.OrderedDict({key: NaiveBayesClassifier.classify(self.classifier, self.extract_features(email))
                                                for key, email in text.items()})
     return predictions

Example #2

Show file

File: sentiment_model.py Project: imclab/happyminions

    feature_freqdist = defaultdict(FreqDist)
    feature_values = defaultdict(set)
    num_samples = len(train_samples) / 2
    for token, counts in labeled_features.items():
        for label in ['neg','pos']:
            feature_freqdist[label, token].inc(True, count=counts[label])
            feature_freqdist[label, token].inc(None, num_samples - counts[label])
            feature_values[token].add(None)
            feature_values[token].add(True)
    for item in feature_freqdist.items():
        print item[0],item[1]
    feature_probdist = {}
    for ((label, fname), freqdist) in feature_freqdist.items():
        probdist = ELEProbDist(freqdist, bins=len(feature_values[fname]))
        feature_probdist[label,fname] = probdist
    return feature_probdist


labeled_features = get_labeled_features(train_samples)

label_probdist = get_label_probdist(labeled_features)

feature_probdist = get_feature_probdist(labeled_features)

classifier = NaiveBayesClassifier(label_probdist, feature_probdist)

for sample in test_samples:
    print "%s | %s" % (sample, classifier.classify(gen_bow(sample)))

classifier.show_most_informative_features()

Example #3

Show file

File: naiveBayesClassifier.py Project: Sareeta054/twitter_analysis

            os.path.split(os.path.realpath(__file__))[0],
            ModelConfigReader.getModelFolder(),
            ModelConfigReader.getModelSavedName(model_name))
        print("model path: " + model_path)
        self.classifier = pickle.load(open(model_path, "rb"))

    def _mostInformativeFeatures(self, limit=20):
        return self.classifier.show_most_informative_features(limit)

    def classify(self, sentence):
        '''
        classify the sentence into postive or negative.
        It returns classification with probability values.
        for eg: {'prediction': 'pos', 'pos': 0.582766958567508, 'neg': 0.41723304143249396}
        '''
        probResult = self.classifier.prob_classify(bagOfWords(sentence))
        return {
            "prediction": probResult.max(),
            "pos": probResult.prob("pos"),
            "neg": probResult.prob("neg")
        }


# ---------- Testing ----------------------
if __name__ == "__main__":
    classifier = NaiveBayesClassifier()
    sentence = "What a fascinating day. I am sure loving the weather."
    sentence2 = "I don't like this at all. Rich people dominating the value of democracy."
    print(classifier.classify(sentence))
    print(classifier.classify(sentence2))

Example #4

Show file

File: train_nbc.py Project: ravenscroftj/partridge

                labelled_features[word.lower()][label] += features[word]

            print "Currently at %d distinct tokens and %d papers" % (
                len(labelled_features), samplecount)

    label_probdist = get_label_probdist(labelled_features)

    feature_probdist = get_feature_probdist(labelled_features)

    classifier = NaiveBayesClassifier(label_probdist, feature_probdist)

    for samplefile in test_samples:
        features = {}

        p = PaperParser()
        p.parsePaper(samplefile)

        for sentence in p.extractRawSentences():
            tokens = nltk.word_tokenize(sentence)

            for word in tokens:
                features[word] = True

        dirname = os.path.basename(os.path.dirname(samplefile))
        label = labels[dirname]

        print "file: %s | actual: %s | predicted: %s" % (
            samplefile, label, classifier.classify(features))

    classifier.show_most_informative_features()

Example #5

Show file

File: processjson.py Project: NimishVerma/HateSpeechDetection

import json
import re
from nltk import NaiveBayesClassifier


def clean_tweet(tweet):
    return ' '.join(
        re.sub("(@[A-Za-z0-9]+)|([^0-9A-Za-z \t])|(\w+:\/\/\S+)", " ",
               tweet).split())


mydata = []
json_data = open('convertcsv.json', 'r')
data = json.load(json_data)
for d in data:
    if d.get('hate_speech') == 0:
        mydata.append({"text": clean_tweet(d.get('tweet')), "label": "pos"})
    else:
        mydata.append({"text": clean_tweet(d.get('tweet')), "label": "neg"})

cl = NaiveBayesClassifier(mydata, format="json")
cl.classify("This is an amazing library!")