Python Featuresets Examples

Programming Language: Python

Namespace/Package Name: lib.featuresets

Class/Type: Featuresets

Examples at hotexamples.com: 4

Python Featuresets - 4 examples found. These are the top rated real world Python examples of lib.featuresets.Featuresets extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

get(2)

Example #1

Show file

File: runner.py Project: Jewelryland/college-machine_learning

    def __init__(self, verbose = True):
        self.verbose = verbose

        self.log("Loading data...")
        self.words = Data.load_words("most_informative")
        reviews = Data.load_reviews()

        self.log("Feature extraction...")
        data_set = Featuresets.get(reviews, self.words)
        self.train_set = data_set[:3*len(data_set)/4]
        self.test_set  = data_set[3*len(data_set)/4:]

Example #2

Show file

    def __init__(self, verbose=True):
        self.verbose = verbose

        self.log("Loading data...")
        self.words = Data.load_words("most_informative")
        reviews = Data.load_reviews()

        self.log("Feature extraction...")
        data_set = Featuresets.get(reviews, self.words)
        self.train_set = data_set[:3 * len(data_set) / 4]
        self.test_set = data_set[3 * len(data_set) / 4:]

Example #3

Show file

    def run(self, classifier, name=None):
        if name:
            self.log("")
            self.log("============================")
            self.log(name)
            self.log("============================")

        if name != "Naive Bayes":
            self.log("Cross validating for parameters selection...")
            accuracy = classifier.cross_validate(5, self.train_set)

            self.log("%.2f (accuracy)" % (accuracy))

        self.log("Cross validating for method evaluation...")
        accuracy = classifier.cross_validate(5, self.train_set + self.test_set)

        self.log("%.4f (accuracy)" % (accuracy))

        self.log("Training and testing...")
        confusion_matrix = classifier.train_and_test(self.train_set,
                                                     self.test_set)
        testAccuracy = confusion_matrix.accuracy()

        # Data.save_most_informative_words(classifier.most_informative_words(500))

        example_reviews = [
            ("A wickedly entertaining, sometimes thrilling adventure.",
             "positive"),
            ("Providing a riot of action, big and visually opulent but oddly lumbering and dull.",
             "negative")
        ]
        for review in example_reviews:
            (document, polarity) = Featuresets.get([review], self.words)[0]
            self.log("Classification: \"%s\" => %s" % (review[0], polarity))

        self.log("Accuracy: %g" % confusion_matrix.accuracy())
        self.log("Precision: %g" % confusion_matrix.precision())
        self.log("Recall:    %g" % confusion_matrix.recall())
        self.log("F1 score:  %g" % confusion_matrix.f1_score())

        return accuracy, testAccuracy

Example #4

Show file

File: runner.py Project: Jewelryland/college-machine_learning

    def run(self, classifier, name = None):
        if name:
            self.log("")
            self.log("============================")
            self.log(name)
            self.log("============================")

        if name != "Naive Bayes":
            self.log("Cross validating for parameters selection...")
            accuracy = classifier.cross_validate(5, self.train_set)

            self.log("%.2f (accuracy)" % (accuracy))

        self.log("Cross validating for method evaluation...")
        accuracy = classifier.cross_validate(5, self.train_set + self.test_set)
        
        self.log("%.4f (accuracy)" % (accuracy))

        self.log("Training and testing...")
        confusion_matrix = classifier.train_and_test(self.train_set, self.test_set)
        testAccuracy=confusion_matrix.accuracy()
        
        # Data.save_most_informative_words(classifier.most_informative_words(500))

        example_reviews = [
            ("A wickedly entertaining, sometimes thrilling adventure.", "positive"),
            ("Providing a riot of action, big and visually opulent but oddly lumbering and dull.", "negative")
        ]
        for review in example_reviews:
            (document, polarity) = Featuresets.get([review], self.words)[0]
            self.log("Classification: \"%s\" => %s" % (review[0], polarity))
        
        self.log("Accuracy: %g" % confusion_matrix.accuracy())
        self.log("Precision: %g" % confusion_matrix.precision())
        self.log("Recall:    %g" % confusion_matrix.recall())
        self.log("F1 score:  %g" % confusion_matrix.f1_score())

        return accuracy, testAccuracy