Пример #1
0
        gammas.append(gamma)
        kernels.append(chi2_kernel(X, X, gamma=1.0 / gamma))
    return kernels, gammas


if __name__ == "__main__":
    total = time.time()
    params = {
        "n_estimators": [10, 50, 100, 200, 400, 750, 800, 1000, 2000],
        "base_estimator__max_depth": [1, 2, 3, 5],
        "base_estimator__random_state": [0],
        "random_state": [0]
    }
    #    params = {"C": [0.00001, 0.0001, 0.001, 0.01, 0.1, 1, 10, 100, 1000, 10000, 100000]}

    datamanager = CaltechManager()
    categories = [
        c for c in os.listdir(datamanager.PATHS["CATEGORIES_DIR"])
        if c != datamanager.BACKGROUND and os.path.splitext(c)[1] != ".py"
    ]

    #kernels, gammas = build_train_kernels(categories, datamanager)
    #print "Finished building kernels"

    #grids = (GridSearch(SVC(kernel="precomputed"), c) for c in categories)
    # grids = (GridSearch(RandomForestClassifier(), c) for c in categories)

    grids = [
        GridSearch(AdaBoostClassifier(), datamanager, c) for c in categories
    ]
Пример #2
0
 def setUp(self):
     self.datamanager = CaltechManager()
     self.datamanager.change_base_path(os.path.join(BASE_PATH, "testdata"))
Пример #3
0
import sys
from sklearn.ensemble import RandomForestClassifier, AdaBoostClassifier
from sklearn.svm import LinearSVC, SVC
from vcd import VisualConceptDetection
import os
import time
from util import svm
from datamanagers.CaltechManager import CaltechManager
import numpy as np
import pylab as pl

from runGridSearch import GridSearch

if __name__ == "__main__":
    category = "airplanes"
    total = time.time()

    clf = RandomForestClassifier(n_estimators=2000)

    # clf = AdaBoostClassifier(n_estimators = 2000)
    # clf.base_estimator.max_depth = 4

    # clf = LinearSVC(C=100)
    # clf = SVC(C=10)

    dm = CaltechManager()
    vcd = VisualConceptDetection(classifier=clf, datamanager=dm)

    vcd.run(category)
    print "Total execution time: %f minutes" % ((time.time() - total) / 60.0)