gammas.append(gamma) kernels.append(chi2_kernel(X, X, gamma=1.0 / gamma)) return kernels, gammas if __name__ == "__main__": total = time.time() params = { "n_estimators": [10, 50, 100, 200, 400, 750, 800, 1000, 2000], "base_estimator__max_depth": [1, 2, 3, 5], "base_estimator__random_state": [0], "random_state": [0] } # params = {"C": [0.00001, 0.0001, 0.001, 0.01, 0.1, 1, 10, 100, 1000, 10000, 100000]} datamanager = CaltechManager() categories = [ c for c in os.listdir(datamanager.PATHS["CATEGORIES_DIR"]) if c != datamanager.BACKGROUND and os.path.splitext(c)[1] != ".py" ] #kernels, gammas = build_train_kernels(categories, datamanager) #print "Finished building kernels" #grids = (GridSearch(SVC(kernel="precomputed"), c) for c in categories) # grids = (GridSearch(RandomForestClassifier(), c) for c in categories) grids = [ GridSearch(AdaBoostClassifier(), datamanager, c) for c in categories ]
def setUp(self): self.datamanager = CaltechManager() self.datamanager.change_base_path(os.path.join(BASE_PATH, "testdata"))
import sys from sklearn.ensemble import RandomForestClassifier, AdaBoostClassifier from sklearn.svm import LinearSVC, SVC from vcd import VisualConceptDetection import os import time from util import svm from datamanagers.CaltechManager import CaltechManager import numpy as np import pylab as pl from runGridSearch import GridSearch if __name__ == "__main__": category = "airplanes" total = time.time() clf = RandomForestClassifier(n_estimators=2000) # clf = AdaBoostClassifier(n_estimators = 2000) # clf.base_estimator.max_depth = 4 # clf = LinearSVC(C=100) # clf = SVC(C=10) dm = CaltechManager() vcd = VisualConceptDetection(classifier=clf, datamanager=dm) vcd.run(category) print "Total execution time: %f minutes" % ((time.time() - total) / 60.0)