def main():
    dirList = list()

    temp = listdir("./data/Asthma/2010/")
    dirList.append(temp)
    temp = listdir("./data/Asthma/2011/")
    dirList.append(temp)
    temp = listdir("./data/Asthma/2012/")
    dirList.append(temp)
    temp = listdir("./data/Asthma/2013/")
    dirList.append(temp)
    temp = listdir("./data/Asthma/2014/")
    dirList.append(temp)

    pre = PreProcessor()
    clf = SVM(kernel=GaussianKernel(5.0), C=1.0)

    X_train, y_train = pre.loadTrainingSet(
        "training_data/Asthma_Sample_Tokenized.csv")
    clf.fit(X_train, y_train)
예제 #2
0
# Author Alvaro Esperanca

from SVM import SVM
from PreProcessor import PreProcessor
from Validator import Validator
from GaussianKernel import GaussianKernel
import numpy as np

if __name__ == "__main__":
    pre = PreProcessor()
    val = Validator()
    clf = SVM(kernel=GaussianKernel(5.0), C=1.0)

    X_train, y_train = pre.loadTrainingSet(
        "training_data/Cancer_Sample_Tokenized.csv")
    X_test = pre.loadTestSet("test_data/Tokenized_Cancer_test.csv")

    clf.fit(X_train, y_train)
    predictions = clf.predict(X_test)

    validFile = open("validation_set/validation_set_labels.txt", "r")

    temp = validFile.readlines()
    validationLabels = [float(num) for num in temp]

    val.validate(validationLabels, predictions)

    val.report()

    # predFile = open("results/gaussian_kernel_s_5000_c_5.txt", "w")
    # statFile = open("results/gaussian_kernel_s_5000_c_5_stats.txt", "w")