Esempio n. 1
0
def testTennis(trainFile, testFile, attrFile):
    tennis_train = pd.read_csv(trainFile, sep=" ", header=None)
    tennis_test = pd.read_csv(testFile, sep=" ", header=None)
    tennis_attr = pd.read_csv(attrFile, sep=" ", header=None)
    
    input, output, input_test, output_test = digitalize(tennis_train, tennis_test, tennis_attr,"tennis")
    input = np.concatenate((input, output), axis=1) 
    test_input = np.concatenate((input_test, output_test), axis=1)
    # p, numOfRulesPerHypo, numofattr, numofoutput, r, m, fit_threshold, stopGeneration, strategy, dataType):
    ga = GA(100, 4, 10, 2, 0.3, 0.1, 1, 1, 30, 'fitness-proportional', 'tennis')
    trainAcc, bestHypo = ga.fit(input)
    print ('Training data accuracy is: ' + str(trainAcc[0])) 
    testAcc = ga.predict(bestHypo, test_input)
    print ('Test data accuracy is: ' + str(testAcc[0]))
    ga.printRules(bestHypo)
Esempio n. 2
0
def testIris(trainfile, testfile, attrfile):
    iris_train = pd.read_csv(trainfile, header=None)
    iris_test = pd.read_csv(testfile, header=None)
    iris_attr = pd.read_csv(attrfile, header=None)
    input, output, input_test, output_test = digitalize(iris_train, iris_test, iris_attr,"iris")
    input = input.astype(np.float)
    input = np.concatenate((input, output), axis=1)
    test_input = np.concatenate((input_test, output_test), axis=1)
    # p, numOfRulesPerHypo, numofattr, numofoutput, r, m, numOfChangeBitsPerRule, fit_threshold, stopGeneration, strategy, dataType): tournament fitness-proportional rank
    # ga = GA(100, 6, 28, 3, 0.4, 0.2, 1, 0.8, 100, 'rank', 'iris')
    # (6*2*4+3)*4  *4
    ga = GA(400, 6, 48, 3, 0.3, 0.1, 1, 1, 50, 'tournament', 'iris')
    correct, bestHypo = ga.fit(input)
    print ('correct rate on traning data' + str(correct))
    ga.printRules(bestHypo)
    cor = ga.predict(bestHypo, test_input)