예제 #1
0
# data4 = pd.read_csv("data/boston.csv")
# data4 = data4.astype({'CHAS':'category'}, copy=False)
# dtg4 = dt.DecisionTreeGenerator(data4)
# dtg4.generate()

# f = open('data/boston.txt', mode='w', encoding='utf-8')
# dtg4.treeRoot.print(file=f)
# f.close()

# =============================================================

data5 = pd.read_csv("data/auto-mpg.csv")
data5 = data5.astype(
    {
        'cylinders': 'category',
        'model year': 'category',
        'origin': 'category'
    },
    copy=False)
dtg5 = dt.DecisionTreeGenerator(data5)
dtg5.generate()

# dtg5.prune(10)
f = open('data/auto-mpg.txt', mode='w', encoding='utf-8')
dtg5.treeRoot.print(file=f)
f.close()

# testData = pd.read_csv("data/auto-mpg-test.csv")
# dtg5.classify(testData)
# testData.to_csv('data/auto-mpg-result.csv', index=False)