def decision_spambase_set(): """ Solution for HW1 prob 1 """ print('Homework 1 problem 1 - Regression Decision tree') print('Spambase Dataset') spam_data = utils.load_and_normalize_spam_data() test, train = utils.split_test_and_train(spam_data) print str(len(train)) + " # in training set <--> # in test " + str(len(test)) dt = train_decision_tree(train) predicted = test_decision_tree(dt, test) #print predicted #print test['is_spam'] error = mystats.calculate_binary_error(predicted, test['is_spam']) print 'Error: ' + str(error)