from classifier import Classifier
import numpy
import pandas as pd

#prepare data
data = numpy.load("data.npz")
train = data['train']
test = data['test']
labels = data['labels']

#create classifier
clf = Classifier()
clf.TreeClassifier()
clf.load_data(training=train, labels=labels, test=test)
results = clf.predict()

df = pd.read_csv("pair&average.csv", sep='\t')


def TF(x):
    if x == 0:
        return False
    else:
        return True


results = [TF(x) for x in results]
TF = pd.Series(results)
df['Need_normalize'] = TF
newdf = df[df['Need_normalize'] == True]