Esempio n. 1
0
from preprocessing import Preprocessing
import regressor as reg
import visualizer as vis
#preprocssing
dataset = pd.read_csv('diamonds.csv')

prepro = Preprocessing()
prepro.handleMissing(dataset)

x = dataset.drop(['price','cut','color','clarity'],axis = 1)
y = dataset['price']

x = prepro.scale(x)

encode_col = dataset[['cut','color','clarity']]
encode_col  = prepro.encode(encode_col)

x = np.concatenate((x,encode_col),axis=1)

X_train, X_test, y_train, y_test = train_test_split(x, y,random_state=0,test_size=0.33)

vis.Visualizer().scatterplot(X_test[:,0],y_test.iloc[:])

# Linear Regression
regressor = reg.Regressor(type=reg.LINEAR_REGRESSION)
regressor.fit(X_train, y_train)
print("******************Linear Regression******************")
print(regressor.score(X_test,y_test))
#vis.Visualizer().scatterplot(X_test[:,0],y_test.iloc[:],regressor)
print("*************************************************")