Python preprocessDataの例

プログラミング言語: Python

名前空間/パッケージ名: mlhelper

メソッド/関数: preprocessData

hotexamples.comのコード掲載数: 4

Python preprocessData - 4件のコード例が見つかりました。すべてオープンソースプロジェクトから抽出されたPythonのmlhelper.preprocessDataの実例で、最も評価が高いものを厳選しています。コード例の評価を行っていただくことで、より質の高いコード例が表示されるようになります。

コード例 #1

ファイルを表示

ファイル: fit-predict-persist.py プロジェクト: muko16/Predict-Rent

    plt.subplot(1, 2, 2)
    plt.barh(pos, feature_importance[sorted_idx], align='center')
    plt.yticks(pos, header[sorted_idx])  # boston.feature_names[sorted_idx])
    plt.xlabel('Relative Importance')
    plt.title('Variable Importance')
    plt.show(block=False)

    return header[sorted_idx], feature_importance[sorted_idx]


csvfile = 'rentList_All_final.csv'
# adding attributes did not make a difference
#csvfile = 'rentList_All_withAllAttr_trimmed.csv'
#csvfile = 'rentList_E_EC_N_final.csv'
data = readCsvIntoPandasDataframe(csvfile)
X, y, X_scaler, y_scaler, header = preprocessData(data)

#print "header type:"
#print type(header).__name__
#print header
#X, y = preprocessDataWithoutScale(data)

joblib.dump(X_scaler, 'pickle/X_scaler.pkl')
joblib.dump(y_scaler, 'pickle/y_scaler.pkl')

estimators = []

# K-Nearest Neighbors
estimators.append({
    "name":
    "KNN",

コード例 #2

ファイルを表示

ファイル: fit-predict-persist-house.py プロジェクト: muko16/Predict-Rent

	plt.subplot(1, 2, 2)
	plt.barh(pos, feature_importance[sorted_idx], align='center')
	plt.yticks(pos, header[sorted_idx]) # boston.feature_names[sorted_idx])
	plt.xlabel('Relative Importance')
	plt.title('Variable Importance')
	plt.show(block=False)

	return header[sorted_idx], feature_importance[sorted_idx]


csvfile = 'HousePriceList_All_Train.csv'
# adding attributes did not make a difference
#csvfile = 'rentList_All_withAllAttr_trimmed.csv' 
#csvfile = 'rentList_E_EC_N_final.csv'
data = readCsvIntoPandasDataframe(csvfile)
X, y, X_scaler, y_scaler, header, imp, vec = preprocessData(data)


#print "header type:"
#print type(header).__name__
#print header
#X, y = preprocessDataWithoutScale(data)

joblib.dump(X_scaler, 'pickle-house/X_scaler.pkl') 
joblib.dump(y_scaler, 'pickle-house/y_scaler.pkl') 
joblib.dump(imp, 'pickle-house/Imputer.pkl') 
joblib.dump(vec, 'pickle-house/Vector.pkl') 

estimators = []

# K-Nearest Neighbors

コード例 #3

ファイルを表示

ファイル: fit-predict-persist-final.py プロジェクト: muko16/Predict-Rent

    plt.subplot(1, 2, 2)
    plt.barh(pos, feature_importance[sorted_idx], align='center')
    plt.yticks(pos, header[sorted_idx])  # boston.feature_names[sorted_idx])
    plt.xlabel('Relative Importance')
    plt.title('Variable Importance')
    plt.show(block=False)

    return header[sorted_idx], feature_importance[sorted_idx]


csvfile = 'rentList_All_final.csv'
# adding attributes did not make a difference
#csvfile = 'rentList_All_withAllAttr_trimmed.csv'
#csvfile = 'rentList_E_EC_N_final.csv'
data = readCsvIntoPandasDataframe(csvfile)
X, y, X_scaler, y_scaler, header, imp, vec = preprocessData(data)

#print "header type:"
#print type(header).__name__
#print header
#X, y = preprocessDataWithoutScale(data)

joblib.dump(X_scaler, 'pickle-final/X_scaler.pkl')
joblib.dump(y_scaler, 'pickle-final/y_scaler.pkl')
joblib.dump(imp, 'pickle-final/Imputer.pkl')
joblib.dump(vec, 'pickle-final/Vector.pkl')

estimators = []

# K-Nearest Neighbors
estimators.append({

コード例 #4

ファイルを表示

ファイル: fit-predict-persist.py プロジェクト: muko16/Predict-Rent

	plt.subplot(1, 2, 2)
	plt.barh(pos, feature_importance[sorted_idx], align='center')
	plt.yticks(pos, header[sorted_idx]) # boston.feature_names[sorted_idx])
	plt.xlabel('Relative Importance')
	plt.title('Variable Importance')
	plt.show(block=False)

	return header[sorted_idx], feature_importance[sorted_idx]


csvfile = 'rentList_All_final.csv'
# adding attributes did not make a difference
#csvfile = 'rentList_All_withAllAttr_trimmed.csv' 
#csvfile = 'rentList_E_EC_N_final.csv'
data = readCsvIntoPandasDataframe(csvfile)
X, y, X_scaler, y_scaler, header = preprocessData(data)

#print "header type:"
#print type(header).__name__
#print header
#X, y = preprocessDataWithoutScale(data)

joblib.dump(X_scaler, 'pickle/X_scaler.pkl') 
joblib.dump(y_scaler, 'pickle/y_scaler.pkl') 


estimators = []

# K-Nearest Neighbors
estimators.append( {"name": "KNN", 
				   "model": neighbors.KNeighborsRegressor(