示例#1
0
文件: wine.py 项目: ToxaZ/coursera_ml
def main():
    wine_file = 'data/wine.data'
    url = 'https://archive.ics.uci.edu/ml/machine-learning-databases/wine/wine.data'
    try:
        data = pd.read_csv(wine_file, header=None)
    except IOError:
        print ('No {0} file found, downloading it from {1}'
               .format(wine_file, url))
        wine_reques = requests.get(url).content
        data = pd.read_csv(io.StringIO(wine_reques.decode('utf-8')),
                           header=None)

    X = data.iloc[:, 1:].values
    X_scaled = scale(X)
    y = data.iloc[:, 0].values
    kf = KFold(len(data.index), n_folds=5, shuffle=True, random_state=42)
    neighbors_range = [x for x in range(1, 51)]

    write_submission(
        classifier_choice_cv(
            X, y, KNeighborsClassifier, 'n_neighbors', neighbors_range, kf)[0],
        '31')
    write_submission(
        classifier_choice_cv(
            X, y, KNeighborsClassifier, 'n_neighbors', neighbors_range, kf)[1],
        '32')
    write_submission(
        classifier_choice_cv(
            X_scaled, y, KNeighborsClassifier, 'n_neighbors', neighbors_range, kf)[0],
        '33')
    write_submission(
        classifier_choice_cv(
            X_scaled, y, KNeighborsClassifier, 'n_neighbors', neighbors_range, kf)[1],
        '34')
示例#2
0
def main():
    boston = load_boston()
    X = scale(boston.data)
    y = boston.target
    classifier = KNeighborsRegressor(n_neighbors=5, weights='distance')
    kf = KFold(len(X), n_folds=5, shuffle=True, random_state=42)
    neighbors_range = np.linspace(1.0, 10.0, num=200)

    write_submission(
        int(classifier_choice_cv(
            X, y, classifier, 'p', neighbors_range, kf,
            scoring='mean_squared_error')[0]),
        '41')