Python essays_by_set 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: competition_io

메소드/함수: essays_by_set

hotexamples.com에서의 예제들: 4

Python essays_by_set - 4개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 competition_io.essays_by_set에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

예제 #1

파일 보기

파일: length_benchmark.py 프로젝트: xiaolei89tw/ASAP-SAS

def main():
    feature_functions = [get_character_count, get_word_count]
    predictions = {}

    for essay_set in cio.get_essay_sets():
        print("Making Predictions for Essay Set %s" % essay_set)
        train = list(cio.essays_by_set(essay_set))
        features = extract_features([x["EssayText"] for x in train],
                                    feature_functions)
        rf = RandomForestRegressor(n_estimators=50)
        rf.fit(features, [float(x["Score1"]) for x in train])

        test = list(
            cio.essays_by_set(essay_set,
                              "../Data/public_leaderboard_rel_2.tsv"))
        features = extract_features([x["EssayText"] for x in test],
                                    feature_functions)
        predicted_scores = rf.predict(features)
        for essay_id, pred_score in zip([x["Id"] for x in test],
                                        predicted_scores):
            predictions[essay_id] = round(pred_score)

    output_file = "../Submissions/length_benchmark.csv"
    print("Writing submission to %s" % output_file)
    f = open(output_file, "w")
    f.write("id,essay_score\n")
    for key in sorted(predictions.keys()):
        f.write("%d,%d\n" % (key, predictions[key]))
    f.close()

예제 #2

파일 보기

def main():
    predictions = {}

    for essay_set in cio.get_essay_sets():
        print("Making Predictions for Essay Set %s" % essay_set)
        train = list(cio.essays_by_set(essay_set))
        bag = features.train_bag(" ".join(x["EssayText"] for x in train), 500)
        fea = [features.bag_representation(bag, x["EssayText"]) for x in train]
        rf = RandomForestRegressor(n_estimators=50)
        rf.fit(fea, [float(x["Score1"]) for x in train])

        test = list(
            cio.essays_by_set(essay_set,
                              "../Data/public_leaderboard_rel_2.tsv"))
        fea = [features.bag_representation(bag, x["EssayText"]) for x in test]
        predicted_scores = rf.predict(fea)
        for essay_id, pred_score in zip([x["Id"] for x in test],
                                        predicted_scores):
            predictions[essay_id] = round(pred_score)

    output_file = "../Submissions/bag_of_words_benchmark.csv"
    print("Writing submission to %s" % output_file)
    f = open(output_file, "w")
    f.write("id,essay_score\n")
    for key in sorted(predictions.keys()):
        f.write("%d,%d\n" % (key, predictions[key]))
    f.close()

예제 #3

파일 보기

파일: length_benchmark.py 프로젝트: benhamner/ASAP-SAS

def main():    
    feature_functions = [get_character_count, get_word_count]
    predictions = {}

    for essay_set in cio.get_essay_sets():
        print("Making Predictions for Essay Set %s" % essay_set)
        train = list(cio.essays_by_set(essay_set))
        features = extract_features([x["EssayText"] for x in train], feature_functions)
        rf = RandomForestRegressor(n_estimators = 50)
        rf.fit(features,[float(x["Score1"]) for x in train])

        test = list(cio.essays_by_set(essay_set, "../Data/public_leaderboard_rel_2.tsv"))
        features = extract_features([x["EssayText"] for x in test], feature_functions)
        predicted_scores = rf.predict(features)
        for essay_id, pred_score in zip([x["Id"] for x in test], predicted_scores):
            predictions[essay_id] = round(pred_score)
    
    output_file = "../Submissions/length_benchmark.csv"
    print("Writing submission to %s" % output_file)
    f = open(output_file, "w")
    f.write("id,essay_score\n")
    for key in sorted(predictions.keys()):
        f.write("%d,%d\n" % (key,predictions[key]))
    f.close()

예제 #4

파일 보기

파일: bag_of_words_benchmark.py 프로젝트: benhamner/ASAP-SAS

def main():    
    predictions = {}

    for essay_set in cio.get_essay_sets():
        print("Making Predictions for Essay Set %s" % essay_set)
        train = list(cio.essays_by_set(essay_set))
        bag = features.train_bag(" ".join(x["EssayText"] for x in train), 500)
        fea =  [features.bag_representation(bag, x["EssayText"]) for x in train]
        rf = RandomForestRegressor(n_estimators = 50)
        rf.fit(fea,[float(x["Score1"]) for x in train])

        test = list(cio.essays_by_set(essay_set, "../Data/public_leaderboard_rel_2.tsv"))
        fea = [features.bag_representation(bag, x["EssayText"]) for x in test]
        predicted_scores = rf.predict(fea)
        for essay_id, pred_score in zip([x["Id"] for x in test], predicted_scores):
            predictions[essay_id] = round(pred_score)
    
    output_file = "../Submissions/bag_of_words_benchmark.csv"
    print("Writing submission to %s" % output_file)
    f = open(output_file, "w")
    f.write("id,essay_score\n")
    for key in sorted(predictions.keys()):
        f.write("%d,%d\n" % (key,predictions[key]))
    f.close()