Python BigQueryService.nlp_v2_get_predictions_table 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: app.bq_service

클래스/타입: BigQueryService

메소드/함수: nlp_v2_get_predictions_table

hotexamples.com에서의 예제들: 2

Python BigQueryService.nlp_v2_get_predictions_table - 2개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 app.bq_service.BigQueryService.nlp_v2_get_predictions_table에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

BigQueryService(21)

insert_records_in_batches(3)

nlp_v2_destructively_migrate_predictions_table(2)

upload_daily_bot_probabilities(2)

execute_query(2)

nlp_v2_get_predictions_table(2)

migrate_daily_bot_probabilities_table(1)

migrate_populate_retweets_table_v2(1)

migrate_populate_user_details_table_v2(1)

migrate_populate_user_screen_names_table(1)

migrate_topics_table(1)

migrate_tweets_table(1)

migrate_user_id_assignments_table(1)

nlp_v2_fetch_statuses(1)

migrate_user_id_lookups_table(1)

fetch_unlabeled_statuses_in_batches(1)

query_to_df(1)

upload_bot_community_profile_tags(1)

upload_bot_community_profile_tokens(1)

upload_bot_community_status_tags(1)

upload_bot_community_status_tokens(1)

upload_predictions_in_batches(1)

upload_user_id_assignments(1)

fetch_user_details_vq(1)

fetch_topics(1)

fetch_tweet_details_v6(1)

fetch_daily_active_tweeter_statuses(1)

destructively_migrate_2_community_predictions_table(1)

destructively_migrate_bot_followers_table(1)

destructively_migrate_bots_table(1)

destructively_migrate_user_friends_flat(1)

fetch_basilica_embedless_partitioned_statuses(1)

fetch_bot_community_profiles(1)

fetch_bot_community_statuses(1)

fetch_daily_active_edge_friends(1)

fetch_daily_active_edge_friends_for_csv(1)

fetch_daily_active_tweeter_statuses_for_model_training(1)

append_topics(1)

fetch_daily_active_user_friends(1)

fetch_daily_nodes_with_active_edges(1)

fetch_daily_statuses_with_opinion_scores(1)

fetch_idless_screen_names(1)

fetch_idless_screen_names_postlookup(1)

fetch_labeled_tweets_in_batches(1)

fetch_max_user_id_postlookup(1)

fetch_nodes_with_active_edges_v6(1)

fetch_sn_nodes_with_active_edges_v7(1)

fetch_statuses_with_tags(1)

upload_user_id_lookups(1)

예제 #1

파일 보기

파일: bulk_predict.py 프로젝트: s2t2/tweet-analyzer-py

            batch = []
        job.end()

    seek_confirmation()
    #exit()

    for model_name in ["logistic_regression", "multinomial_nb"]:

        storage = ModelStorage(dirpath=f"nlp_v2/models/best/{model_name}")
        tv = storage.load_vectorizer()
        clf = storage.load_model()

        print(f"DESTROY PREDICTIONS TABLE? ({model_name})")
        seek_confirmation()
        bq_service.nlp_v2_destructively_migrate_predictions_table(model_name)
        predictions_table = bq_service.nlp_v2_get_predictions_table(model_name) # API call. cache it here once.

        job.start()

        for chunk_df in read_csv(CSV_FILEPATH, chunksize=BATCH_SIZE): # FYI: this will include the last chunk even if it is not a full batch
            status_ids = chunk_df["status_id"].tolist()
            status_texts = chunk_df["status_text"].tolist()

            preds = clf.predict(tv.transform(status_texts))

            batch = [{"status_id": status_id, "prediction": pred} for status_id, pred in zip(status_ids, preds)]
            bq_service.insert_records_in_batches(predictions_table, batch)

            job.counter += len(chunk_df)
            job.progress_report()
            batch = []

예제 #2

파일 보기

파일: bert_score_uploader.py 프로젝트: s2t2/tweet-analyzer-py

from app.bq_service import BigQueryService
from app.retweet_graphs_v2.k_days.generator import DateRangeGenerator

BATCH_SIZE = int(
    os.getenv("BATCH_SIZE", default=25000)
)  # the max number of processed users to store in BQ at once (with a single insert API call)

if __name__ == "__main__":

    bq_service = BigQueryService()
    job = Job()

    print(f"DESTROY PREDICTIONS TABLE? (BERT)")
    seek_confirmation()
    bq_service.nlp_v2_destructively_migrate_predictions_table("bert")
    predictions_table = bq_service.nlp_v2_get_predictions_table("bert")

    job.start()

    for dr in DateRangeGenerator(start_date="2019-12-20",
                                 k_days=1,
                                 n_periods=58).date_ranges:
        print(dr.start_date)
        csv_filepath = os.path.join(DATA_DIR,
                                    "daily_active_edge_friend_graphs_v5",
                                    dr.start_date,
                                    "tweets_BERT_Impeachment_800KTweets.csv")

        #df = read_csv(csv_filepath, usecols=["status_id", "text", "logit_0", "logit_1", "opinion_tweet"], nrows=100)
        #print(df.head())
        for chunk_df in read_csv(