def train_and_save_gnosis_ref_arch_s3(training_data_url, fp_min_support_count,
                                      fp_intent_topic_count_threshold,
                                      fp_num_partition):
    """Train the Ref Arch Gnosis and saves the Gnosis model in S3.

    :return: None
    """
    input_bucket_name, output_bucket_name, additional_path = get_path_names(
        training_data_url)
    input_data_store = S3DataStore(src_bucket_name=input_bucket_name,
                                   access_key=config.AWS_S3_ACCESS_KEY_ID,
                                   secret_key=config.AWS_S3_SECRET_ACCESS_KEY)

    output_data_store = S3DataStore(src_bucket_name=output_bucket_name,
                                    access_key=config.AWS_S3_ACCESS_KEY_ID,
                                    secret_key=config.AWS_S3_SECRET_ACCESS_KEY)

    train_and_save_gnosis_ref_arch(
        input_data_store=input_data_store,
        output_data_store=output_data_store,
        additional_path=additional_path,
        fp_min_support_count=fp_min_support_count,
        fp_intent_topic_count_threshold=fp_intent_topic_count_threshold,
        fp_num_partition=fp_num_partition)
    return None
示例#2
0
def generate_evaluate_test_s3(training_url, result_id):
    input_bucket_name, output_bucket_name, additional_path = get_path_names(
        training_url)
    input_data_store = S3DataStore(src_bucket_name=input_bucket_name,
                                   access_key=AWS_S3_ACCESS_KEY_ID,
                                   secret_key=AWS_S3_SECRET_ACCESS_KEY)
    output_data_store = S3DataStore(src_bucket_name=input_bucket_name,
                                    access_key=AWS_S3_ACCESS_KEY_ID,
                                    secret_key=AWS_S3_SECRET_ACCESS_KEY)
    generate_test(input_data_store, output_data_store, additional_path)
    test_kronos(training_url, result_id, input_data_store, output_data_store,
                additional_path)
示例#3
0
def generate_and_save_package_frequency_dict_s3(training_data_url):
    input_bucket_name, output_bucket_name, additional_path = get_path_names(
        training_data_url)
    input_data_store = S3DataStore(src_bucket_name=input_bucket_name,
                                   access_key=config.AWS_S3_ACCESS_KEY_ID,
                                   secret_key=config.AWS_S3_SECRET_ACCESS_KEY)
    output_data_store = S3DataStore(src_bucket_name=output_bucket_name,
                                    access_key=config.AWS_S3_ACCESS_KEY_ID,
                                    secret_key=config.AWS_S3_SECRET_ACCESS_KEY)
    frequency_dict_generator = FrequencyDictGenerator.create_frequency_generator(
        input_data_store=input_data_store, additional_path=additional_path)
    frequency_dict_generator.generate_and_save_frequency_dict(
        output_data_store=output_data_store, additional_path=additional_path)
def generate_evaluate_test_s3(training_url, result_id):
    """Generate the test, save it, and then call all relevant checkers."""
    input_bucket_name, output_bucket_name, additional_path = get_path_names(
        training_url)
    input_data_store = S3DataStore(src_bucket_name=input_bucket_name,
                                   access_key=AWS_S3_ACCESS_KEY_ID,
                                   secret_key=AWS_S3_SECRET_ACCESS_KEY)
    output_data_store = S3DataStore(src_bucket_name=input_bucket_name,
                                    access_key=AWS_S3_ACCESS_KEY_ID,
                                    secret_key=AWS_S3_SECRET_ACCESS_KEY)
    generate_test(input_data_store, output_data_store, additional_path)
    perform_kronos_test(training_url, result_id, input_data_store,
                        output_data_store, additional_path)
示例#5
0
def generate_and_save_gnosis_package_topic_model_s3(training_data_url):
    """Generate and save Gnosis package topic model into S3."""
    input_bucket_name, output_bucket_name, additional_path = get_path_names(
        training_data_url)
    input_data_store = S3DataStore(src_bucket_name=input_bucket_name,
                                   access_key=config.AWS_S3_ACCESS_KEY_ID,
                                   secret_key=config.AWS_S3_SECRET_ACCESS_KEY)

    output_data_store = S3DataStore(src_bucket_name=output_bucket_name,
                                    access_key=config.AWS_S3_ACCESS_KEY_ID,
                                    secret_key=config.AWS_S3_SECRET_ACCESS_KEY)

    generate_and_save_gnosis_package_topic_model(input_data_store=input_data_store,
                                                 output_data_store=output_data_store,
                                                 additional_path=additional_path)
def train_and_save_pruned_tag_list_s3(training_data_url):
    """Return the clean package_topic present in the given s3 training URL.
        :param training_data_url: The Location where data is read from and written to."""

    input_bucket_name, output_bucket_name, additional_path = get_path_names(
        training_data_url)
    input_package_topic_data_store = S3DataStore(src_bucket_name=input_bucket_name,
                                                 access_key=config.AWS_S3_ACCESS_KEY_ID,
                                                 secret_key=config.AWS_S3_SECRET_ACCESS_KEY)
    output_package_topic_data_store = S3DataStore(src_bucket_name=output_bucket_name,
                                                  access_key=config.AWS_S3_ACCESS_KEY_ID,
                                                  secret_key=config.AWS_S3_SECRET_ACCESS_KEY)
    return TagListPruner.prune_tag_list(input_package_topic_data_store,
                                        output_package_topic_data_store,
                                        additional_path)
示例#7
0
def generate_and_save_kronos_dependency_s3(training_data_url):
    input_bucket_name, output_bucket_name, additional_path = get_path_names(
        training_data_url)
    input_gnosis_data_store = S3DataStore(src_bucket_name=input_bucket_name,
                                          access_key=config.AWS_S3_ACCESS_KEY_ID,
                                          secret_key=config.AWS_S3_SECRET_ACCESS_KEY)

    input_package_topic_data_store = S3DataStore(src_bucket_name=input_bucket_name,
                                                 access_key=config.AWS_S3_ACCESS_KEY_ID,
                                                 secret_key=config.AWS_S3_SECRET_ACCESS_KEY)

    output_data_store = S3DataStore(src_bucket_name=output_bucket_name,
                                    access_key=config.AWS_S3_ACCESS_KEY_ID,
                                    secret_key=config.AWS_S3_SECRET_ACCESS_KEY)

    generate_and_save_kronos_dependency(
        input_gnosis_data_store=input_gnosis_data_store,
        input_package_topic_data_store=input_package_topic_data_store,
        output_data_store=output_data_store, additional_path=additional_path)
示例#8
0
def generate_and_save_cooccurrence_matrices_s3(training_data_url):
    input_bucket_name, output_bucket_name, additional_path = get_path_names(
        training_data_url)
    input_kronos_dependency_data_store = S3DataStore(src_bucket_name=input_bucket_name,
                                                     access_key=config.AWS_S3_ACCESS_KEY_ID,
                                                     secret_key=config.AWS_S3_SECRET_ACCESS_KEY)

    input_manifest_data_store = S3DataStore(src_bucket_name=input_bucket_name,
                                            access_key=config.AWS_S3_ACCESS_KEY_ID,
                                            secret_key=config.AWS_S3_SECRET_ACCESS_KEY)

    output_data_store = S3DataStore(src_bucket_name=output_bucket_name,
                                    access_key=config.AWS_S3_ACCESS_KEY_ID,
                                    secret_key=config.AWS_S3_SECRET_ACCESS_KEY)

    generate_and_save_cooccurrence_matrices(
        input_kronos_dependency_data_store=input_kronos_dependency_data_store,
        input_manifest_data_store=input_manifest_data_store,
        output_data_store=output_data_store, additional_path=additional_path)
def train_and_save_kronos_list_s3(training_data_url):
    """Train the Kronos and save the results into the AWS S3 storage."""
    input_bucket_name, output_bucket_name, additional_path = get_path_names(
        training_data_url)
    input_kronos_dependency_data_store = S3DataStore(src_bucket_name=input_bucket_name,
                                                     access_key=config.AWS_S3_ACCESS_KEY_ID,
                                                     secret_key=config.AWS_S3_SECRET_ACCESS_KEY)

    input_cooccurrence_matrix_data_store = S3DataStore(src_bucket_name=input_bucket_name,
                                                       access_key=config.AWS_S3_ACCESS_KEY_ID,
                                                       secret_key=config.AWS_S3_SECRET_ACCESS_KEY)

    output_data_store = S3DataStore(src_bucket_name=output_bucket_name,
                                    access_key=config.AWS_S3_ACCESS_KEY_ID,
                                    secret_key=config.AWS_S3_SECRET_ACCESS_KEY)

    train_and_save_kronos_list(
        input_kronos_dependency_data_store=input_kronos_dependency_data_store,
        input_co_occurrence_data_store=input_cooccurrence_matrix_data_store,
        output_data_store=output_data_store, additional_path=additional_path)