Пример #1
0
            'Usage:', sys.argv[0],
            'in_train_file in_test_file in_test_ans in_user_profile_file in_config out_train_file out_test_file'
        )
        exit()

    # arguments
    train_file = sys.argv[1]
    test_file = sys.argv[2]
    test_ans_file = sys.argv[3]
    user_profile_file = sys.argv[4]
    config_file = sys.argv[5]
    out_train_file = sys.argv[6]
    out_test_file = sys.argv[7]

    # read in data
    train_graph = file_io.read_graph(train_file)
    config = file_io.read_config(config_file)
    user_feature = None

    (user_feature,
     feature_name) = file_io.read_feature_column_major(user_profile_file,
                                                       config)

    #normalize features
    for column in user_feature:
        if column.type == 'numerical':
            cf.normalize_column(column)
        elif column.type == 'categorical':
            cf.convert_to_dummy_variable(column)

    test_pair = file_io.read_data(test_file)
Пример #2
0
if __name__ == "__main__":
    if len(sys.argv) != 8:
        print('Usage:', sys.argv[0], 'in_train_file in_test_file in_test_ans in_user_profile_file in_config out_train_file out_test_file')
        exit()
    
    # arguments
    train_file = sys.argv[1]
    test_file = sys.argv[2]
    test_ans_file = sys.argv[3]
    user_profile_file = sys.argv[4]
    config_file = sys.argv[5]
    out_train_file = sys.argv[6]
    out_test_file = sys.argv[7]

    # read in data
    train_graph = file_io.read_graph(train_file)
    config = file_io.read_config(config_file)
    user_feature = None
    
    (user_feature, feature_name) = file_io.read_feature_column_major(user_profile_file, config)
    
    #normalize features
    for column in user_feature:
        if column.type == 'numerical':
            cf.normalize_column(column)
        elif column.type == 'categorical':
            cf.convert_to_dummy_variable(column)
    
    test_pair = file_io.read_data(test_file)
    train_graph = update_nodes_from_test_data(train_graph, test_pair)
    test_ans = gen_label_mapping(test_pair, file_io.read_ans(test_ans_file))