def make_implicit_graphs(preprocessed_data_folder, simple_undirected_implicit_graph_folder):
    ####################################################################################################################
    # Read graphs.
    ####################################################################################################################
    # Read follow graph.
    source_path = preprocessed_data_folder + "/" + "followedby" + ".tsv"
    follow_graph = read_adjacency_matrix(source_path, "\t", "matlab")
    follow_graph = follow_graph.transpose()

    # Read mention graph.
    source_path = preprocessed_data_folder + "/" + "mentionedby" + ".tsv"
    mention_graph = read_adjacency_matrix(source_path, "\t", "matlab")
    mention_graph = mention_graph.transpose()

    # Read retweet graph.
    source_path = preprocessed_data_folder + "/" + "retweetedby" + ".tsv"
    retweet_graph = read_adjacency_matrix(source_path, "\t", "matlab")
    retweet_graph = retweet_graph.transpose()

    ####################################################################################################################
    # Simple undirected implicit graphs.
    ####################################################################################################################
    target_path = simple_undirected_implicit_graph_folder + "/" + "follow_graph" + ".tsv"
    simple_undirected_follow_graph = (follow_graph + follow_graph.transpose())/2
    scipy_sparse_to_csv(target_path, simple_undirected_follow_graph, separator="\t", directed=False, numbering="matlab")

    target_path = simple_undirected_implicit_graph_folder + "/" + "mention_graph" + ".tsv"
    simple_undirected_mention_graph = (mention_graph + mention_graph.transpose())/2
    scipy_sparse_to_csv(target_path, simple_undirected_mention_graph, separator="\t", directed=False, numbering="matlab")

    target_path = simple_undirected_implicit_graph_folder + "/" + "retweet_graph" + ".tsv"
    simple_undirected_retweet_graph = (retweet_graph + retweet_graph.transpose())/2
    scipy_sparse_to_csv(target_path, simple_undirected_retweet_graph, separator="\t", directed=False, numbering="matlab")

    gc.collect()

    ####################################################################################################################
    # Multiview graphs.
    ####################################################################################################################
    target_path = simple_undirected_implicit_graph_folder + "/" + "fol_men_graph" + ".tsv"
    simple_undirected_fol_men_graph = (follow_graph + follow_graph.transpose() +
                                       mention_graph + mention_graph.transpose())/4
    scipy_sparse_to_csv(target_path, simple_undirected_fol_men_graph, separator="\t", directed=False, numbering="matlab")

    target_path = simple_undirected_implicit_graph_folder + "/" + "men_ret_graph" + ".tsv"
    simple_undirected_men_ret_graph = (mention_graph + mention_graph.transpose() +
                                       retweet_graph + retweet_graph.transpose())/4
    scipy_sparse_to_csv(target_path, simple_undirected_men_ret_graph, separator="\t", directed=False, numbering="matlab")

    target_path = simple_undirected_implicit_graph_folder + "/" + "fol_ret_graph" + ".tsv"
    simple_undirected_fol_ret_graph = (follow_graph + follow_graph.transpose() +
                                       retweet_graph + retweet_graph.transpose())/4
    scipy_sparse_to_csv(target_path, simple_undirected_fol_ret_graph, separator="\t", directed=False, numbering="matlab")

    target_path = simple_undirected_implicit_graph_folder + "/" + "fol_men_ret_graph" + ".tsv"
    simple_undirected_fol_men_ret_graph = (follow_graph + follow_graph.transpose() +
                                           mention_graph + mention_graph.transpose() +
                                           retweet_graph + retweet_graph.transpose())/6
    scipy_sparse_to_csv(target_path, simple_undirected_fol_men_ret_graph, separator="\t", directed=False, numbering="matlab")
def read_insight_data(dataset_folder):
    adjacency_matrix = insight_read_data.read_adjacency_matrix(file_path=dataset_folder + "/men_ret_graph.tsv",
                                                               separator="\t")
    node_label_matrix,\
    labelled_node_indices,\
    number_of_categories = insight_read_data.read_node_label_matrix(file_path=dataset_folder + "/user_label_matrix.tsv",
                                                                    separator="\t")
    return adjacency_matrix,\
           node_label_matrix,\
           labelled_node_indices,\
           number_of_categories
Beispiel #3
0
def read_insight_data(dataset_folder):
    adjacency_matrix = insight_read_data.read_adjacency_matrix(
        file_path=dataset_folder + "/men_ret_graph.tsv", separator="\t")
    node_label_matrix,\
    labelled_node_indices,\
    number_of_categories = insight_read_data.read_node_label_matrix(file_path=dataset_folder + "/user_label_matrix.tsv",
                                                                    separator="\t")
    return adjacency_matrix,\
           node_label_matrix,\
           labelled_node_indices,\
           number_of_categories