Ejemplo n.º 1
0
def get_haus_distance():

    def pairwise(iterable):
        "s -> (s0,s1), (s1,s2), (s2, s3), ..."
        a, b = itertools.tee(iterable)
        next(b, None)
        return itertools.izip(a, b)

    doc_id_list = request.form.getlist('doc_list')

    distance = {}
    for x, y in pairwise(doc_id_list + [doc_id_list[0]]):
        distance[data_warehouse.get_doc_title_by_id(x) + ", " + data_warehouse.get_doc_title_by_id(y)] = MHD.\
            get_min_of_avg_hausdorff_distance(
                data_warehouse.get_stylometric_features_by_doc_id(x),
                data_warehouse.get_stylometric_features_by_doc_id(y))

    return jsonify(distance)
Ejemplo n.º 2
0
def get_haus_distance():

    def pairwise(iterable):
        "s -> (s0,s1), (s1,s2), (s2, s3), ..."
        a, b = itertools.tee(iterable)
        next(b, None)
        return itertools.izip(a, b)

    doc_id_list = request.form.getlist('doc_list')

    distance = {}
    for x, y in pairwise(doc_id_list + [doc_id_list[0]]):
        distance[data_warehouse.get_doc_title_by_id(x) + ", " + data_warehouse.get_doc_title_by_id(y)] = MHD.\
            get_min_of_avg_hausdorff_distance(
                data_warehouse.get_stylometric_features_by_doc_id(x),
                data_warehouse.get_stylometric_features_by_doc_id(y))

    return jsonify(distance)
Ejemplo n.º 3
0
def get_csv_of_all_features():
    author_list = []
    feature_list = []

    doc_id_list = request.form.getlist('doc_list')

    for idx in range(0, len(doc_id_list)):
        features = data_warehouse.get_stylometric_features_by_doc_id(doc_id_list[idx])
        feature_list.extend(features)
        author_list.extend([idx for x in range(len(features))])

    string_io = StringIO()
    cw = csv.writer(string_io)
    cw.writerows(data_to_csv.get_output_lists_for_csv_after_3d_pca(author_list, feature_list))

    output = make_response(string_io.getvalue())
    output.headers['Content-type'] = 'text/plaintext'
    return output
Ejemplo n.º 4
0
def get_csv_of_all_features():
    author_list = []
    feature_list = []

    doc_id_list = request.form.getlist('doc_list')

    for idx in range(0, len(doc_id_list)):
        features = data_warehouse.get_stylometric_features_by_doc_id(doc_id_list[idx])
        feature_list.extend(features)
        author_list.extend([idx for x in range(len(features))])

    string_io = StringIO()
    cw = csv.writer(string_io)
    cw.writerows(data_to_csv.get_output_lists_for_csv_after_3d_pca(author_list, feature_list))

    output = make_response(string_io.getvalue())
    output.headers['Content-type'] = 'text/plaintext'
    return output