Python printhclust 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: clusters

메소드/함수: printhclust

hotexamples.com에서의 예제들: 5

Python printhclust - 5개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 clusters.printhclust에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

예제 #1

파일 보기

def main():
    with open("json/{}.json".format(METRIC)) as data:
        json_obj = json.load(data)
        created_clusters = clusters.read_json(json_obj)

    labels = make_vectors.get_list("data/itemIndex.txt")
    hierarchy, level1_set, level2_set = get_hierarchy("data/itemHierarchy.csv")

    list_nodes = prune(
        created_clusters,
        len(level1_set))  # Prune so that there are len(level1_set) nodes
    # Evaluate which items belong to which clusters in the len(level1_set) nodes
    for node in list_nodes:
        evaluate_cluster(node, labels, hierarchy)

    clusters.printhclust(created_clusters, labels)

예제 #2

파일 보기

파일: hclusterwords.py 프로젝트: KelvinKim1/clustering_lab

import clusters

docs, words, data = clusters.readfile('titles_vectors.txt')
rdata = clusters.rotatematrix(data)

clust = clusters.hcluster(rdata, distance=clusters.pearson)
print('clusters by pearson correlation')
clusters.printhclust(clust, labels=words)
clusters.drawdendrogram(clust, words, jpeg='wordsclustpearson.jpg')

clust = clusters.hcluster(rdata, distance=clusters.tanimoto)
print('clusters by tanimoto coefficient')
clusters.printhclust(clust, labels=words)
clusters.drawdendrogram(clust, words, jpeg='wordsclusttanimoto.jpg')

clust = clusters.hcluster(rdata, distance=clusters.euclidean)
print('clusters by euclidean distance')
clusters.printhclust(clust, labels=words)
clusters.drawdendrogram(clust, words, jpeg='wordsclusteuclidean.jpg')

예제 #3

파일 보기

import clusters

docs, words, data = clusters.readfile('titles_vectors.txt')

clust = clusters.hcluster(data, distance=clusters.pearson)
print('clusters by pearson correlation')
clusters.printhclust(clust, labels=docs)
clusters.drawdendrogram(clust, docs, jpeg='docsclust_pearson.jpg')

clust = clusters.hcluster(data, distance=clusters.tanimoto)
print('clusters by tanimoto coefficient')
clusters.printhclust(clust, labels=docs)
clusters.drawdendrogram(clust, docs, jpeg='docsclust_tanimoto.jpg')

clust = clusters.hcluster(data, distance=clusters.euclidean)
print('clusters by euclidean distance')
clusters.printhclust(clust, labels=docs)
clusters.drawdendrogram(clust, docs, jpeg='docsclust_euclidean.jpg')

clust = clusters.hcluster(data, distance=clusters.cosine)
print('clusters by euclidean distance')
clusters.printhclust(clust, labels=docs)
clusters.drawdendrogram(clust, docs, jpeg='docsclust_cosine.jpg')

예제 #4

파일 보기

파일: hcluster.py 프로젝트: supersglzc/clustering_lab

import clusters

row_names, column_names, data = clusters.readfile('dataset_vectors.txt')

clust = clusters.hcluster(data)
print('clusters by euclidean distance')
clusters.printhclust(clust, labels=row_names)
clusters.drawdendrogram(clust,
                        row_names,
                        jpeg='hcluster_euclidean_centroid.jpg')

print()
clust = clusters.hcluster(data, clusters.find_by_min)
print('clusters by euclidean distance')
clusters.printhclust(clust, labels=row_names)
clusters.drawdendrogram(clust, row_names, jpeg='hcluster_euclidean_min.jpg')

print()
clust = clusters.hcluster(data, clusters.find_by_max)
print('clusters by euclidean distance')
clusters.printhclust(clust, labels=row_names)
clusters.drawdendrogram(clust, row_names, jpeg='hcluster_euclidean_max.jpg')

예제 #5

파일 보기

파일: hierarchical_cluster.py 프로젝트: jtsen/clustering_lab

import clusters, data_processing
'''Import Dataset'''
data = data_processing.open_csv_file('dataset.csv')
'''Create a list of countries in the order of the similarity matrix'''
countries_list = data_processing.get_country_names(data)
'''Create numerical attributes matrix'''
attr_matrix = data_processing.create_attribute_matrix(data)
data_processing.str_to_float(attr_matrix)
'''hierachical clustering: euclidean distance'''
num_cluster = 3
resulting_clusters = clusters.hcluster(attr_matrix,
                                       distance=clusters.euclidean)
print('clusters by euclidean distance')
clusters.printhclust(resulting_clusters, labels=countries_list)
clusters.drawdendrogram(resulting_clusters,
                        countries_list,
                        jpeg='Euclidean Cluster.jpg')
'''hierachical clustering: tanimoto coefficient'''
resulting_clusters = clusters.hcluster(attr_matrix, distance=clusters.tanimoto)
print('clusters by tanimoto coefficient')
clusters.printhclust(resulting_clusters, labels=countries_list)
clusters.drawdendrogram(resulting_clusters,
                        countries_list,
                        jpeg='Tanimoto Cluster.jpg')
print()
'''hierachical clustering: pearson similarity'''
resulting_clusters = clusters.hcluster(attr_matrix, distance=clusters.pearson)
print('clusters by pearson correlation')
clusters.printhclust(resulting_clusters, labels=countries_list)
clusters.drawdendrogram(resulting_clusters,
                        countries_list,