Python Clustering.loadの例

プログラミング言語: Python

名前空間/パッケージ名: clustering

クラス/型: Clustering

メソッド/関数: load

hotexamples.comのコード掲載数: 5

Python Clustering.load - 5件のコード例が見つかりました。すべてオープンソースプロジェクトから抽出されたPythonのclustering.Clustering.loadの実例で、最も評価が高いものを厳選しています。コード例の評価を行っていただくことで、より質の高いコード例が表示されるようになります。

よく使われるメソッド

表示非表示

Clustering(30)

fit(6)

k_means(4)

createDistanceMatrix(3)

load(3)

buildTree(3)

fill_clusters(3)

run(3)

cluster(3)

createLevelMatrix(3)

lab_to_labels(2)

merge(2)

min_link(2)

mwk_means(2)

imwk_means(2)

ik_means(2)

start(2)

spectral(2)

melhor_da_geracao(1)

inputType(1)

kMeans(1)

thrEstimation(1)

kmeans(1)

kmeans_clustering(1)

kmeans_fit(1)

list_cluster(1)

spectral_decomp(1)

mds_decomp(1)

preProcess(1)

predict(1)

selecao(1)

run_spectral_rotate(1)

run_clustering(1)

mutacao(1)

run_SKMeans_137(1)

mwpam(1)

nn_centers(1)

proclus(1)

plot(1)

print_clusters(1)

pp_distance(1)

pam(1)

get_double_centre(1)

get_label_mapping(1)

dbscan_clustering(1)

MDS_decomp(1)

addnext(1)

agnes_clustering(1)

ahc_fit(1)

avgTree(1)

コード例 #1

ファイルを表示

ファイル: groundtruth.py プロジェクト: hbredin/byzance

def do_compute(reference_txt, pre_clustering_txt, groundtruth_npy):

    # load reference clusters
    reference = Clustering.load(reference_txt)

    # load hypothesis clusters
    hypothesis = Clustering.load(pre_clustering_txt)

    # number of hypothesis clusters
    nPreClusters = len(hypothesis.clusters)
    preClusters = sorted(hypothesis.clusters)

    # groundtruth[i, j] contains
    # 1 if all elements in clusters i and j are in the same cluster
    # 0 if elements in clusters i and j are not in the same cluster
    # -1 if either cluster i or j is not pure
    groundtruth = np.empty((nPreClusters, nPreClusters), dtype=int)

    # clustersRef[c] contains reference cluster for pure hypothesis cluster c
    # in case c is not pure, clustersRef[c] is None
    clustersRef = {}
    for c in preClusters:
        r = set([reference[i] for i in hypothesis.clusters[c]])
        if len(r) == 1:
            clustersRef[c] = r.pop()
        else:
            clustersRef[c] = None

    for k, ci in enumerate(preClusters):
        if clustersRef[ci] is None:
            groundtruth[ci, :] = -1
            groundtruth[:, ci] = -1
            continue
        for cj in preClusters[k:]:
            if clustersRef[cj] is not None:
                groundtruth[ci, cj] = clustersRef[ci] == clustersRef[cj]
                groundtruth[cj, ci] = groundtruth[ci, cj]

    # save groundtruth matrix
    np.save(groundtruth_npy, groundtruth)

コード例 #2

ファイルを表示

def do_it(image_txt, features_npy, clustering_txt, output_npy):

    # load image list
    with open(image_txt, 'r') as f:
        images = [int(line.strip()) for line in f.readlines()]
        image2index = {image: index for index, image in enumerate(images)}

    # load hypothesis clusters
    clustering = Clustering.load(clustering_txt)
    clusters = sorted(clustering.clusters)

    # load features
    features = np.load(features_npy)

    # L2 normalization (for later dot product)
    features = (features.T / np.sqrt(np.sum((features**2), axis=1))).T

    # find centroid image for every cluster
    centroid = {}
    for c, cluster in enumerate(clusters):

        # list of images in current cluster
        _images = clustering.clusters[cluster]

        # corresponding indices in features matrix
        _indices = [image2index[image] for image in _images]

        # compute distance matrix between
        # all images of current cluster
        _features = features[_indices, :]
        _distance = 1. - np.dot(_features, _features.T)

        # find centroid image
        i = np.argmin(np.sum(_distance, axis=0))
        centroid[cluster] = _images[i]

        print 'image %s is centroid of cluster %s' % (centroid[cluster],
                                                      cluster)

    # centroid indices in features matrix
    _indices = [image2index[centroid[cluster]] for cluster in clusters]

    # compute distance matrix between all centroids
    _features = features[_indices, :]
    _distance = 1. - np.dot(_features, _features.T)

    # save distance matrix
    with open(output_npy, 'wb') as f:
        np.save(f, _distance)

コード例 #3

ファイルを表示

ファイル: cluster_distance.py プロジェクト: hbredin/byzance

def do_it(image_txt, features_npy, clustering_txt, output_npy):

    # load image list
    with open(image_txt, 'r') as f:
        images = [int(line.strip()) for line in f.readlines()]
        image2index = {image: index for index, image in enumerate(images)}

    # load hypothesis clusters
    clustering = Clustering.load(clustering_txt)
    clusters = sorted(clustering.clusters)

    # load features
    features = np.load(features_npy)

    # L2 normalization (for later dot product)
    features = (features.T / np.sqrt(np.sum((features ** 2), axis=1))).T

    # find centroid image for every cluster
    centroid = {}
    for c, cluster in enumerate(clusters):

        # list of images in current cluster
        _images = clustering.clusters[cluster]

        # corresponding indices in features matrix
        _indices = [image2index[image] for image in _images]

        # compute distance matrix between
        # all images of current cluster
        _features = features[_indices, :]
        _distance = 1. - np.dot(_features, _features.T)

        # find centroid image
        i = np.argmin(np.sum(_distance, axis=0))
        centroid[cluster] = _images[i]

        print 'image %s is centroid of cluster %s' % (centroid[cluster], cluster)

    # centroid indices in features matrix
    _indices = [image2index[centroid[cluster]] for cluster in clusters]

    # compute distance matrix between all centroids
    _features = features[_indices, :]
    _distance = 1. - np.dot(_features, _features.T)

    # save distance matrix
    with open(output_npy, 'wb') as f:
        np.save(f, _distance)

コード例 #4

ファイルを表示

    for k, v in cluster.iteritems():
        for photo in v:
            file.write("%d\t%d\n" % (photo, k))

    file.close()


print "Loading json into memory..."
dictionary = readjson(
    "/vol/corpora4/mediaeval/2014/SED_2014_Dev_Metadata.json")
print "...Done !"

clusterU = clusterUser(dictionary, fileID)
clusterD = clusterDate(dictionary, fileID, clusterU)

print_result_file(clusterD, fileOUT)

reference = Clustering.load(fileREF)
hypothesis = Clustering.load(fileOUT)

images = []
for c in clusterD.values():
    for i in range(0, len(c)):
        images.append(c[i])

h = homogeneity(reference, hypothesis, images)
print h
c = completeness(reference, hypothesis, images)
print c

コード例 #5

ファイルを表示

ファイル: DataReduction.py プロジェクト: hbredin/byzance

	file = open(filename, "w")

	for k, v in cluster.iteritems():
		for photo in v:
			file.write("%d\t%d\n" % (photo, k))

	file.close()

print "Loading json into memory..."
dictionary = readjson("/vol/corpora4/mediaeval/2014/SED_2014_Dev_Metadata.json")
print "...Done !"

clusterU = clusterUser(dictionary, fileID)
clusterD = clusterDate(dictionary, fileID, clusterU)

print_result_file(clusterD, fileOUT)

reference = Clustering.load(fileREF)
hypothesis = Clustering.load(fileOUT)

images = []
for c in clusterD.values():
	for i in range (0, len(c)):
		images.append(c[i])

h = homogeneity(reference, hypothesis, images)
print h
c = completeness(reference, hypothesis, images)
print c