Python Clustering.k_means 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: clustering

클래스/타입: Clustering

메소드/함수: k_means

hotexamples.com에서의 예제들: 4

Python Clustering.k_means - 4개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 clustering.Clustering.k_means에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

Clustering(30)

fit(6)

k_means(4)

createDistanceMatrix(3)

load(3)

buildTree(3)

fill_clusters(3)

run(3)

cluster(3)

createLevelMatrix(3)

lab_to_labels(2)

merge(2)

min_link(2)

mwk_means(2)

imwk_means(2)

ik_means(2)

start(2)

spectral(2)

melhor_da_geracao(1)

inputType(1)

kMeans(1)

thrEstimation(1)

kmeans(1)

kmeans_clustering(1)

kmeans_fit(1)

list_cluster(1)

spectral_decomp(1)

mds_decomp(1)

preProcess(1)

predict(1)

selecao(1)

run_spectral_rotate(1)

run_clustering(1)

mutacao(1)

run_SKMeans_137(1)

mwpam(1)

nn_centers(1)

proclus(1)

plot(1)

print_clusters(1)

pp_distance(1)

pam(1)

get_double_centre(1)

get_label_mapping(1)

dbscan_clustering(1)

MDS_decomp(1)

addnext(1)

agnes_clustering(1)

ahc_fit(1)

avgTree(1)

예제 #1

파일 보기

    def clusterize(self):
        print("\nclusterize")

        self.process_clustering_data()

        c = Clustering(self.clustering_df)
        c.k_means(2)
        c.k_means(3)
        c.k_means(4)

예제 #2

파일 보기

파일: run.py 프로젝트: wenyishengkingkong/k-means

def main(fn, clusters_no):
    geo_locs = []
    #read location data from csv file and store each location as a Point(latit,longit) object
    df = pd.read_csv(fn)
    for index, row in df.iterrows():
        loc_ = Point(float(row['LAT']), float(row['LON']))  #tuples for location
        geo_locs.append(loc_)
    #run k_means clustering
    cluster = Clustering(geo_locs, clusters_no)
    flag = cluster.k_means(False)
    if flag == -1:
        print("Error in arguments!")
    else:
        #clustering results is a list of lists where each list represents one cluster
        print("Clustering results:")
        cluster.print_clusters(cluster.clusters)

예제 #3

파일 보기

####################################################################
print('Minkowski Weighted PAM')
start = time.time()
[u, medoids, weights, ite, dist_tmp] = cl.mwpam(data, 3, 1.1, False, 10)
print('Time elapsed: ', time.time()-start)
print('Accuracy: ', cl.my_math.compare_categorical_vectors(u, y)[0])
####################################################################
print('Minkowski Weighted PAM (Initialized with Minkowski Build)')
start = time.time()
[u, medoids, weights, ite, dist_tmp] = cl.mwpam(data, 3, 1.1)
print('Time elapsed: ', time.time()-start)
print('Accuracy: ', cl.my_math.compare_categorical_vectors(u, y)[0])
####################################################################
print('K-Means')
start = time.time()
[u, centroids, ite, dist_tmp] = cl.k_means(data, 3, replicates=10)
print('Time elapsed: ', time.time()-start)
print('Accuracy: ', cl.my_math.compare_categorical_vectors(u, y)[0])
####################################################################
print('iK-Means')
start = time.time()
[u, centroids, ite, dist_tmp, init_centroids] = cl.ik_means(data, 3)
print('Time elapsed: ', time.time()-start)
print('Accuracy: ', cl.my_math.compare_categorical_vectors(u, y)[0])
####################################################################
print('WK-Means')
start = time.time()
[u, centroids, weights, ite, dist_tmp] = cl.wk_means(data, 3, 1.1, replicates=10)
print('Time elapsed: ', time.time()-start)
print('Accuracy: ', cl.my_math.compare_categorical_vectors(u, y)[0])
####################################################################

예제 #4

파일 보기

def subspace_cluster(datapath,
                     ypath,
                     algorithm,
                     k,
                     sep=",",
                     preprocess_method="standard",
                     replicates=10,
                     max_ite=100,
                     beta=2,
                     init_weights=None,
                     init_centroids=None,
                     init_weights_method="random",
                     is_sparse=0,
                     threshold=0.9,
                     l=2,
                     minDeviation=0.1,
                     A=30,
                     B=10):
    np.seterr(all='raise')
    cl = Clustering()
    data_ori = np.genfromtxt(datapath, delimiter=sep)
    y = np.genfromtxt(ypath)
    data = data_preprocess(data_ori, preprocess_method)

    if algorithm == 'K-Means':
        print 'using K-Means'
        start = time.time()
        [u, centroids, ite, dist_tmp] = cl.k_means(data, k, replicates)
        time_elapsed = time.time() - start
        acc = cl.my_math.compare_categorical_vectors(u, y)[0]
        print 'Time elapsed: ', time_elapsed
        print 'Accuracy: ', acc
        return [u, centroids, ite, dist_tmp], time_elapsed, acc
    elif algorithm == 'iK-Means':
        print 'using iK-Means'
        start = time.time()
        [u, centroids, ite, dist_tmp, init_centroids] = cl.ik_means(data, k)
        time_elapsed = time.time() - start
        acc = cl.my_math.compare_categorical_vectors(u, y)[0]
        print 'Time elapsed: ', time_elapsed
        print 'Accuracy: ', acc
        return [u, centroids, ite, dist_tmp, init_centroids], time_elapsed, acc
    elif algorithm == 'WK-Means':
        print 'using WK-Means'
        start = time.time()
        [u, centroids, weights, ite,
         dist_tmp] = cl.wk_means(data,
                                 k,
                                 beta,
                                 init_centroids=init_centroids,
                                 init_weights=init_weights,
                                 replicates=replicates,
                                 max_ite=max_ite,
                                 init_weights_method=init_weights_method,
                                 is_sparse=is_sparse,
                                 threshold=threshold)
        time_elapsed = time.time() - start
        acc = cl.my_math.compare_categorical_vectors(u, y)[0]
        print 'Time elapsed: ', time_elapsed
        print 'Accuracy: ', acc
        return [u, centroids, weights, ite, dist_tmp], time_elapsed, acc
    elif algorithm == 'MWK-Means':
        print 'using MWK-Means'
        start = time.time()
        [u, centroids, weights, ite,
         dist_tmp] = cl.mwk_means(data,
                                  k,
                                  beta,
                                  init_centroids=init_centroids,
                                  init_weights=init_weights,
                                  replicates=replicates,
                                  max_ite=max_ite,
                                  init_weights_method=init_weights_method,
                                  is_sparse=is_sparse,
                                  threshold=threshold)
        time_elapsed = time.time() - start
        acc = cl.my_math.compare_categorical_vectors(u, y)[0]
        print 'Time elapsed: ', time_elapsed
        print 'Accuracy: ', acc
        return [u, centroids, weights, ite, dist_tmp], time_elapsed, acc
    elif algorithm == 'iMWK-Means':
        print 'using iMWK-Means'
        start = time.time()
        [u, centroids, weights, ite, dist_tmp] = cl.imwk_means(data, beta, k)
        time_elapsed = time.time() - start
        acc = cl.my_math.compare_categorical_vectors(u, y)[0]
        print 'Time elapsed: ', time_elapsed
        print 'Accuracy: ', acc
        return [u, centroids, weights, ite, dist_tmp], time_elapsed, acc
    elif algorithm == 'proclus':
        print 'using proclus'
        start = time.time()
        M, D, A, acc = cl.proclus(data,
                                  y,
                                  k,
                                  l,
                                  minDeviation=minDeviation,
                                  A=A,
                                  B=B,
                                  niters=max_ite)
        time_elapsed = time.time() - start
        print 'Time elapsed: ', time_elapsed
        print "Accuracy: %.4f" % acc
        return [M, D, A], time_elapsed, acc