Python Clustering.cluster Examples

Programming Language: Python

Namespace/Package Name: clustering

Class/Type: Clustering

Method/Function: cluster

Examples at hotexamples.com: 3

Python Clustering.cluster - 3 examples found. These are the top rated real world Python examples of clustering.Clustering.cluster extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

Clustering(30)

fit(6)

k_means(4)

createDistanceMatrix(3)

load(3)

buildTree(3)

fill_clusters(3)

run(3)

cluster(3)

createLevelMatrix(3)

lab_to_labels(2)

merge(2)

min_link(2)

mwk_means(2)

imwk_means(2)

ik_means(2)

start(2)

spectral(2)

melhor_da_geracao(1)

inputType(1)

kMeans(1)

thrEstimation(1)

kmeans(1)

kmeans_clustering(1)

kmeans_fit(1)

list_cluster(1)

spectral_decomp(1)

mds_decomp(1)

preProcess(1)

predict(1)

selecao(1)

run_spectral_rotate(1)

run_clustering(1)

mutacao(1)

run_SKMeans_137(1)

mwpam(1)

nn_centers(1)

proclus(1)

plot(1)

print_clusters(1)

pp_distance(1)

pam(1)

get_double_centre(1)

get_label_mapping(1)

dbscan_clustering(1)

MDS_decomp(1)

addnext(1)

agnes_clustering(1)

ahc_fit(1)

avgTree(1)

Example #1

Show file

from log_parser import LogParser
from feature_extractor import FeatureExtractor
from clustering import Clustering
from idf import IDF

parser = LogParser('../../data/HDFS_2K.log')
tagged_events, log_sequences = parser.parse()

extractor = FeatureExtractor(log_sequences, list(tagged_events.keys()))
log_sequences = extractor.extract()

clustering = Clustering(log_sequences, tagged_events)
cluster_ids, cluster_values, silhouette = clustering.cluster()

for cluster_value in cluster_values:
    if cluster_value['num_possible_abnormal_events'] != 0:
        print(cluster_value)
        print()

#print ("El coeficiente de silueta es =", silhouette)

Example #2

Show file

File: initial_clustering.py Project: shashankavusali/Naberfeed

    articles = list(
        db.articles.find({}, {
            '_id': 1,
            'keywords': 1
        }).limit(10000))
    article_keywords = np.array([article['keywords'] for article in articles])
    article_object_ids = np.array([article['_id'] for article in articles])

    a_dist = ArticleDistance(copy.deepcopy(article_keywords))
    dists = a_dist.article_pdist()
    n = dists.shape[0]
    dists[range(n), range(n)] = 0
    d = distance.squareform(dists)

    cluster = Clustering(d)
    c = cluster.cluster()
    extractor = TopicExtractor()

    for i in range(len(np.unique(c))):
        articles = []
        indices = np.where(c == i)[0]
        articles.extend(article_object_ids[indices])
        whole_keywords = []
        whole_keywords.extend(article_keywords[indices])
        db.articles.update_many({'_id': {
            '$in': articles
        }}, {'$set': {
            'cluster_id': i
        }})
        topic_words, cluster_word_counts = extractor.extract_topic_keywords(
            whole_keywords)

Example #3

Show file

    from regressor import Regressor

    regressor = Regressor(algorithm_name)
    y_predicted = regressor.predict(X_train, y_train, X_test)
    regressor_score = regressor.get_score(y_test, y_predicted)

    # Visualizing the results
    visualizer = Visualizer()
    visualizer.plot_classifier_regressor(y_test, y_predicted,
                                         method_identifier)

    print('The coefficient of determination is: ' + str(regressor_score))
    print(algorithm_name)

# ---------------------Clustering the data------------------------------------
elif method_identifier == 3:

    from clustering import Clustering

    clustering = Clustering(algorithm_name)
    n_clusters, inertia = clustering.tune_parameters(X_train)
    clusters = clustering.cluster(X_train, X_test, n_clusters)

    # Visualizing the results
    visualizer = Visualizer()
    visualizer.plot_clustering(X_test, clusters)

    print("The clustering model's inertia: " + str(inertia))
    print(str(algorithm_name))