Python KMeans.calculate_performanceの例

プログラミング言語: Python

名前空間/パッケージ名: k_means

クラス/型: KMeans

メソッド/関数: calculate_performance

hotexamples.comのコード掲載数: 4

Python KMeans.calculate_performance - 4件のコード例が見つかりました。すべてオープンソースプロジェクトから抽出されたPythonのk_means.KMeans.calculate_performanceの実例で、最も評価が高いものを厳選しています。コード例の評価を行っていただくことで、より質の高いコード例が表示されるようになります。

よく使われるメソッド

表示非表示

KMeans(30)

fit(9)

cluster(7)

train(7)

run(6)

calculate_performance(4)

get_centroids(2)

print_results(2)

main_loop(2)

predict(2)

open_dataset(1)

k_means(1)

kmeans(1)

train_model(1)

print_distance(1)

plot_objective_function(1)

step(1)

initCentroids(1)

report(1)

run_k_means(1)

start(1)

init_centers(1)

get_clusters(1)

get_sse_score(1)

classify_centroids(1)

_get_initial_centroids(1)

_is_finish(1)

_squared_euclidian_dist(1)

_update_centroids_and_data(1)

calc_err(1)

calculate_sse(1)

centroids_find_closest(1)

cluster_points(1)

get_msc_avg(1)

compute_sse(1)

evaluate(1)

findClosestCentroids(1)

find_centers(1)

fit_predict(1)

get_cluster(1)

_choose_cluster(1)

update_k(1)

コード例 #1

ファイルを表示

ファイル: genetic_algorithm_feature_selection.py プロジェクト: Max-1892/machine_learning

def evaluate_model(model, model_type, num_of_classes, candidate_feature_set, data_set):
    '''This method uses the inputted feature subset to cluster the inputted data and
    scores performance using a LDA-like objective function.'''
    # Convert candidate_feature_set representation from
    # f_1, ... f_d to the list of indices of the f_i = 1
    # (for example, [1 0 0 1 0] -> [0 3]
    candidate_feature_set = \
        [idx for idx in xrange(len(candidate_feature_set)) if candidate_feature_set[idx] == 1]
    if model_type == "Kmeans":
        model = KMeans(num_of_classes)
    elif model_type == "HAC":
        model = HAC(num_of_classes)
    model.cluster(data_set[:,candidate_feature_set])
    return model.calculate_performance()

コード例 #2

ファイルを表示

ファイル: stepwise_forward_selection.py プロジェクト: Max-1892/machine_learning

def perform_SFS_feature_selection(model, model_type, num_of_classes, data_set):
    # Create a boolean string, 1 = include feature, 0 = leave it out
    feature_set = [i for i in xrange(data_set.shape[1])]
    chosen_features = []
    chosen_clusters = []
    base_performance = float("-inf")
    # while there are still features to choose from...
    while len(feature_set) > 0:
        # initialize performance metrics
        best_performance = float("-inf")
        best_clusters = []
        #print "best performance = %f" % best_performance
        # Pick a feature that hasn't be chosen yet and train the model
        for feature in feature_set:
            chosen_features.append(feature)
            # Train model
            if model_type == "Kmeans":
                model = KMeans(num_of_classes)
            elif model_type == "HAC":
                model = HAC(num_of_classes)
            #print "Modeling with %s" % chosen_features
            clusters = model.cluster(data_set)
            # Calculate performance via LDA-like objective function
            current_performance = model.calculate_performance()
            #print "model performance = %f" % current_performance
            # if this combo of features beats the best performance so far
            # take note...
            if current_performance > best_performance:
                best_performance = current_performance
                best_feature = feature
                best_clusters = clusters
                #print "best performance updated to %f" % best_performance
            chosen_features.remove(feature)
        # If best noted performance beats the best performance we've seen
        # so far, add to chosen features
        if best_performance > base_performance:
            base_performance = best_performance
            feature_set.remove(best_feature)
            chosen_features.append(best_feature)
            chosen_clusters = best_clusters
            #print "base performance = %f" % base_performance
        else:
            #print "best performance = %f" % base_performance
            break
    return chosen_features, chosen_clusters

コード例 #3

ファイルを表示

ファイル: test_harness.py プロジェクト: Max-1892/machine_learning

   data_file = open(test[0])
   print "Running with %s" % test[0]
   for line in data_file:
       line_split = line.split(',')
       data_instances.append(map(float, line_split))
   data_instances = np.array(data_instances)

   # Run SFS using k-means and HAC
   kmeans_model = KMeans(test[1])
   hac_model = HAC(test[1])

   # Glass dataset
   if "glass" in test[0]:
      kmeans_sfs_glass = np.array([1,3])
      kmeans_model.cluster(data_instances[:,kmeans_sfs_glass])
      print "Kmeans SFS glass performance = %f" % kmeans_model.calculate_performance()

      kmeans_ga_glass = np.array([0,1,2,3,4,5,6])
      kmeans_model = KMeans(test[1])
      kmeans_model.cluster(data_instances[:,kmeans_ga_glass])
      print "Kmeans GA glass performance = %f" % kmeans_model.calculate_performance()

      hac_sfs_glass = np.array([0])
      hac_model.cluster(data_instances[:,hac_sfs_glass])
      print "HAC SFS glass performance = %f" % hac_model.calculate_performance()

   # Iris dataset
   elif "iris" in test[0]:
      kmeans_sfs_iris = np.array([1])
      kmeans_model = KMeans(test[1])
      kmeans_model.cluster(data_instances[:,kmeans_sfs_iris])

コード例 #4

ファイルを表示

ファイル: main.py プロジェクト: sungwons/Machine_Learning

    print "Running with %s" % test[0]
    for line in data_file:
        line_split = line.split(',')
        data_instances.append(map(float, line_split))
    data_instances = np.array(data_instances)

    # Run SFS using k-means and HAC
    kmeans_model = KMeans(test[1])
    hac_model = HAC(test[1])

    # Glass dataset
    if "glass" in test[0]:
        kmeans_sfs_glass = np.array([1, 3])
        kmeans_model.cluster(data_instances[:, kmeans_sfs_glass])
        print("K-means SFS glass performance = %f" %
              kmeans_model.calculate_performance())

        kmeans_ga_glass = np.array([0, 1, 2, 3, 4, 5, 6])
        kmeans_model = KMeans(test[1])
        kmeans_model.cluster(data_instances[:, kmeans_ga_glass])
        print("K-means GA glass performance = %f" %
              kmeans_model.calculate_performance())

        hac_sfs_glass = np.array([0])
        hac_model.cluster(data_instances[:, hac_sfs_glass])
        print("HAC SFS glass performance = %f" %
              hac_model.calculate_performance())

    # Iris dataset
    elif "iris" in test[0]:
        kmeans_sfs_iris = np.array([1])