Python BTree.right 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: BTree

클래스/타입: BTree

메소드/함수: right

hotexamples.com에서의 예제들: 2

Python BTree.right - 2개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 BTree.BTree.right에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

BTree(30)

insert(16)

delete(6)

json(5)

all_clustering_dic(2)

indices(2)

right(2)

__init__(2)

left(2)

where_dominant(2)

print(1)

weight(1)

values(1)

traverse(1)

stop(1)

search(1)

root(1)

bulkload(1)

query(1)

print_order(1)

print_anagrams(1)

printPreOrder(1)

printInOrder(1)

addOccurrence(1)

display(1)

obtener_documentos(1)

ll(1)

bic(1)

key(1)

children(1)

insertar(1)

add(1)

inorder(1)

contains(1)

get_best_index(1)

expand(1)

empty(1)

dump(1)

populate_tree(1)

예제 #1

파일 보기

def Matryoshka(data, merge_cutoff=0.1, max_k=10, max_ndim=2, bic='bic'):

    if data.shape[0] <= 20:
        root = BTree(('leaf', ))
        root.indices = data.index.values.tolist()
        root.all_clustering_dic = _set_small_leaf(data)
        return root

    separable_features, bipartitions, scores, all_clustering_dic = HiScanFeatures(
        data, merge_cutoff, max_k, max_ndim, bic)

    if len(separable_features) == 0:
        root = BTree(('leaf', ))
        root.indices = data.index.values.tolist()
        root.all_clustering_dic = all_clustering_dic
        return root

    idx_best = np.argmax(scores)
    best_feature = separable_features[idx_best]
    best_partition = bipartitions[best_feature]

    ## construct current node
    root = BTree(best_feature)
    root.indices = data.index.values.tolist()
    root.all_clustering_dic = all_clustering_dic
    #root.marker_summary = marker_summary
    #root.para = para

    ## branch cells, component with higher mean goes right.
    p1_mean = data.loc[best_partition, best_feature].mean(0)
    p2_mean = data.loc[~best_partition, best_feature].mean(0)

    flag = True
    if len(p1_mean) == 1:
        flag = p1_mean.values > p2_mean.values
    else:
        p1_cosine = sum(p1_mean) / np.sqrt(sum(p1_mean**2))
        p2_cosine = sum(p2_mean) / np.sqrt(sum(p2_mean**2))
        flag = p1_cosine > p2_cosine

    if flag:
        child_right = data.iloc[best_partition, :]
        child_left = data.iloc[~best_partition, :]
        root.where_dominant = 'right'
    else:
        child_right = data.iloc[~best_partition, :]
        child_left = data.iloc[best_partition, :]
        root.where_dominant = 'left'

    ## recursion
    root.left = Matryoshka(child_left, merge_cutoff, max_k, max_ndim, bic)
    root.right = Matryoshka(child_right, merge_cutoff, max_k, max_ndim, bic)

    return root

예제 #2

파일 보기

def ReSplit(data, merge_cutoff=0.1, weight=1, max_k=10, max_ndim=2, bic='bic'):

    root = BTree(('leaf', ))
    root.indices = data.index.values.tolist()
    root.weight = weight
    #if len(root.indices) < 500:
    #    print(root.indices)

    if data.shape[0] < 2:
        root.all_clustering_dic = _set_small_leaf(data)
        root.stop = 'small size'
        return root

    unimodal = GaussianMixture(1, covariance_type='full').fit(data)
    root.ll = root.weight * unimodal.lower_bound_
    root.bic = unimodal.bic(data)

    separable_features, bipartitions, scores_ll, bic_list, all_clustering_dic = HiScanFeatures(
        data, root, merge_cutoff, max_k, max_ndim, bic)

    if len(separable_features) == 0:
        root.all_clustering_dic = all_clustering_dic
        root.stop = 'no separable features'
        return root
    '''
    scores_ll = np.zeros(len(separable_features))
    bic_list = np.zeros(len(separable_features))
    for fidx in range(len(separable_features)):
        f = separable_features[fidx]
        if np.sum(bipartitions[f]) < 2 or np.sum(~bipartitions[f]) < 2:
            continue
        gmm1 = GaussianMixture(1,covariance_type='full').fit(data.loc[bipartitions[f],:])
        ll1 = gmm1.lower_bound_ * sum(bipartitions[f])/len(bipartitions[f])
        bic1 = gmm1.bic(data.loc[bipartitions[f],:]) 
        
        gmm0 = GaussianMixture(1,covariance_type='full').fit(data.loc[~bipartitions[f],:])
        ll0 = gmm0.lower_bound_ * sum(~bipartitions[f])/len(bipartitions[f])
        bic0 = gmm0.bic(data.loc[~bipartitions[f],:]) 
        
        scores_ll[fidx] = (ll1 + ll0) * root.weight - root.ll
        bic_list[fidx] = bic1 + bic0
    '''
    #print(separable_features)
    #print(scores_ll)
    #print(bic_list)
    idx_best = np.argmax(scores_ll)
    if np.max(scores_ll) < 0.001:
        #if root.bic < bic_list[idx_best]:
        root.stop = 'spliting increases bic'
        return root

    #idx_best = np.argmax(scores_ent)
    best_feature = separable_features[idx_best]
    best_partition = bipartitions[best_feature]
    #best_weights = all_clustering_dic[len(best_feature)][best_feature]['weight']

    ## construct current node
    root.key = best_feature
    root.all_clustering_dic = all_clustering_dic
    #root.marker_summary = marker_summary
    #root.para = para

    ## branch cells, component with higher mean goes right.
    p1_mean = data.loc[best_partition, best_feature].mean(0)
    p2_mean = data.loc[~best_partition, best_feature].mean(0)

    flag = True
    if len(p1_mean) == 1:
        flag = p1_mean.values > p2_mean.values
    else:
        p1_cosine = sum(p1_mean) / np.sqrt(sum(p1_mean**2))
        p2_cosine = sum(p2_mean) / np.sqrt(sum(p2_mean**2))
        flag = p1_cosine > p2_cosine

    if flag:
        child_right = data.iloc[best_partition, :]
        w_r = sum(best_partition) / len(best_partition)
        child_left = data.iloc[~best_partition, :]
        w_l = sum(~best_partition) / len(best_partition)
        root.where_dominant = 'right'
    else:
        child_right = data.iloc[~best_partition, :]
        w_r = sum(~best_partition) / len(best_partition)
        child_left = data.iloc[best_partition, :]
        w_l = sum(best_partition) / len(best_partition)
        root.where_dominant = 'left'

    ## recursion
    root.left = ReSplit(child_left, merge_cutoff, weight * w_l, max_k,
                        max_ndim, bic)
    root.right = ReSplit(child_right, merge_cutoff, weight * w_r, max_k,
                         max_ndim, bic)

    return root