Python agglomerativeClustering 예제들, nifty.graph.agglo.agglomerativeClustering Python 예제들

예제 #1

0

파일 보기

    def get_soln_graph_clustering(self, node_features):
        labels = []
        node_labels = []
        for i, sp_seg in enumerate(self.init_sp_seg):
            single_node_features = node_features[self.n_offs[i]:self.n_offs[i+1]].detach().cpu().numpy()
            rag = nifty.graph.undirectedGraph(single_node_features.shape[0])
            rag.insertEdges((self.edge_ids[:, self.e_offs[i]:self.e_offs[i+1]] - self.n_offs[i]).T.detach().cpu().numpy())

            edge_weights = np.ones(rag.numberOfEdges, dtype=np.int)
            edge_sizes = np.ones(rag.numberOfEdges, dtype=np.int)
            node_sizes = np.ones(rag.numberOfNodes, dtype=np.int)

            policy = self.cluster_policy(
                graph=rag,
                edgeIndicators=edge_weights,
                edgeSizes=edge_sizes,
                nodeFeatures=single_node_features,
                nodeSizes=node_sizes,
                numberOfNodesStop=self.cfg.gen.n_max_object,
                beta = 1,
                sizeRegularizer = 0
            )
            clustering = nagglo.agglomerativeClustering(policy)
            clustering.run()

            node_labels.append(clustering.result())
            rag = elf.segmentation.features.compute_rag(np.expand_dims(sp_seg.cpu(), axis=0))
            labels.append(elf.segmentation.features.project_node_labels_to_pixels(rag, node_labels[-1]).squeeze())
        return torch.from_numpy(np.stack(labels).astype(np.float)).to(node_features.device), \
               torch.from_numpy(np.concatenate(node_labels).astype(np.float)).to(node_features.device)

예제 #2

0

파일 보기

파일: clustering.py 프로젝트: zheng980629/elf

def mala_clustering(graph,
                    edge_features,
                    edge_sizes,
                    threshold,
                    return_object=False):
    """ Compute segmentation with mala-style clustering.

    In "Large Scale Image Segmentation with Structured Loss based Deep Learning for Connectome Reconstruction":
    https://ieeexplore.ieee.org/stamp/stamp.jsp?arnumber=8364622

    Arguments:
        graph [nifty.graph] - graph to cluster
        edge_features [np.ndarray] - features used for clustering
        edge_sizes [np.ndarray] - sizes of edges
        threshold [float] - threshold to stop clustering
    """
    n_nodes = graph.numberOfNodes
    policy_class = nagglo.malaClusterPolicyWithUcm if return_object else nagglo.malaClusterPolicy
    policy = policy_class(graph=graph,
                          edgeIndicators=edge_features,
                          nodeSizes=np.zeros(n_nodes, dtype='float'),
                          edgeSizes=edge_sizes,
                          threshold=threshold)
    clustering = nagglo.agglomerativeClustering(policy)
    if return_object:
        return clustering
    clustering.run()
    return clustering.result()

예제 #3

0

파일 보기

파일: clustering.py 프로젝트: zheng980629/elf

def agglomerative_clustering(graph,
                             edge_features,
                             node_sizes,
                             edge_sizes,
                             n_stop,
                             size_regularizer,
                             return_object=False):
    """ Compute segmentation with agglomerative clustering with optional size regularizer.

    Arguments:
        graph [nifty.graph] - graph to cluster
        edge_features [np.ndarray] - features used for clustering
        node_sizes [np.ndarray] - sizes of nodes
        edge_sizes [np.ndarray] - sizes of edges
        n_stop [int] - target number of clusters
        size_regularizer [float] - strength of size regularizer
    """
    policy_class = nagglo.edgeWeightedClusterPolicyWithUcm if return_object else nagglo.edgeWeightedClusterPolicy
    policy = policy_class(graph=graph,
                          edgeIndicators=edge_features,
                          nodeSizes=node_sizes.astype('float'),
                          edgeSizes=edge_sizes.astype('float'),
                          numberOfNodesStop=n_stop,
                          sizeRegularizer=size_regularizer)
    clustering = nagglo.agglomerativeClustering(policy)
    if return_object:
        return clustering
    clustering.run()
    return clustering.result()

예제 #4

0

파일 보기

파일: test_GASP.py 프로젝트: constantinpape/elf

    def test_gasp_abs_max(self):
        clusterPolicy = nagglo.get_GASP_policy(
            graph=self.g,
            signed_edge_weights=self.edgeIndicators,
            linkage_criteria='abs_max')

        agglomerativeClustering = nagglo.agglomerativeClustering(clusterPolicy)
        agglomerativeClustering.run()
        seg = agglomerativeClustering.result()
        self.assertTrue(seg[0] != seg[1] and seg[0] == seg[2] and seg[0] == seg[3])

예제 #5

0

파일 보기

파일: segmentation_utils.py 프로젝트: kreshuklab/hiiragi_segmentation_cluster_tools

def mala_clustering(graph, edge_features, edge_sizes, threshold):
    n_nodes = graph.numberOfNodes
    policy = nagglo.malaClusterPolicy(graph=graph,
                                      edgeIndicators=edge_features,
                                      nodeSizes=np.zeros(n_nodes, dtype='float'),
                                      edgeSizes=edge_sizes,
                                      threshold=threshold)
    clustering = nagglo.agglomerativeClustering(policy)
    clustering.run()
    return clustering.result()

예제 #6

0

파일 보기

파일: test_GASP.py 프로젝트: constantinpape/elf

    def test_gasp_sum(self):
        clusterPolicy = nagglo.get_GASP_policy(
            graph=self.g,
            signed_edge_weights=self.edgeIndicators,
            linkage_criteria='sum',
            add_cannot_link_constraints=False)

        agglomerativeClustering = nagglo.agglomerativeClustering(clusterPolicy)
        agglomerativeClustering.run()
        seg = agglomerativeClustering.result().tolist()
        self.assertTrue(seg[0] != seg[1] and seg[0] == seg[2] and seg[0] == seg[3])

예제 #7

0

파일 보기

파일: segmentation_utils.py 프로젝트: kreshuklab/hiiragi_segmentation_cluster_tools

def agglomerative_clustering(graph, edge_features,
                             node_sizes, edge_sizes,
                             n_stop, size_regularizer):
    policy = nagglo.edgeWeightedClusterPolicy(graph=graph,
                                              edgeIndicators=edge_features,
                                              nodeSizes=node_sizes.astype('float'),
                                              edgeSizes=edge_sizes.astype('float'),
                                              numberOfNodesStop=n_stop,
                                              sizeRegularizer=size_regularizer)
    clustering = nagglo.agglomerativeClustering(policy)
    clustering.run()
    return clustering.result()

예제 #8

0

파일 보기

파일: clustering.py 프로젝트: k-dominik/elf

def mala_clustering(graph, edge_features, edge_sizes, threshold):
    """ Compute segmentation with mala-style clustering.

    Arguments:
        graph [nifty.graph] - graph to cluster
        edge_features [np.ndarray] - features used for clustering
        edge_sizes [np.ndarray] - sizes of edges
        threshold [float] - threshold to stop clustering
    """
    n_nodes = graph.numberOfNodes
    policy = nagglo.malaClusterPolicy(graph=graph,
                                      edgeIndicators=edge_features,
                                      nodeSizes=np.zeros(n_nodes,
                                                         dtype='float'),
                                      edgeSizes=edge_sizes,
                                      threshold=threshold)
    clustering = nagglo.agglomerativeClustering(policy)
    clustering.run()
    return clustering.result()

예제 #9

0

파일 보기

파일: agglomeration.py 프로젝트: weihuang527/cremi_tools

 def _segmentation_impl(self,
                        graph,
                        costs,
                        node_sizes=None,
                        edge_sizes=None):
     if self.use_sizes:
         assert node_sizes is not None and edge_sizes is not None
         node_sizes_ = node_sizes
         edge_sizes_ = edge_sizes
     else:
         node_sizes_ = np.ones(graph.numberOfNodes)
         edge_sizes_ = np.ones(graph.numberOfEdges)
     policy = self._cluster_policy(graph=graph,
                                   edge_features=costs,
                                   edge_sizes=edge_sizes_,
                                   node_sizes=node_sizes_)
     clustering = nagglo.agglomerativeClustering(policy)
     clustering.run()
     node_labels = clustering.result()
     return node_labels

예제 #10

0

파일 보기

파일: ProtInfoNce_loss.py 프로젝트: paulhfu/unsup_pix_embed

    def graph_cluster(self, features, k, shape):
        # _centroid, label = kmeans2(mom_embed.cpu(), k, minit='random', iter=20)
        # build image grid graph
        graph = nifty.graph.undirectedGridGraph(shape)

        edge_weights = np.ones(
            graph.numberOfEdges,
            dtype=np.int)  # (beta=1) -> edge weights will not be used
        edge_sizes = np.ones(graph.numberOfEdges,
                             dtype=np.int)  # won't be used as well
        node_sizes = np.ones(graph.numberOfNodes,
                             dtype=np.int)  # nodes have equal initial masses
        # define cluster policy that does not use edge stats and that does not have higher merge affinities for small clusters
        # that policy is only available on this nifty fork https://github.com/paulhfu/nifty
        policy = nagglo.cosineDistNodeAndEdgeWeightedClusterPolicy(
            graph=graph,
            edgeIndicators=edge_weights,
            edgeSizes=edge_sizes,
            nodeFeatures=features.detach().cpu(),
            nodeSizes=node_sizes,
            numberOfNodesStop=k,
            beta=1,
            sizeRegularizer=0)
        clustering = nagglo.agglomerativeClustering(policy)
        clustering.run()

        label = clustering.result()
        label = torch.from_numpy(label.astype(np.int)).to(
            features.device).long()
        unique_lbl = torch.unique(
            label
        )  # using kmeans does not guarantee k clusters (has no effect when using agglomerative clustering)
        # relabel to consecutive labeling
        for new, lbl in enumerate(unique_lbl):
            label[label == lbl] = new
        return label

예제 #11

0

파일 보기

def run_GASP(
        graph,
        signed_edge_weights,
        linkage_criteria='mean',
        add_cannot_link_constraints= False,
        edge_sizes=None,
        is_mergeable_edge=None,
        use_efficient_implementations=True,
        verbose=False,
        linkage_criteria_kwargs=None,
        print_every=100000):
    """
    Run the Generalized Algorithm for Agglomerative Clustering on Signed Graphs (GASP).
    The C++ implementation is currently part of the nifty library (https://github.com/abailoni/nifty).

    Parameters
    ----------
    graph : nifty.graph
        Instance of a graph, e.g. nifty.graph.UndirectedGraph, nifty.graph.undirectedLongRangeGridGraph or
        nifty.graph.rag.gridRag

    signed_edge_weights : numpy.array(float) with shape (nb_graph_edges, )
        Attractive weights are positive; repulsive weights are negative.

    linkage_criteria : str (default 'mean')
        Specifies the linkage criteria / update rule used during agglomeration.
        List of available criteria:
            - 'mean', 'average', 'avg'
            - 'max', 'single_linkage'
            - 'min', 'complete_linkage'
            - 'mutex_watershed', 'abs_max'
            - 'sum'
            - 'quantile', 'rank' keeps statistics in a histogram, with parameters:
                    * q : float (default 0.5 equivalent to the median)
                    * numberOfBins: int (default: 40)
            - 'generalized_mean', 'gmean' with parameters:
                    * p : float (default: 1.0)
                    * https://en.wikipedia.org/wiki/Generalized_mean
            - 'smooth_max', 'smax' with parameters:
                    * p : float (default: 0.0)
                    * https://en.wikipedia.org/wiki/Smooth_maximum

    add_cannot_link_constraints : bool

    edge_sizes : numpy.array(float) with shape (nb_graph_edges, )
        Depending on the linkage criteria, they can be used during the agglomeration to weight differently
        the edges  (e.g. with sum or avg linkage criteria). Commonly used with regionAdjGraphs when edges
        represent boundaries of different length between segments / super-pixels. By default, all edges have
        the same weighting.

    is_mergeable_edge : numpy.array(bool) with shape (nb_graph_edges, )
        Specifies if an edge can be merged or not. Sometimes some edges represent direct-neighbor relations
        and others describe long-range connections. If a long-range connection /edge is assigned to
        `is_mergeable_edge = False`, then the two associated nodes are not merged until they become
        direct neighbors and they get connected in the image-plane.
        By default all edges are mergeable.

    use_efficient_implementations : bool (default: True)
        In the following special cases, alternative efficient implementations are used:
            - 'abs_max' criteria: Mutex Watershed (https://github.com/hci-unihd/mutex-watershed.git)
            - 'max' criteria without cannot-link constraints: maximum spanning tree

    verbose : bool (default: False)

    linkage_criteria_kwargs : dict
        Additional optional parameters passed to the chosen linkage criteria (see previous list)

    print_every : int (default: 100000)
        After how many agglomeration iteration to print in verbose mode

    Returns
    -------
    node_labels : numpy.array(uint) with shape (nb_graph_nodes, )
        Node labels representing the final clustering

    runtime : float
    """

    if use_efficient_implementations and (linkage_criteria in ['mutex_watershed', 'abs_max'] or
                                          (linkage_criteria == 'max' and not add_cannot_link_constraints)):
        if is_mergeable_edge is not None:
            if not is_mergeable_edge.all():
                print("WARNING: Efficient implementations only works when all edges are mergeable")
            # assert is_mergeable_edge.all(), "Efficient implementations only works when all edges are mergeable"
        # assert is_mergeable_edge is None, "Efficient implementations only works when all edges are mergeable"
        nb_nodes = graph.numberOfNodes
        uv_ids = graph.uvIds()
        mutex_edges = signed_edge_weights < 0.

        tick = time.time()
        # These implementations use the convention where all edge weights are positive
        assert aff_segm is not None, "For the efficient implementation of GASP, affogato module is needed"
        if linkage_criteria in ['mutex_watershed', 'abs_max']:
            node_labels = aff_segm.compute_mws_clustering(nb_nodes,
                                             uv_ids[np.logical_not(mutex_edges)],
                                             uv_ids[mutex_edges],
                                             signed_edge_weights[np.logical_not(mutex_edges)],
                                             -signed_edge_weights[mutex_edges])
        else:
            node_labels = aff_segm.compute_single_linkage_clustering(nb_nodes,
                                                        uv_ids[np.logical_not(mutex_edges)],
                                                        uv_ids[mutex_edges],
                                                        signed_edge_weights[np.logical_not(mutex_edges)],
                                                        -signed_edge_weights[mutex_edges])
        runtime = time.time() - tick
    else:
        cluster_policy = nifty_agglo.get_GASP_policy(graph, signed_edge_weights,
                                                     edge_sizes=edge_sizes,
                                                     linkage_criteria=linkage_criteria,
                                                     linkage_criteria_kwargs=linkage_criteria_kwargs,
                                                     add_cannot_link_constraints=add_cannot_link_constraints,
                                                     is_mergeable_edge=is_mergeable_edge)
        agglomerativeClustering = nifty_agglo.agglomerativeClustering(cluster_policy)

        # Run clustering:
        tick = time.time()
        agglomerativeClustering.run(verbose=verbose,
                                    printNth=print_every)
        runtime = time.time() - tick

        # Collect results:
        node_labels = agglomerativeClustering.result()
    return node_labels, runtime

예제 #12

0

파일 보기

파일: greedy_edge_contr.py 프로젝트: jamiegrieser/segmfriends

def runGreedyGraphEdgeContraction(graph,
                                  signed_edge_weights,
                                  linkage_criteria='mean',
                                  add_cannot_link_constraints=False,
                                  edge_sizes=None,
                                  node_sizes=None,
                                  is_merge_edge=None,
                                  size_regularizer=0.0,
                                  return_UCM=False,
                                  return_agglomeration_data=False,
                                  ignored_edge_weights=None,
                                  **run_kwargs):
    """
    :param ignored_edge_weights: boolean array, if an edge label is True, than the passed signed weight is ignored
            (neither attractive nor repulsive)

    Returns node_labels and runtime. If return_UCM == True, then also returns the UCM and the merging iteration for
    every edge.
    """
    raise DeprecationWarning("use version in GASP repo instead")
    # Legacy:
    if "update_rule" in run_kwargs:
        update_rule = run_kwargs.pop("update_rule")
    else:
        update_rule = linkage_criteria

    if update_rule == 'mutex_watershed' or (update_rule == 'max' and
                                            not add_cannot_link_constraints):
        # if False:
        assert not return_UCM
        if is_merge_edge is not None:
            if not is_merge_edge.all():
                print(
                    "WARNING: Efficient implementations only works when all edges are mergeable"
                )
        # In this case we use the efficient MWS clustering implementation in affogato:
        nb_nodes = graph.numberOfNodes
        uv_ids = graph.uvIds()
        mutex_edges = signed_edge_weights < 0.

        # if is_merge_edge is not None:
        #     # If we have edges labelled as lifted, they should all be repulsive in this implementation!
        #     if not is_merge_edge.min():
        #         assert all(is_merge_edge == np.logical_not(mutex_edges)), "Affogato MWS cannot enforce local merges!"

        tick = time.time()
        # This function will sort the edges in ascending order, so we transform all the edges to negative values
        if update_rule == 'mutex_watershed':
            nodeSeg = compute_mws_clustering(
                nb_nodes, uv_ids[np.logical_not(mutex_edges)],
                uv_ids[mutex_edges],
                signed_edge_weights[np.logical_not(mutex_edges)],
                -signed_edge_weights[mutex_edges])
        else:
            nodeSeg = compute_single_linkage_clustering(
                nb_nodes, uv_ids[np.logical_not(mutex_edges)],
                uv_ids[mutex_edges],
                signed_edge_weights[np.logical_not(mutex_edges)],
                -signed_edge_weights[mutex_edges])
        runtime = time.time() - tick
        out_dict = {'runtime': runtime}

        return nodeSeg, out_dict
    else:
        # FIXME: temporary fix for the sum rule
        # if update_rule == 'sum':
        #     signed_edge_weights *= edge_sizes

        cluster_policy = nagglo.get_GASP_policy(
            graph,
            signed_edge_weights,
            edge_sizes=edge_sizes,
            linkage_criteria=update_rule,
            linkage_criteria_kwargs=None,
            add_cannot_link_constraints=add_cannot_link_constraints,
            node_sizes=node_sizes,
            is_mergeable_edge=is_merge_edge,
            size_regularizer=size_regularizer,
        )
        agglomerativeClustering = nagglo.agglomerativeClustering(
            cluster_policy)

        out_dict = {}

        tick = time.time()
        if not return_UCM:
            agglomerativeClustering.run(**run_kwargs)
        else:
            # TODO: add run_kwargs with UCM
            outputs = agglomerativeClustering.runAndGetMergeTimesAndDendrogramHeight(
                verbose=False)
            mergeTimes, UCM = outputs
            out_dict['UCM'] = UCM
            out_dict['mergeTimes'] = mergeTimes

        runtime = time.time() - tick

        nodeSeg = agglomerativeClustering.result()
        out_dict['runtime'] = runtime
        if return_agglomeration_data:
            out_dict['agglomeration_data'], out_dict[
                'edge_data_contracted_graph'] = cluster_policy.exportAgglomerationData(
                )
        return nodeSeg, out_dict