Beispiel #1
0
async def get_vr_homology(data: VietorisRipsHomologyInput):
    points = np.array(data.points)
    N, dim = points.shape
    rips = cm.Rips()
    filt = rips.build(points)
    filt = [(simplex, value / 2) for simplex, value in filt]  # Make the indx to be the radius of circles
    filt_range = [min(filt, key=lambda x: x[1])[1], max(filt, key=lambda x: x[1])[1]]
    diagrams = cm.solver.phat_diagrams(filt, verbose=False)
    diagrams[0] = np.concatenate([diagrams[0], np.array([filt_range])])  # Append first connected component to compare with Cubix
    return {
        "filtration": {
            "range": filt_range,
            "simplices": [
                {
                    "value": value,
                    "points": points[simplex].tolist(),
                    "dimension": len(simplex) - 1,
                } for simplex, value in filt
            ],
        },
        "holes": [
            {
                "birth": birth,
                "death": death,
                "lifetime": death - birth,
                "dimension": dim,
            } for dim, simplices in enumerate(diagrams) for birth, death in simplices
        ],
    }
Beispiel #2
0
import logging
logging.basicConfig(level=logging.CRITICAL)

from ctk_cli import CLIArgumentParser


def main(args):

    feature_list = []


# Initialize a noisy circle
X = tadasets.dsphere(n=100, d=1, r=1, noise=0.2)
# Instantiate and build a rips filtration
rips = cm.Rips(1)  #Go up to 1D homology
rips.build(X)
dgmsrips = rips.diagrams()

plt.subplot(121)
plt.scatter(X[:, 0], X[:, 1])
plt.axis('square')
plt.title("Point Cloud")
plt.subplot(122)
plot_diagrams(dgmsrips)
plt.title("Rips Persistence Diagrams")
plt.tight_layout()
plt.show()

# data_test = np.random.random((100,2))
#data = im_label
Beispiel #3
0
    def build(self, **kwargs):
        '''
        Apply persistent homology using the combination of Cechmate and PHAT.

        On successful run, this function constructs:
            1. A list of dictionaries. Each dictionary corresponds to a 
                birth/death feature containing keys:
                    'pair', 'birth', 'death', 'H_i', 'generator_ptr'
                The ordering here has no significance outside of the internals 
                of the cechmate/PHAT algorithms.

            2. A collection of useful statistics in the same order for 
                visualization/access of top-level information. These are 
                flat numpy arrays for easy slicing/access without having to work 
                with dictionary/list logic. Available attributes:
                    self.births
                    self.deaths
                    self.H_i
                    self.generator_ptrs

            3. A collection of common orderings of the topological features
                based on the above information generated using by numpy.argsort.
                Available orderings:
                    self._persistence_order (death-birth; sorted from largest first)
                    self._birth_order       (sorted from smallest first)
                    self._death_order       (sorted from smallest first)

        Inputs: None; but you must instantiate the class with the data matrix first.

        Optional inputs:
            verbosity: controls amount of print statements. Currently only two levels; 
                0 : no print statements (default)
                1 : reports progress along pipeline.

        Outputs: None; but the above attributes are stored in the object.
        '''

        verbosity = kwargs.get('verbosity', 0)

        # this part loosely follows https://cechmate.scikit-tda.org/notebooks/BasicUsage.html
        rips = cechmate.Rips(maxdim=self.maxdim)

        if verbosity > 0: print('Building complex...')
        compl = rips.build(self.X)  # TODO: this is the second slowest part

        if verbosity > 0: print('ordering simplices...')
        ordered_simplices = sorted(compl, key=lambda x: (x[1], len(x[0])))

        # cast as numpy array for handy array slicing later
        o_s2 = np.array(ordered_simplices)

        #
        # TODO: This is the bottleneck right now in terms of speed!
        # It's written in python; if there's a C++ version sitting around it could
        # be sped up. The python code doesn't look too crazy...
        if verbosity > 0: print('Casting to sparse pivot column form...')
        columns = cechmate.solver._simplices_to_sparse_pivot_column(
            ordered_simplices)

        if verbosity > 0: print('Building boundary matrix...')
        b_m = phat.boundary_matrix(
            columns=columns,
            representation=phat.representations.sparse_pivot_column)

        if verbosity > 0: print('Computing persistence pairs...')
        pairs = b_m.compute_persistence_pairs(
        )  # boundary matrix gets reduced in-place here

        #
        # OK, here's the sketch of what we're doing
        # to get out generators:
        #
        # 1. Use some criterion to identify which birth/death pairs you want
        #    (e.g. lexsort by homological dimension, then lifetime)
        # 2. Identify the "pairs" in the associated table (from b_m.compute_persistence_pairs)
        # 3. Associate "pairs" (boundary matrix columns) with associated simplices
        #    by identifying nonzero entries (b_m.get_column(j)); these are indexes
        #    for ordered_simplices)
        # 4. Visualize/attach information however you like.
        #
        # REVISITED: pass on #1 until visualization/processing stage.
        # otherwise loosely following 2-4, but no visualization in this function.
        #

        pp = np.array(
            list(pairs))  # cast to numpy array just to get array slicing

        # Find homological dimension of each thing; following the lead of
        # cechmate.solver._process_distances().
        Hi = np.array([len(o_s2[ppi[0]][0]) - 1 for ppi in pp])

        # Pull out simplex information from the processed boundary matrix.
        if verbosity > 0: print('Identifying generators...')
        sparse_reduced_b_m = {}

        for j in range(b_m._matrix.get_num_cols()):
            thing = b_m._matrix.get_col(j)
            if len(thing) > 0:
                sparse_reduced_b_m[j] = np.array(thing, dtype=np.int64)
        #

        if verbosity > 0: print('Putting a bow on everything...')
        topo_features = []

        for ii, pair in enumerate(pp):
            idx = pair[1]
            birth = o_s2[pair[0]][1]
            death = o_s2[pair[1]][1]

            # don't bother with trivial features.
            if birth == death:
                continue
            #
            gen_simplices = o_s2[sparse_reduced_b_m[idx]][:, 0]

            # vertex indices in original ordering
            g_v = np.unique(np.concatenate(gen_simplices))

            topo_features.append({
                'pair': pair,
                'birth': birth,
                'death': death,
                'H_i': Hi[ii],
                'generator_ptr': g_v
            })
        #

        # numpy array just for slicing
        self.topo_features = np.array(topo_features)

        # store summary information in flat form for easier sorting/accessing by ptr.
        self.births = np.zeros(len(self.topo_features), dtype=float)
        self.deaths = np.zeros(len(self.topo_features), dtype=float)
        self.H_i = np.zeros(len(self.topo_features), dtype=int)

        generator_ptrs = []

        for j, d in enumerate(self.topo_features):
            self.births[j] = d['birth']
            self.deaths[j] = d['death']
            self.H_i[j] = d['H_i']
            generator_ptrs.append(d['generator_ptr'])
        #
        self.generator_ptrs = np.array(generator_ptrs)

        # create orderings for later use.
        self._persistence_order = np.argsort(self.births -
                                             self.deaths)  # largest first
        self._birth_order = np.argsort(self.births)  # smallest first
        self._death_order = np.argsort(self.deaths)  # smallest first

        if verbosity > 0: print('done.')
        return
        [-1,-1],
        [3,0],
        [0,2]
        ])
    radii = [2.5,1.5,1]
    return np.vstack([
        noisy_circle(n, ci[0], ci[1], eps=eps, r=ri) for ci,ri in zip(centers,radii)
    ])
#


X = noisy_circles(80, 3)
X = np.random.permutation(X)    # shuffle

# this part loosely follows https://cechmate.scikit-tda.org/notebooks/BasicUsage.html
rips = cechmate.Rips(maxdim=1)
compl = rips.build(X)   # this is the second slowest part
ordered_simplices = sorted(compl, key=lambda x: (x[1], len(x[0])))

# cast as numpy array for handy array slicing later
o_s2 = np.array(ordered_simplices)

#
# This is the bottleneck right now in terms of speed!
# It's written in python; if there's a C++ version sitting around it could
# be sped up. The python code doesn't look too crazy...
columns = cechmate.solver._simplices_to_sparse_pivot_column(ordered_simplices)

b_m = phat.boundary_matrix(columns=columns, representation=phat.representations.sparse_pivot_column)
pairs = b_m.compute_persistence_pairs() # boundary matrix gets reduced in-place here