%matplotlib inline
%load_ext autoreload
%autoreload 2

import numpy as np
import matplotlib.pyplot as plt
import gudhi as gd
from gudhi.tensorflow import RipsLayer
import tensorflow as tf
from tqdm.notebook import tqdm

import utils as u

print("Version of Gudhi you are using: (should be at least 3.8.0): %s" %gd.__version__)
print("Version of tensorflow (should be at least 2.4): %s " %tf.__version__)

Version of Gudhi you are using: (should be at least 3.8.0): 3.8.0
Version of tensorflow: 2.13.0

# Run the following cell to have an illustration
u.showcase_homotopy()

u.showcase_point_cloud_trivial_homology()

# Showcase the sublevelset of $f$. You can play with the value of "parameter".
# (keep it > 0 for plotting purposes)
u.showcase_sublevel_sets(parameter = 0.8)

# Illustration of the Cech sublevel set and the above (informal) theorem.
# Unless you've been very unlucky with your sampling, the homology of the Cech 
# sublevelset (lightblue area) should be the same as the one of the underlying shape X
# that is, a circle --> one connected component and one non-trivial loop.

u.showcase_Cech_sublevelset(parameter=0.2)

# You can play with the parameter, if it's too low, you will not see the loop (and even have more than 1
# connected component, if it's too large, the loop structure will be killed (filled in), and your sublevel set
# will have the homology of a disk (that is of a point).

u.showcase_birth_death()

u.showcase_barcode_and_dgm()
# There is a visual artefact which makes the cavity (2-dimensional homological feature) in the Torus hard to see 
# in the barcode representation. 
# The Persistence Diagram representation should often be prefered.

u.showcase_tda_stability()

# Generate a 2 dimensional simplicial complex. As the vertices are located randomly, the result may not be very beautiful in some instances
# do not hesitate to run it several times.
u.showcase_simplicial_complex()

u.showcase_simplicial_filtration()

u.showcase_cech_simplicial_filtration()

# A short illustration for the Rips filtration. The top-left Figure shows the difference with the Cech filtration: 
# even though the three balls does not intersect all together, the face (triangle) is introduced as they pairwise intersect.
u.showcase_rips_simplicial_filtration()

u.showcase_time_delay_embedding()

u.showcase_sw_periodicity(noise_level=1.)

u.showcase_vectorization()

st = gd.SimplexTree()

st.insert([0])

True

for simplex, value in st.get_filtration():
    print("Simplex:", simplex, "---> value:", value)

Simplex: [0] ---> value: 0.0

st.insert([0,1], filtration=2.0)

True

for simplex, value in st.get_filtration():
    print("Simplex:", simplex, "---> value:", value)

Simplex: [0] ---> value: 0.0
Simplex: [1] ---> value: 2.0
Simplex: [0, 1] ---> value: 2.0

st.insert([0, 1, 2], filtration=3.0)
for simplex, value in st.get_filtration():
    print("Simplex:", simplex, "---> value:", value)

Simplex: [0] ---> value: 0.0
Simplex: [1] ---> value: 2.0
Simplex: [0, 1] ---> value: 2.0
Simplex: [2] ---> value: 3.0
Simplex: [0, 2] ---> value: 3.0
Simplex: [1, 2] ---> value: 3.0
Simplex: [0, 1, 2] ---> value: 3.0

st.insert([4], filtration = 5.0)  # add a new vertex with filtration value 5.0
st.insert([3,4], filtration = 3.0) # add a new edge between vertex 3 and 4 with filtration value 3.0

st.insert([0, 1, 2], filtration=3.0)
for simplex, value in st.get_filtration():
    print("Simplex:", simplex, "---> value:", value)

Simplex: [0] ---> value: 0.0
Simplex: [1] ---> value: 2.0
Simplex: [0, 1] ---> value: 2.0
Simplex: [2] ---> value: 3.0
Simplex: [0, 2] ---> value: 3.0
Simplex: [1, 2] ---> value: 3.0
Simplex: [0, 1, 2] ---> value: 3.0
Simplex: [3] ---> value: 3.0
Simplex: [4] ---> value: 3.0
Simplex: [3, 4] ---> value: 3.0

X = np.array([[0,0], [0,1], [0,2], [1,2], [2,2], [2,1], [2,0], [1,0]])   # a 2-dimensional point cloud
fig, ax = plt.subplots()
ax.scatter(X[:,0], X[:,1], color='red', zorder=5)
for i, x in enumerate(X):
    ax.annotate('%s' %i, x + (0.03, 0.03))
ax.grid()

rips_complex = gd.RipsComplex(points=X).create_simplex_tree(max_dimension=2)

for simplex, value in rips_complex.get_filtration():
    print("Simplex:", simplex, "---> value:", value)

Simplex: [0] ---> value: 0.0
Simplex: [1] ---> value: 0.0
Simplex: [2] ---> value: 0.0
Simplex: [3] ---> value: 0.0
Simplex: [4] ---> value: 0.0
Simplex: [5] ---> value: 0.0
Simplex: [6] ---> value: 0.0
Simplex: [7] ---> value: 0.0
Simplex: [0, 1] ---> value: 1.0
Simplex: [1, 2] ---> value: 1.0
Simplex: [2, 3] ---> value: 1.0
Simplex: [3, 4] ---> value: 1.0
Simplex: [4, 5] ---> value: 1.0
Simplex: [5, 6] ---> value: 1.0
Simplex: [0, 7] ---> value: 1.0
Simplex: [6, 7] ---> value: 1.0
Simplex: [1, 3] ---> value: 1.4142135623730951
Simplex: [1, 2, 3] ---> value: 1.4142135623730951
Simplex: [3, 5] ---> value: 1.4142135623730951
Simplex: [3, 4, 5] ---> value: 1.4142135623730951
Simplex: [1, 7] ---> value: 1.4142135623730951
Simplex: [0, 1, 7] ---> value: 1.4142135623730951
Simplex: [5, 7] ---> value: 1.4142135623730951
Simplex: [5, 6, 7] ---> value: 1.4142135623730951
Simplex: [0, 2] ---> value: 2.0
Simplex: [0, 1, 2] ---> value: 2.0
Simplex: [2, 4] ---> value: 2.0
Simplex: [2, 3, 4] ---> value: 2.0
Simplex: [1, 5] ---> value: 2.0
Simplex: [1, 3, 5] ---> value: 2.0
Simplex: [0, 6] ---> value: 2.0
Simplex: [4, 6] ---> value: 2.0
Simplex: [4, 5, 6] ---> value: 2.0
Simplex: [3, 7] ---> value: 2.0
Simplex: [1, 3, 7] ---> value: 2.0
Simplex: [1, 5, 7] ---> value: 2.0
Simplex: [3, 5, 7] ---> value: 2.0
Simplex: [0, 6, 7] ---> value: 2.0
Simplex: [0, 3] ---> value: 2.23606797749979
Simplex: [0, 1, 3] ---> value: 2.23606797749979
Simplex: [0, 2, 3] ---> value: 2.23606797749979
Simplex: [1, 4] ---> value: 2.23606797749979
Simplex: [1, 2, 4] ---> value: 2.23606797749979
Simplex: [1, 3, 4] ---> value: 2.23606797749979
Simplex: [0, 5] ---> value: 2.23606797749979
Simplex: [0, 1, 5] ---> value: 2.23606797749979
Simplex: [2, 5] ---> value: 2.23606797749979
Simplex: [0, 2, 5] ---> value: 2.23606797749979
Simplex: [1, 2, 5] ---> value: 2.23606797749979
Simplex: [0, 3, 5] ---> value: 2.23606797749979
Simplex: [2, 3, 5] ---> value: 2.23606797749979
Simplex: [1, 4, 5] ---> value: 2.23606797749979
Simplex: [2, 4, 5] ---> value: 2.23606797749979
Simplex: [1, 6] ---> value: 2.23606797749979
Simplex: [0, 1, 6] ---> value: 2.23606797749979
Simplex: [3, 6] ---> value: 2.23606797749979
Simplex: [0, 3, 6] ---> value: 2.23606797749979
Simplex: [1, 3, 6] ---> value: 2.23606797749979
Simplex: [1, 4, 6] ---> value: 2.23606797749979
Simplex: [3, 4, 6] ---> value: 2.23606797749979
Simplex: [0, 5, 6] ---> value: 2.23606797749979
Simplex: [1, 5, 6] ---> value: 2.23606797749979
Simplex: [3, 5, 6] ---> value: 2.23606797749979
Simplex: [2, 7] ---> value: 2.23606797749979
Simplex: [0, 2, 7] ---> value: 2.23606797749979
Simplex: [1, 2, 7] ---> value: 2.23606797749979
Simplex: [0, 3, 7] ---> value: 2.23606797749979
Simplex: [2, 3, 7] ---> value: 2.23606797749979
Simplex: [4, 7] ---> value: 2.23606797749979
Simplex: [1, 4, 7] ---> value: 2.23606797749979
Simplex: [2, 4, 7] ---> value: 2.23606797749979
Simplex: [3, 4, 7] ---> value: 2.23606797749979
Simplex: [0, 5, 7] ---> value: 2.23606797749979
Simplex: [2, 5, 7] ---> value: 2.23606797749979
Simplex: [4, 5, 7] ---> value: 2.23606797749979
Simplex: [1, 6, 7] ---> value: 2.23606797749979
Simplex: [3, 6, 7] ---> value: 2.23606797749979
Simplex: [4, 6, 7] ---> value: 2.23606797749979
Simplex: [0, 4] ---> value: 2.8284271247461903
Simplex: [0, 1, 4] ---> value: 2.8284271247461903
Simplex: [0, 2, 4] ---> value: 2.8284271247461903
Simplex: [0, 3, 4] ---> value: 2.8284271247461903
Simplex: [0, 4, 5] ---> value: 2.8284271247461903
Simplex: [2, 6] ---> value: 2.8284271247461903
Simplex: [0, 2, 6] ---> value: 2.8284271247461903
Simplex: [1, 2, 6] ---> value: 2.8284271247461903
Simplex: [2, 3, 6] ---> value: 2.8284271247461903
Simplex: [0, 4, 6] ---> value: 2.8284271247461903
Simplex: [2, 4, 6] ---> value: 2.8284271247461903
Simplex: [2, 5, 6] ---> value: 2.8284271247461903
Simplex: [0, 4, 7] ---> value: 2.8284271247461903
Simplex: [2, 6, 7] ---> value: 2.8284271247461903

M = np.random.rand(4, 4)  # A random 4x4 square matrix with entries in (0,1)

rips_complex = gd.RipsComplex(distance_matrix=M).create_simplex_tree(max_dimension=2)

for simplex, value in rips_complex.get_filtration():
    print("Simplex:", simplex, "---> value:", value)

Simplex: [0] ---> value: 0.0
Simplex: [1] ---> value: 0.0
Simplex: [2] ---> value: 0.0
Simplex: [3] ---> value: 0.0
Simplex: [1, 3] ---> value: 0.12628582984808145
Simplex: [2, 3] ---> value: 0.14834324394652643
Simplex: [1, 2] ---> value: 0.3228545589508307
Simplex: [1, 2, 3] ---> value: 0.3228545589508307
Simplex: [0, 2] ---> value: 0.3615988007382981
Simplex: [0, 3] ---> value: 0.415702267407685
Simplex: [0, 2, 3] ---> value: 0.415702267407685
Simplex: [0, 1] ---> value: 0.4678051145898179
Simplex: [0, 1, 2] ---> value: 0.4678051145898179
Simplex: [0, 1, 3] ---> value: 0.4678051145898179

# Let us give an example with a Rips Filtration on a random point cloud in 2D. 

# Built the point cloud
X = np.random.randn(30, 2)  # 30 points in dimension 2
# Built the Rips Simplicial Complex
rc = gd.RipsComplex(points=X).create_simplex_tree(max_dimension=2)  # A RipsComplex where we introduce vertices, edges and triangles, but not higher dimensional simplices.
# Compute and reads its persistence (in any dimension)
dgm = rc.persistence()  # We compute its persistence diagram

# Plot all of this.
fig, axs = plt.subplots(1, 2, figsize=(12,4))
ax = axs[0]
ax.scatter(X[:,0], X[:,1], color='red')
ax.set_title("Input point cloud")
ax.grid()

ax = axs[1]
ax = gd.plot_persistence_diagram(dgm, axes=ax)
ax.set_title("PD (you can modify the title)")

Text(0.5, 1.0, 'PD (you can modify the title)')

# We generate three random 2D point clouds
X1 = np.random.randn(20, 2)
X2 = np.random.randn(30, 2)
X3 = np.random.randn(50, 2)

# Compute their Rips filtrations
rc1 = gd.RipsComplex(points=X1).create_simplex_tree(max_dimension=2)
rc2 = gd.RipsComplex(points=X2).create_simplex_tree(max_dimension=2)
rc3 = gd.RipsComplex(points=X3).create_simplex_tree(max_dimension=2)

# Compute their persistence
rc1.compute_persistence()
rc2.compute_persistence()
rc3.compute_persistence()

# Get the diagram in dimension 1 (loops)
dgm1 = rc1.persistence_intervals_in_dimension(1)
dgm2 = rc2.persistence_intervals_in_dimension(1)
dgm3 = rc3.persistence_intervals_in_dimension(1)

# Now compute the Wasserstein Distance between the first two diagrams:
Wdist = gd.representations.metrics.WassersteinDistance(order=2.)
dist = Wdist(dgm1, dgm2)

print("Distance between the two diagrams: %.3f" %dist)

# and now the pairwise distances matrix using a sklearn-like API
dgm_set = [dgm1, dgm2, dgm3]
Wdist.fit(dgm_set)
dist_matrix = Wdist.transform(dgm_set)  # Note: we could use another set of diagrams to compute pairwise distance between the first set uesd in fit, and another second set of diagrams.

print("\nPairwise distance matrix between the three diagrams:")
print(np.round(dist_matrix, 3))

Distance between the two diagrams: 0.078

Pairwise distance matrix between the three diagrams:
[[0.    0.078 0.085]
 [0.078 0.    0.083]
 [0.085 0.083 0.   ]]

# We use the same diagram list as above, so do not forget to run the previous cell first.
# Instanciate the object
reso = 30, 30
PI = gd.representations.vector_methods.PersistenceImage(bandwidth=0.05, resolution=reso)
# fit it to the dataset (so that it adapts few internal parameters)
PI.fit(dgm_set)
# And now we compute the persistence images of all diagrams in our list.
final_persistence_images = PI.transform(dgm_set)

n = len(dgm_set)
fig, axs = plt.subplots(1, n, figsize=(15,3))
for pim, ax in zip(final_persistence_images, axs):
    ax.imshow(pim.reshape(reso))

# Generate and visualize the point cloud, along with its persistence diagrams
np.random.seed(1)
Xinit = np.array(np.random.uniform(high=1., low=-1., size=(300,2)), dtype=np.float32)
st = gd.RipsComplex(points=Xinit, max_edge_length=1.).create_simplex_tree(max_dimension=2)
dgm = st.persistence()

fig, axs = plt.subplots(1, 2, figsize=(12, 4))
ax = axs[0]
ax.scatter(Xinit[:,0], Xinit[:,1], color='red')
ax.set_title("Initial point cloud")
ax.grid()
ax = axs[1]
plot = gd.plot_persistence_diagram(dgm, axes=ax)

X = tf.Variable(initial_value=Xinit, trainable=True)

layer = gd.tensorflow.RipsLayer(maximum_edge_length=1., homology_dimensions=[1])

lr = tf.keras.optimizers.schedules.InverseTimeDecay(initial_learning_rate=1e-1, decay_steps=10, decay_rate=.01)
optimizer = tf.keras.optimizers.SGD(learning_rate=lr, momentum=0.)

losses, dgms = [], []
for epoch in tqdm(range(200+1)):
    
    with tf.GradientTape() as tape:  # tensorflow syntax
        # We compute the diagram of the current X
        dgm = layer.call(X)[0][0]  
        # We compute the loss at X
        persistence_loss = -tf.math.reduce_sum(tf.square(.5*(dgm[:,1]-dgm[:,0])))
        # Unit square regularization
        regularization = tf.reduce_sum(tf.maximum(tf.abs(X)-1, 0))
        # Compute the loss
        loss = persistence_loss + regularization

    # Now, we ask tensorflow "compute the gradient of the loss with respect to the (single) variable X"
    gradients = tape.gradient(loss, [X])
    
    # We also apply a small random noise to the gradient to ensure convergence 
    np.random.seed(epoch)
    gradients[0] = gradients[0] + np.random.normal(loc=0., scale=.001, size=gradients[0].shape)
    
    optimizer.apply_gradients(zip(gradients, [X]))
    losses.append(loss.numpy())
    dgms.append(dgm)

100%|██████████| 201/201 [01:16<00:00,  2.64it/s]

Xnp = X.numpy()  # turns X back to a numpy variable for plotting purpose

fig, axs = plt.subplots(1, 3, figsize=(20,4))

ax = axs[0]
ax.scatter(Xinit[:,0], Xinit[:,1], color='red', label='init', alpha=0.2)
ax.scatter(Xnp[:,0], Xnp[:,1], color='blue', label='final state')
ax.legend()
ax.grid()
ax.set_title("Initial and final point cloud")

ax = axs[1]
gd.plot_persistence_diagram(dgms[0].numpy(), axes=ax, colormap=[[1,0,0]], alpha=0.5)
gd.plot_persistence_diagram(dgms[-1].numpy(), axes=ax, colormap=[[0,0,1]])
ax.set_title("Initial and final persistence diagrams")

ax = axs[2]
ax.plot(losses)
ax.set_title("Evolution of the loss over iterations")
ax.grid()

r1, r2 = 3.5, 4.1

traj1 = u.generate_orbit(1000, r=r1)
traj2 = u.generate_orbit(1000, r=r2)

fig, axs = plt.subplots(1, 2, figsize=(12,4))
for ax, traj, r in zip(axs, [traj1, traj2], [r1, r2]):
    ax.scatter(traj[:,0], traj[:,1])
    ax.grid()
    ax.set_title("Orbit with r = %s" %r)

walkers, steppers, runners, jumpers = u.load_data_motions(idx = 9)  # change idx (between 0 and 9) to see a different instance for each class.

# Write your code here.

Topological Data Analysis with Gudhi for Dynamical Systems, a tutorial

I. Introduction¶

II. Topological data Analysis¶

1. A brief overview of mathematical foundations of TDA¶

2. A brief overview of computational foundations of TDA¶

3. Persistent Homology for time series and dynamical systems¶

4. Vectorization of topological descriptors¶

5. Topological Optimization¶

III. Gudhi¶

1. Overall presentation of Gudhi¶

2. The SimplexTree interface¶

3. Extracting and manipulating persistence diagrams¶

4. Topological Optimization with Gudhi¶

5. Contributing to Gudhi¶

IV. Your turn: experiment TDA on Time Series¶

1. The Orbit Dataset¶

2. Recognizing motions¶

V. To go further: some questions before the MRC.¶

1. Minimal representative cycles¶

2. Filtrations for dynamical systems¶