# Import necessary libraries
import numpy as np
import matplotlib.pyplot as plt
from matplotlib.patches import Circle
from scipy.spatial.distance import cdist

# Set random seed for reproducibility
np.random.seed(42)

# Generate points sampled from a noisy circle
n_points = 50
theta = np.linspace(0, 2*np.pi, n_points, endpoint=False)
radius = 1.0
noise_level = 0.1

# Add noise to the circle
x = radius * np.cos(theta) + np.random.normal(0, noise_level, n_points)
y = radius * np.sin(theta) + np.random.normal(0, noise_level, n_points)

points = np.column_stack([x, y])

# Visualize the point cloud
plt.figure(figsize=(8, 8))
plt.scatter(x, y, s=50, alpha=0.6)
plt.axis('equal')
plt.title('Point Cloud Sampled from a Noisy Circle', fontsize=14)
plt.xlabel('x')
plt.ylabel('y')
plt.grid(True, alpha=0.3)
plt.show()

print(f"Generated {n_points} points in 2D space")

Generated 50 points in 2D space

# Visualize Vietoris-Rips filtration at different scales
def plot_rips_filtration(points, radii):
    fig, axes = plt.subplots(1, len(radii), figsize=(5*len(radii), 5))
    if len(radii) == 1:
        axes = [axes]
    
    for idx, r in enumerate(radii):
        ax = axes[idx]
        
        # Plot points
        ax.scatter(points[:, 0], points[:, 1], s=100, c='red', zorder=3)
        
        # Plot edges
        distances = cdist(points, points)
        for i in range(len(points)):
            for j in range(i+1, len(points)):
                if distances[i, j] <= r:
                    ax.plot([points[i, 0], points[j, 0]], 
                           [points[i, 1], points[j, 1]], 
                           'b-', alpha=0.3, linewidth=1)
        
        ax.set_aspect('equal')
        ax.set_title(f'Rips Filtration at r = {r:.2f}', fontsize=12)
        ax.grid(True, alpha=0.3)
    
    plt.tight_layout()
    plt.show()

# Use a smaller subset for clearer visualization
sample_points = points[::5]  # Take every 5th point
radii = [0.3, 0.5, 0.8]
plot_rips_filtration(sample_points, radii)

# Visualize Čech filtration concept with ball intersections
def plot_cech_concept():
    fig, axes = plt.subplots(1, 2, figsize=(14, 6))
    
    # Example points
    pts = np.array([[0, 0], [1, 0], [0.5, 0.8]])
    
    for idx, r in enumerate([0.4, 0.6]):
        ax = axes[idx]
        
        # Draw circles
        for i, pt in enumerate(pts):
            circle = Circle(pt, r, fill=False, edgecolor='blue', linewidth=2)
            ax.add_patch(circle)
            circle_fill = Circle(pt, r, alpha=0.1, facecolor='blue')
            ax.add_patch(circle_fill)
            ax.scatter(pt[0], pt[1], s=100, c='red', zorder=3)
        
        # Draw edges if balls intersect
        for i in range(len(pts)):
            for j in range(i+1, len(pts)):
                if np.linalg.norm(pts[i] - pts[j]) <= 2*r:
                    ax.plot([pts[i, 0], pts[j, 0]], 
                           [pts[i, 1], pts[j, 1]], 
                           'k-', linewidth=2, alpha=0.5)
        
        ax.set_xlim(-1, 2)
        ax.set_ylim(-1, 2)
        ax.set_aspect('equal')
        ax.set_title(f'Čech Complex at r = {r:.1f}', fontsize=12)
        ax.grid(True, alpha=0.3)
    
    plt.tight_layout()
    plt.show()

plot_cech_concept()

# Visualize sublevel-set filtration on a 2D function
def plot_sublevel_filtration():
    # Create a 2D function (e.g., sum of Gaussians)
    x = np.linspace(-3, 3, 100)
    y = np.linspace(-3, 3, 100)
    X, Y = np.meshgrid(x, y)
    
    # Function: two Gaussian peaks
    Z = (np.exp(-((X-1)**2 + (Y-1)**2)) + 
         np.exp(-((X+1)**2 + (Y+1)**2)))
    
    fig, axes = plt.subplots(1, 3, figsize=(18, 5))
    
    # Original function
    im = axes[0].contourf(X, Y, Z, levels=20, cmap='viridis')
    axes[0].set_title('Function f(x,y)', fontsize=12)
    axes[0].set_aspect('equal')
    plt.colorbar(im, ax=axes[0])
    
    # Sublevel sets at different heights
    for idx, threshold in enumerate([0.3, 0.7]):
        axes[idx+1].contourf(X, Y, Z, levels=[0, threshold], colors=['lightblue'], alpha=0.6)
        axes[idx+1].contour(X, Y, Z, levels=[threshold], colors='blue', linewidths=2)
        axes[idx+1].contourf(X, Y, Z, levels=20, cmap='viridis', alpha=0.3)
        axes[idx+1].set_title(f'Sublevel Set: f(x,y) ≤ {threshold}', fontsize=12)
        axes[idx+1].set_aspect('equal')
    
    plt.tight_layout()
    plt.show()

plot_sublevel_filtration()

# Visualize birth and death of connected components
def visualize_components():
    # Create 3 clusters of points
    np.random.seed(123)
    cluster1 = np.random.randn(8, 2) * 0.2 + np.array([0, 0])
    cluster2 = np.random.randn(8, 2) * 0.2 + np.array([2, 0])
    cluster3 = np.random.randn(8, 2) * 0.2 + np.array([1, 2])
    points = np.vstack([cluster1, cluster2, cluster3])
    
    fig, axes = plt.subplots(1, 4, figsize=(20, 5))
    radii = [0.0, 0.5, 1.6, 2]
    component_counts = []
    
    for idx, r in enumerate(radii):
        ax = axes[idx]
        ax.scatter(points[:, 0], points[:, 1], s=100, c='red', zorder=3)
        
        if r > 0:
            distances = cdist(points, points)
            for i in range(len(points)):
                for j in range(i+1, len(points)):
                    if distances[i, j] <= r:
                        ax.plot([points[i, 0], points[j, 0]], 
                               [points[i, 1], points[j, 1]], 
                               'b-', alpha=0.3, linewidth=1.5)
        
        ax.set_aspect('equal')
        ax.set_title(f'r = {r:.1f}', fontsize=14)
        ax.grid(True, alpha=0.3)
        
        # Count connected components (simplified - actual computation requires Union-Find)
        if r == 0.0:
            n_components = len(points)
        elif r == 0.5:
            n_components = 3
        elif r == 1.6:
            n_components = 2
        else:
            n_components = 1
        
        ax.text(0.05, 0.95, f'Components: {n_components}', 
               transform=ax.transAxes, fontsize=12, 
               verticalalignment='top',
               bbox=dict(boxstyle='round', facecolor='wheat', alpha=0.5))
    
    plt.suptitle('Birth and Death of Connected Components (H₀)', fontsize=16, y=1.02)
    plt.tight_layout()
    plt.show()

visualize_components()

# Visualize birth and death of a loop
def visualize_loop():
    # Generate circle points
    n = 12
    theta = np.linspace(0, 2*np.pi, n, endpoint=False)
    circle_points = np.column_stack([np.cos(theta), np.sin(theta)])
    
    fig, axes = plt.subplots(1, 4, figsize=(15, 5))
    radii = [0.5, 0.8, 1.8, 2]
    
    for idx, r in enumerate(radii):
        ax = axes[idx]
        ax.scatter(circle_points[:, 0], circle_points[:, 1], s=100, c='red', zorder=3)
        
        distances = cdist(circle_points, circle_points)
        for i in range(len(circle_points)):
            for j in range(i+1, len(circle_points)):
                if distances[i, j] <= r:
                    ax.plot([circle_points[i, 0], circle_points[j, 0]], 
                           [circle_points[i, 1], circle_points[j, 1]], 
                           'b-', alpha=0.3, linewidth=1.5)
        
        ax.set_xlim(-1.5, 1.5)
        ax.set_ylim(-1.5, 1.5)
        ax.set_aspect('equal')
        ax.grid(True, alpha=0.3)
        
        if idx == 0:
            title = f'r = {r:.1f}\nNo loop yet'
        elif idx == 1:
            title = f'r = {r:.1f}\nLoop is BORN (H₁)'
        elif idx == 1.8:
            title = f'r = {r:.1f}\nLoop is still alive (H₁)'
        else:
            title = f'r = {r:.1f}\nLoop is FILLED (dies)'
        
        ax.set_title(title, fontsize=12)
    
    plt.suptitle('Birth and Death of a 1-Dimensional Loop', fontsize=16, y=1.02)
    plt.tight_layout()
    plt.show()

visualize_loop()

# Example: Generate noisy circle data
n_points = 50
theta = np.linspace(0, 2*np.pi, n_points, endpoint=False)
radius = 1.0
noise_level = 0.15

x = radius * np.cos(theta) + np.random.normal(0, noise_level, n_points)
y = radius * np.sin(theta) + np.random.normal(0, noise_level, n_points)
circle_points = np.column_stack([x, y])

# Visualize the evolution of topology
fig, axes = plt.subplots(1, 4, figsize=(20, 5))
radii = [0.2, 0.35, 0.5, 0.8]

for idx, r in enumerate(radii):
    ax = axes[idx]
    ax.scatter(x, y, s=80, c='red', zorder=3, alpha=0.7)
    
    # Draw edges for Rips complex
    distances = cdist(circle_points, circle_points)
    for i in range(len(circle_points)):
        for j in range(i+1, len(circle_points)):
            if distances[i, j] <= r:
                ax.plot([circle_points[i, 0], circle_points[j, 0]], 
                       [circle_points[i, 1], circle_points[j, 1]], 
                       'b-', alpha=0.2, linewidth=1)
    
    ax.set_aspect('equal')
    ax.set_title(f'Scale r = {r:.2f}', fontsize=13)
    ax.grid(True, alpha=0.3)
    ax.set_xlim(-1.5, 1.5)
    ax.set_ylim(-1.5, 1.5)
    
    # Add annotation
    if idx == 0:
        ax.text(0.5, -1.3, 'Disconnected\ncomponents', ha='center', fontsize=10)
    elif idx == 1:
        ax.text(0.5, -1.3, 'Components\nmerging', ha='center', fontsize=10)
    elif idx == 2:
        ax.text(0.5, -1.3, 'Loop BORN\n(H₁ feature)', ha='center', fontsize=10, 
               bbox=dict(boxstyle='round', facecolor='yellow', alpha=0.5))
    else:
        ax.text(0.5, -1.3, 'Loop persists\n(signal)', ha='center', fontsize=10)

plt.suptitle('Persistent Homology: Tracking Features Across Scales', fontsize=16, y=1.02)
plt.tight_layout()
plt.show()

print("Key observation: The main loop (H₁) persists from r≈0.5 to large r → SIGNAL")
print("Small loops appear and disappear quickly → NOISE")

Key observation: The main loop (H₁) persists from r≈0.5 to large r → SIGNAL
Small loops appear and disappear quickly → NOISE

# Example: Create a barcode visualization
def plot_barcode(ax, intervals, title, dimension):
    # Sort by birth time
    intervals_sorted = sorted(intervals, key=lambda x: x[0])
    
    for idx, (birth, death) in enumerate(intervals_sorted):
        if death == np.inf:
            # Essential feature - draw arrow
            ax.arrow(birth, idx, 2.5, 0, head_width=0.15, head_length=0.1, 
                    fc='red', ec='red', linewidth=2)
            ax.plot([birth, birth + 2.5], [idx, idx], 'r-', linewidth=3)
        else:
            # Regular feature
            persistence = death - birth
            color = 'darkblue' if persistence > 0.3 else 'lightgray'
            linewidth = 3 if persistence > 0.3 else 1.5
            ax.plot([birth, death], [idx, idx], color=color, linewidth=linewidth)
    
    ax.set_xlabel('Filtration Parameter (scale)', fontsize=12)
    ax.set_ylabel('Features', fontsize=12)
    ax.set_title(f'{title}\n{dimension}', fontsize=14, fontweight='bold')
    ax.grid(True, alpha=0.3, axis='x')
    ax.set_ylim(-1, len(intervals))
    
    # Add legend
    from matplotlib.lines import Line2D
    legend_elements = [
        Line2D([0], [0], color='darkblue', linewidth=3, label='Signal (long-lived)'),
        Line2D([0], [0], color='lightgray', linewidth=1.5, label='Noise (short-lived)'),
        Line2D([0], [0], color='red', linewidth=3, label='Essential (death = ∞)')
    ]
    ax.legend(handles=legend_elements, loc='upper right')

# Example data: H₀ (connected components)
h0_intervals = [
    (0.0, np.inf),  # Essential: main component
    (0.0, 0.25),    # Components merge
    (0.0, 0.30),
    (0.0, 0.35),
    (0.0, 0.40),
    (0.0, 0.45),
    (0.0, 0.50),
]

# Example data: H₁ (loops)
h1_intervals = [
    (0.48, 1.80),   # Main loop (SIGNAL)
    (0.25, 0.35),   # Noise
    (0.30, 0.38),   # Noise
    (0.52, 0.61),   # Noise
    (0.45, 0.53),   # Noise
    (0.70, 0.82),   # Small loop
]

# Create subplots with two columns
fig, axes = plt.subplots(1, 2, figsize=(12, 6))

# Plot H₀ barcode on the first axis (left)
plot_barcode(axes[0], h0_intervals, 'Barcode', 'H₀ (Connected Components)')

# Plot H₁ barcode on the second axis (right)
plot_barcode(axes[1], h1_intervals, 'Barcode', 'H₁ (Loops/Holes)')

# Adjust layout for better spacing
plt.tight_layout()
plt.show()

# Create persistence diagram visualization
def plot_persistence_diagram(ax, points, title, dimension):
    # Separate finite and infinite death times
    finite_points = [(b, d) for b, d in points if d != np.inf]
    essential_points = [(b, d) for b, d in points if d == np.inf]
    
    # Plot diagonal
    max_val = max([d for b, d in finite_points] + [b for b, d in finite_points]) if finite_points else 2.0
    diag_line = np.linspace(0, max_val * 1.1, 100)
    ax.plot(diag_line, diag_line, 'k--', linewidth=2, label='Diagonal (y=x)', alpha=0.5)
    
    # Plot finite points
    if finite_points:
        births = [b for b, d in finite_points]
        deaths = [d for b, d in finite_points]
        persistences = [d - b for b, d in finite_points]
        
        # Color by persistence
        colors = ['red' if p > 0.3 else 'lightblue' for p in persistences]
        sizes = [200 if p > 0.3 else 50 for p in persistences]
        
        for b, d, c, s in zip(births, deaths, colors, sizes):
            ax.scatter(b, d, c=c, s=s, alpha=0.7, edgecolors='black', linewidth=1)
    
    # Plot essential points (at top of diagram)
    if essential_points:
        essential_births = [b for b, d in essential_points]
        essential_y = [max_val * 1.05] * len(essential_births)  # Place near top
        ax.scatter(essential_births, essential_y, c='darkred', s=300, 
                  marker='^', label='Essential (death = ∞)', 
                  edgecolors='black', linewidth=2)
    
    ax.set_xlabel('Birth', fontsize=13)
    ax.set_ylabel('Death', fontsize=13)
    ax.set_title(f'{title}\n{dimension}', fontsize=14, fontweight='bold')
    ax.grid(True, alpha=0.3)
    ax.set_aspect('equal')
    
    # Add legend
    from matplotlib.lines import Line2D
    legend_elements = [
        Line2D([0], [0], marker='o', color='w', markerfacecolor='red', 
               markersize=12, label='Signal (far from diagonal)'),
        Line2D([0], [0], marker='o', color='w', markerfacecolor='lightblue', 
               markersize=8, label='Noise (near diagonal)'),
        Line2D([0], [0], color='k', linestyle='--', linewidth=2, label='Diagonal (y=x)')
    ]
    if essential_points:
        legend_elements.append(
            Line2D([0], [0], marker='^', color='w', markerfacecolor='darkred', 
                   markersize=12, label='Essential (death = ∞)')
        )
    ax.legend(handles=legend_elements, loc='lower right', fontsize=10)

# Create subplots with two columns
fig, axes = plt.subplots(1, 2, figsize=(12, 6))

# Plot H₀ persistence diagram on the first axis (left)
plot_persistence_diagram(axes[0], h0_intervals, 'Persistence Diagram', 'H₀ (Connected Components)')

# Plot H₁ persistence diagram on the second axis (right)
plot_persistence_diagram(axes[1], h1_intervals, 'Persistence Diagram', 'H₁ (Loops/Holes)')

# Adjust layout for better spacing
plt.tight_layout()
plt.show()

# Side-by-side comparison
def compare_representations(intervals, dimension):
    fig = plt.figure(figsize=(18, 6))
    
    # Barcode (left)
    ax1 = plt.subplot(1, 2, 1)
    intervals_sorted = sorted([i for i in intervals if i[1] != np.inf], key=lambda x: x[0])
    
    for idx, (birth, death) in enumerate(intervals_sorted):
        persistence = death - birth
        color = 'darkblue' if persistence > 0.3 else 'lightgray'
        linewidth = 3 if persistence > 0.3 else 1.5
        ax1.plot([birth, death], [idx, idx], color=color, linewidth=linewidth)
    
    ax1.set_xlabel('Filtration Parameter', fontsize=12)
    ax1.set_ylabel('Features', fontsize=12)
    ax1.set_title(f'Barcode - {dimension}', fontsize=13, fontweight='bold')
    ax1.grid(True, alpha=0.3, axis='x')
    
    # Persistence diagram (right)
    ax2 = plt.subplot(1, 2, 2)
    
    finite_points = [(b, d) for b, d in intervals if d != np.inf]
    if finite_points:
        births = [b for b, d in finite_points]
        deaths = [d for b, d in finite_points]
        persistences = [d - b for b, d in finite_points]
        
        max_val = max(deaths + births)
        diag_line = np.linspace(0, max_val * 1.1, 100)
        ax2.plot(diag_line, diag_line, 'k--', linewidth=2, alpha=0.5)
        
        colors = ['red' if p > 0.3 else 'lightblue' for p in persistences]
        sizes = [200 if p > 0.3 else 50 for p in persistences]
        
        for b, d, c, s in zip(births, deaths, colors, sizes):
            ax2.scatter(b, d, c=c, s=s, alpha=0.7, edgecolors='black', linewidth=1)
    
    ax2.set_xlabel('Birth', fontsize=12)
    ax2.set_ylabel('Death', fontsize=12)
    ax2.set_title(f'Persistence Diagram - {dimension}', fontsize=13, fontweight='bold')
    ax2.grid(True, alpha=0.3)
    ax2.set_aspect('equal')
    
    plt.suptitle('Two Equivalent Representations of the Same Topological Information', 
                fontsize=15, fontweight='bold', y=1.02)
    plt.tight_layout()
    plt.show()

compare_representations(h1_intervals, 'H₁')

import numpy as np
import matplotlib.pyplot as plt

# Visualize two persistence diagrams
D1 = np.array([[1, 4], [2, 5]])
D2 = np.array([[1.2, 4.1], [2.1, 4.9]])

fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(12, 5))

# Plot D1
ax1.scatter(D1[:, 0], D1[:, 1], s=100, c='blue', marker='o', label='D1')
ax1.plot([0, 6], [0, 6], 'k--', alpha=0.3, label='Diagonal')
ax1.set_xlabel('Birth', fontsize=12)
ax1.set_ylabel('Death', fontsize=12)
ax1.set_title('Persistence Diagram D1', fontsize=14)
ax1.legend()
ax1.grid(True, alpha=0.3)
ax1.set_aspect('equal')

# Plot D2
ax2.scatter(D2[:, 0], D2[:, 1], s=100, c='red', marker='s', label='D2')
ax2.plot([0, 6], [0, 6], 'k--', alpha=0.3, label='Diagonal')
ax2.set_xlabel('Birth', fontsize=12)
ax2.set_ylabel('Death', fontsize=12)
ax2.set_title('Persistence Diagram D2', fontsize=14)
ax2.legend()
ax2.grid(True, alpha=0.3)
ax2.set_aspect('equal')

plt.tight_layout()
plt.show()

# Demonstrate difference between Bottleneck and Wasserstein
def compute_wasserstein_p(D1, D2, p):
    """Simple computation assuming optimal matching is identity"""
    if len(D1) != len(D2):
        raise ValueError("Diagrams must have same size for this example")
    
    costs = np.max(np.abs(D1 - D2), axis=1)  # L-infinity norm
    if p == np.inf:
        return np.max(costs)
    else:
        return np.power(np.sum(np.power(costs, p)), 1/p)

# Example diagrams
D1 = np.array([[1, 3], [2, 4], [3, 5]])
D2 = np.array([[1.1, 3.1], [2.1, 4.1], [3.1, 5.1]])

print("Distance comparisons:")
print(f"Bottleneck (p=∞): {compute_wasserstein_p(D1, D2, np.inf):.4f}")
print(f"1-Wasserstein:    {compute_wasserstein_p(D1, D2, 1):.4f}")
print(f"2-Wasserstein:    {compute_wasserstein_p(D1, D2, 2):.4f}")
print(f"5-Wasserstein:    {compute_wasserstein_p(D1, D2, 5):.4f}")

Distance comparisons:
Bottleneck (p=∞): 0.1000
1-Wasserstein:    0.3000
2-Wasserstein:    0.1732
5-Wasserstein:    0.1246

# Demonstrate stability with noisy data
def generate_circle(n_points, radius=1, noise_level=0):
    """Generate points on a circle with optional noise"""
    theta = np.linspace(0, 2*np.pi, n_points, endpoint=False)
    x = radius * np.cos(theta)
    y = radius * np.sin(theta)
    
    if noise_level > 0:
        x += np.random.normal(0, noise_level, n_points)
        y += np.random.normal(0, noise_level, n_points)
    
    return np.column_stack([x, y])

# Generate clean and noisy circles
np.random.seed(42)
circle_clean = generate_circle(50, radius=1, noise_level=0)
circle_noisy = generate_circle(50, radius=1, noise_level=0.1)

fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(12, 5))

# Plot clean circle
ax1.scatter(circle_clean[:, 0], circle_clean[:, 1], s=50, c='blue', alpha=0.6)
ax1.set_xlabel('x', fontsize=12)
ax1.set_ylabel('y', fontsize=12)
ax1.set_title('Clean Circle', fontsize=14)
ax1.set_aspect('equal')
ax1.grid(True, alpha=0.3)

# Plot noisy circle
ax2.scatter(circle_noisy[:, 0], circle_noisy[:, 1], s=50, c='red', alpha=0.6)
ax2.set_xlabel('x', fontsize=12)
ax2.set_ylabel('y', fontsize=12)
ax2.set_title('Noisy Circle (noise = 0.1)', fontsize=14)
ax2.set_aspect('equal')
ax2.grid(True, alpha=0.3)

plt.tight_layout()
plt.show()

print("Expected behavior:")
print("- Both should show one persistent H1 feature (the loop)")
print("- Noisy version will have many short-lived features")
print("- Main loop feature persists and is stable (moves by ≤ noise level)")

Expected behavior:
- Both should show one persistent H1 feature (the loop)
- Noisy version will have many short-lived features
- Main loop feature persists and is stable (moves by ≤ noise level)

Filtration	Computational Cost	Theoretical Accuracy	Typical Use Case
Vietoris–Rips	Low	Approximation	General point clouds
Čech	High	Exact (nerve theorem)	Theoretical analysis
Alpha	Medium (low dim)	Exact (in low dim)	2D/3D geometric data
Sublevel-set	Depends on domain	Exact	Scalar fields, images

Index	Simplex	Dimension	Filtration time
0	$a$	0	0
1	$b$	0	0
2	$c$	0	0
3	$ab$	1	1
4	$bc$	1	1
5	$ca$	1	1
6	$abc$	2	2

Aspect	Traditional Features	Topological Features
Invariance	Often coordinate-dependent	Coordinate-free
Noise	Sensitive to outliers	Stable by design
Scale	Single scale or fixed scales	Multi-scale automatically
Interpretation	Domain-specific	Geometric/topological
Computation	Often fast	Can be expensive
Applicability	Dataset-specific	General purpose

Module 4: Persistent Homology and Persistence Diagrams¶

Introduction¶

Essential Concepts¶

Key Ideas:¶

Example: Point Cloud Data¶

1. Filtrations (Core Idea)¶

Definition¶

Why Filtrations?¶

Most Common Filtrations¶

1. Vietoris–Rips Filtration¶

2. Čech Filtration¶

3. Alpha Filtration¶

4. Sublevel-Set Filtration¶

Comparison of Filtrations¶

2. Topological Features Across Scales¶

Birth and Death of Features¶

Types of Features¶

0-Dimensional Features: Connected Components¶

1-Dimensional Features: Loops and Holes¶

2-Dimensional Features: Voids¶

Key Insight¶

Signal vs. Noise Heuristic¶

3. Persistent Homology¶

Formal Definition: Persistence Module¶

Structure Theorem¶

4. Persistence Diagrams & Barcodes¶

4.1 Barcodes¶

Structure:¶

Interpretation:¶

4.2 Persistence Diagrams¶

Structure:¶

Interpreting Persistence Diagrams¶

Equivalence of Representations¶

5. Distances & Stability¶

5.1 The Need for Distance Metrics¶

5.2 Bottleneck Distance¶

Definition¶

Intuition¶

Example: Computing Bottleneck Distance¶

5.3 Wasserstein Distance¶

Definition¶

Special Cases¶

Example: Wasserstein vs Bottleneck¶

5.4 Stability Theorem¶

Statement¶

Interpretation¶

Practical Implications¶

Example: Noisy Circle¶

Extended Stability Results¶

6. Algorithm for Computing Persistent Homology¶

6.1 Matrix Reduction Algorithm¶

The Boundary Matrix¶

Matrix Reduction Algorithm¶

Reading Birth-Death Pairs¶

Example: Computing $H_0$ and $H_1$ for a Triangle¶

Summary of Algorithm¶

6.2 Computational Complexity¶

Bottlenecks¶

Rips Complex Growth¶

Practical Strategies¶

7. Interpretation & Usage¶

Signal vs. Noise Separation¶

Topological Features for Data Analysis¶

Practical Use Cases¶

Summary: Why Persistent Homology Works¶

Comparison: Traditional vs. Topological Features¶

Further Reading¶

Programming tasks¶

Task 1: Persistence Diagrams for Shape Analysis of Point Clouds¶

Background:¶

Input:¶

Output:¶

Notes:¶

Task 2: Computing Bottleneck Distance Between Persistence Diagrams¶

Background:¶

Input:¶

Output:¶

Notes:¶

Task 3: Topological Analysis of Images Using Persistence Diagrams¶

Background:¶