# !pip install ripser persim scikit-learn matplotlib numpy

import numpy as np
import matplotlib.pyplot as plt
from ripser import ripser
from persim import sliced_wasserstein
from scipy.stats import permutation_test

rng = np.random.default_rng(42)

def population(n_clouds=50, n_points=200, noise=0.05, seed_base=0):
    diagrams = []
    for i in range(n_clouds):
        r = np.random.default_rng(seed_base + i)
        theta = r.uniform(0, 2*np.pi, n_points)
        X = np.column_stack([np.cos(theta), np.sin(theta)])
        X += noise * r.normal(size=X.shape)
        diagrams.append(ripser(X, maxdim=1)['dgms'][1])
    return diagrams

pop_A = population(noise=0.05, seed_base=0)
pop_B = population(noise=0.10, seed_base=1000)
print('populations built:', len(pop_A), len(pop_B))

# YOUR TURN
# Compute the (100, 100) pairwise distance matrix using persim.sliced_wasserstein.

# YOUR TURN
# Test whether the mean within-A distance differs from the mean between-AB distance.
# Use scipy.stats.permutation_test with n_resamples=1000.

# YOUR TURN
# For noise difference in {0.02, 0.04, 0.06, 0.08, 0.10}, estimate the power
# of the test at alpha=0.05 over 50 replications each.

Lab 4 — Statistical tests on persistence diagrams¶

Setup¶

Two populations of 50 noisy circles each¶

Exercise 1 — Compute pairwise sliced-Wasserstein distance matrix¶

Exercise 2 — Permutation test¶

Exercise 3 — Power curve¶

Done?¶