import sys
from pathlib import Path

import numpy as np
import matplotlib.pyplot as plt

# Make the local fmg package importable regardless of the launch directory.
def _find(name):
    p = Path.cwd()
    for _ in range(6):
        if (p / name).exists():
            return p
        p = p.parent
    return Path.cwd()

PY_DIR = _find("fmg")
sys.path.insert(0, str(PY_DIR))
REPO = PY_DIR.parent
FIG_DIR = REPO / "paper" / "figures"
FIG_DIR.mkdir(parents=True, exist_ok=True)

import fmg
from fmg import schedules, mixture, ode, ot_semidiscrete, plotting
from fmg.seeding import set_seed

SEED = set_seed()
plt = plotting.setup_matplotlib()
print("fmg", fmg.__version__, "| seed", SEED, "| figures ->", FIG_DIR)

fmg 0.1.0 | seed 20260617 | figures -> /Users/eserie/galaxies/flow-matching-gaussians/.worktrees/task-20260617-32e5/paper/figures

mus = np.array([[2.4, 0.0], [-1.4, 2.0], [-1.4, -2.0]])   # three atoms
w = np.array([0.45, 0.30, 0.25])                          # weights (sum to 1)
SCHEDULES = [schedules.linear(), schedules.variance_preserving(), schedules.cosine()]

for s in SCHEDULES:
    s.check_boundary()
print("atoms\n", mus, "\nweights", w)
print("schedules:", [s.name for s in SCHEDULES], "— boundary conditions OK")

N = 600
x0 = np.random.randn(N, 2)   # base samples ~ N(0, I)

atoms
 [[ 2.4  0. ]
 [-1.4  2. ]
 [-1.4 -2. ]] 
weights [0.45 0.3  0.25]
schedules: ['linear', 'variance-preserving', 'cosine'] — boundary conditions OK

# Marginal density rho_t on a grid, linear schedule, at three times.
sched = schedules.linear()
gx = np.linspace(-5, 5, 240)
GX, GY = np.meshgrid(gx, gx)
grid = np.column_stack([GX.ravel(), GY.ravel()])

fig, axes = plt.subplots(1, 3, figsize=(12, 3.8))
for ax, t in zip(axes, [0.15, 0.5, 0.9]):
    logrho = mixture.log_density(grid, t, sched, mus, w).reshape(GX.shape)
    ax.contourf(GX, GY, np.exp(logrho), levels=30, cmap="magma")
    ax.scatter(*mus.T, c=plotting.ATOM_COLORS, s=60, edgecolor="white", zorder=5)
    ax.set_title(f"$\\rho_t$  (linear, $t={t}$)")
    ax.set_aspect("equal"); ax.set_xlim(-5, 5); ax.set_ylim(-5, 5)
fig.suptitle("Closed-form marginal: a Gaussian blob splitting into three atoms")
plotting.savefig_pdf(fig, FIG_DIR / "mixture_marginal_density.pdf")
plt.show()
print("gamma finite at t=0.999:", np.isfinite(mixture.posterior_gamma(x0, 0.999, sched, mus, w)).all())

gamma finite at t=0.999: True

ts = np.linspace(0.05, 0.97, 40)
fig, ax = plt.subplots(figsize=(7, 4))
for s in SCHEDULES:
    _, err = mixture.velocity_error_curve(x0[:200], ts, s, mus, w)
    ax.semilogy(ts, err + 1e-18, label=s.name)
ax.set_xlabel("$t$"); ax.set_ylabel(r"$\max_x\,|v_{\rm closed}-v_{\rm autodiff}|$")
ax.set_title("Closed-form vs. autodiff velocity — agreement degrades only near $t=1$")
ax.legend()
plotting.savefig_pdf(fig, FIG_DIR / "mixture_velocity_crosscheck.pdf")
plt.show()

def vel_fn(x, t, s):
    return mixture.velocity(x, t, s, mus, w)

def integrate_and_colour(s):
    tt, traj = ode.integrate_samples(x0, s, vel_fn, eps=1e-3)
    end = traj[-1]
    labels = np.argmin(np.linalg.norm(end[:, None, :] - mus[None, :, :], axis=-1), axis=1)
    return tt, traj, labels

def plot_traj(ax, traj, labels, title):
    for i in range(traj.shape[1]):
        ax.plot(traj[:, i, 0], traj[:, i, 1], lw=0.4, alpha=0.35,
                color=plotting.ATOM_COLORS[labels[i]])
    ax.scatter(traj[0, :, 0], traj[0, :, 1], s=3, c="0.4", alpha=0.5)
    ax.scatter(*mus.T, c=plotting.ATOM_COLORS, s=90, edgecolor="white", zorder=5)
    ax.set_title(title); ax.set_aspect("equal"); ax.set_xlim(-5, 5); ax.set_ylim(-5, 5)

results = {s.name: integrate_and_colour(s) for s in SCHEDULES}

# One detailed figure for the linear schedule.
fig, ax = plt.subplots(figsize=(5.5, 5.5))
_, traj, labels = results["linear"]
plot_traj(ax, traj, labels, "Flow-matching trajectories (linear schedule)")
plotting.savefig_pdf(fig, FIG_DIR / "mixture_trajectories_linear.pdf")
plt.show()

# Side-by-side over the three schedules.
fig, axes = plt.subplots(1, 3, figsize=(13.5, 4.6))
for ax, s in zip(axes, SCHEDULES):
    _, traj, labels = results[s.name]
    plot_traj(ax, traj, labels, s.name)
fig.suptitle("Same endpoints, different paths — the schedule bends the trajectories")
plotting.savefig_pdf(fig, FIG_DIR / "mixture_trajectories_schedules.pdf")
plt.show()

frac = {n: np.bincount(r[2], minlength=3) / len(r[2]) for n, r in results.items()}
print("empirical basin fractions vs. target weights", np.round(w, 3))
for n, f in frac.items():
    print(f"  {n:20s} {np.round(f, 3)}")

empirical basin fractions vs. target weights [0.45 0.3  0.25]
  linear               [0.428 0.317 0.255]
  variance-preserving  [0.428 0.317 0.255]
  cosine               [0.428 0.317 0.255]

sdot = ot_semidiscrete.SemiDiscreteOT(mus, w).fit(n_samples=60000, seed=SEED)
print("semi-discrete OT fit residual (max |mass_k - w_k|):", f"{sdot.fit_residual:.2e}")
print("Laguerre potentials psi:", np.round(sdot.psi, 4))

cells = sdot.assign(grid).reshape(GX.shape)
ts_ot = np.linspace(0, 1, 60)
ot_traj = sdot.trajectory(x0, ts_ot)          # (T, N, 2) straight lines
ot_labels = sdot.assign(x0)

fig, axes = plt.subplots(1, 2, figsize=(12, 5.6))
# Left: Laguerre cells + straight OT trajectories.
ax = axes[0]
ax.contourf(GX, GY, cells, levels=[-0.5, 0.5, 1.5, 2.5],
            colors=[plotting.ATOM_COLORS[k] for k in range(3)], alpha=0.18)
for i in range(0, N, 2):
    ax.plot(ot_traj[:, i, 0], ot_traj[:, i, 1], lw=0.4, alpha=0.35,
            color=plotting.ATOM_COLORS[ot_labels[i]])
ax.scatter(*mus.T, c=plotting.ATOM_COLORS, s=90, edgecolor="white", zorder=5)
ax.set_title("Optimal transport: straight lines into Laguerre cells")
ax.set_aspect("equal"); ax.set_xlim(-5, 5); ax.set_ylim(-5, 5)
# Right: flow-matching (linear) for comparison.
_, traj, labels = results["linear"]
plot_traj(axes[1], traj, labels, "Flow matching (linear): curved, independent coupling")
fig.suptitle("Flow matching $\\neq$ optimal transport (same marginals, different coupling)")
plotting.savefig_pdf(fig, FIG_DIR / "mixture_ot_contrast.pdf")
plt.show()

semi-discrete OT fit residual (max |mass_k - w_k|): 3.72e-03
Laguerre potentials psi: [ 0.     -0.8065 -1.2405]

schedule	$a(t)$	$b(t)$	character
linear	$1-t$	$t$	straight sample paths (rectified flow)
variance-preserving	$\cos\frac{\pi t}{2}$	$\sin\frac{\pi t}{2}$	unit $a^2+b^2$, no mid-path pinch
cosine	$\tfrac12(1+\cos\pi t)$	$\tfrac12(1-\cos\pi t)$	slow start/end, fast middle

Notebook A — Flow Matching to a Three-Dirac Mixture¶

1. The target, the schedules, and the base samples¶

2. Closed-form marginal and velocity¶

3. Cross-check: closed form vs. autodiff of $\log\rho_t$¶

4. Integrating the flow — trajectories coloured by their atom¶

5. Contrast with optimal transport (semi-discrete / Laguerre)¶

6. Takeaways¶