"""Generate a self-contained interactive 'Robot Learning Landscape' page.

Pulls the researched paradigm data straight out of robot_paradigms_app.py so the
visualization stays in sync, then injects it into a static HTML template that
provides: a constellation map, Keynote-style Magic-Move detail panels (View
Transitions API), and a small looping SMIL animation per paradigm.

Run:  .venv_robot_paradigms/bin/python gen_landscape.py
Out:  robot_landscape.html
"""
import json
import html as html_lib
import robot_paradigms_app as app
import my_papers

# ---------------------------------------------------------------------------
# 1. Family display labels (nice names for the 10 hubs)
# ---------------------------------------------------------------------------
FAMILY_LABEL = {
    "BC":                "Imitation Learning",
    "Reinforcement":     "Reinforcement Learning",
    "Offline RL":        "Offline RL",
    "Inverse RL":        "Inverse RL (Imitation)",
    "Model-Based":       "World Models",
    "Sequence":          "Sequence Models",
    "Goal-Cond.":        "Goal-Conditioned",
    "Hierarchical":      "Hierarchical",
    "Meta-Learning":     "Meta-Learning",
    "LLM-Orchestration": "LLM / VLM",
}

# ---------------------------------------------------------------------------
# 2. Per-paradigm enrichment authored for a beginner audience:
#    short  = label shown on the map
#    simple = plain-English "what the robot is doing" (high-school level)
#    anim   = which mini-animation archetype to play
# ---------------------------------------------------------------------------
ENRICH = {
    "flow-matching-policy": dict(short="Flow Matching", anim="flow", simple=(
        "Imagine smoothly steering a dot from a random scribble to the exact move an "
        "expert made, following the straightest possible path. The robot learns that "
        "“steering field,” so it can turn noise into a precise action in just a "
        "few steps.")),
    "diffusion-policy": dict(short="Diffusion", anim="denoise", simple=(
        "Start with pure static (random noise) and clean it up step by step until a "
        "smooth, sensible action appears — like sharpening a blurry photo. Because it "
        "imagines many possibilities, it can pick left OR right around an obstacle instead "
        "of averaging into a crash.")),
    "tokenized-bc": dict(short="Tokenized BC", anim="tokens", simple=(
        "Chop each action into little pieces and predict them one-by-one, exactly like a "
        "chatbot predicts the next word. This lets a robot reuse all the machinery of a "
        "language model to act.")),
    "energy-based-bc": dict(short="Energy / Implicit", anim="energy", simple=(
        "Give every possible action a “score,” then roll downhill to the "
        "best-scoring one — like a marble settling into the lowest dip of a hilly "
        "landscape.")),
    "value-based-rl": dict(short="Q-Learning", anim="qlearn", simple=(
        "Try things, keep a running estimate of how good each move turns out, and always "
        "pick the move with the best expected payoff. It learns purely from rewards and "
        "mistakes — no teacher needed.")),
    "policy-gradient-rl": dict(short="Policy Gradient", anim="pgrad", simple=(
        "Do the task many times; nudge the behavior a little toward whatever earned more "
        "reward and away from what earned less. Slowly the robot’s habits get "
        "better.")),
    "off-policy-ac": dict(short="Actor-Critic", anim="actorcritic", simple=(
        "Two parts team up: an “actor” that acts and a “critic” that "
        "grades each action. The critic’s grades teach the actor to act better — "
        "and it can re-use old replayed experience.")),
    "offline-rl": dict(short="Offline RL", anim="offline", simple=(
        "Learn only from a fixed recording of past behavior — no live robot, no new "
        "tries. The trick is to stay close to what’s in the recording so the robot "
        "doesn’t bet on moves it never saw work.")),
    "maxent-irl": dict(short="MaxEnt IRL", anim="rewardmap", simple=(
        "Watch an expert and figure out the hidden “reward” that would explain "
        "why they did what they did — reverse-engineering their goal from their "
        "behavior.")),
    "gail": dict(short="GAIL", anim="adversarial", simple=(
        "Two networks play a game: one tries to act like the expert, the other tries to "
        "spot the fake. As the spotter gets sharper, the imitator is forced to become "
        "indistinguishable from the real expert.")),
    "forward-dynamics-mpc": dict(short="MPC", anim="plan", simple=(
        "Learn a “what happens if…” simulator, imagine several action plans "
        "a few steps ahead, and execute the one that looks best — then re-plan at the "
        "next moment.")),
    "latent-imagination": dict(short="Dreamer", anim="dream", simple=(
        "Build a compact “mental world,” then practice thousands of times inside "
        "that daydream instead of the real world — fast and safe — and carry the "
        "learned skill back to reality.")),
    "generative-video-wm": dict(short="Video WM", anim="videopred", simple=(
        "Predict the future as a short video: given what it sees now, the robot pictures "
        "what will happen next, frame by frame.")),
    "action-conditioned-wm": dict(short="Action-Cond WM", anim="videoaction", simple=(
        "Ask “if I move like this, what will I see?” The robot predicts the "
        "future video that each candidate action would cause, then picks the best one.")),
    "world-action-model": dict(short="World-Action", anim="worldaction", simple=(
        "Imagine the future video of the task AND read off the actions needed to make that "
        "future happen — dreaming the plan and the moves together.")),
    "occupancy-latent-wm": dict(short="Occupancy WM", anim="occupancy", simple=(
        "Instead of a full video, predict a simple map of where stuff will be (occupied vs "
        "free space) so the robot can plan safe motions.")),
    "decision-transformer": dict(short="Decision Transf.", anim="returncond", simple=(
        "Tell the robot the score you want (“get 100 points”) and it writes out "
        "the sequence of actions likely to hit that score — like autocompleting a "
        "winning playthrough.")),
    "trajectory-diffusion": dict(short="Traj. Diffusion", anim="denoise", simple=(
        "Sketch a whole path out of noise and clean it up all at once into a smooth plan, "
        "then gently steer that plan toward a goal.")),
    "goal-conditioned": dict(short="Goal + HER", anim="goalrelabel", simple=(
        "Tell the robot where to end up and it aims for that goal. When it misses, it "
        "pretends “wherever I landed” was the goal all along — so even "
        "failures become useful lessons.")),
    "hrl": dict(short="Hierarchical", anim="hierarchy", simple=(
        "A “manager” sets mini-goals (go here, then there) and a “worker” "
        "figures out the small moves to reach each one — splitting a big task into "
        "easy chunks.")),
    "meta-learning": dict(short="Meta-Learning", anim="meta", simple=(
        "Practice on many different tasks so the robot learns HOW to learn — then it "
        "can pick up a brand-new task after just a few tries.")),
    "llm-planner": dict(short="LLM Planner", anim="llmplan", simple=(
        "A language model reads the instruction, breaks it into a step-by-step plan (or "
        "even writes code), and calls ready-made skills to carry it out — no "
        "trial-and-error training.")),
    "vlm-affordance": dict(short="VLM Affordance", anim="affordance", simple=(
        "A vision-language model looks at the scene and marks WHERE and HOW to act (grab "
        "here, push there), turning a picture into a usable plan.")),
}

# ---------------------------------------------------------------------------
# 3. Interconnections between paradigms (the bridges).  [idA, idB, why]
# ---------------------------------------------------------------------------
# (a, b, why, kind):
#   "v" = variant — same core idea, different flavor (dashed, undirected)
#   "b" = builds-on — arrow a → b means "b builds on / uses a" (a underlies b)
EDGES = [
    # ---- variants (same core idea, different flavor) ----
    ("diffusion-policy", "trajectory-diffusion", "same denoising idea (action vs. whole path)", "v"),
    ("diffusion-policy", "flow-matching-policy", "generative action heads", "v"),
    ("flow-matching-policy", "tokenized-bc", "the three VLA action heads", "v"),
    ("diffusion-policy", "tokenized-bc", "the three VLA action heads", "v"),
    ("tokenized-bc", "llm-planner", "reuse the language-model / token stack", "v"),
    ("offline-rl", "decision-transformer", "return-conditioned offline RL (sequence modeling)", "b"),
    ("decision-transformer", "goal-conditioned", "condition on a target", "v"),
    ("decision-transformer", "tokenized-bc", "sequence models of actions", "v"),
    ("offline-rl", "diffusion-policy", "stay close to the data = imitate it", "v"),
    ("gail", "maxent-irl", "recover / use a reward signal", "v"),
    ("latent-imagination", "forward-dynamics-mpc", "plan inside a learned model", "v"),
    ("forward-dynamics-mpc", "occupancy-latent-wm", "a model used for planning", "v"),
    ("generative-video-wm", "action-conditioned-wm", "adds action-controllable prediction", "b"),
    ("action-conditioned-wm", "world-action-model", "actions + video together", "v"),
    ("vlm-affordance", "llm-planner", "language / vision planning, no policy gradient", "v"),
    ("hrl", "goal-conditioned", "sub-goals are just goals", "v"),
    ("hrl", "llm-planner", "high-level decomposition", "v"),
    ("classical-mpc", "forward-dynamics-mpc", "same optimizer — known vs. learned model", "v"),
    # ---- builds-on / enables (arrow a → b: "b builds on a") ----
    ("off-policy-ac", "offline-rl", "many offline methods extend off-policy AC (+ conservatism)", "b"),
    ("policy-gradient-rl", "gail", "GAIL trains its imitator with RL", "b"),
    ("maxent-irl", "value-based-rl", "infer the reward, then run RL on it", "b"),
    ("policy-gradient-rl", "latent-imagination", "trains the policy inside the imagined model", "b"),
    ("diffusion-policy", "world-action-model", "share diffusion/flow generative machinery", "v"),
    ("policy-gradient-rl", "meta-learning", "adapts with a few gradient steps", "b"),
    ("off-policy-ac", "goal-conditioned", "HER rides on off-policy RL", "b"),
    # ---- classical control underlies the learning methods ----
    ("lqr", "value-based-rl", "classical optimal-control precursor to RL", "b"),
    ("pid-control", "off-policy-ac", "residual RL learns on top of a controller", "b"),
    ("motion-planning", "llm-planner", "the LLM calls a classical planner", "b"),
    ("classical-mpc", "vlm-affordance", "VLM cost + a classical trajectory optimizer", "b"),
]

# ---------------------------------------------------------------------------
# 4. Classical / traditional control — NOT in the learning app, added here so
#    the map shows the full robot-control landscape (the non-learning bedrock).
# ---------------------------------------------------------------------------
CLASSICAL_FAMILY = dict(
    key="Classical", label="Classical Control", color="#64748b",
    desc=("Model-based control & planning with no learning — the engineering "
          "bedrock robots still run on, and what most learned methods sit on top of."),
)
CLASSICAL_PARADIGMS = [
    dict(
        id="pid-control", name="PID / Feedback Control", short="PID", family="Classical",
        anim="pid", tagline="Push proportionally to the error — the workhorse of control.",
        simple=("Measure how far you are from the target, and correct in proportion to that "
                "error — plus a bit for accumulated error (I) and how fast it’s changing (D). "
                "No model, no learning, just feedback. It’s the inner loop under almost everything."),
        mapping="error e(t) → control u(t)",
        math=r"u(t)=K_p\,e(t)+K_i\!\int_0^t\! e(\tau)\,d\tau+K_d\,\dot e(t)",
        when="Low-level motor/joint control, and the inner loop beneath higher-level planners.",
        pros=["Dead simple, needs no model", "Ubiquitous and robust", "Easy to tune"],
        cons=["No foresight or constraints", "Struggles with nonlinear / coupled / delayed systems",
              "Gains are hand-tuned"],
        papers=["Ziegler–Nichols tuning (1942)", "classical control theory"],
    ),
    dict(
        id="lqr", name="LQR / Optimal Control", short="LQR", family="Classical",
        anim="lqr", tagline="The provably optimal linear feedback gain.",
        simple=("If your system is roughly linear, you can solve for the single best feedback "
                "gain that minimizes a cost trading off staying on target vs. control effort. "
                "It’s the optimal-control ancestor of value-based RL."),
        mapping="state x → control u = −Kx",
        math=r"u=-Kx,\quad K=R^{-1}B^\top P,\quad A^\top P+PA-PBR^{-1}B^\top P+Q=0",
        when="Stabilization/tracking for systems you can linearize; a baseline and building block (iLQR, LQG).",
        pros=["Provably optimal for linear-quadratic problems", "Closed-form and fast",
              "Foundation for iLQR / LQG / MPC"],
        cons=["Assumes linear dynamics + quadratic cost", "No hard constraints", "Needs a model"],
        papers=["Kalman (1960), optimal control / LQG"],
    ),
    dict(
        id="classical-mpc", name="Model-Predictive Control / Trajectory Optimization",
        short="MPC / TrajOpt", family="Classical", anim="trajopt",
        tagline="Optimize controls over a horizon with a known model; re-plan each step.",
        simple=("Using known physics, optimize a short sequence of future controls to minimize "
                "cost while respecting constraints (limits, obstacles), execute the first one, then "
                "re-optimize at the next step. This is the same machinery learned-model MPC uses — "
                "here the model is hand-derived physics."),
        mapping="model f + cost ℓ → optimal u_{0:H}",
        math=r"\min_{u_{0:H}}\sum_{t=0}^{H}\ell(x_t,u_t)\quad\text{s.t.}\quad x_{t+1}=f(x_t,u_t),\;\;g(x_t,u_t)\le 0",
        when="When you have a decent model and need constraint handling + foresight (legged locomotion, driving, arms).",
        pros=["Handles constraints and foresight", "Uses known physics", "Re-planning adds robustness"],
        cons=["Needs an accurate model", "Online optimization is expensive",
              "Hard for contact-rich / uncertain dynamics"],
        papers=["iLQR (Todorov 2005)", "CHOMP / TrajOpt", "MPC literature"],
    ),
    dict(
        id="motion-planning", name="Motion Planning (Sampling / Search)",
        short="Motion Planning", family="Classical", anim="planning",
        tagline="Search the free space for a collision-free path.",
        simple=("Find a collision-free path from start to goal by sampling random configurations "
                "and connecting them (RRT/PRM) or searching a grid/graph (A*). It’s about geometry "
                "and feasibility, not learning — and it’s often the executor under an LLM planner."),
        mapping="start, goal, obstacles → collision-free path τ",
        math=r"\text{find }\tau: q_{\text{start}}\to q_{\text{goal}}\;\;\text{s.t.}\;\;\tau(s)\in\mathcal{C}_{\text{free}}\;\;\forall s",
        when="Navigation and arm motion through known obstacle fields.",
        pros=["Completeness / optimality guarantees (A*, RRT*)", "No training data needed",
              "Mature and reliable"],
        cons=["Needs a known map / geometry", "Struggles with high-dim contact + dynamics",
              "Replanning cost in clutter"],
        papers=["RRT (LaValle 1998)", "PRM (Kavraki 1996)", "A* (Hart 1968)"],
    ),
]


# ---------------------------------------------------------------------------
# 5. Best "learn more" explainer per branch (verified reachable June 2026).
#    (title, url) — canonical project pages / respected blogs / standard texts.
# ---------------------------------------------------------------------------
LEARN = {
    "flow-matching-policy":  ("π₀ flow-matching VLA — HuggingFace", "https://huggingface.co/blog/pi0"),
    "diffusion-policy":      ("Diffusion Policy — project page", "https://diffusion-policy.cs.columbia.edu/"),
    "tokenized-bc":          ("OpenVLA — project page", "https://openvla.github.io/"),
    "energy-based-bc":       ("Implicit BC — project page", "https://implicitbc.github.io/"),
    "decision-transformer":  ("Decision Transformer — project page", "https://sites.google.com/berkeley.edu/decision-transformer"),
    "trajectory-diffusion":  ("Diffuser: Planning with Diffusion", "https://diffusion-planning.github.io/"),
    "value-based-rl":        ("Deep Q-Learning — HF Deep RL Course", "https://huggingface.co/learn/deep-rl-course/unit3/introduction"),
    "policy-gradient-rl":    ("Policy Gradients & PPO — Arxiv Insights (video)", "https://www.youtube.com/watch?v=5P7I-xPq8u8"),
    "off-policy-ac":         ("DDPG & SAC — Pieter Abbeel (video)", "https://www.youtube.com/watch?v=pg-lKy7JIRk"),
    "offline-rl":            ("Offline RL — BAIR blog", "https://bair.berkeley.edu/blog/2020/12/07/offline/"),
    "maxent-irl":            ("What Is Inverse RL? — The Gradient", "https://thegradient.pub/learning-from-humans-what-is-inverse-reinforcement-learning/"),
    "gail":                  ("GAIL Imitation Learning (video)", "https://www.youtube.com/watch?v=E-lfhLiXiBc"),
    "forward-dynamics-mpc":  ("Model-Based RL + MPC — BAIR", "https://bair.berkeley.edu/blog/2017/11/30/model-based-rl/"),
    "latent-imagination":    ("Dreamer — Danijar Hafner", "https://danijar.com/project/dreamer/"),
    "generative-video-wm":   ("World Models — interactive", "https://worldmodels.github.io/"),
    "action-conditioned-wm": ("V-JEPA 2 World Model — Meta", "https://ai.meta.com/blog/v-jepa-2-world-model-benchmarks/"),
    "world-action-model":    ("Unified Video Action Model", "https://unified-video-action-model.github.io/"),
    "occupancy-latent-wm":   ("Drive-OccWorld — occupancy WM", "https://drive-occworld.github.io/"),
    "goal-conditioned":      ("Hindsight Experience Replay — Two Minute Papers (video)", "https://www.youtube.com/watch?v=Dvd1jQe3pq0"),
    "hrl":                   ("Hierarchical RL — The Gradient", "https://thegradient.pub/the-promise-of-hierarchical-reinforcement-learning/"),
    "meta-learning":         ("Interactive Intro to MAML", "https://interactive-maml.github.io/maml.html"),
    "llm-planner":           ("Code as Policies — project page", "https://code-as-policies.github.io/"),
    "vlm-affordance":        ("VoxPoser — project page", "https://voxposer.github.io/"),
    "pid-control":           ("PID Control — Brian Douglas (video)", "https://www.youtube.com/watch?v=wkfEZmsQqiA"),
    "lqr":                   ("LQR Optimal Control — Brian Douglas (video)", "https://www.youtube.com/watch?v=E_RDCFOlJx4"),
    "classical-mpc":         ("Model Predictive Control — MATLAB (video)", "https://www.youtube.com/watch?v=cEWnixjNdzs"),
    "motion-planning":       ("A* Pathfinding — Red Blob Games (interactive)", "https://www.redblobgames.com/pathfinding/a-star/introduction.html"),
}


def build_data():
    families = []
    for k in app.FAMILY:
        families.append(dict(
            key=k, label=FAMILY_LABEL.get(k, k), color=app.FAMILY[k][0],
            desc=app.FAMILY[k][1],
            equation=app.FAMILY_EQUATIONS.get(k, ""),
            relations=[dict(name=n, eq=e) for (n, e, _note) in app.FAMILY_RELATIONS.get(k, [])],
        ))
    cf = dict(CLASSICAL_FAMILY); cf["equation"] = ""; cf["relations"] = []
    families.append(cf)
    for f in EXTRA_FAMILIES:
        families.append(dict(f, desc="", equation="", relations=[]))
    paradigms = []
    for p in app.PARADIGMS:
        e = ENRICH.get(p["id"], {})
        paradigms.append(dict(
            id=p["id"],
            name=p["name"],
            short=e.get("short", p["name"]),
            family=p["family"],
            tagline=p["tagline"],
            simple=e.get("simple", p["intuition"]),
            anim=e.get("anim", "denoise"),
            mapping=p.get("mapping", ""),
            math=p.get("math", ""),
            when=p.get("when", ""),
            pros=p.get("pros", []),
            cons=p.get("cons", []),
            papers=p.get("key_papers", []),
            learn=({"title": LEARN[p["id"]][0], "url": LEARN[p["id"]][1]} if p["id"] in LEARN else None),
        ))
    for p in CLASSICAL_PARADIGMS:
        paradigms.append(dict(
            id=p["id"], name=p["name"], short=p["short"], family=p["family"],
            tagline=p["tagline"], simple=p["simple"], anim=p["anim"],
            mapping=p["mapping"], math=p["math"], when=p["when"],
            pros=p["pros"], cons=p["cons"], papers=p["papers"],
            learn=({"title": LEARN[p["id"]][0], "url": LEARN[p["id"]][1]} if p["id"] in LEARN else None),
        ))
    for p in EXTRA_PARADIGMS:
        paradigms.append(dict(
            id=p["id"], name=p["name"], short=p["short"], family=p["family"], anim=p["anim"],
            tagline=p["tagline"], simple=p["simple"], mapping=p["mapping"], math=p["math"],
            when=p["when"], pros=p["pros"], cons=p["cons"], papers=p["papers"],
            learn={"title": p["learn"][0], "url": p["learn"][1]},
        ))
    # only keep edges whose endpoints exist
    ids = {p["id"] for p in paradigms}
    edges = [[a, b, w, k] for (a, b, w, k) in (EDGES + EXTRA_EDGES) if a in ids and b in ids]
    nodeset = ids | {f["key"] for f in families}
    mypapers = [m for m in my_papers.MY_PAPERS if m.get("node") in nodeset]
    return dict(families=families, paradigms=paradigms, edges=edges, mypapers=mypapers)


TEMPLATE = r"""<!doctype html>
<html lang="en">
<head>
<meta charset="utf-8"/>
<meta name="viewport" content="width=device-width, initial-scale=1"/>
<link rel="icon" href="data:,"/>
<title>Robot Learning Landscape</title>
<script>
window.MathJax = { tex: { displayMath: [['\\[','\\]']], inlineMath: [['\\(','\\)']] },
  options: { skipHtmlTags: ['script','noscript','style','textarea','pre'] } };
</script>
<script async src="https://cdn.jsdelivr.net/npm/mathjax@3/es5/tex-mml-chtml.js"></script>
<style>
  :root{ --bg:#070b16; --ink:#e7ecf6; --mut:#93a0bd; --gold:#fbbf24; }
  *{ box-sizing:border-box; }
  html,body{ margin:0; height:100%; background:var(--bg); color:var(--ink);
    font-family:Inter,-apple-system,BlinkMacSystemFont,"Segoe UI",sans-serif; }
  a{ color:#7dd3fc; }

  .topbar{ position:relative; z-index:5; display:flex; align-items:baseline; gap:14px;
    flex-wrap:wrap; padding:16px 22px 6px; }
  .topbar h1{ margin:0; font-size:21px; font-weight:800; letter-spacing:.2px;
    background:linear-gradient(90deg,#a78bfa,#67e8f9); -webkit-background-clip:text;
    background-clip:text; color:transparent; }
  .topbar .sub{ color:var(--mut); font-size:13px; }
  .topbar .sub b{ color:var(--gold); }

  .stage{ position:relative; width:100%; height:calc(100vh - 64px); overflow:hidden; }
  .map{ position:absolute; inset:0; width:100%; height:100%;
    background:
      radial-gradient(1200px 520px at 50% 42%, rgba(124,58,237,.16), transparent 62%),
      radial-gradient(900px 520px at 12% 100%, rgba(20,184,166,.10), transparent 60%),
      radial-gradient(900px 520px at 100% 0%, rgba(56,189,248,.10), transparent 60%);
    transition:filter .45s ease, opacity .45s ease; }
  .stage.detail .map{ filter:blur(3px) brightness(.6); }

  svg.canvas{ width:100%; height:100%; display:block; }
  .edge{ fill:none; stroke:#475569; stroke-width:1.4; opacity:.16; transition:.25s; stroke-dasharray:5 5; }
  .edge.dir{ stroke-dasharray:none; }          /* builds-on = solid (+ arrowhead) */
  .edge.lit{ stroke:var(--gold); opacity:.95; stroke-width:2.3;
    filter:drop-shadow(0 0 6px rgba(251,191,36,.6)); }
  .edge-label{ fill:#fde68a; font-size:9.5px; font-weight:600; opacity:0; pointer-events:none;
    paint-order:stroke; stroke:#070b16; stroke-width:3px; stroke-linejoin:round; transition:opacity .2s; }
  .edge-label.on{ opacity:1; }
  .legend{ position:absolute; left:14px; bottom:14px; z-index:6; display:flex; gap:18px; align-items:center;
    background:rgba(11,19,38,.72); border:1px solid #1e293b; border-radius:10px; padding:7px 13px;
    font-size:11.5px; color:#cbd5e1; backdrop-filter:blur(6px); }
  .legend .li{ display:flex; align-items:center; gap:7px; }
  .stage.detail .legend{ opacity:0; }
  .chip-rel{ font-weight:800; color:var(--cc); font-size:10px; }
  .limb{ fill:none; stroke-linecap:round; transition:.25s; }

  .node{ cursor:pointer; }
  .node .ring{ transform-box:fill-box; transform-origin:center;
    transition:transform .18s cubic-bezier(.2,.7,.3,1), filter .18s, opacity .25s; }
  .node text{ pointer-events:none; font-weight:700; paint-order:stroke;
    stroke:#070b16; stroke-width:3.4px; stroke-linejoin:round; }
  .node.fam text{ font-size:13px; fill:#fff; }
  .node.par text{ font-size:11px; fill:#dbe4f7; }
  .node:hover .ring{ transform:scale(1.18); filter:drop-shadow(0 0 9px currentColor); }
  .node.dim{ opacity:.22; }
  .core-label{ font-size:11px; font-weight:800; letter-spacing:1.4px; fill:#c4b5fd; }

  /* tooltip */
  .tip{ position:absolute; z-index:8; pointer-events:none; max-width:240px; padding:8px 10px;
    background:#0b1326; border:1px solid #334155; border-radius:9px; font-size:12px;
    color:var(--ink); box-shadow:0 10px 28px rgba(0,0,0,.55); opacity:0; transform:translateY(4px);
    transition:opacity .14s, transform .14s; }
  .tip.on{ opacity:1; transform:translateY(0); }
  .tip .t-name{ font-weight:800; }
  .tip .t-fam{ font-size:10.5px; text-transform:uppercase; letter-spacing:.05em; }

  /* detail drawer */
  .drawer{ position:absolute; top:0; right:0; height:100%; width:min(560px,94vw); z-index:10;
    background:linear-gradient(180deg,#0c1326,#0a1020); border-left:1px solid #1e293b;
    box-shadow:-24px 0 60px rgba(0,0,0,.5); transform:translateX(102%);
    transition:transform .42s cubic-bezier(.2,.8,.2,1); overflow-y:auto; padding:22px 24px 60px; }
  .stage.detail .drawer{ transform:translateX(0); }
  .d-close{ position:absolute; top:14px; right:16px; cursor:pointer; border:none; color:var(--mut);
    background:rgba(148,163,184,.1); width:34px; height:34px; border-radius:50%; font-size:18px; }
  .d-close:hover{ color:#fff; background:rgba(148,163,184,.2); }

  .d-head{ display:flex; align-items:center; gap:12px; margin-bottom:4px; }
  .d-av{ width:46px; height:46px; border-radius:50%; flex:0 0 auto;
    box-shadow:0 0 0 4px rgba(255,255,255,.04), 0 0 22px var(--c); background:var(--c); }
  .d-fam{ font-size:11px; font-weight:800; text-transform:uppercase; letter-spacing:.06em; color:var(--c); }
  .d-name{ font-size:21px; font-weight:800; margin:1px 0 0; line-height:1.15; }
  .d-tag{ color:var(--mut); font-size:13px; margin:10px 0 0; }
  .learn-link{ display:inline-flex; align-items:center; gap:7px; margin-top:12px; text-decoration:none;
    font-size:12.5px; font-weight:700; color:var(--ink); border:1px solid var(--c); border-radius:999px;
    padding:6px 13px; background:color-mix(in srgb, var(--c) 16%, transparent); transition:.16s; }
  .learn-link:hover{ background:color-mix(in srgb, var(--c) 32%, transparent); transform:translateY(-1px); }
  .learn-link .arrow{ color:var(--c); }

  .sec-l{ font-size:11px; font-weight:800; letter-spacing:.07em; text-transform:uppercase;
    color:#8aa0c6; margin:20px 0 7px; }
  .d-simple{ font-size:14.5px; line-height:1.55; }
  .myread{ display:flex; flex-direction:column; gap:6px; }
  .mp{ font-size:12.5px; border-left:2px solid var(--gold); padding:3px 0 3px 9px; color:#e7ecf6; }
  .mp a{ color:#fde68a; text-decoration:none; font-weight:600; }
  .mp a:hover{ text-decoration:underline; }
  .mp small{ display:block; color:var(--mut); font-size:11px; margin-top:1px; }
  .pbadge{ stroke:#070b16; stroke-width:1.5; }

  .anim-box{ margin-top:14px; border:1px solid #1e293b; border-radius:13px; padding:10px;
    background:radial-gradient(120% 120% at 50% 0%, rgba(124,58,237,.10), #070d1c);
    position:relative; }
  .anim-box .replay{ position:absolute; top:8px; right:10px; font-size:11px; color:var(--mut);
    background:rgba(148,163,184,.1); border:none; border-radius:7px; padding:3px 8px; cursor:pointer; }
  .anim-box .replay:hover{ color:#fff; }
  .anim-box svg{ width:100%; height:auto; display:block; }
  .anim-cap{ text-align:center; color:var(--mut); font-size:11.5px; margin-top:4px; }

  .math-toggle{ margin-top:16px; }
  .math-toggle summary{ cursor:pointer; list-style:none; font-size:13px; font-weight:700;
    color:#a5b4fc; display:inline-flex; align-items:center; gap:7px; user-select:none; }
  .math-toggle summary::-webkit-details-marker{ display:none; }
  .math-toggle summary::before{ content:"\25B8"; transition:.2s; }
  .math-toggle[open] summary::before{ transform:rotate(90deg); }
  .map-line{ font-family:ui-monospace,SFMono-Regular,Menlo,monospace; font-size:12px; color:#7dd3fc;
    background:rgba(56,189,248,.06); border:1px solid #1e3a5f; border-radius:8px; padding:8px 10px;
    margin:10px 0; overflow-x:auto; }
  .math-disp{ overflow-x:auto; font-size:13px; }
  .eq-l{ font-size:10.5px; font-weight:800; letter-spacing:.06em; text-transform:uppercase;
    color:#7c8db5; margin:14px 0 4px; }
  .rel-eq{ border-left:2px solid #27406b; padding:2px 0 2px 10px; margin:8px 0; }
  .rel-eq-name{ font-size:11.5px; font-weight:700; color:#cbd5e1; margin-bottom:2px; }
  .rel-eq .math-disp{ font-size:12px; opacity:.92; }

  .pc{ display:grid; grid-template-columns:1fr 1fr; gap:10px; margin-top:6px; }
  .pc ul{ margin:6px 0 0; padding-left:16px; font-size:12.5px; line-height:1.5; }
  .pc .pros b{ color:#34d399; } .pc .cons b{ color:#fb7185; }
  .when{ font-size:13px; line-height:1.5; background:rgba(124,58,237,.08);
    border:1px solid #312e81; border-radius:9px; padding:10px 12px; }
  .papers{ font-size:11.5px; color:var(--mut); line-height:1.7; }

  .chips{ display:flex; flex-wrap:wrap; gap:8px; margin-top:8px; }
  .chip{ cursor:pointer; border:1px solid var(--cc); border-radius:999px; padding:5px 11px;
    font-size:12px; color:#e7ecf6; background:color-mix(in srgb, var(--cc) 14%, transparent);
    transition:.16s; }
  .chip:hover{ background:color-mix(in srgb, var(--cc) 32%, transparent); transform:translateY(-1px); }
  .chip small{ display:block; color:var(--mut); font-size:10px; }

  ::view-transition-group(morph){ animation-duration:.5s; }
</style>
</head>
<body>
  <div class="topbar">
    <h1>🤖 Robot Learning Landscape</h1>
    <span class="sub" id="meta"></span>
    <span class="sub">— click any star to see <b>what it does</b>.</span>
  </div>
  <div class="stage" id="stage">
    <div class="map" id="map"><svg class="canvas" id="svg" preserveAspectRatio="xMidYMid meet"></svg></div>
    <div class="tip" id="tip"></div>
    <div class="legend">
      <div class="li"><svg width="34" height="10" viewBox="0 0 34 10"><line x1="0" y1="5" x2="34" y2="5" stroke="#94a3b8" stroke-width="2" stroke-dasharray="5 4"/></svg> variant</div>
      <div class="li"><svg width="34" height="10" viewBox="0 0 34 10"><line x1="0" y1="5" x2="27" y2="5" stroke="#94a3b8" stroke-width="2"/><path d="M27,1 L34,5 L27,9 z" fill="#94a3b8"/></svg> builds on</div>
    </div>
    <aside class="drawer" id="drawer" aria-live="polite"></aside>
  </div>

<script>
const D = __DATA_JSON__;
const byId={}; D.paradigms.forEach(p=>byId[p.id]=p);
const famByKey={}; D.families.forEach(f=>famByKey[f.key]=f);
document.getElementById('meta').textContent =
  D.families.length + ' families · ' + D.paradigms.length + ' paradigms · ' + D.edges.length + ' links';

/* ---------- layout ---------- */
const W=1280, H=880, cx=W/2, cy=H/2, SX=1.30;
const N=D.families.length;
D.families.forEach((f,i)=>{
  const ang=(-90 + i*360/N) * Math.PI/180;
  f.ang=ang; f.x=cx+Math.cos(ang)*250*SX; f.y=cy+Math.sin(ang)*250;
  f.kids=D.paradigms.filter(p=>p.family===f.key);
});
D.families.forEach(f=>{
  const n=f.kids.length;
  const step=Math.min(0.13, 0.46/Math.max(n-1,1));   // keep a family's fan inside its 36° wedge
  f.kids.forEach((p,j)=>{
    const a=f.ang + (j-(n-1)/2)*step;
    const r=352 + (j%2)*50 + (n>=5?Math.floor(j/2)*12:0);  // stagger radius so dense families don't pile up
    p.ang=a; p.x=cx+Math.cos(a)*r*SX; p.y=cy+Math.sin(a)*r;
  });
});
function adj(id){ const s=new Set(); D.edges.forEach(([a,b])=>{ if(a===id)s.add(b); if(b===id)s.add(a); }); return s; }

/* ---------- render the map ---------- */
const svg=document.getElementById('svg');
svg.setAttribute('viewBox', '0 0 '+W+' '+H);
function curve(x1,y1,x2,y2){ const mx=(x1+x2)/2, my=(y1+y2)/2;
  const dx=x2-x1, dy=y2-y1; const nx=-dy, ny=dx; const k=0.14;
  return 'M'+x1+','+y1+' Q'+(mx+nx*k)+','+(my+ny*k)+' '+x2+','+y2; }

function renderMap(){
  let s='<defs><marker id="arrow" viewBox="0 0 10 10" refX="9" refY="5" markerWidth="7" markerHeight="7" '+
    'orient="auto-start-reverse"><path d="M0,0 L10,5 L0,10 z" fill="context-stroke"/></marker></defs>';
  // limbs: core -> family
  D.families.forEach(f=>{ s+='<path class="limb" d="M'+cx+','+cy+' L'+f.x+','+f.y+
    '" stroke="'+f.color+'" stroke-width="2.4" opacity="0.5"/>'; });
  // limbs: family -> paradigm
  D.families.forEach(f=>f.kids.forEach(p=>{ s+='<path class="limb" d="M'+f.x+','+f.y+' L'+p.x+','+p.y+
    '" stroke="'+f.color+'" stroke-width="1.6" opacity="0.4"/>'; }));
  // bridges (cross-links): dashed = variant, solid arrow = builds-on. Labels drawn last (on top).
  let edgeLabels='';
  D.edges.forEach(([a,b,why,kind])=>{ const pa=byId[a], pb=byId[b];
    const dir = kind==='b';
    s+='<path class="edge'+(dir?' dir':'')+'" data-edge="'+a+'|'+b+'" d="'+curve(pa.x,pa.y,pb.x,pb.y)+'"'+
      (dir?' marker-end="url(#arrow)"':'')+'/>';
    const mx=(pa.x+pb.x)/2, my=(pa.y+pb.y)/2, nx=-(pb.y-pa.y), ny=(pb.x-pa.x);
    const lx=mx+nx*0.07, ly=my+ny*0.07;
    edgeLabels+='<text class="edge-label" data-edge="'+a+'|'+b+'" x="'+lx.toFixed(1)+'" y="'+ly.toFixed(1)+
      '" text-anchor="middle">'+esc(why)+'</text>';
  });
  // core
  s+='<g class="node core"><circle cx="'+cx+'" cy="'+cy+'" r="44" fill="#0b1226" stroke="#8b5cf6" '+
     'stroke-width="2.5" style="filter:drop-shadow(0 0 26px rgba(124,58,237,.6))"/>'+
     '<text x="'+cx+'" y="'+(cy-4)+'" text-anchor="middle" style="font-size:22px;stroke:none">🤖</text>'+
     '<text class="core-label" x="'+cx+'" y="'+(cy+15)+'" text-anchor="middle" style="stroke:none">POLICY</text></g>';
  // family hubs
  D.families.forEach(f=>{ s+='<g class="node fam" data-node="fam:'+f.key+'" style="color:'+f.color+'">'+
    '<circle class="ring" cx="'+f.x+'" cy="'+f.y+'" r="13" fill="'+f.color+'" '+
    'style="filter:drop-shadow(0 0 10px '+f.color+')"/>'+
    '<text x="'+f.x+'" y="'+(f.y - 20)+'" text-anchor="middle">'+esc(f.label)+'</text></g>'; });
  // paradigm stars — labels fanned radially outward so dense clusters don't overlap
  D.paradigms.forEach(p=>{ const f=famByKey[p.family];
    const co=Math.cos(p.ang), si=Math.sin(p.ang);
    let lx=p.x+co*15, ly=p.y+si*15+4;
    ly=Math.max(14, Math.min(H-6, ly));
    const anc = co>0.35 ? 'start' : (co<-0.35 ? 'end' : 'middle');
    s+='<g class="node par" data-node="'+p.id+'" style="color:'+f.color+'">'+
      '<circle class="ring" cx="'+p.x+'" cy="'+p.y+'" r="8" fill="#0b1326" stroke="'+f.color+
      '" stroke-width="2.5"/>'+
      '<circle cx="'+p.x+'" cy="'+p.y+'" r="3" fill="'+f.color+'"/>'+
      '<text x="'+lx+'" y="'+ly+'" text-anchor="'+anc+'">'+esc(p.short)+'</text></g>'; });
  s+=edgeLabels;   // labels on top so lit ones stay readable
  svg.innerHTML=s;
}
function esc(t){ return (t||'').replace(/&/g,'&amp;').replace(/</g,'&lt;').replace(/>/g,'&gt;'); }

/* ---------- hover behaviour ---------- */
const tip=document.getElementById('tip'), stage=document.getElementById('stage');
function highlight(id){
  const nb=adj(id); nb.add(id);
  svg.querySelectorAll('.node.par,.node.fam').forEach(g=>{
    const d=g.getAttribute('data-node');
    g.classList.toggle('dim', !(d===id || nb.has(d) || d.startsWith('fam:')));
  });
  svg.querySelectorAll('.edge').forEach(e=>{
    const [a,b]=e.getAttribute('data-edge').split('|');
    e.classList.toggle('lit', a===id||b===id);
  });
  svg.querySelectorAll('.edge-label').forEach(t=>{
    const [a,b]=t.getAttribute('data-edge').split('|');
    t.classList.toggle('on', a===id||b===id);
  });
}
function clearHL(){ svg.querySelectorAll('.dim').forEach(g=>g.classList.remove('dim'));
  svg.querySelectorAll('.edge.lit').forEach(e=>e.classList.remove('lit'));
  svg.querySelectorAll('.edge-label.on').forEach(t=>t.classList.remove('on')); }

svg.addEventListener('mouseover', e=>{
  const g=e.target.closest('.node.par'); if(!g) return;
  const p=byId[g.getAttribute('data-node')]; if(!p) return;
  const f=famByKey[p.family];
  highlight(p.id);
  tip.innerHTML='<div class="t-fam" style="color:'+f.color+'">'+esc(f.label)+'</div>'+
    '<div class="t-name">'+esc(p.name)+'</div><div style="color:var(--mut);margin-top:3px">'+esc(p.tagline)+'</div>';
  tip.classList.add('on');
});
svg.addEventListener('mousemove', e=>{
  const r=stage.getBoundingClientRect();
  let x=e.clientX-r.left+14, y=e.clientY-r.top+14;
  x=Math.min(x, r.width-tip.offsetWidth-10); y=Math.min(y, r.height-tip.offsetHeight-10);
  tip.style.left=x+'px'; tip.style.top=y+'px';
});
svg.addEventListener('mouseout', e=>{
  if(e.target.closest('.node.par')){ if(!stage.classList.contains('detail')) clearHL(); tip.classList.remove('on'); }
});

/* ---------- click -> Magic Move detail ---------- */
const drawer=document.getElementById('drawer');
let current=null;
svg.addEventListener('click', e=>{
  const g=e.target.closest('.node.par');
  if(g){ openDetail(g.getAttribute('data-node')); }
  else if(stage.classList.contains('detail')){ closeDetail(); }   // click empty space = close
});

function showDetail(id){
  const p=byId[id]; if(!p) return;
  current=id; renderDetail(p); stage.classList.add('detail'); highlight(id);
}

function openDetail(id){
  if(!byId[id]) return;
  tip.classList.remove('on');
  // clear any stale morph name (e.g. the previous detail avatar) so only ONE element owns it
  drawer.querySelectorAll('[style*="view-transition-name"]').forEach(el=>el.style.viewTransitionName='');
  const node=svg.querySelector('[data-node="'+id+'"] .ring');
  if(document.startViewTransition && node){
    node.style.viewTransitionName='morph';
    let vt;
    try{ vt=document.startViewTransition(()=>{ node.style.viewTransitionName=''; showDetail(id); }); }
    catch(_){ node.style.viewTransitionName=''; showDetail(id); return; }
    vt.finished.catch(()=>{}).finally(()=>{ node.style.viewTransitionName=''; });
  } else { showDetail(id); }
}

function closeDetail(){
  const id=current;
  const node=id ? svg.querySelector('[data-node="'+id+'"] .ring') : null;
  const finish=()=>{ stage.classList.remove('detail'); current=null; clearHL(); };
  if(document.startViewTransition && node){
    let vt;
    try{ vt=document.startViewTransition(()=>{ drawer.innerHTML=''; finish(); node.style.viewTransitionName='morph'; }); }
    catch(_){ drawer.innerHTML=''; finish(); return; }
    vt.finished.catch(()=>{}).finally(()=>{ node.style.viewTransitionName=''; });
  } else { drawer.innerHTML=''; finish(); }
}

function renderDetail(p){
  const f=famByKey[p.family];
  const pros=(p.pros||[]).map(x=>'<li>'+esc(x)+'</li>').join('');
  const cons=(p.cons||[]).map(x=>'<li>'+esc(x)+'</li>').join('');
  const papers=(p.papers||[]).map(esc).join(' · ');
  const links=D.edges.filter(e=>e[0]===p.id||e[1]===p.id).map(e=>{
    const a=e[0], b=e[1], why=e[2], kind=e[3];
    const oid=a===p.id?b:a; const o=byId[oid]; const of=famByKey[o.family];
    const tag = kind==='b' ? (a===p.id ? '↑ enables' : '↳ builds on') : '≈ variant';
    return '<div class="chip" style="--cc:'+of.color+'" data-go="'+oid+'">'+
      '<span class="chip-rel">'+tag+'</span> '+esc(o.short)+'<small>'+esc(why)+'</small></div>';
  }).join('');
  const relList=[];
  D.paradigms.forEach(function(q){ if(q.family===p.family && q.id!==p.id && q.math) relList.push({n:(q.short||q.name), e:q.math}); });
  (f.relations||[]).forEach(function(r){ if(r.eq) relList.push({n:r.name, e:r.eq}); });
  let relHtml='';
  if(f.equation){ relHtml += '<div class="eq-l">Family objective</div><div class="math-disp">\\['+f.equation+'\\]</div>'; }
  if(relList.length){ relHtml += '<div class="eq-l">Related equations in this family</div>'+
    relList.map(function(it){ return '<div class="rel-eq"><div class="rel-eq-name">'+esc(it.n)+'</div><div class="math-disp">\\['+it.e+'\\]</div></div>'; }).join(''); }
  drawer.style.setProperty('--c', f.color);
  drawer.innerHTML =
    '<button class="d-close" title="Close (Esc)">×</button>'+
    '<div class="d-head"><div class="d-av" style="--c:'+f.color+';view-transition-name:morph"></div>'+
      '<div><div class="d-fam" style="--c:'+f.color+'">'+esc(f.label)+'</div>'+
      '<div class="d-name">'+esc(p.name)+'</div></div></div>'+
    '<div class="d-tag">'+esc(p.tagline)+'</div>'+
    (p.learn ? '<div><a class="learn-link" href="'+p.learn.url+'" target="_blank" rel="noopener noreferrer">📖 Learn: '+esc(p.learn.title)+' <span class="arrow">↗</span></a></div>' : '')+
    '<div><button class="learn-link" style="cursor:pointer" data-lab="'+esc(p.id)+'">🧪 Open in Algorithm Lab <span class="arrow">↗</span></button></div>'+
    '<div class="sec-l">What the robot is doing</div>'+
    '<div class="d-simple">'+esc(p.simple)+'</div>'+
    '<div class="anim-box"><button class="replay" title="Replay">↻ replay</button>'+
      '<div class="anim-host"></div></div>'+
    '<div class="anim-cap">'+esc(ANIM_CAP[p.anim]||'')+'</div>'+
    '<details class="math-toggle"><summary>Show the math &amp; related equations</summary>'+
      (p.mapping?'<div class="map-line">'+esc(p.mapping)+'</div>':'')+
      '<div class="eq-l">This method</div><div class="math-disp">\\['+ (p.math||'') +'\\]</div>'+
      relHtml+'</details>'+
    '<div class="sec-l">When you’d reach for it</div><div class="when">'+esc(p.when)+'</div>'+
    '<div class="pc"><div class="pros"><b>Strengths</b><ul>'+pros+'</ul></div>'+
      '<div class="cons"><b>Trade-offs</b><ul>'+cons+'</ul></div></div>'+
    (links?'<div class="sec-l">Connects to</div><div class="chips">'+links+'</div>':'')+
    (papers?'<div class="sec-l">Key work</div><div class="papers">'+papers+'</div>':'')+
    (function(){ const mine=(D.mypapers||[]).filter(function(m){return m.node===p.id||m.node===p.family;});
      if(!mine.length) return '';
      return '<div class="sec-l">📌 My reading</div><div class="myread">'+mine.map(function(m){
        return '<div class="mp">'+(m.url?'<a href="'+m.url+'" target="_blank" rel="noopener noreferrer">'+esc(m.title)+' ↗</a>':esc(m.title))+
          (m.note?'<small>'+esc(m.note)+'</small>':'')+'</div>'; }).join('')+'</div>'; })();

  const host=drawer.querySelector('.anim-host');
  playAnim(host, p.anim, f.color);
  drawer.querySelector('.d-close').onclick=closeDetail;
  drawer.querySelector('.replay').onclick=()=>playAnim(host, p.anim, f.color);
  const labBtn=drawer.querySelector('[data-lab]');
  if(labBtn) labBtn.onclick=function(){
    try{ window.parent.postMessage({type:'openAlgorithmLab', id:p.id}, '*'); }
    catch(_){}
  };
  drawer.querySelectorAll('.chip').forEach(c=>c.onclick=()=>openDetail(c.getAttribute('data-go')));
  const mt=drawer.querySelector('.math-toggle');
  const typeset=function(){ if(window.MathJax && MathJax.typesetPromise) MathJax.typesetPromise([...drawer.querySelectorAll('.math-disp')]).catch(function(){}); };
  if(mt) mt.addEventListener('toggle', function(){ if(mt.open) typeset(); });
  typeset();
}
document.addEventListener('keydown', e=>{ if(e.key==='Escape' && stage.classList.contains('detail')) closeDetail(); });

/* ---------- mini animations (SMIL, loop forever) ---------- */
function playAnim(host, key, c){
  const fn=ANIM[key]||ANIM.denoise;
  host.innerHTML='';                       // remove old
  void host.offsetWidth;                   // reflow so SMIL restarts
  host.innerHTML='<svg viewBox="0 0 280 150">'+fn(c)+'</svg>';
}
function rnd(seed){ let x=Math.sin(seed)*10000; return x-Math.floor(x); }

const ANIM_CAP = {
  denoise:"Random noise is cleaned up into a smooth action.",
  flow:"A steering field flows noise straight into the action.",
  tokens:"Action pieces are predicted one at a time, like words.",
  energy:"The action rolls downhill to the lowest-energy (best) spot.",
  qlearn:"Values back up from the reward; act greedily toward them.",
  pgrad:"The action distribution shifts toward higher reward.",
  actorcritic:"The critic grades the actor; the actor improves.",
  offline:"Learn from a fixed log — no live robot.",
  rewardmap:"Demos reveal the hidden reward map.",
  adversarial:"Imitator vs. spotter — until the fake looks real.",
  plan:"Imagine a few futures, execute one step, slide the horizon, re-plan.",
  dream:"Practice inside an imagined world.",
  videopred:"Predict the future, frame by frame.",
  videoaction:"Each candidate action predicts a different future.",
  worldaction:"Imagine the future video AND the actions that cause it.",
  occupancy:"Predict which cells will be occupied vs. free; thread a safe path.",
  returncond:"Aim for a target score; generate actions to hit it.",
  goalrelabel:"Missed the goal? Call where you landed the goal.",
  hierarchy:"A manager sets sub-goals; a worker reaches them.",
  meta:"Learn many tasks, then adapt to a new one fast.",
  llmplan:"Language model writes the plan; skills execute it.",
  affordance:"Vision marks where and how to act.",
  pid:"Correct in proportion to the error until it hits the target.",
  lqr:"Optimal feedback drives the state smoothly to zero.",
  trajopt:"Optimize a path around constraints; slide the horizon, re-plan.",
  planning:"Grow a search tree through free space to find a path."
};

const ANIM = {
  denoise(c){
    const tgt=[[24,112],[64,64],[108,44],[150,48],[192,82],[228,66],[258,50]];
    let dots=''; tgt.forEach((t,i)=>{ const sx=20+rnd(i+1)*240, sy=18+rnd(i+9)*116;
      const kt='0;0.15;0.55;0.85;1';
      dots+='<circle r="4.2" fill="'+c+'">'+
        '<animate attributeName="cx" values="'+sx+';'+sx+';'+t[0]+';'+t[0]+';'+sx+'" keyTimes="'+kt+'" dur="3.2s" repeatCount="indefinite"/>'+
        '<animate attributeName="cy" values="'+sy+';'+sy+';'+t[1]+';'+t[1]+';'+sy+'" keyTimes="'+kt+'" dur="3.2s" repeatCount="indefinite"/>'+
        '<animate attributeName="opacity" values="0.3;0.55;1;1;0.3" keyTimes="'+kt+'" dur="3.2s" repeatCount="indefinite"/></circle>'; });
    const path='M24,112 C70,40 150,30 192,82 S250,60 258,50';
    return '<path d="'+path+'" fill="none" stroke="'+c+'" stroke-width="3" stroke-linecap="round" opacity="0">'+
      '<animate attributeName="opacity" values="0;0;0.85;0.85;0" keyTimes="0;0.5;0.6;0.85;1" dur="3.2s" repeatCount="indefinite"/></path>'+dots;
  },
  flow(c){
    // a learned velocity FIELD, integrated in a FEW straight steps (vs diffusion's many curvy ones)
    let s='';
    for(let r=0;r<4;r++)for(let q=0;q<7;q++){ const x=24+q*36,y=34+r*26;
      s+='<line x1="'+x+'" y1="'+y+'" x2="'+(x+11)+'" y2="'+(y-4)+'" stroke="'+c+'" stroke-width="1" opacity="0.22"/><path d="M'+(x+11)+','+(y-4)+' l-3,-1 l1,3 z" fill="'+c+'" opacity="0.22"/>'; }
    s+='<text x="12" y="120" font-size="9" fill="'+c+'">noise</text><text x="232" y="40" font-size="9" fill="'+c+'">action</text>';
    s+='<line x1="28" y1="116" x2="252" y2="46" stroke="'+c+'" stroke-width="1.5" stroke-dasharray="2 5" opacity="0.5"/>';
    const xs='28;84;140;196;252;28', ys='116;98;81;63;46;116';
    s+='<circle r="5" fill="'+c+'" style="filter:drop-shadow(0 0 6px '+c+')"><animate attributeName="cx" values="'+xs+'" dur="2.8s" calcMode="discrete" repeatCount="indefinite"/><animate attributeName="cy" values="'+ys+'" dur="2.8s" calcMode="discrete" repeatCount="indefinite"/></circle>';
    s+='<text x="140" y="142" text-anchor="middle" font-size="9" fill="#93a0bd">straight · few steps</text>';
    return s;
  },
  tokens(c){
    let s='<line x1="20" y1="86" x2="260" y2="86" stroke="#334155" stroke-width="1"/>';
    for(let i=0;i<6;i++){ const x=24+i*40;
      s+='<g><rect x="'+x+'" y="64" width="32" height="32" rx="6" fill="'+c+'" opacity="0">'+
        '<animate attributeName="opacity" values="0;1;1;1" keyTimes="0;0.12;0.9;1" dur="3s" begin="'+(i*0.32)+'s" repeatCount="indefinite"/></rect>'+
        '<text x="'+(x+16)+'" y="86" text-anchor="middle" dominant-baseline="middle" font-size="13" fill="#06121f" opacity="0">a'+(i+1)+
        '<animate attributeName="opacity" values="0;1;1;1" keyTimes="0;0.12;0.9;1" dur="3s" begin="'+(i*0.32)+'s" repeatCount="indefinite"/></text></g>'; }
    return s;
  },
  energy(c){
    // U-shaped energy curve; ball does a damped roll and SETTLES at the minimum (no wild bounce).
    const path='M20,40 C70,40 90,120 140,120 C190,120 210,40 260,40';
    // points sit on the bowl y(x)=120-0.01*(x-140)^2, oscillation shrinking toward x=140
    const xs='70;200;95;175;120;150;140';
    const ys='71;84;100;108;116;119;120';
    const kt='0;0.16;0.34;0.52;0.70;0.86;1';
    const spl='0.4 0 0.6 1;0.4 0 0.6 1;0.4 0 0.6 1;0.4 0 0.6 1;0.4 0 0.6 1;0.4 0 0.6 1';
    let s='<path d="'+path+'" fill="none" stroke="#475569" stroke-width="2"/>';
    s+='<circle r="7" fill="'+c+'" style="filter:drop-shadow(0 0 7px '+c+')">'+
      '<animate attributeName="cx" values="'+xs+'" keyTimes="'+kt+'" calcMode="spline" keySplines="'+spl+'" dur="3s" repeatCount="indefinite"/>'+
      '<animate attributeName="cy" values="'+ys+'" keyTimes="'+kt+'" calcMode="spline" keySplines="'+spl+'" dur="3s" repeatCount="indefinite"/>'+
      '<animate attributeName="opacity" values="0;1;1;1;1;1;0" keyTimes="0;0.08;0.3;0.5;0.7;0.92;1" dur="3s" repeatCount="indefinite"/></circle>'+
      '';
    return s;
  },
  rlloop(c){
    const goal='<circle cx="244" cy="40" r="9" fill="none" stroke="#fbbf24" stroke-width="2"/>'+
      '<text x="244" y="44" text-anchor="middle" font-size="11" fill="#fbbf24">★</text>';
    let s=goal;
    const tries=[['M24,120 C90,120 120,60 244,40','#fb7185','0s'],
                 ['M24,120 C80,90 160,110 244,40','#fbbf24','0.9s'],
                 ['M24,120 C100,70 180,52 244,40',c,'1.8s']];
    tries.forEach(([d,col,b])=>{ s+='<path d="'+d+'" fill="none" stroke="'+col+'" stroke-width="2.4" '+
      'stroke-dasharray="320" stroke-dashoffset="320" opacity="0.9">'+
      '<animate attributeName="stroke-dashoffset" values="320;0" dur="0.8s" begin="'+b+'" fill="freeze" repeatCount="1"/>'+
      '<animate attributeName="opacity" values="0;0.9" dur="0.2s" begin="'+b+'" fill="freeze"/></path>'; });
    // reward meter
    s+='<rect x="24" y="132" width="120" height="8" rx="4" fill="#1e293b"/>'+
       '<rect x="24" y="132" width="0" height="8" rx="4" fill="'+c+'">'+
       '<animate attributeName="width" values="0;36;78;118" keyTimes="0;0.33;0.66;1" dur="2.8s" repeatCount="indefinite"/></rect>'+
       '<text x="150" y="140" font-size="10" fill="#93a0bd">reward ↑</text>'+
       '<circle cx="24" cy="120" r="6" fill="'+c+'"/>';
    return s;
  },
  offline(c){
    let s='';
    for(let i=0;i<3;i++){ const y=34+i*30;
      s+='<rect x="22" y="'+y+'" width="150" height="22" rx="5" fill="#0f1c33" stroke="#27406b"/>'+
        '<path d="M30,'+(y+11)+' q20,-12 40,0 t40,0 t40,0" fill="none" stroke="'+c+'" stroke-width="2" opacity="0.8"/>'; }
    s+='';
    // policy reads
    s+='<circle cx="232" cy="64" r="16" fill="#0b1326" stroke="'+c+'" stroke-width="2.5"/>'+
       '<text x="232" y="68" text-anchor="middle" font-size="10" fill="'+c+'">π</text>';
    for(let i=0;i<3;i++){ s+='<circle r="3.5" fill="'+c+'"><animateMotion dur="1.6s" begin="'+(i*0.5)+
      's" repeatCount="indefinite" path="M176,'+(45+i*30)+' L216,64"/>'+
      '<animate attributeName="opacity" values="0;1;0" dur="1.6s" begin="'+(i*0.5)+'s" repeatCount="indefinite"/></circle>'; }
    return s;
  },
  rewardmap(c){
    let s='<path d="M24,120 C90,40 170,40 250,96" fill="none" stroke="#e2e8f0" stroke-width="2.2" '+
      'stroke-dasharray="6 5" opacity="0.85"/>'+
      '';
    const pts=[[60,86],[110,58],[160,58],[210,80]];
    pts.forEach((p,i)=>{ s+='<circle cx="'+p[0]+'" cy="'+p[1]+'" r="6" fill="'+c+'">'+
      '<animate attributeName="r" values="0;26;0" dur="2.6s" begin="'+(i*0.4)+'s" repeatCount="indefinite"/>'+
      '<animate attributeName="opacity" values="0.5;0;0.5" dur="2.6s" begin="'+(i*0.4)+'s" repeatCount="indefinite"/></circle>'; });
    return s;
  },
  adversarial(c){
    let s='<rect x="20" y="50" width="60" height="40" rx="8" fill="#0f1c33" stroke="'+c+'" stroke-width="2"/>'+
      '<text x="50" y="74" text-anchor="middle" font-size="12" fill="'+c+'">G</text>'+
      '<text x="50" y="44" text-anchor="middle" font-size="9" fill="#93a0bd">imitator</text>'+
      '<rect x="200" y="50" width="60" height="40" rx="8" fill="#0f1c33" stroke="#fb7185" stroke-width="2"/>'+
      '<text x="230" y="74" text-anchor="middle" font-size="12" fill="#fb7185">D</text>'+
      '<text x="230" y="44" text-anchor="middle" font-size="9" fill="#93a0bd">spotter</text>'+
      '<line x1="80" y1="70" x2="200" y2="70" stroke="#334155" stroke-width="1.5"/>';
    s+='<circle r="4" fill="'+c+'"><animateMotion dur="1.4s" repeatCount="indefinite" path="M84,70 L196,70"/></circle>';
    s+='<text x="140" y="118" text-anchor="middle" font-size="12" fill="#fb7185">fake?'+
       '<animate attributeName="opacity" values="1;1;0;0" dur="3s" repeatCount="indefinite"/></text>'+
       '<text x="140" y="118" text-anchor="middle" font-size="12" fill="#34d399">real!'+
       '<animate attributeName="opacity" values="0;0;1;1" dur="3s" repeatCount="indefinite"/></text>';
    return s;
  },
  plan(c){
    // learned-model MPC essence: at each step IMAGINE a few candidate futures
    // (inside a receding-horizon window), execute one step of the best, slide, re-plan.
    const ref='M20,110 C70,104 110,66 156,60 C200,54 220,46 256,42';
    const DUR='5s', kt='0;0.8;0.9;1';
    let s='<text x="252" y="32" text-anchor="middle" font-size="13" fill="#fbbf24">★</text>';
    s+='<path d="'+ref+'" fill="none" stroke="#334155" stroke-width="1.5" stroke-dasharray="2 4"/>';
    // executed-so-far: solid, revealed left→right behind the sliding window
    s+='<path d="'+ref+'" fill="none" stroke="'+c+'" stroke-width="3" stroke-linecap="round" stroke-dasharray="300" stroke-dashoffset="300">'+
       '<animate attributeName="stroke-dashoffset" values="300;0;0;300" keyTimes="'+kt+'" dur="'+DUR+'" repeatCount="indefinite"/></path>';
    // sliding horizon window with THREE imagined candidate futures (learned model), best highlighted
    s+='<g><animateTransform attributeName="transform" type="translate" values="0,0;204,0;204,0;0,0" keyTimes="'+kt+'" dur="'+DUR+'" repeatCount="indefinite"/>'+
       '<rect x="16" y="26" width="66" height="100" rx="6" fill="'+c+'" opacity="0.10"/>'+
       '<rect x="16" y="26" width="66" height="100" rx="6" fill="none" stroke="'+c+'" stroke-width="1" stroke-dasharray="3 3" opacity="0.45"/>'+
       '<text x="49" y="22" text-anchor="middle" font-size="8" fill="'+c+'">imagine ↻</text>'+
       '<path d="M22,100 C40,64 60,44 80,38" fill="none" stroke="#64748b" stroke-width="1.5" stroke-dasharray="4 3" opacity="0.6"/>'+
       '<path d="M22,100 C42,96 62,98 80,104" fill="none" stroke="#64748b" stroke-width="1.5" stroke-dasharray="4 3" opacity="0.6"/>'+
       '<path d="M22,100 C40,80 58,66 80,58" fill="none" stroke="'+c+'" stroke-width="2.2" stroke-dasharray="4 3" opacity="0.9"/>'+
       '<text x="74" y="54" font-size="9" fill="'+c+'">✓</text>'+
       '</g>';
    // current state riding the executed tip
    s+='<circle r="5" fill="#fff" style="filter:drop-shadow(0 0 5px '+c+')">'+
       '<animateMotion dur="'+DUR+'" repeatCount="indefinite" path="'+ref+'" keyPoints="0;1;1;0" keyTimes="'+kt+'" calcMode="linear"/></circle>';
    s+='<text x="14" y="142" font-size="8" fill="#93a0bd">– – imagine futures (learned model)  ·  ▬ execute 1 step  ·  re-plan</text>';
    return s;
  },
  dream(c){
    let s='<circle cx="40" cy="100" r="12" fill="#0b1326" stroke="'+c+'" stroke-width="2.5"/>'+
      '<text x="40" y="104" text-anchor="middle" font-size="12">🤖</text>';
    // thought bubble
    s+='<circle cx="70" cy="78" r="4" fill="#0f1c33" stroke="'+c+'"/>'+
       '<circle cx="84" cy="64" r="6" fill="#0f1c33" stroke="'+c+'"/>'+
       '<rect x="96" y="20" width="160" height="74" rx="16" fill="#0f1c33" stroke="'+c+'" stroke-width="1.6" opacity="0.95"/>';
    s+='<path d="M120,72 C150,30 200,30 232,60" fill="none" stroke="'+c+'" stroke-width="1.6" opacity="0.5" stroke-dasharray="4 4"/>';
    s+='<circle r="5" fill="'+c+'" style="filter:drop-shadow(0 0 6px '+c+')">'+
       '<animateMotion dur="2s" repeatCount="indefinite" path="M120,72 C150,30 200,30 232,60"/></circle>';
    s+='';
    return s;
  },
  videogen(c){
    let s='';
    for(let i=0;i<5;i++){ const x=20+i*52;
      s+='<rect x="'+x+'" y="42" width="44" height="56" rx="5" fill="#0f1c33" stroke="#27406b"/>'+
        '<rect x="'+x+'" y="42" width="44" height="56" rx="5" fill="'+c+'" opacity="0">'+
        '<animate attributeName="opacity" values="0;0.55;0.55;0" keyTimes="0;0.2;0.85;1" dur="3s" begin="'+(i*0.45)+'s" repeatCount="indefinite"/></rect>'+
        '<circle cx="'+(x+22)+'" cy="70" r="'+(6+i*2)+'" fill="none" stroke="'+c+'" stroke-width="2" opacity="0">'+
        '<animate attributeName="opacity" values="0;1;1;0" keyTimes="0;0.2;0.85;1" dur="3s" begin="'+(i*0.45)+'s" repeatCount="indefinite"/></circle>'; }
    s+='<text x="140" y="118" text-anchor="middle" font-size="11" fill="'+c+'">↳ + action</text>';
    return s;
  },
  returncond(c){
    let s='<text x="20" y="30" font-size="11" fill="#93a0bd">target return</text>'+
      '<rect x="20" y="38" width="120" height="10" rx="5" fill="#1e293b"/>'+
      '<rect x="20" y="38" width="108" height="10" rx="5" fill="#fbbf24"/>'+
      '<text x="146" y="47" font-size="11" fill="#fbbf24">100 ★</text>';
    s+='';
    for(let i=0;i<5;i++){ const x=24+i*46;
      s+='<rect x="'+x+'" y="90" width="36" height="28" rx="6" fill="'+c+'" opacity="0">'+
        '<animate attributeName="opacity" values="0;1;1;1" keyTimes="0;0.15;0.9;1" dur="3s" begin="'+(0.6+i*0.36)+'s" repeatCount="indefinite"/></rect>'+
        '<text x="'+(x+18)+'" y="108" text-anchor="middle" font-size="11" fill="#06121f" opacity="0">a'+(i+1)+
        '<animate attributeName="opacity" values="0;1;1;1" keyTimes="0;0.15;0.9;1" dur="3s" begin="'+(0.6+i*0.36)+'s" repeatCount="indefinite"/></text>'; }
    return s;
  },
  goalrelabel(c){
    let s='<circle cx="30" cy="110" r="7" fill="'+c+'"/>'+
      '<text x="236" y="40" text-anchor="middle" font-size="14" fill="#fbbf24">★</text>'+
      '<text x="236" y="54" text-anchor="middle" font-size="9" fill="#93a0bd">goal</text>';
    // attempt that falls short
    s+='<path d="M30,110 C90,60 140,60 176,88" fill="none" stroke="'+c+'" stroke-width="2.4" '+
      'stroke-dasharray="240" stroke-dashoffset="240">'+
      '<animate attributeName="stroke-dashoffset" values="240;0;0;240" keyTimes="0;0.4;0.8;1" dur="3.4s" repeatCount="indefinite"/></path>';
    // landing point becomes new goal
    s+='<circle cx="176" cy="88" r="9" fill="none" stroke="#34d399" stroke-width="2.4">'+
      '<animate attributeName="opacity" values="0;0;1;1;0" keyTimes="0;0.4;0.55;0.85;1" dur="3.4s" repeatCount="indefinite"/></circle>'+
      '<text x="176" y="112" text-anchor="middle" font-size="10" fill="#34d399">↻ new goal'+
      '<animate attributeName="opacity" values="0;0;1;1;0" keyTimes="0;0.4;0.55;0.85;1" dur="3.4s" repeatCount="indefinite"/></text>';
    return s;
  },
  hierarchy(c){
    // manager drops ORDERED sub-goals along one plan line; worker threads through them
    const wp=[[78,56],[140,92],[206,60],[248,104]];
    const line='M40,48 L'+wp.map(p=>p[0]+','+p[1]).join(' L');
    let s='<circle cx="40" cy="32" r="14" fill="'+c+'"/>'+
      '<text x="40" y="36" text-anchor="middle" font-size="10" font-weight="700" fill="#06121f">hi</text>'+
      '<text x="40" y="16" text-anchor="middle" font-size="9" fill="#93a0bd">manager</text>'+
      '<path d="'+line+'" fill="none" stroke="'+c+'" stroke-width="1.4" stroke-dasharray="5 5" opacity="0.4"/>';
    wp.forEach((p,i)=>{ s+='<g opacity="0">'+
      '<animate attributeName="opacity" values="0;1;1" keyTimes="0;0.12;1" dur="3.2s" begin="'+(i*0.4)+'s" fill="freeze" repeatCount="indefinite"/>'+
      '<line x1="'+p[0]+'" y1="'+p[1]+'" x2="'+p[0]+'" y2="'+(p[1]-15)+'" stroke="'+c+'" stroke-width="1.5"/>'+
      '<path d="M'+p[0]+','+(p[1]-15)+' l10,3.5 l-10,3.5 z" fill="'+c+'"/></g>'; });
    s+='<circle r="6" fill="#fff" style="filter:drop-shadow(0 0 6px '+c+')">'+
      '<animateMotion dur="3.2s" repeatCount="indefinite" path="'+line+'"/></circle>'+
      '<text x="248" y="126" text-anchor="middle" font-size="9" fill="#93a0bd">worker</text>';
    return s;
  },
  meta(c){
    let s='';
    const tasks=['A','B','C'];
    tasks.forEach((t,i)=>{ const x=24+i*42;
      s+='<rect x="'+x+'" y="40" width="32" height="32" rx="7" fill="#0f1c33" stroke="'+c+'"/>'+
        '<text x="'+(x+16)+'" y="61" text-anchor="middle" font-size="13" fill="'+c+'">'+t+'</text>'+
        '<text x="'+(x+16)+'" y="88" text-anchor="middle" font-size="12" fill="#34d399">✓</text>'; });
    s+='';
    // new task quickly solved
    s+='<rect x="196" y="40" width="44" height="44" rx="9" fill="#0f1c33" stroke="#fbbf24" stroke-width="2"/>'+
      '<text x="218" y="68" text-anchor="middle" font-size="16" fill="#fbbf24">?'+
      '<animate attributeName="opacity" values="1;1;0" keyTimes="0;0.5;0.6" dur="2.6s" repeatCount="indefinite"/></text>'+
      '<text x="218" y="70" text-anchor="middle" font-size="18" fill="#34d399">✓'+
      '<animate attributeName="opacity" values="0;0;1;1" keyTimes="0;0.6;0.7;1" dur="2.6s" repeatCount="indefinite"/></text>'+
      '';
    return s;
  },
  llmplan(c){
    let s='<rect x="18" y="22" width="150" height="34" rx="9" fill="#0f1c33" stroke="'+c+'"/>'+
      '<text x="28" y="43" font-size="11" fill="#e7ecf6">"put cup on shelf"</text>'+
      '<path d="M40,56 l-8,12 l16,0 z" fill="#0f1c33" stroke="'+c+'"/>';
    const steps=['1 find cup','2 grasp','3 place on shelf'];
    steps.forEach((t,i)=>{ const y=78+i*22;
      s+='<text x="26" y="'+y+'" font-size="11" fill="#cbd5e1" opacity="0">'+t+
        '<animate attributeName="opacity" values="0;1;1" keyTimes="0;0.2;1" dur="3s" begin="'+(i*0.5)+'s" repeatCount="indefinite"/></text>'+
        '<text x="200" y="'+y+'" font-size="12" fill="#34d399" opacity="0">✓'+
        '<animate attributeName="opacity" values="0;1;1" keyTimes="0;0.2;1" dur="3s" begin="'+(0.4+i*0.5)+'s" repeatCount="indefinite"/></text>'; });
    return s;
  },
  affordance(c){
    let s='<rect x="18" y="20" width="244" height="112" rx="12" fill="#0a1426" stroke="#27406b"/>'+
      ''+
      '<line x1="30" y1="116" x2="250" y2="116" stroke="#334155" stroke-width="2"/>';
    // a clearer mug: rim + body + C-handle
    s+='<ellipse cx="136" cy="74" rx="24" ry="6" fill="#26344f" stroke="#5b6b87" stroke-width="1.5"/>'+
       '<rect x="113" y="74" width="46" height="42" rx="6" fill="#1f2a44" stroke="#5b6b87" stroke-width="2"/>'+
       '<path d="M159,84 a13,13 0 0 1 0,24" fill="none" stroke="#5b6b87" stroke-width="4"/>';
    // affordance heat + reticle on the handle
    s+='<circle cx="172" cy="96" r="7" fill="'+c+'">'+
       '<animate attributeName="r" values="7;22;7" dur="2.2s" repeatCount="indefinite"/>'+
       '<animate attributeName="opacity" values="0.65;0;0.65" dur="2.2s" repeatCount="indefinite"/></circle>'+
       '<circle cx="172" cy="96" r="12" fill="none" stroke="'+c+'" stroke-width="2"/>'+
       '<line x1="172" y1="80" x2="172" y2="112" stroke="'+c+'" stroke-width="1"/>'+
       '<line x1="156" y1="96" x2="188" y2="96" stroke="'+c+'" stroke-width="1"/>'+
       '<text x="172" y="128" text-anchor="middle" font-size="9" fill="'+c+'">grasp the handle</text>';
    return s;
  },

  // ---------- distinct RL animations ----------
  qlearn(c){
    const cols=6, rows=3, x0=22, y0=34, cw=38, ch=30;
    let s='';
    for(let r=0;r<rows;r++) for(let col=0;col<cols;col++){
      const x=x0+col*cw, y=y0+r*ch; const d=Math.abs(5-col)+Math.abs(0-r);
      s+='<rect x="'+x+'" y="'+y+'" width="'+(cw-4)+'" height="'+(ch-4)+'" rx="4" fill="#0f1c33" stroke="#27406b"/>'+
        '<rect x="'+x+'" y="'+y+'" width="'+(cw-4)+'" height="'+(ch-4)+'" rx="4" fill="'+c+'" opacity="0">'+
        '<animate attributeName="opacity" values="0;'+(0.12+0.5*(1-d/8)).toFixed(2)+'" dur="0.5s" begin="'+((8-d)*0.16).toFixed(2)+'s" fill="freeze"/></rect>'; }
    s+='<text x="'+(x0+5*cw+15)+'" y="'+(y0+16)+'" text-anchor="middle" font-size="14" fill="#fbbf24">★</text>';
    const path='M'+(x0+17)+','+(y0+2*ch+13)+' L'+(x0+cw*2+17)+','+(y0+2*ch+13)+' L'+(x0+cw*2+17)+','+(y0+13)+' L'+(x0+cw*5+17)+','+(y0+13);
    s+='<circle r="6" fill="#fff" opacity="0" style="filter:drop-shadow(0 0 6px '+c+')">'+
      '<animate attributeName="opacity" values="0;1" dur="0.01s" begin="1.6s" fill="freeze"/>'+
      '<animateMotion dur="3s" begin="1.6s" repeatCount="indefinite" path="'+path+'"/></circle>'+
      '';
    return s;
  },
  pgrad(c){
    const px=42, py=80;
    const ends=[[120,30],[168,26],[214,52],[226,92],[196,122]]; const best=1;
    let s='<circle cx="'+px+'" cy="'+py+'" r="7" fill="'+c+'"/>'+
      '<text x="176" y="20" font-size="11" fill="#fbbf24">★ reward</text>';
    ends.forEach((e,i)=>{ const isB=i===best;
      s+='<line x1="'+px+'" y1="'+py+'" x2="'+e[0]+'" y2="'+e[1]+'" stroke="'+c+'" stroke-linecap="round">'+
        '<animate attributeName="stroke-width" values="'+(isB?2:5)+';'+(isB?8:1.2)+';'+(isB?2:5)+'" dur="3s" repeatCount="indefinite"/>'+
        '<animate attributeName="opacity" values="'+(isB?0.5:0.6)+';'+(isB?1:0.12)+';'+(isB?0.5:0.6)+'" dur="3s" repeatCount="indefinite"/></line>'; });
    s+='';
    return s;
  },
  actorcritic(c){
    let s='<rect x="18" y="30" width="66" height="38" rx="9" fill="#0f1c33" stroke="'+c+'" stroke-width="2"/>'+
      '<text x="51" y="54" text-anchor="middle" font-size="12" fill="'+c+'">Actor</text>'+
      '<rect x="196" y="30" width="66" height="38" rx="9" fill="#0f1c33" stroke="#34d399" stroke-width="2"/>'+
      '<text x="229" y="54" text-anchor="middle" font-size="12" fill="#34d399">Critic</text>'+
      '<text x="140" y="44" text-anchor="middle" font-size="9" fill="#93a0bd">action →</text>'+
      '<circle r="4" fill="'+c+'"><animateMotion dur="1.6s" repeatCount="indefinite" path="M84,49 L196,49"/></circle>'+
      '<text x="229" y="86" text-anchor="middle" font-size="11" fill="#34d399">Q = +0.8'+
      '<animate attributeName="opacity" values="0.25;1;0.25" dur="1.6s" repeatCount="indefinite"/></text>'+
      '<path d="M196,62 C150,98 90,98 58,70" fill="none" stroke="#34d399" stroke-width="1.4" stroke-dasharray="4 4" opacity="0.6"/>'+
      '<text x="128" y="102" text-anchor="middle" font-size="9" fill="#34d399">grade → improve</text>'+
      '<rect x="200" y="98" width="58" height="20" rx="4" fill="#0f1c33" stroke="#27406b"/>'+
      '<text x="229" y="112" text-anchor="middle" font-size="8.5" fill="#93a0bd">replay buffer</text>';
    return s;
  },

  // ---------- distinct world-model animations ----------
  videopred(c){
    let s='';
    for(let i=0;i<5;i++){ const x=20+i*52;
      s+='<rect x="'+x+'" y="42" width="44" height="62" rx="5" fill="#0f1c33" stroke="#27406b"/>'+
        '<rect x="'+x+'" y="42" width="44" height="62" rx="5" fill="'+c+'" opacity="0">'+
        '<animate attributeName="opacity" values="0;0.55;0.55;0" keyTimes="0;0.2;0.85;1" dur="3s" begin="'+(i*0.45)+'s" repeatCount="indefinite"/></rect>'+
        '<circle cx="'+(x+22)+'" cy="73" r="'+(6+i*2)+'" fill="none" stroke="'+c+'" stroke-width="2" opacity="0">'+
        '<animate attributeName="opacity" values="0;1;1;0" keyTimes="0;0.2;0.85;1" dur="3s" begin="'+(i*0.45)+'s" repeatCount="indefinite"/></circle>'; }
    return s;
  },
  videoaction(c){
    let s='<rect x="20" y="50" width="56" height="60" rx="7" fill="#0f1c33" stroke="#5b6b87" stroke-width="1.5"/>'+
      '<text x="48" y="44" text-anchor="middle" font-size="9" fill="#93a0bd">now</text>'+
      '<circle cx="48" cy="80" r="9" fill="none" stroke="#5b6b87" stroke-width="2"/>'+
      '<path d="M76,80 L100,80" stroke="'+c+'" stroke-width="2"/>'+
      '<rect x="100" y="68" width="40" height="24" rx="6" fill="'+c+'"/>'+
      '<text x="120" y="84" text-anchor="middle" font-size="11" fill="#06121f">a →</text>'+
      '<path d="M140,80 L168,80" stroke="'+c+'" stroke-width="2"/>'+
      '<rect x="170" y="50" width="56" height="60" rx="7" fill="#0f1c33" stroke="'+c+'" stroke-width="2"/>'+
      '<text x="198" y="44" text-anchor="middle" font-size="9" fill="'+c+'">predicted next</text>'+
      '<circle cy="80" r="7" fill="none" stroke="'+c+'" stroke-width="2">'+
      '<animate attributeName="cx" values="190;212;190" dur="2.4s" repeatCount="indefinite"/>'+
      '<animate attributeName="r" values="5;11;5" dur="2.4s" repeatCount="indefinite"/></circle>'+
      '';
    return s;
  },
  worldaction(c){
    let s='';
    for(let i=0;i<4;i++){ const x=20+i*60;
      s+='<rect x="'+x+'" y="30" width="52" height="42" rx="5" fill="#0f1c33" stroke="#27406b"/>'+
        '<rect x="'+x+'" y="30" width="52" height="42" rx="5" fill="'+c+'" opacity="0">'+
        '<animate attributeName="opacity" values="0;0.5;0.5;0" keyTimes="0;0.2;0.85;1" dur="3s" begin="'+(i*0.5)+'s" repeatCount="indefinite"/></rect>'+
        '<circle cx="'+(x+26)+'" cy="51" r="8" fill="none" stroke="'+c+'" stroke-width="2" opacity="0.5"/>'; }
    s+='';
    for(let i=0;i<4;i++){ const x=20+i*60;
      s+='<rect x="'+(x+8)+'" y="100" width="36" height="22" rx="5" fill="'+c+'" opacity="0">'+
        '<animate attributeName="opacity" values="0;1;1;1" keyTimes="0;0.15;0.9;1" dur="3s" begin="'+(i*0.5+0.2)+'s" repeatCount="indefinite"/></rect>'+
        '<text x="'+(x+26)+'" y="115" text-anchor="middle" font-size="10" fill="#06121f" opacity="0">a'+(i+1)+
        '<animate attributeName="opacity" values="0;1;1;1" keyTimes="0;0.15;0.9;1" dur="3s" begin="'+(i*0.5+0.2)+'s" repeatCount="indefinite"/></text>'; }
    return s;
  },
  occupancy(c){
    const cols=8, rows=4, x0=20, y0=30, cw=30, ch=24;
    const occ=new Set(['2,1','3,1','4,1','5,1','3,2','4,2']);
    let s='';
    for(let r=0;r<rows;r++) for(let col=0;col<cols;col++){
      const x=x0+col*cw, y=y0+r*ch;
      s+='<rect x="'+x+'" y="'+y+'" width="'+(cw-3)+'" height="'+(ch-3)+'" rx="3" fill="#0b1326" stroke="#27406b"/>';
      if(occ.has(col+','+r)){ s+='<rect x="'+x+'" y="'+y+'" width="'+(cw-3)+'" height="'+(ch-3)+'" rx="3" fill="'+c+'" opacity="0">'+
        '<animate attributeName="opacity" values="0;0.85" dur="0.4s" begin="'+(0.3+((col+r)%4)*0.2).toFixed(2)+'s" fill="freeze"/></rect>'; }
    }
    const path='M'+(x0+15)+','+(y0+3*ch+11)+' L'+(x0+cw*7+15)+','+(y0+3*ch+11)+' L'+(x0+cw*7+15)+','+(y0+11);
    s+='<path d="'+path+'" fill="none" stroke="#34d399" stroke-width="2.5" stroke-dasharray="300" stroke-dashoffset="300">'+
      '<animate attributeName="stroke-dashoffset" values="300;0" dur="1.6s" begin="1.4s" fill="freeze"/></path>'+
      '<circle r="5" fill="#fff" opacity="0"><animate attributeName="opacity" values="0;1" dur="0.01s" begin="1.4s" fill="freeze"/>'+
      '<animateMotion dur="1.6s" begin="1.4s" repeatCount="indefinite" path="'+path+'"/></circle>';
    return s;
  },

  // ---------- classical / traditional control ----------
  pid(c){
    // 3-stage story: P (droops → offset) → P+I (reaches) → P+I+D (damps overshoot)
    const P=[6,98,188];
    const titles=['P','P + I','P + I + D'];
    let s='';
    P.forEach((px,i)=>{
      s+='<line x1="'+(px+6)+'" y1="40" x2="'+(px+84)+'" y2="40" stroke="#fbbf24" stroke-width="1" stroke-dasharray="4 3" opacity="0.8"/>';
      s+='<text x="'+(px+45)+'" y="24" text-anchor="middle" font-size="12" font-weight="800" fill="'+c+'">'+titles[i]+'</text>';
    });
    function draw(d,col,w,kt,op){ return '<path d="'+d+'" fill="none" stroke="'+col+'" stroke-width="'+w+'" stroke-linecap="round" opacity="'+op+'" stroke-dasharray="340" stroke-dashoffset="340"><animate attributeName="stroke-dashoffset" values="340;340;0;0;340" keyTimes="'+kt+'" dur="6s" repeatCount="indefinite"/></path>'; }
    // P: overshoots then decaying-oscillates, and SETTLES BELOW the target (offset)
    s+=draw('M14,98 C26,98 32,46 40,44 C50,42 50,66 56,64 C64,62 64,50 72,52 C80,54 82,56 88,56', c, 2.4, '0;0.04;0.22;0.9;1', '1');
    s+='<line x1="88" y1="56" x2="88" y2="40" stroke="#fb7185" stroke-width="1" stroke-dasharray="2 2"/><text x="90" y="51" font-size="6.5" fill="#fb7185">offset</text>';
    // P+I: bigger overshoot, still oscillates, but SETTLES ON the target (offset gone)
    s+=draw('M106,98 C118,98 122,30 132,28 C144,26 144,54 152,52 C162,50 162,36 172,38 C178,39 179,40 180,40', c, 2.4, '0;0.32;0.52;0.9;1', '1');
    // P+I+D: faint ghost (no D → still rings) + damped smooth (with D)
    s+=draw('M196,98 C214,98 218,24 232,30 C248,36 248,52 262,48 C268,46 268,40 270,40', '#fb7185', 1.5, '0;0.62;0.80;0.9;1', '0.55');
    s+=draw('M196,98 C216,98 226,38 244,40 C254,40 262,40 270,40', c, 2.6, '0;0.64;0.82;0.9;1', '1');
    return s;
  },
  lqr(c){
    // Highlight: (1) you must KNOW the dynamics model, (2) the gain comes from
    // DIRECTLY solving the Riccati equation (one-shot algebra, not trial-and-error).
    let s='';
    // ① known dynamics
    s+='<text x="8" y="27" font-size="8.5" fill="'+c+'">① known model</text>';
    s+='<rect x="8" y="31" width="120" height="23" rx="7" fill="#0c1326" stroke="'+c+'" stroke-width="1.6"/>'+
       '<text x="68" y="47" text-anchor="middle" font-size="12" fill="#e7ecf6">ẋ = A x + B u</text>';
    s+='<line x1="68" y1="54" x2="68" y2="65" stroke="'+c+'" stroke-width="1.6"/><path d="M64,61 l4,5 l4,-5 z" fill="'+c+'"/>';
    // ② solve Riccati (one-shot)
    s+='<text x="8" y="75" font-size="8.5" fill="'+c+'">② solve once</text>';
    s+='<rect x="8" y="79" width="134" height="40" rx="7" fill="#0c1326" stroke="'+c+'" stroke-width="1.6"/>'+
       '<text x="75" y="95" text-anchor="middle" font-size="8.5" fill="#cbd5e1">AᵀP+PA−PBR⁻¹BᵀP+Q=0</text>'+
       '<text x="75" y="111" text-anchor="middle" font-size="10.5" font-weight="700" fill="'+c+'">⇒  K = R⁻¹BᵀP</text>';
    // arrow to the phase plane
    s+='<line x1="143" y1="99" x2="167" y2="90" stroke="'+c+'" stroke-width="1.6"/><path d="M161,87 l7,3 l-3,6 z" fill="'+c+'"/>'+
       '<text x="156" y="82" text-anchor="middle" font-size="8" fill="#93a0bd">u=−Kx</text>';
    // ③ phase-plane: state spirals smoothly to the origin
    const ox=216, oy=80;
    s+='<line x1="170" y1="'+oy+'" x2="274" y2="'+oy+'" stroke="#27406b" stroke-width="1"/>'+
       '<line x1="'+ox+'" y1="42" x2="'+ox+'" y2="118" stroke="#27406b" stroke-width="1"/>'+
       '<circle cx="'+ox+'" cy="'+oy+'" r="4" fill="#34d399"/><text x="'+(ox+7)+'" y="'+(oy+13)+'" font-size="8" fill="#34d399">0</text>';
    let d='M'+(ox+54)+','+oy+' '; const turns=2.6, steps=56;
    for(let i=1;i<=steps;i++){ const t=i/steps, a=t*turns*2*Math.PI, r=54*(1-t);
      d+='L'+(ox+r*Math.cos(a)).toFixed(1)+','+(oy+r*Math.sin(a)*0.5).toFixed(1)+' '; }
    s+='<path d="'+d+'" fill="none" stroke="'+c+'" stroke-width="1.8" stroke-dasharray="420" stroke-dashoffset="420">'+
       '<animate attributeName="stroke-dashoffset" values="420;0" dur="2.6s" repeatCount="indefinite"/></path>'+
       '<circle r="4" fill="'+c+'" style="filter:drop-shadow(0 0 5px '+c+')"><animateMotion dur="2.6s" calcMode="paced" repeatCount="indefinite" path="'+d+'"/></circle>';
    return s;
  },
  trajopt(c){
    // MPC essence: a receding-horizon WINDOW slides forward; inside it is a dashed
    // PREDICTED plan; only the front step is executed (solid); then re-plan & repeat.
    const ref='M20,112 C66,108 104,64 150,58 C196,52 216,44 256,40';
    const DUR='5s', kt='0;0.8;0.9;1';
    let s='<text x="252" y="30" text-anchor="middle" font-size="13" fill="#fbbf24">★</text>';
    // faint reference (where we want to go)
    s+='<path d="'+ref+'" fill="none" stroke="#334155" stroke-width="1.5" stroke-dasharray="2 4"/>';
    // executed-so-far: solid, revealed left→right (trails the moving window), then resets
    s+='<path d="'+ref+'" fill="none" stroke="'+c+'" stroke-width="3" stroke-linecap="round" stroke-dasharray="300" stroke-dashoffset="300">'+
       '<animate attributeName="stroke-dashoffset" values="300;0;0;300" keyTimes="'+kt+'" dur="'+DUR+'" repeatCount="indefinite"/></path>';
    // the moving prediction horizon window (+ a dashed predicted plan inside it), slides forward
    s+='<g><animateTransform attributeName="transform" type="translate" values="0,0;206,0;206,0;0,0" keyTimes="'+kt+'" dur="'+DUR+'" repeatCount="indefinite"/>'+
       '<rect x="18" y="28" width="62" height="96" rx="6" fill="'+c+'" opacity="0.10"/>'+
       '<rect x="18" y="28" width="62" height="96" rx="6" fill="none" stroke="'+c+'" stroke-width="1" stroke-dasharray="3 3" opacity="0.45"/>'+
       '<text x="49" y="24" text-anchor="middle" font-size="8" fill="'+c+'">horizon ↻</text>'+
       '<path d="M22,100 C40,74 58,60 78,52" fill="none" stroke="'+c+'" stroke-width="2" stroke-dasharray="4 3" opacity="0.75"/>'+
       '</g>';
    // current state riding the executed tip (front of the window)
    s+='<circle r="5" fill="#fff" style="filter:drop-shadow(0 0 5px '+c+')">'+
       '<animateMotion dur="'+DUR+'" repeatCount="indefinite" path="'+ref+'" keyPoints="0;1;1;0" keyTimes="'+kt+'" calcMode="linear"/></circle>';
    // minimal legend: dashed = predicted plan, solid = executed
    s+='<text x="14" y="142" font-size="8" fill="#93a0bd">– – predict ahead  ·  ▬ execute 1 step  ·  re-plan</text>';
    return s;
  },
  planning(c){
    let s='<circle cx="26" cy="120" r="6" fill="'+c+'"/>'+
      '<text x="250" y="36" text-anchor="middle" font-size="13" fill="#fbbf24">★</text>'+
      '<rect x="108" y="52" width="52" height="48" rx="6" fill="#1f2a44" stroke="#5b6b87"/>';
    const segs=[['M26,120 L60,96','0s'],['M60,96 L48,64','0.3s'],['M60,96 L96,108','0.5s'],
                ['M96,108 L100,122','0.7s'],['M48,64 L80,40','0.9s'],['M80,40 L130,34','1.1s'],
                ['M96,108 L172,112','1.2s'],['M172,112 L200,82','1.5s'],['M130,34 L196,44','1.6s'],
                ['M200,82 L240,48','1.9s']];
    segs.forEach(function(seg){ s+='<path d="'+seg[0]+'" fill="none" stroke="#475569" stroke-width="1.4" stroke-dasharray="60" stroke-dashoffset="60">'+
      '<animate attributeName="stroke-dashoffset" values="60;0" dur="0.4s" begin="'+seg[1]+'" fill="freeze"/></path>'; });
    const fp='M26,120 L60,96 L48,64 L80,40 L130,34 L196,44 L240,48';
    s+='<path d="'+fp+'" fill="none" stroke="'+c+'" stroke-width="2.6" stroke-dasharray="420" stroke-dashoffset="420" opacity="0.95">'+
      '<animate attributeName="stroke-dashoffset" values="420;0" dur="1.4s" begin="2.2s" fill="freeze"/></path>'+
      '';
    return s;
  }
};

renderMap();
</script>
</body>
</html>
"""


# ---------------------------------------------------------------------------
# Survey-driven additions (same pattern as Classical Control): VLA family,
# Sim-to-Real, and Representation pretraining. Added here, not in the app.
# ---------------------------------------------------------------------------
EXTRA_FAMILIES = [
    dict(key="VLA", label="Vision-Language-Action", color="#f59e0b"),
    dict(key="Sim2Real", label="Sim-to-Real", color="#0ea5e9"),
    dict(key="Representation", label="Representation Pretraining", color="#65a30d"),
]
EXTRA_PARADIGMS = [
    dict(id="vla-foundation", name="VLA Foundation Models", short="VLA Foundation", family="VLA", anim="vla",
         tagline="A VLM trunk + an action head, trained on many robots' data.",
         simple=("Take a pretrained vision-language model (so it already 'knows' objects and language), "
                 "bolt on an action head, and fine-tune on huge multi-robot datasets. One model then "
                 "follows language commands across many tasks and embodiments — RT-2, OpenVLA, π0, GR00T."),
         mapping="image + instruction → robot actions",
         math=r"\pi_\theta(a\mid o,\ell),\;\;\theta\;\text{init from a VLM};\;\text{head}\in\{\text{tokens},\,\text{diffusion},\,\text{flow}\}",
         when="Generalist, language-conditioned manipulation across tasks and embodiments.",
         pros=["Web-scale priors from the VLM", "One model, many tasks/robots", "Language-conditioned"],
         cons=["Data- and compute-heavy", "Inference latency", "Still brittle out of distribution"],
         papers=["RT-2 (2023)", "OpenVLA (2024)", "π0 (2024)", "GR00T N1 (2024)"],
         learn=("OpenVLA — project page", "https://openvla.github.io/")),
    dict(id="vla-rl", name="RL-Finetuned VLA", short="RL-Finetuned VLA", family="VLA", anim="rlloop",
         tagline="Let a pretrained VLA practice with rewards, not just copy demos.",
         simple=("Imitation only copies demonstrations. RL fine-tuning lets a pretrained VLA actually "
                 "practice — collect rewards (in the real world or inside a world model) and improve "
                 "beyond the demos, fixing systematic failures imitation can't."),
         mapping="VLA + reward → improved VLA",
         math=r"\max_\theta\;\mathbb{E}_{\tau\sim\pi_\theta}\!\Big[\textstyle\sum_t \gamma^t r_t\Big]\;\;\text{from a pretrained VLA}",
         when="Push a strong imitation VLA past the demo ceiling; close the loop with a world model.",
         pros=["Improves beyond demos", "Fixes systematic failures", "Pairs with world models"],
         cons=["Needs reward / simulator", "Can destabilize a good policy", "Sample cost"],
         papers=["VLA-RFT (2025)", "iRe-VLA (2024)", "RL post-training of VLAs"],
         learn=("Illustrated RLHF — Hugging Face", "https://huggingface.co/blog/rlhf")),
    dict(id="domain-randomization", name="Domain Randomization", short="Domain Randomization", family="Sim2Real", anim="domainrand",
         tagline="Randomize the simulator so the real world is just another variation.",
         simple=("Train in simulation, but randomize everything — colors, lighting, friction, masses. "
                 "The policy sees so many variations that the real world looks like just one more, so it "
                 "transfers without any real-world training data."),
         mapping="randomized sims → robust real policy",
         math=r"\max_\pi\;\mathbb{E}_{\xi\sim p(\xi)}\,\mathbb{E}_{\tau\sim\pi,\,\mathrm{sim}_\xi}\!\Big[\textstyle\sum_t \gamma^t r_t\Big]",
         when="Sim-to-real for locomotion / dexterity when real data is scarce or dangerous.",
         pros=["No real-world training", "Cheap, parallel sims", "Backbone of legged/dexterous deploys"],
         cons=["Over-randomization hurts performance", "Needs a decent simulator", "Reality gap remains"],
         papers=["Domain Randomization (Tobin 2017)", "OpenAI Dactyl (2018)"],
         learn=("Solving Rubik's Cube (domain randomization) — OpenAI", "https://openai.com/index/solving-rubiks-cube/")),
    dict(id="sim2real-adapt", name="Domain Adaptation (RMA)", short="Domain Adaptation", family="Sim2Real", anim="domainrand",
         tagline="Quickly infer the real robot's true dynamics, then adapt online.",
         simple=("Instead of being robust to everything, learn to quickly figure out the real robot's "
                 "properties from a few moments of motion, then adapt on the fly — Rapid Motor Adaptation "
                 "(RMA) does this for legged robots walking on new terrain."),
         mapping="online experience → adapted policy",
         math=r"z_t=\phi(o_{1:t},a_{1:t}),\quad \pi(a\mid o,z_t)\;\;(\text{infer dynamics, then adapt})",
         when="Hardware whose dynamics differ from sim; changing terrain or payload.",
         pros=["Adapts to real dynamics", "Fast, online", "Strong legged-robot results"],
         cons=["Needs an adaptation module", "Base still sim-trained", "Limited to seen variation range"],
         papers=["RMA (Kumar 2021)", "domain adaptation for control"],
         learn=("RMA: Rapid Motor Adaptation — project page", "https://ashish-kmr.github.io/rma-legged-robots/")),
    dict(id="visual-pretrain", name="Visual Pretraining (R3M / MVP / VIP)", short="Visual Pretraining", family="Representation", anim="repr",
         tagline="Pretrain a vision encoder on web/human video, then freeze it for control.",
         simple=("Robot data is scarce, but internet video is endless. Pretrain a visual encoder on web / "
                 "human video with self-supervised or value objectives (R3M, MVP, VIP), freeze it, and "
                 "train a small policy on top — so you need far fewer robot demos."),
         mapping="web video → frozen encoder → small policy",
         math=r"\phi^*=\arg\min_\phi \mathcal{L}_{\text{SSL}}(\phi;\,\text{web video})\;\Rightarrow\;\pi_\psi(a\mid \phi(o))",
         when="Low-data manipulation; reuse perception across tasks.",
         pros=["Few robot demos needed", "Reusable perception", "Leverages internet video"],
         cons=["Frozen features may miss task cues", "Encoder–task mismatch", "Not a full policy"],
         papers=["R3M (2022)", "MVP (2022)", "VIP (2023)"],
         learn=("R3M — project page", "https://sites.google.com/view/robot-r3m/")),
    dict(id="latent-action", name="Latent Action Pretraining (LAPA)", short="Latent Action", family="Representation", anim="latentact",
         tagline="Learn 'latent actions' from unlabeled video, then map them to motors.",
         simple=("Most video has no action labels. Learn a latent 'what changed between frames' code from "
                 "raw video, pretrain a policy in that latent-action space, then map the latents to real "
                 "motor commands with only a little labeled data — LAPA / UniPi-style."),
         mapping="unlabeled video → latent actions → motors",
         math=r"\hat z_t=\mathrm{VQ}(o_t,o_{t+1}),\;\;p_\psi(o_{t+1}\!\mid o_t,\hat z_t)\;\Rightarrow\;a_t=h_\phi(\hat z_t)",
         when="Bootstrapping policies from action-free video at scale.",
         pros=["Uses action-free video", "Cuts labeled-data needs", "Scales with video"],
         cons=["Latent→action mapping needs labels", "VQ fidelity limits", "Indirect"],
         papers=["LAPA (2024)", "UniPi (2023)"],
         learn=("Latent Action Pretraining (LAPA) — project page", "https://latentactionpretraining.github.io/")),
]
EXTRA_EDGES = [
    ("tokenized-bc", "vla-foundation", "tokenized action head for a VLA", "b"),
    ("flow-matching-policy", "vla-foundation", "flow action head for a VLA", "b"),
    ("diffusion-policy", "vla-foundation", "diffusion action head for a VLA", "b"),
    ("vla-foundation", "vla-rl", "RL fine-tunes the VLA past the demo ceiling", "b"),
    ("policy-gradient-rl", "vla-rl", "RL objective for the fine-tune", "b"),
    ("vla-foundation", "llm-planner", "both VLM/LLM-based & language-conditioned", "v"),
    ("policy-gradient-rl", "domain-randomization", "sim RL trained over randomized physics", "b"),
    ("domain-randomization", "sim2real-adapt", "two routes across the reality gap", "v"),
    ("visual-pretrain", "diffusion-policy", "a frozen visual encoder feeds the policy", "b"),
    ("latent-action", "vla-foundation", "latent-action pretraining warm-starts VLAs", "b"),
    ("latent-action", "generative-video-wm", "both learn from action-free video", "v"),
    ("visual-pretrain", "latent-action", "representation pretraining from video", "v"),
]

# Extra animations injected into the shared template's ANIM object.
ROBOT_EXTRA_ANIM_JS = r"""
  vla(c){
    let s='<rect x="14" y="40" width="40" height="40" rx="6" fill="#172036" stroke="'+c+'" stroke-width="1.5"/><circle cx="34" cy="60" r="9" fill="none" stroke="'+c+'" stroke-width="2"/>';
    s+='<rect x="14" y="88" width="118" height="20" rx="6" fill="#172036" stroke="#334155"/><text x="22" y="102" font-size="9" fill="#cbd5e1">"pick up the cup"</text>';
    s+='<rect x="64" y="40" width="68" height="40" rx="9" fill="#0c1326" stroke="'+c+'" stroke-width="2"/><text x="98" y="64" text-anchor="middle" font-size="11" fill="'+c+'">VLM</text>';
    for(let i=0;i<4;i++)s+='<rect x="'+(148+i*28)+'" y="50" width="24" height="22" rx="5" fill="'+c+'" opacity="0"><animate attributeName="opacity" values="0;1;1" keyTimes="0;0.12;1" dur="3s" begin="'+(0.6+i*0.3)+'s" repeatCount="indefinite"/></rect>'+
      '<text x="'+(160+i*28)+'" y="65" text-anchor="middle" font-size="9" fill="#06121f" opacity="0">a'+(i+1)+'<animate attributeName="opacity" values="0;1;1" keyTimes="0;0.12;1" dur="3s" begin="'+(0.6+i*0.3)+'s" repeatCount="indefinite"/></text>';
    s+='';
    return s;
  },
  domainrand(c){
    let s='';
    const bg=['#1f2a44','#3b2a1f','#1f3b2a'];
    bg.forEach((b,i)=>{const x=14+i*60;
      s+='<rect x="'+x+'" y="24" width="52" height="40" rx="5" fill="'+b+'" stroke="'+c+'" stroke-width="1"><animate attributeName="opacity" values="0.5;1;0.5" dur="2.4s" begin="'+(i*0.3)+'s" repeatCount="indefinite"/></rect>'+
        '<circle cx="'+(x+26)+'" cy="44" r="7" fill="'+c+'" opacity="0.8"/>';});
    for(let i=0;i<3;i++)s+='<line x1="'+(40+i*60)+'" y1="66" x2="120" y2="92" stroke="'+c+'" stroke-width="1" stroke-dasharray="3 3" opacity="0.4"/>';
    s+='<rect x="92" y="92" width="58" height="24" rx="9" fill="#0c1326" stroke="'+c+'" stroke-width="2"/><text x="121" y="108" text-anchor="middle" font-size="10" fill="'+c+'">robust π</text>';
    s+='<path d="M152,104 L186,104" stroke="#34d399" stroke-width="2"/><path d="M180,99 l8,5 l-8,5" fill="none" stroke="#34d399" stroke-width="2"/><text x="196" y="100" font-size="14">🤖</text><text x="192" y="118" font-size="8" fill="#34d399">real robot</text>';
    return s;
  },
  repr(c){
    let s='';
    for(let i=0;i<4;i++)s+='<rect x="'+(14+i*26)+'" y="24" width="22" height="28" rx="3" fill="#172036" stroke="#27406b"/>';
    s+='<text x="14" y="74" font-size="9" fill="'+c+'">self-supervised → frozen encoder 🔒</text>';
    s+='<rect x="14" y="82" width="70" height="30" rx="8" fill="#0c1326" stroke="'+c+'" stroke-width="2"/><text x="49" y="101" text-anchor="middle" font-size="10" fill="'+c+'">φ frozen</text>';
    s+='<path d="M86,97 L120,97" stroke="'+c+'" stroke-width="2"/><path d="M114,92 l8,5 l-8,5" fill="none" stroke="'+c+'" stroke-width="2"/>';
    s+='<rect x="124" y="84" width="54" height="26" rx="8" fill="#172036" stroke="#475569"/><text x="151" y="101" text-anchor="middle" font-size="9" fill="#cbd5e1">small π</text><text x="182" y="101" font-size="8" fill="#93a0bd">few demos</text>';
    return s;
  },
  latentact(c){
    let s='<rect x="14" y="40" width="38" height="38" rx="5" fill="#172036" stroke="#27406b"/><text x="33" y="34" text-anchor="middle" font-size="8" fill="#93a0bd">oₜ</text><circle cx="30" cy="59" r="6" fill="'+c+'" opacity="0.7"/>';
    s+='<rect x="62" y="40" width="38" height="38" rx="5" fill="#172036" stroke="#27406b"/><text x="81" y="34" text-anchor="middle" font-size="8" fill="#93a0bd">oₜ₊₁</text><circle cx="86" cy="59" r="6" fill="'+c+'" opacity="0.7"/>';
    s+='<path d="M104,59 L140,59" stroke="'+c+'" stroke-width="2"/><path d="M134,54 l8,5 l-8,5" fill="none" stroke="'+c+'" stroke-width="2"/><text x="120" y="44" text-anchor="middle" font-size="8" fill="#93a0bd">latent action</text>';
    s+='<rect x="142" y="46" width="44" height="28" rx="8" fill="'+c+'"/><text x="164" y="64" text-anchor="middle" font-size="12" fill="#06121f">ẑ</text>';
    s+='<path d="M164,76 L164,98" stroke="'+c+'" stroke-width="2"/><path d="M159,92 l5,8 l5,-8" fill="none" stroke="'+c+'" stroke-width="2"/><text x="164" y="116" text-anchor="middle" font-size="10" fill="'+c+'">→ motor action</text>';
    s+='';
    return s;
  },
"""
ROBOT_EXTRA_CAP_JS = (
 'vla:"A VLM trunk reads the scene + instruction and emits actions.",'
 'domainrand:"Randomize the sim so the real world is just another variation.",'
 'repr:"Pretrain a vision encoder on video; freeze it for control.",'
 'latentact:"Learn latent actions from unlabeled video, then map to motors.",'
)


def render():
    """Render robot_landscape HTML with the extra animations injected."""
    t = TEMPLATE.replace("const ANIM = {", "const ANIM = {\n" + ROBOT_EXTRA_ANIM_JS, 1)
    t = t.replace("const ANIM_CAP = {", "const ANIM_CAP = {\n  " + ROBOT_EXTRA_CAP_JS + "\n", 1)
    return t.replace("__DATA_JSON__", json.dumps(build_data()))


def main():
    data = build_data()
    html = render()
    out = "robot_landscape.html"
    with open(out, "w", encoding="utf-8") as fh:
        fh.write(html)
    print(f"wrote {out}  ({len(html):,} bytes)")
    print(f"  families={len(data['families'])} paradigms={len(data['paradigms'])} edges={len(data['edges'])}")


if __name__ == "__main__":
    main()