runs: subtle 'clear' button next to compare selected

runs: live counter + keep compare selections across filter swaps
- Counter shows 'N / cap' where cap flips 10→50 based on whether any chip is active. Updates immediately on chip click and after every htmx swap. - compare-select.js no longer prunes selections that aren't in the current DOM slice — server-side filtering replaces the whole list, so absence from DOM means 'off-current-filter', not 'run deleted'.
2026-04-22 18:04:24 -06:00 · 2026-04-22 18:02:35 -06:00 · 2026-04-22 17:54:46 -06:00 · 2026-04-22 17:48:35 -06:00 · 2026-04-22 17:28:55 -06:00 · 2026-04-22 17:23:51 -06:00
14 changed files with 486 additions and 144 deletions
--- a/app/web/main.py
+++ b/app/web/main.py
@ -475,6 +475,18 @@ def run_args_hash(
 embed_args_hash = run_args_hash


+def sci_notation(v: Any) -> str:
+    """Float → compact sci notation without a period (0.005 → '5E-3').
+    Used in stems and Prefect run names so filenames + UI avoid periods."""
+    try:
+        f = float(v)
+    except (TypeError, ValueError):
+        return str(v)
+    m, e = f"{f:.3e}".split("e")
+    m = m.rstrip("0").rstrip(".")
+    return f"{m}E{int(e)}"
+
+
 def synthesize_output_paths(
    generator_path: str,
    embedder: str,
@ -487,8 +499,9 @@ def synthesize_output_paths(
 ) -> Tuple[str, str]:
    gen = generator_path.split(".")[-1]
    emb = embedder.split(".")[-1]
-    ref = f"{gen}_Reference_N{num_points}_T{num_timesteps}_J{jitter_scale}_s{seed}.html"
-    base = f"{gen}_{emb}_N{num_points}_T{num_timesteps}_J{jitter_scale}_s{seed}"
+    j = sci_notation(jitter_scale)
+    ref = f"{gen}_Reference_N{num_points}_T{num_timesteps}_J{j}_s{seed}.html"
+    base = f"{gen}_{emb}_N{num_points}_T{num_timesteps}_J{j}_s{seed}"
    if embed_args is None:
        embf = f"{base}.html"
    else:
@ -534,32 +547,46 @@ class Prefect:
        return None

    async def create_run(
-        self, client: httpx.AsyncClient, parameters: Dict[str, Any]
+        self,
+        client: httpx.AsyncClient,
+        parameters: Dict[str, Any],
+        tags: Optional[List[str]] = None,
    ) -> Optional[Dict[str, Any]]:
        dep = await self.deployment_id(client)
        if not dep:
            return None
+        body: Dict[str, Any] = {"parameters": parameters}
+        if tags:
+            body["tags"] = list(tags)
        r = await client.post(
            f"{self.base}/deployments/{dep}/create_flow_run",
-            json={"parameters": parameters},
+            json=body,
        )
        if r.status_code >= 400:
            return {"error": r.text, "status": r.status_code}
        return r.json()

    async def recent_runs(
-        self, client: httpx.AsyncClient, limit: int = 10
+        self,
+        client: httpx.AsyncClient,
+        limit: int = 10,
+        required_tags: Optional[List[str]] = None,
    ) -> List[Dict[str, Any]]:
        dep = await self.deployment_id(client)
        if not dep:
            return []
+        flow_runs: Dict[str, Any] = {"deployment_id": {"any_": [dep]}}
+        if required_tags:
+            flow_runs["tags"] = {"all_": list(required_tags)}
+        # Prefect rejects limit > 200 with HTTP 422.
+        capped = min(max(1, limit), 200)
        try:
            r = await client.post(
                f"{self.base}/flow_runs/filter",
                json={
                    "sort": "START_TIME_DESC",
-                    "limit": limit,
-                    "flow_runs": {"deployment_id": {"any_": [dep]}},
+                    "limit": capped,
+                    "flow_runs": flow_runs,
                },
            )
            if r.status_code == 200:
@ -568,6 +595,19 @@ class Prefect:
            return []
        return []

+    async def update_tags(
+        self, client: httpx.AsyncClient, run_id: str, tags: List[str]
+    ) -> bool:
+        try:
+            r = await client.patch(
+                f"{self.base}/flow_runs/{run_id}",
+                json={"tags": list(tags)},
+            )
+            return r.status_code < 400
+        except httpx.HTTPError:
+            return False
+        return []
+

 PREFECT = Prefect()

@ -663,7 +703,9 @@ def _run_view(run: Dict[str, Any]) -> Dict[str, Any]:
        "ref_exists": ref_exists,
        "emb_exists": emb_exists,
        "embedder_short": (params.get("embedder") or "").split(".")[-1],
-        "generator_short": (params.get("generator_path") or "").split(".")[-1],
+        "generator_short": _dataset_id(
+            params.get("generator_path") or "", params.get("generator_kwargs") or {}
+        ),
    }


@ -736,10 +778,49 @@ async def reducer_form(request: Request, name: str) -> HTMLResponse:
    )


+def _chip_filter_tags(params) -> List[str]:
+    """Turn chip-filter query params (?dataset=…&algorithm=…&N=…&T=…&J=…)
+    into a Prefect `tags all_` list. Empty / missing values skip the axis."""
+    keys = ("dataset", "algorithm", "N", "T", "J")
+    tags = []
+    for k in keys:
+        v = (params.get(k) or "").strip()
+        if v:
+            tags.append(f"{k}:{v}")
+    return tags
+
+
+@app.get("/runs/axes.json")
+async def runs_axes() -> JSONResponse:
+    """Distinct chip values across the last N deployment-scoped runs. Lets
+    the chip bar show the full universe regardless of the current filter."""
+    async with httpx.AsyncClient(timeout=5.0) as client:
+        runs = await PREFECT.recent_runs(client, limit=500)
+    values: Dict[str, set] = {k: set() for k in ("dataset", "algorithm", "N", "T", "J")}
+    for r in runs:
+        for tag in r.get("tags") or []:
+            if ":" not in tag:
+                continue
+            k, _, v = tag.partition(":")
+            if k in values:
+                values[k].add(v)
+    # Sort numeric axes numerically.
+    def _sort(k, vs):
+        if k in ("N", "T", "J"):
+            return sorted(vs, key=lambda x: float(x) if x else 0.0)
+        return sorted(vs)
+    return JSONResponse({k: _sort(k, v) for k, v in values.items()})
+
+
@app.get("/runs", response_class=HTMLResponse)
 async def runs_partial(request: Request) -> HTMLResponse:
+    required = _chip_filter_tags(request.query_params)
+    # Server-side tag filter → one narrow query per chip state. When any
+    # axis is unfiltered, Prefect returns the K most recent for that slice;
+    # when fully filtered, usually a handful of exact matches.
+    limit = 50 if required else 10
    async with httpx.AsyncClient(timeout=5.0) as client:
-        runs = await PREFECT.recent_runs(client, limit=10)
+        runs = await PREFECT.recent_runs(client, limit=limit, required_tags=required)
    views = [_run_view(r) for r in runs]
    _mark_stale_views(views)
    return templates.TemplateResponse(
@ -839,8 +920,13 @@ async def submit(request: Request) -> HTMLResponse:
    if generator_kwargs:
        parameters["generator_kwargs"] = generator_kwargs

+    tags = build_run_tags(
+        generator_path, generator_kwargs, reducer,
+        num_points, num_timesteps, jitter_scale,
+    )
+
    async with httpx.AsyncClient(timeout=10.0) as client:
-        run = await PREFECT.create_run(client, parameters)
+        run = await PREFECT.create_run(client, parameters, tags=tags)

    if not run:
        return HTMLResponse(
@ -904,7 +990,7 @@ async def metrics_json() -> JSONResponse:


 _STEM_RE = re.compile(
-    r"^make_[A-Za-z_]+?_[A-Za-z]+_N\d+_T\d+_J[\d.]+_s\d+(?:_[0-9a-f]{8})?$"
+    r"^make_[A-Za-z_]+?_[A-Za-z]+_N\d+_T\d+_J[\d.Ee+\-]+_s\d+(?:_[0-9a-f]{8})?$"
 )

 # Map short generator name ("make_blobs") to its DATASET_META entry.
@ -914,6 +1000,62 @@ for _m in DATASET_META.values():
    _GEN_TO_META.setdefault(_m["path"].rsplit(".", 1)[-1], _m)


+# Kwargs the flow injects / we supply explicitly — never part of the
+# dataset's semantic identity, so strip them before DATASET_META matching
+# and before regenerating labels.
+_TRANSIENT_GEN_KWARGS = {"n_samples", "random_state"}
+
+
+def _clean_gen_kwargs(gk: Optional[Dict[str, Any]]) -> Optional[Dict[str, Any]]:
+    if gk is None:
+        return None
+    return {k: v for k, v in gk.items() if k not in _TRANSIENT_GEN_KWARGS}
+
+
+# Tag axes the chip-filter and backfill both care about. Keep as
+# (short_prefix, builder) pairs so adding an axis is a one-line change.
+TAG_AXES = ("dataset", "algorithm", "N", "T", "J")
+
+
+def build_run_tags(
+    generator_path: str,
+    generator_kwargs: Optional[Dict[str, Any]],
+    embedder: str,
+    num_points: int,
+    num_timesteps: int,
+    jitter_scale: float,
+) -> List[str]:
+    """Tags written onto every flow run so the chip filter can narrow
+    server-side via Prefect's tag:all_ filter. Single value per axis; the
+    client's cassette chips pick exactly one per filter."""
+    return [
+        f"dataset:{_dataset_id(generator_path, generator_kwargs)}",
+        f"algorithm:{(embedder or '').rsplit('.', 1)[-1]}",
+        f"N:{int(num_points)}",
+        f"T:{int(num_timesteps)}",
+        f"J:{sci_notation(jitter_scale)}",
+    ]
+
+
+def _dataset_id(generator_path: str, generator_kwargs: Optional[Dict[str, Any]]) -> str:
+    """Human-scale identifier for a run's dataset — e.g. 'swiss_roll' vs
+    'swiss_roll_hole' — by matching (path, cleaned kwargs) against
+    DATASET_META. Falls back to the path short-name when no match."""
+    gen_short = (generator_path or "").rsplit(".", 1)[-1]
+    gk = _clean_gen_kwargs(generator_kwargs)
+    candidates = [
+        (k, m) for k, m in DATASET_META.items()
+        if m["path"].rsplit(".", 1)[-1] == gen_short
+    ]
+    if not candidates:
+        return gen_short
+    if gk is not None:
+        for k, m in candidates:
+            if m["kwargs"] == gk:
+                return k
+    return candidates[0][0]
+
+
 def _lookup_dataset_meta(
    generator_short: str, generator_kwargs: Optional[Dict[str, Any]]
 ) -> Optional[Dict[str, Any]]:
@ -926,9 +1068,10 @@ def _lookup_dataset_meta(
    ]
    if not candidates:
        return None
-    if generator_kwargs is not None:
+    gk = _clean_gen_kwargs(generator_kwargs)
+    if gk is not None:
        for m in candidates:
-            if m["kwargs"] == generator_kwargs:
+            if m["kwargs"] == gk:
                return m
    return candidates[0]

@ -963,7 +1106,13 @@ def _enrich_with_labels(d: Dict[str, Any]) -> Dict[str, Any]:
    dm = _lookup_dataset_meta(gen_short, gk)
    if not dm:
        return d
-    kwargs_to_use = gk if gk is not None else dm["kwargs"]
+    # Replace the stem-derived generator short (ambiguous for swiss_roll vs
+    # hole) with the matched DATASET_META id for the panel header.
+    for key, entry in DATASET_META.items():
+        if entry is dm:
+            d["meta"]["generator"] = key
+            break
+    kwargs_to_use = _clean_gen_kwargs(gk) if gk is not None else dm["kwargs"]
    try:
        mod_path, cls_name = dm["path"].rsplit(".", 1)
        fn = getattr(importlib.import_module(mod_path), cls_name)
--- a/app/web/plotly_parse.py
+++ b/app/web/plotly_parse.py
@ -20,7 +20,7 @@ from pathlib import Path

 _STEM_RE = re.compile(
    r"^(?P<gen>make_.+?)_(?P<emb>[A-Za-z]+)_N(?P<n>\d+)_T(?P<t>\d+)"
-    r"_J(?P<j>[\d.]+)_s(?P<s>\d+)(?:_(?P<h>[0-9a-f]{8}))?$"
+    r"_J(?P<j>[\d.Ee+\-]+)_s(?P<s>\d+)(?:_(?P<h>[0-9a-f]{8}))?$"
 )

 # plotly's typed-array dtype -> (struct format char, item size bytes)
--- a/app/web/static/compare-select.js
+++ b/app/web/static/compare-select.js
@ -8,6 +8,7 @@
  const selected = new Set();

  const btn = document.getElementById('compare-btn');
+  const clearBtn = document.getElementById('compare-clear');
  const countEl = document.getElementById('compare-count');
  const slot = document.getElementById('runs-slot');
  if (!btn || !countEl || !slot) return;
@ -16,17 +17,15 @@
    const n = selected.size;
    countEl.textContent = `(${n}/${MAX})`;
    btn.disabled = n < MIN || n > MAX;
+    if (clearBtn) clearBtn.hidden = n === 0;
  }

  function applyToDOM() {
-    const checkboxes = slot.querySelectorAll('.compare-cb');
-    // Drop any selected stems that are no longer in the DOM (run aged out of list)
-    const present = new Set();
-    checkboxes.forEach((cb) => present.add(cb.dataset.stem));
-    for (const s of [...selected]) if (!present.has(s)) selected.delete(s);
-
+    // Selections persist across swaps — with server-side filtering, rows
+    // leave the DOM when they don't match the current filter, but the user
+    // still has them "in the cart".
    const atCap = selected.size >= MAX;
-    checkboxes.forEach((cb) => {
+    slot.querySelectorAll('.compare-cb').forEach((cb) => {
      const stem = cb.dataset.stem;
      cb.checked = selected.has(stem);
      cb.disabled = atCap && !cb.checked;
@ -61,5 +60,10 @@
    window.open(`/compare?${qs}`, '_blank', 'noopener');
  });

+  if (clearBtn) clearBtn.addEventListener('click', () => {
+    selected.clear();
+    applyToDOM();
+  });
+
  applyToDOM();
 })();
--- a/app/web/static/compare.js
+++ b/app/web/static/compare.js
@ -1,7 +1,7 @@
 // compare.js — thin shim that parses ?stem=…&stem=… (legacy ?a=&b=) and
 // hands off to panel-grid.js.

-import { mountPanels } from './panel-grid.js?v=5';
+import { mountPanels } from './panel-grid.js?v=6';

 const params = new URLSearchParams(window.location.search);
 let stems = params.getAll('stem').filter(Boolean);
--- a/app/web/static/panel-grid.js
+++ b/app/web/static/panel-grid.js
@ -567,6 +567,9 @@ export function mountPanels({ host, controls, stems }) {
  // Reset controls to a clean state (they may be reused across opens).
  if (scrub)   scrub.value = '0';
  if (playBtn) { playBtn.textContent = '▶'; playBtn.setAttribute('aria-label', 'play'); }
+  // Axes dropdown is meaningless for a single-panel view (nothing to lock
+  // against; aspect is fixed by the modal dialog's own sizing).
+  if (syncSel) syncSel.disabled = total < 2;

  // Parallel fetch; each panel's error is independent.
  const ready = Promise.allSettled(stems.map(fetchFrames)).then((results) => {
--- a/app/web/static/run-modal.js
+++ b/app/web/static/run-modal.js
@ -1,7 +1,7 @@
 // run-modal.js — homepage click-hijack for embedding links. Opens a
 // <dialog id="run-modal"> that renders the run's embedding via panel-grid.js.

-import { mountPanels } from './panel-grid.js?v=5';
+import { mountPanels } from './panel-grid.js?v=6';

 const dialog = document.getElementById('run-modal');
 const host = document.getElementById('modal-panel-host');
--- a/app/web/static/runs-filter.js
+++ b/app/web/static/runs-filter.js
@ -1,114 +1,123 @@
-// Filter the recent-runs list by dataset + algorithm chips.
-// State lives outside #runs-slot so it survives the 3s htmx poll. After
-// each swap we repopulate chip options from whatever runs came back, then
-// re-apply the current selection to hide non-matching rows.
+// Cassette-style single-select chip filter. Each axis has at most one
+// selection; clicking the selected chip again releases it. State lives
+// here and rides along on the htmx-polled /runs request via hx-vals on
+// #runs-slot. Chip universe comes from /runs/axes.json so the bar shows
+// the full history, not just the currently-displayed page.

 (function () {
  const slot = document.getElementById('runs-slot');
-  const dsEl = document.getElementById('runs-flt-dataset');
-  const algEl = document.getElementById('runs-flt-algo');
-  if (!slot || !dsEl || !algEl) return;
+  if (!slot) return;

-  // null = "all selected" (no filtering on this axis). Populated Sets
-  // override that. Sticky across htmx swaps.
-  let datasets = null;
-  let algorithms = null;
+  const AXES = [
+    { key: 'dataset',   chipsId: 'runs-flt-dataset', numeric: false },
+    { key: 'algorithm', chipsId: 'runs-flt-algo',    numeric: false },
+    { key: 'N',         chipsId: 'runs-flt-n',       numeric: true  },
+    { key: 'T',         chipsId: 'runs-flt-t',       numeric: true  },
+    { key: 'J',         chipsId: 'runs-flt-j',       numeric: true  },
+  ];

-  function scanValues() {
-    const ds = new Set();
-    const alg = new Set();
-    slot.querySelectorAll('li.run').forEach((li) => {
-      const d = li.dataset.generator; if (d) ds.add(d);
-      const a = li.dataset.embedder;  if (a) alg.add(a);
-    });
-    return {
-      datasets: [...ds].sort(),
-      algorithms: [...alg].sort(),
-    };
+  for (const ax of AXES) {
+    ax.el = document.getElementById(ax.chipsId);
+    ax.group = ax.el ? ax.el.closest('.runs-filter-group') : null;
+    ax.selected = null;
+    ax.universe = [];
  }

-  function paint(container, values, selected) {
-    container.innerHTML = '';
+  function stateAsQuery() {
+    const p = {};
+    for (const ax of AXES) {
+      if (ax.selected != null) p[ax.key] = ax.selected;
+    }
+    return p;
+  }
+
+  function syncHtmxVals() {
+    // Feed the current chip state into every htmx request on #runs-slot
+    // (including the 3s poll). JSON form.
+    slot.setAttribute('hx-vals', JSON.stringify(stateAsQuery()));
+  }
+
+  function paint(ax) {
+    if (!ax.el) return;
+    ax.el.innerHTML = '';
+    const values = ax.universe;
+    if (ax.group) ax.group.style.display = values.length <= 1 ? 'none' : '';
    for (const v of values) {
      const b = document.createElement('button');
      b.type = 'button';
-      const on = selected == null || selected.has(v);
+      const on = ax.selected === v;
      b.className = 'chip' + (on ? ' is-on' : '');
      b.dataset.value = v;
-      b.dataset.role = 'value';
      b.setAttribute('aria-pressed', on ? 'true' : 'false');
      b.textContent = v;
-      container.appendChild(b);
-    }
-    for (const [role, label] of [['all', 'all'], ['none', 'none']]) {
-      const b = document.createElement('button');
-      b.type = 'button';
-      b.className = 'chip chip-meta';
-      b.dataset.role = role;
-      b.textContent = label;
-      container.appendChild(b);
+      ax.el.appendChild(b);
    }
  }

-  function repaint() {
-    const { datasets: allDs, algorithms: allAlg } = scanValues();
-    paint(dsEl, allDs, datasets);
-    paint(algEl, allAlg, algorithms);
+  function repaintAll() {
+    for (const ax of AXES) paint(ax);
  }

-  function apply() {
-    slot.querySelectorAll('li.run').forEach((li) => {
-      const ds = li.dataset.generator || '';
-      const al = li.dataset.embedder || '';
-      const passDs = datasets == null || datasets.has(ds);
-      const passAl = algorithms == null || algorithms.has(al);
-      li.classList.toggle('filtered-out', !(passDs && passAl));
-    });
+  async function refreshUniverse() {
+    try {
+      const res = await fetch('/runs/axes.json', { cache: 'no-store' });
+      if (!res.ok) return;
+      const data = await res.json();
+      for (const ax of AXES) {
+        ax.universe = Array.isArray(data[ax.key]) ? data[ax.key] : [];
+      }
+      repaintAll();
+    } catch {
+      /* offline → leave whatever we had */
+    }
  }

-  function bind(container, getSet, setSet, allGetter) {
-    container.addEventListener('click', (e) => {
+  function anyFilterActive() {
+    return AXES.some((ax) => ax.selected != null);
+  }
+
+  function updateCounter() {
+    const count = slot.querySelectorAll('li.run').length;
+    const cap = anyFilterActive() ? 50 : 10;
+    const countEl = document.getElementById('runs-count');
+    const capEl = document.getElementById('runs-cap');
+    if (countEl) countEl.textContent = String(count);
+    if (capEl)   capEl.textContent   = String(cap);
+  }
+
+  function triggerRunsRefresh() {
+    // Tell htmx to re-fetch /runs right now with the updated hx-vals.
+    if (window.htmx && typeof window.htmx.trigger === 'function') {
+      window.htmx.trigger(slot, 'filter-changed');
+    }
+  }
+
+  for (const ax of AXES) {
+    if (!ax.el) continue;
+    ax.el.addEventListener('click', (e) => {
      const btn = e.target.closest('.chip');
      if (!btn) return;
-      const role = btn.dataset.role;
-      const all = allGetter();
-      let cur = getSet();
-      if (cur == null) cur = new Set(all);
-      if (role === 'value') {
      const v = btn.dataset.value;
-        if (cur.has(v)) cur.delete(v);
-        else cur.add(v);
-      } else if (role === 'all') {
-        cur = new Set(all);
-      } else if (role === 'none') {
-        cur = new Set();
-      }
-      setSet(cur);
-      repaint();
-      apply();
+      ax.selected = (ax.selected === v) ? null : v;
+      paint(ax);
+      syncHtmxVals();
+      updateCounter();
+      triggerRunsRefresh();
    });
  }

-  bind(
-    dsEl,
-    () => datasets,
-    (s) => { datasets = s; },
-    () => scanValues().datasets,
-  );
-  bind(
-    algEl,
-    () => algorithms,
-    (s) => { algorithms = s; },
-    () => scanValues().algorithms,
-  );
-
+  // Re-paint on htmx swap (fresh runs arriving) so the chip universe stays
+  // current even between explicit refreshes.
  document.body.addEventListener('htmx:afterSwap', (e) => {
    if (e.target && e.target.id === 'runs-slot') {
-      repaint();
-      apply();
+      repaintAll();
+      updateCounter();
    }
  });

-  repaint();
-  apply();
+  syncHtmxVals();
+  refreshUniverse();
+  updateCounter();
+  // Periodically refresh the universe so newly-introduced values appear.
+  setInterval(refreshUniverse, 30_000);
 })();
--- a/app/web/static/style.css
+++ b/app/web/static/style.css
@ -513,15 +513,37 @@ button.submit:disabled { background: var(--faint); border-color: var(--faint); c
  font-size: 0.76rem;
  font-style: italic;
 }
+.compare-bar .compare-clear {
+  background: transparent;
+  border: 0;
+  color: var(--faint);
+  font: inherit;
+  font-size: 0.72rem;
+  padding: 0 0.2rem;
+  cursor: pointer;
+  text-decoration: underline dotted;
+  text-underline-offset: 3px;
+}
+.compare-bar .compare-clear:hover { color: var(--alarm); }

 .runs-filter {
  display: flex;
-  flex-wrap: wrap;
-  gap: 0.6rem 1.4rem;
+  flex-direction: column;
+  gap: 0.4rem;
  padding: 0.25rem 0 0.7rem;
  margin-bottom: 0.3rem;
  border-bottom: 1px dashed var(--rule);
 }
+.runs-filter-row {
+  display: flex;
+  flex-wrap: wrap;
+  gap: 0.4rem 1.4rem;
+}
+/* Hide a row entirely when every child group is display:none (all axes
+   in it have a single value). :has is supported in all modern evergreens. */
+.runs-filter-row:not(:has(.runs-filter-group:not([style*="display: none"]))) {
+  display: none;
+}
 .runs-filter-group {
  display: flex;
  align-items: center;
@ -542,6 +564,11 @@ button.submit:disabled { background: var(--faint); border-color: var(--faint); c
  gap: 0.25rem 0.3rem;
  align-items: center;
 }
+.runs-filter-group .chips .chip-meta-wrap {
+  display: inline-flex;
+  gap: 0.25rem 0.3rem;
+  flex-shrink: 0;
+}

 .runs li.run.filtered-out { display: none; }
 .runs li.run.just-submitted {
@ -1680,6 +1707,9 @@ button.submit:disabled { background: var(--faint); border-color: var(--faint); c
  align-items: center;
  gap: 0.35rem;
 }
+/* Hide a wrap entirely when its select is disabled (e.g., axes on a
+   single-panel modal view). */
+.compare-controls label:has(select:disabled) { display: none; }
 .compare-controls .cc-lbl {
  color: var(--faint);
  text-transform: lowercase;
--- a/app/web/templates/_runs.html
+++ b/app/web/templates/_runs.html
@ -9,7 +9,10 @@
    {% for r in runs %}
      <li class="run {% if just_submitted is defined and r.id == just_submitted %}just-submitted{% endif %}{% if r.stale %} stale{% endif %}"
          data-embedder="{{ r.embedder_short or '' }}"
-          data-generator="{{ r.generator_short or '' }}">
+          data-generator="{{ r.generator_short or '' }}"
+          data-n="{{ r.params.get('num_points', '') if r.params else '' }}"
+          data-t="{{ r.params.get('num_timesteps', r.params.get('num_snapshots', '')) if r.params else '' }}"
+          data-j="{{ r.params.get('jitter_scale', '') if r.params else '' }}">
        {% if r.emb_exists and not r.stale %}
          <input type="checkbox" class="compare-cb" data-stem="{{ r.emb_file[:-5] }}" aria-label="select run for comparison" />
        {% else %}
--- a/app/web/templates/compare.html
+++ b/app/web/templates/compare.html
@ -4,7 +4,7 @@
  <meta charset="utf-8" />
  <meta name="viewport" content="width=device-width,initial-scale=1" />
  <title>embedding notebook &middot; compare</title>
-  <link rel="stylesheet" href="/static/style.css?v=32" />
+  <link rel="stylesheet" href="/static/style.css?v=36" />
  <script type="importmap">
  {
    "imports": {
@ -102,7 +102,7 @@
 </template>

 <script src="/static/theme.js?v=11"></script>
-<script type="module" src="/static/compare.js?v=17"></script>
+<script type="module" src="/static/compare.js?v=18"></script>
 <!-- panel-grid.js is imported by compare.js (module); versioned via compare.js cache-bust -->

 </body>
--- a/app/web/templates/index.html
+++ b/app/web/templates/index.html
@ -4,7 +4,7 @@
  <meta charset="utf-8" />
  <meta name="viewport" content="width=device-width,initial-scale=1" />
  <title>embedding notebook</title>
-  <link rel="stylesheet" href="/static/style.css?v=32" />
+  <link rel="stylesheet" href="/static/style.css?v=38" />
  <script src="https://unpkg.com/htmx.org@2.0.4"></script>
  <script type="importmap">
  {
@ -296,7 +296,7 @@
    <div class="section-label">
      <span>§ 4 &nbsp; recent runs</span>
      <span class="run-count">
-        <span id="runs-count">{{ runs|length }}</span> / 10 · refresh 3s
+        <span id="runs-count">{{ runs|length }}</span> / <span id="runs-cap">10</span> &middot; refresh 3s
        <span id="poll-ind" class="htmx-indicator" style="margin-left:6px">&#9679;</span>
      </span>
    </div>
@ -305,24 +305,41 @@
      <button type="button" id="compare-btn" disabled>
        compare selected <span id="compare-count">(0/8)</span>
      </button>
+      <button type="button" id="compare-clear" class="compare-clear" hidden aria-label="clear selection">clear</button>
      <span class="compare-hint muted">pick 2&ndash;8 embeddings &rarr; side-by-side animation in a new tab</span>
    </div>

    <div class="runs-filter" id="runs-filter">
-      <div class="runs-filter-group">
+      <div class="runs-filter-row">
+        <div class="runs-filter-group" data-axis="dataset">
          <span class="ctl-label">dataset</span>
          <div class="chips" id="runs-flt-dataset" aria-label="filter by dataset"></div>
        </div>
-      <div class="runs-filter-group">
+        <div class="runs-filter-group" data-axis="algorithm">
          <span class="ctl-label">algorithm</span>
          <div class="chips" id="runs-flt-algo" aria-label="filter by algorithm"></div>
        </div>
      </div>
+      <div class="runs-filter-row">
+        <div class="runs-filter-group" data-axis="n">
+          <span class="ctl-label">N</span>
+          <div class="chips" id="runs-flt-n" aria-label="filter by N"></div>
+        </div>
+        <div class="runs-filter-group" data-axis="t">
+          <span class="ctl-label">T</span>
+          <div class="chips" id="runs-flt-t" aria-label="filter by T"></div>
+        </div>
+        <div class="runs-filter-group" data-axis="j">
+          <span class="ctl-label">J</span>
+          <div class="chips" id="runs-flt-j" aria-label="filter by J"></div>
+        </div>
+      </div>
+    </div>

    <div
      id="runs-slot"
      hx-get="/runs"
-      hx-trigger="load delay:3s, every 3s"
+      hx-trigger="load delay:3s, every 3s, filter-changed"
      hx-swap="innerHTML"
      hx-indicator="#poll-ind"
    >
@ -484,9 +501,9 @@
 <script src="/static/theme.js?v=11"></script>
 <script type="module" src="/static/dataset-picker.js?v=11"></script>
 <script type="module" src="/static/metrics.js?v=11"></script>
-<script src="/static/compare-select.js?v=2"></script>
-<script src="/static/runs-filter.js?v=1"></script>
-<script type="module" src="/static/run-modal.js?v=2"></script>
+<script src="/static/compare-select.js?v=4"></script>
+<script src="/static/runs-filter.js?v=6"></script>
+<script type="module" src="/static/run-modal.js?v=3"></script>
 <script>
  // Anchor-links alone don't expand <details>; force it.
  document.querySelector('a[href="#metrics"]')?.addEventListener('click', () => {
--- a/flows/embedding_flow.py
+++ b/flows/embedding_flow.py
@ -43,6 +43,19 @@ def _run_args_hash(
    return hashlib.sha1(s.encode()).hexdigest()[:8]


+def _sci(v: Any) -> str:
+    """Float → compact sci notation without a period (e.g. 0.005 → 5E-3,
+    0.01 → 1E-2). Keeps Prefect's UI happy — it doesn't like periods in
+    run names."""
+    try:
+        f = float(v)
+    except (TypeError, ValueError):
+        return str(v)
+    m, e = f"{f:.3e}".split("e")
+    m = m.rstrip("0").rstrip(".")
+    return f"{m}E{int(e)}"
+
+
 def _flow_run_name() -> str:
    """Name each Prefect run after the stem of its output fig, so runs are
    searchable / hoverable instead of wearing Prefect's auto-generated
@ -52,7 +65,7 @@ def _flow_run_name() -> str:
    emb = (p.get("embedder") or "").rsplit(".", 1)[-1] or "?"
    N = p.get("num_points", "?")
    T = p.get("num_timesteps", "?")
-    J = p.get("jitter_scale", "?")
+    J = _sci(p.get("jitter_scale", "?"))
    s = p.get("seed", "?")
    tag = _run_args_hash(p.get("embed_args"), p.get("generator_kwargs"))
    return f"{gen}_{emb}_N{N}_T{T}_J{J}_s{s}_{tag}"
@ -315,12 +328,13 @@ def embedding_flow(

    Path(output_dir).mkdir(parents=True, exist_ok=True)
    _generator = generator_path.split(".")[-1]
+    _j = _sci(jitter_scale)
    output_ref: str = (
-        f"{output_dir.strip('/')}/{_generator}_Reference_N{num_points}_T{num_timesteps}_J{jitter_scale}_s{seed}.html"
+        f"{output_dir.strip('/')}/{_generator}_Reference_N{num_points}_T{num_timesteps}_J{_j}_s{seed}.html"
    )
    _args_tag = _run_args_hash(embed_args, user_generator_kwargs)
    output_embed: str = (
-        f"{output_dir.strip('/')}/{_generator}_{embedder.split('.')[-1]}_N{num_points}_T{num_timesteps}_J{jitter_scale}_s{seed}_{_args_tag}.html"
+        f"{output_dir.strip('/')}/{_generator}_{embedder.split('.')[-1]}_N{num_points}_T{num_timesteps}_J{_j}_s{seed}_{_args_tag}.html"
    )
    output_metrics: str = output_embed[:-5] + ".metrics.json"
    output_frames: str = output_embed[:-5] + ".frames.json"
--- a/scripts/backfill_hashes.py
+++ b/scripts/backfill_hashes.py
@ -30,7 +30,7 @@ from typing import Any, Dict, List, Optional

 _ROOT = Path(__file__).resolve().parent.parent
 sys.path.insert(0, str(_ROOT))
-from app.web.main import PREFECT, run_args_hash  # noqa: E402
+from app.web.main import PREFECT, run_args_hash, sci_notation  # noqa: E402


 def _legacy_hash(ea: Optional[Dict[str, Any]]) -> str:
@ -38,30 +38,45 @@ def _legacy_hash(ea: Optional[Dict[str, Any]]) -> str:
    return hashlib.sha1(s.encode()).hexdigest()[:8]


-def _base_stem(params: Dict[str, Any]) -> Optional[str]:
+def _base_stems(params: Dict[str, Any]) -> List[str]:
+    """Return the stem prefix(es) for this run's params: both the current
+    sci-J form and the legacy decimal-J form, so we can find pre-transition
+    files on disk too."""
    try:
        gen = (params.get("generator_path") or "").rsplit(".", 1)[-1]
        emb = (params.get("embedder") or "").rsplit(".", 1)[-1]
        N = int(params["num_points"])
        T = int(params.get("num_timesteps", params.get("num_snapshots")))
-        J = float(params["jitter_scale"])
+        Jf = float(params["jitter_scale"])
        s = int(params["seed"])
    except (KeyError, TypeError, ValueError):
-        return None
+        return []
    if not gen or not emb:
-        return None
-    return f"{gen}_{emb}_N{N}_T{T}_J{J}_s{s}"
+        return []
+    out = [f"{gen}_{emb}_N{N}_T{T}_J{sci_notation(Jf)}_s{s}"]
+    legacy = f"{gen}_{emb}_N{N}_T{T}_J{Jf}_s{s}"
+    if legacy not in out:
+        out.append(legacy)
+    return out


-def _candidate_names(base: str, ea: Dict[str, Any], gk: Dict[str, Any]) -> List[str]:
-    target = f"{base}_{run_args_hash(ea, gk)}.html"
-    legacy = f"{base}_{_legacy_hash(ea)}.html"
-    no_hash = f"{base}.html"
-    # Preserve order: target first so we short-circuit on already-backfilled.
+def _candidate_names(bases: List[str], ea: Dict[str, Any], gk: Dict[str, Any]) -> List[str]:
+    # Target = current sci-J base + new-scheme hash.
+    if not bases:
+        return []
+    target_base = bases[0]
+    target = f"{target_base}_{run_args_hash(ea, gk)}.html"
    out = [target]
-    for x in (legacy, no_hash):
+    # Fall back to every (base, hash) combination we might find on disk.
+    hashes = [run_args_hash(ea, gk), _legacy_hash(ea)]
+    for b in bases:
+        for h in hashes:
+            x = f"{b}_{h}.html"
            if x not in out:
                out.append(x)
+        no_hash = f"{b}.html"
+        if no_hash not in out:
+            out.append(no_hash)
    return out


@ -125,13 +140,13 @@ def main() -> int:
        params = r.get("parameters") or {}
        ea = params.get("embed_args") or {}
        gk = params.get("generator_kwargs") or {}
-        base = _base_stem(params)
-        if not base:
+        bases = _base_stems(params)
+        if not bases:
            continue
-        target = f"{base}_{run_args_hash(ea, gk)}.html"
+        target = f"{bases[0]}_{run_args_hash(ea, gk)}.html"
        if target in seen_targets:
            continue  # later duplicate — the stale-marking logic will handle it
-        for candidate in _candidate_names(base, ea, gk):
+        for candidate in _candidate_names(bases, ea, gk):
            if (figs_dir / candidate).exists():
                if candidate == target:
                    # Already at target; just ensure metrics.json carries gk.
--- a/scripts/backfill_tags.py
+++ b/scripts/backfill_tags.py
@ -0,0 +1,98 @@
+"""Backfill per-run Prefect tags for the chip-filter UX.
+
+Each run in the deployment is tagged with
+  dataset:<id>  algorithm:<short>  N:<n>  T:<t>  J:<j>
+computed from its stored `parameters`. Existing tags on the run are
+preserved; the five axis tags are merged in (replacing any stale value).
+
+Dry-run by default. Pass `--apply` to actually PATCH runs.
+
+Usage:
+    .venv/bin/python scripts/backfill_tags.py [--apply] [--limit N]
+"""
+
+from __future__ import annotations
+
+import argparse
+import asyncio
+import sys
+from pathlib import Path
+from typing import Any, Dict, List
+
+_ROOT = Path(__file__).resolve().parent.parent
+sys.path.insert(0, str(_ROOT))
+
+import httpx  # noqa: E402
+
+from app.web.main import PREFECT, TAG_AXES, build_run_tags  # noqa: E402
+
+
+def _desired_tags(params: Dict[str, Any]) -> List[str]:
+    return build_run_tags(
+        params.get("generator_path") or "",
+        params.get("generator_kwargs") or {},
+        params.get("embedder") or "",
+        int(params.get("num_points", 0) or 0),
+        int(params.get("num_timesteps", params.get("num_snapshots", 0)) or 0),
+        float(params.get("jitter_scale", 0.0) or 0.0),
+    )
+
+
+def _merge(existing: List[str], desired: List[str]) -> List[str]:
+    """Replace any existing `<axis>:*` tags with the desired ones; keep
+    anything else untouched."""
+    prefixes = tuple(f"{k}:" for k in TAG_AXES)
+    kept = [t for t in (existing or []) if not t.startswith(prefixes)]
+    return kept + list(desired)
+
+
+async def main_async(apply: bool, limit: int) -> int:
+    async with httpx.AsyncClient(timeout=10.0) as c:
+        runs = await PREFECT.recent_runs(c, limit=limit)
+        planned = []
+        for r in runs:
+            params = r.get("parameters") or {}
+            try:
+                desired = _desired_tags(params)
+            except Exception as e:
+                print(f"  skip {r['id'][:8]} ({e})")
+                continue
+            existing = r.get("tags") or []
+            merged = _merge(existing, desired)
+            if set(merged) == set(existing):
+                continue
+            planned.append((r["id"], existing, merged))
+
+        print(f"scanning deployment runs (seen: {len(runs)})")
+        print(f"  {len(planned)} to patch\n")
+        for rid, _, merged in planned:
+            print(f"  {rid[:8]}  ->  {sorted(merged)}")
+        if not planned:
+            print("nothing to do")
+            return 0
+        if not apply:
+            print("\n(dry run — pass --apply to patch)")
+            return 0
+
+        print("\napplying...")
+        ok = 0
+        for rid, _, merged in planned:
+            if await PREFECT.update_tags(c, rid, merged):
+                ok += 1
+                print(f"  {rid[:8]}  OK")
+            else:
+                print(f"  {rid[:8]}  FAILED")
+        print(f"done — patched {ok}/{len(planned)}")
+        return 0
+
+
+def main() -> int:
+    ap = argparse.ArgumentParser(description=__doc__)
+    ap.add_argument("--apply", action="store_true", help="actually PATCH tags (default: dry-run)")
+    ap.add_argument("--limit", type=int, default=500, help="Prefect runs to scan")
+    args = ap.parse_args()
+    return asyncio.run(main_async(args.apply, args.limit))
+
+
+if __name__ == "__main__":
+    sys.exit(main())
Author	SHA1	Message	Date
Michael Pilosov	ba7eef9df0	runs: subtle 'clear' button next to compare selected	2026-04-22 18:04:24 -06:00
Michael Pilosov	59a6bece2e	runs: live counter + keep compare selections across filter swaps - Counter shows 'N / cap' where cap flips 10→50 based on whether any chip is active. Updates immediately on chip click and after every htmx swap. - compare-select.js no longer prunes selections that aren't in the current DOM slice — server-side filtering replaces the whole list, so absence from DOM means 'off-current-filter', not 'run deleted'.	2026-04-22 18:02:35 -06:00
Michael Pilosov	e94d28b8fc	filenames + run names: J in sci notation (5E-3 not 0.005) Periods in filenames are avoidable and the Prefect UI dislikes them in run names. Uses a shared sci_notation helper in main.py mirrored in the flow. Stem regex (main + parser) now matches J<digits.Ee+-> to accept both old decimal-J and new sci-J filenames so the two transition together. J tag in Prefect tag list also uses the sci form, so chip filters stay consistent. Backfill script extended to find pre-transition (decimal-J) files on disk via a second base-stem variant, then rename them to the sci form. backfill_tags re-patches existing runs so their J tag matches the new canonical form. All 13 existing figs + runs renamed / retagged in-place.	2026-04-22 17:54:46 -06:00
Michael Pilosov	56279dbb1b	runs: server-side chip filter via Prefect tags + cassette chip UX - New runs are tagged on dispatch with dataset:<id> / algorithm:<short> / N:<n> / T:<t> / J:<j> (single value per axis). - /runs accepts ?dataset=&algorithm=&N=&T=&J= and applies Prefect's tags: {all_: [...]} server-side. Without filter, fetch cap is 10; with filter, 50 so narrow results aren't truncated. Prefect's own 200-limit on filter queries is clamped inside recent_runs. - New /runs/axes.json returns the universe of chip values across the last 200 deployment runs so the chip bar shows history even when the current slice is narrow. - runs-filter.js rewritten to cassette-style single-select: clicking the selected chip releases it. No 'all'/'none' meta chips. Chip state feeds #runs-slot via hx-vals; a filter-changed custom event triggers an immediate refetch on change, in addition to the 3s poll. - Prefect client gets an update_tags(run_id, tags) helper. - scripts/backfill_tags.py PATCHes tags onto every existing deployment run (dry-run by default, --apply to commit).	2026-04-22 17:48:35 -06:00
Michael Pilosov	aa1303e373	runs filter: add J (jitter) chip group alongside N and T	2026-04-22 17:28:55 -06:00
Michael Pilosov	4ecdc7f586	modal: hide axes dropdown for single-panel runs Disable #cc-sync in panel-grid when there's only one stem (nothing to sync; aspect is fixed by the dialog) and hide any .compare-controls label whose select is disabled via :has.	2026-04-22 17:23:51 -06:00
Michael Pilosov	d70eff3704	runs filter: N + T chip rows; group all/none meta chips; explicit row layout - Add N and T axes alongside dataset/algorithm; chips populated from runs in the list, axis group hidden when there's a single unique value. - Dataset+algorithm on row 1, N+T on row 2 via two explicit .runs-filter-row flex containers (cleaner than a sentinel break elem that double-counted the row-gap). - 'all' and 'none' meta-chips now wrap as a unit inside .chip-meta-wrap so one doesn't orphan to the next line. - Row is hidden entirely when every axis in it collapses to a single value (:has selector on .runs-filter-row).	2026-04-22 17:20:08 -06:00
Michael Pilosov	4576088c73	labels: distinguish swiss_roll vs swiss_roll_hole in the UI - _run_view uses a new _dataset_id(path, kwargs) that matches DATASET_META by (path, cleaned kwargs) and returns the catalogue key — so the runs list / filter chips show 'swiss_roll' vs 'swiss_roll_hole' rather than collapsing both to 'make_swiss_roll'. - _enrich_with_labels replaces the stem-derived meta.generator with the matched DATASET_META key, so the compare panel header + diff-highlight also distinguish the two variants.	2026-04-22 17:12:46 -06:00
Michael Pilosov	d052ec4223	labels: strip transient n_samples/random_state from generator_kwargs before regen Sidecars written by the pre-fix flow contain merged generator_kwargs (n_samples + random_state=0 mixed in with the user-supplied form). The enrichment call passes n_samples/random_state explicitly, so an old sidecar's gk caused a TypeError (duplicate kwarg) that the try/except swallowed — leaving labels empty and coloring falling back to a plain ramp. Strip those keys before DATASET_META matching and the regen call; matches work naturally against the stripped dict.	2026-04-22 17:09:26 -06:00