diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
index 7fa8d3c..cca3ef0 100644
--- a/.github/workflows/release.yml
+++ b/.github/workflows/release.yml
@@ -26,6 +26,12 @@ on:
       - 'CMakeLists.txt'
       - 'library.json'
       - '.github/workflows/release.yml'
+      # The web installer + landing page are served from Pages by the deploy-pages job
+      # below; a change to them must trigger a deploy or it never reaches the live site
+      # (the eth-only-provisioning fix shipped a commit that didn't auto-deploy because
+      # docs/install was missing here). src/ui/install-picker*.js is already covered by src/**.
+      - 'docs/install/**'
+      - 'docs/landing/**'
   workflow_dispatch:
     inputs:
       tag:
@@ -102,6 +108,10 @@ jobs:
       - uses: actions/checkout@v4
         with:
           persist-credentials: false
+          # Full history: compute_version.py counts commits since the last v* tag
+          # for the `latest` build's `-dev.<N>` suffix. A shallow clone (the default)
+          # has no tags / partial history and would yield a wrong count.
+          fetch-depth: 0
 
       - name: Cache ESP-IDF tooling
         uses: actions/cache@v4
@@ -129,6 +139,27 @@ jobs:
           elif [ "$IS_MAIN" = "true" ]; then echo "tag=latest" >> "$GITHUB_OUTPUT"
           else echo "tag=$REF_NAME" >> "$GITHUB_OUTPUT"; fi
 
+      # The semver burned into the binary + stamped on the assets/manifest. A
+      # `latest` build gets `<core>-dev.<N>` (N = commits since the last v* tag)
+      # so successive latest builds are orderable; a stable tag gets the core.
+      # Computed once here and reused by build + staging so all three agree.
+      - name: Compute version
+        id: ver
+        # The channel (latest vs stable) and the -rc handling both live in
+        # compute_version.py — pass only the tag, the helper derives the rest, so
+        # this step and the release job's identical step can't disagree. Raw
+        # `python` (not `uv run`): this job has no setup-uv (the ESP-IDF docker
+        # action provides Python) and the script is stdlib-only.
+        # Tag passed via env (not inline ${{ }}) so it reaches the script as a
+        # plain shell variable, never spliced into the command text — no shell
+        # injection from a crafted tag/ref.
+        env:
+          TAG: ${{ steps.tag.outputs.tag }}
+        run: |
+          set -euo pipefail
+          V=$(python scripts/build/compute_version.py --tag "$TAG")
+          echo "version=$V" >> "$GITHUB_OUTPUT"
+
       - name: Build firmware
         uses: espressif/esp-idf-ci-action@v1
         with:
@@ -150,13 +181,13 @@ jobs:
           # We run our own builder (not the action's default `idf.py build`)
           # so the sdkconfig fragments and EXCLUDE_COMPONENTS go through the
           # same code path as local builds. --release burns the channel tag in.
-          command: python ../scripts/build/build_esp32.py --firmware ${{ matrix.firmware }} --release "${{ steps.tag.outputs.tag }}"
+          command: python ../scripts/build/build_esp32.py --firmware ${{ matrix.firmware }} --release "${{ steps.tag.outputs.tag }}" --version "${{ steps.ver.outputs.version }}"
 
       - name: Stage release artifacts
         run: |
           set -euo pipefail
           mkdir -p dist
-          V=$(jq -r .version library.json)
+          V="${{ steps.ver.outputs.version }}"   # computed once above; matches the binary's MM_VERSION
           # Per-firmware build dir under build/esp32-<firmware>/ (plan-19.1).
           # build_esp32.py points idf.py at this dir via -B, so the build
           # tree lives outside esp32/ and multiple firmwares can coexist —
@@ -242,6 +273,10 @@ jobs:
       # the "Re-create latest" step below force-pushes the `latest` tag with git,
       # which needs the token in .git/config.
       - uses: actions/checkout@v4
+        with:
+          # Full history: compute_version.py counts commits since the last v* tag
+          # for the manifest's `-dev.<N>` version (must match the binary's).
+          fetch-depth: 0
 
       - uses: astral-sh/setup-uv@v3
 
@@ -272,13 +307,28 @@ jobs:
             echo "tag=$REF_NAME" >> "$GITHUB_OUTPUT"
           fi
 
+      # Same computation as the build job's "Compute version" — the manifest's
+      # version must match the binary's MM_VERSION + the asset names. Channel +
+      # -rc handling live in compute_version.py; pass only the tag (this job has
+      # setup-uv, so `uv run`).
+      - name: Compute version
+        id: ver
+        # Tag via env (not inline ${{ }}) to keep it out of the command text —
+        # no shell injection from a crafted tag/ref.
+        env:
+          TAG: ${{ steps.tag.outputs.tag }}
+        run: |
+          set -euo pipefail
+          V=$(uv run python scripts/build/compute_version.py --tag "$TAG")
+          echo "version=$V" >> "$GITHUB_OUTPUT"
+
       - name: Generate ESP Web Tools manifests (release-asset URLs)
         env:
           TAG: ${{ steps.tag.outputs.tag }}
           REPO: ${{ github.repository }}
         run: |
           set -euo pipefail
-          V=$(jq -r .version library.json)
+          V="${{ steps.ver.outputs.version }}"   # computed once above; matches binary + asset names
           # Absolute GitHub release-asset URLs. Uploaded as release assets;
           # read by the on-device OTA picker (device fetches the .bin directly
           # — no CORS). The Pages-relative manifests are generated in the
@@ -342,6 +392,14 @@ jobs:
         uses: softprops/action-gh-release@v2
         with:
           tag_name: ${{ steps.tag.outputs.tag }}
+          # Release `name` is the computed semver (e.g. "2.1.0-dev.7"). The device-
+          # hosted UI's dev-channel update check reads it from the CORS-readable
+          # GitHub API (releases/tags/latest) — the manifest-*.json asset that also
+          # carries the version is fetched via a release-asset URL that redirects to
+          # release-assets.githubusercontent.com, which sends no CORS header, so the
+          # browser blocks that read from the device origin. The API exposes `name`
+          # cross-origin, so surfacing the version here is what makes the badge work.
+          name: ${{ steps.ver.outputs.version }}
           # latest and vX.Y.Z-rcN tags are prerelease — they sort below stable
           # on the Releases page and aren't picked up by tooling that asks for
           # "latest release". Stable vX.Y.Z tags publish normally.
diff --git a/CLAUDE.md b/CLAUDE.md
index b5d50c5..d8328bf 100644
--- a/CLAUDE.md
+++ b/CLAUDE.md
@@ -16,6 +16,7 @@ See `docs/architecture.md` for system design. This file contains only rules and
 - **Default to subtraction.** The reflex on most changes (a bug fix, a review finding, a refactor) should be *can this remove or replace code, or land net-neutral?*, not *what do I add?* If a change only ever grows the line count and the doc count, that's the smell this rule exists to catch. Prefer removing code over adding it; a deletion that preserves behaviour is the best kind of change.
 - **Continuous refactor, no hacks.** Improvement is not a scheduled phase; it happens *the moment* a hack, a divergence, or a duplicated pattern is spotted, in whatever change is already open. The bar is absolute: **never** leave a hack, a workaround, or a bespoke one-off in place because "it works for now" — the fix is the *recognisable, standard* one. So when you reach for a clever shortcut, an environment sniff, a duplicated block, a stub that papers over a broken dependency, stop and ask *what's the textbook construct here?* and do that instead. This is the union of three principles applied as a working reflex rather than a checklist: *[Common patterns first](#principles)* (use the construct a new contributor recognises in 30s), *[Industry standards, our own code](#principles)* (the textbook algorithm AND the textbook name, written fresh against our architecture), and *[Minimalism means elegance](#principles)* (consistency, reuse, no duplication, the fast hot path). What this bullet adds over those: the **timing** (on sight, continuously, not deferred to a "cleanup later" that never comes) and the **no-hacks floor** (a workaround is never the destination; if the standard fix is genuinely out of scope right now, the hack doesn't ship — it's backlogged with the standard fix named, per *[Mandatory subtraction](#process-rules)*). The product-owner-initiated counterpart, for larger restructures, is the *[Refactor for simplicity](#process-rules)* process rule; this principle is the small-scale, agent-initiated version of the same instinct.
 - **No duplication, in code or docs.** Same logic in two places belongs in one shared function; same fact in two docs belongs in one place the other links to. A comment or doc paragraph that restates what the code already says is duplication too; delete it. (Reuse a recognisable shape rather than inventing one; see *Common patterns first* above.)
+- **Document a thing once, reference it generically.** A module lives in one home (its `.h` + one `docs/moonmodules/*.md`), its registration, and its tests. Don't name it elsewhere: in other prose say "a modifier"/"a driver", not `FooModifier`, and don't re-explain what it does — the reader studies its spec. Naming a thing across unrelated files multiplies rename cost and teaches nothing a link wouldn't. *No duplication* applied to names.
 - **Data over objects in the hot path.** This is minimalism's hot-path corollary — the same "minimal memory, fastest hot path" test (see *Minimalism means elegance*), applied where speed and memory matter most and resolved to one answer: design around plain contiguous data, not an object graph. A flat buffer of elements that one stage writes and the next stage reads, following the producer/consumer data flow in [docs/architecture.md](docs/architecture.md). A contiguous buffer is cache-friendly and lets a stage do integer math straight on the array, whereas per-element objects with virtual accessors are cache-hostile and allocation-heavy, exactly what the hot-path rules forbid. So in the render loop: no object graph, no inheritance, don't wrap buffer data in objects. The **one deliberate class hierarchy** is the module tree (one `MoonModule` base, shallow subclasses, a single virtual-dispatch boundary), because uniform polymorphism is what lets the UI render any module generically with zero per-module UI code. **Outside the hot path**, a small *recognizable* adapter interface with a couple of virtuals is allowed when it passes the *Common patterns first* test — e.g. `ListSource` is the textbook data-source/adapter shape (UITableView's data source, Qt's `QAbstractItemModel`): the view is generic, the rows stay with their owner. That is not "adding inheritance" in the sense this rule forbids; a *bespoke* hierarchy outside the module tree still is. The line: hot-path data is flat and object-free, period; off the hot path, prefer flat data but a proven adapter interface beats a hand-rolled callback table when it's more consistent and reusable.
 - **Concrete first, abstract later.** Build one working feature end-to-end before extracting patterns into shared abstractions. Don't build the framework before the domain logic works.
 - **Robust to any input.** A running device tolerates any sequence of UI actions or API calls: add, delete, replace, or reconfigure any module in any order, at any grid size, and it keeps running. Degraded or idle is acceptable; crashed is not. This robustness is a defining strongpoint of projectMM, and it's guarded by the test framework, not by hope: a discovered crash drives a new test that pins the fix (see the Hard Rule). Out of scope: power loss, malformed OTA, brown-out, and other physical/electrical faults the firmware can't intercept; this principle is about what the software accepts as input.
@@ -178,7 +179,7 @@ The "end users will use this" moment. Per-release criteria are defined by the pr
 
 5. **Changelog / release notes**: drafted in the GitHub release body. Skip only for unreleased pre-1.0 tags.
 6. **Cross-platform smoke**: run scenarios on every supported platform (today: PC + ESP32; later: + Teensy, RPi), if the release claims new platform support or the version bumps a major or minor.
-7. **Principles audit**: sweep `docs/` (except `docs/backlog/` and `docs/history/`) and `src/` for forward-looking language ("roadmap", "will be", "planned", "in the future", "currently lacks", `TODO`, `FIXME`) and other violations of § Principles. Acceptable hits carry a one-line justification; the rest get rewritten present-tense or moved to `docs/backlog/backlog.md` / `docs/history/`. The reviewer agent can run this end-to-end. Skip only for releases where the diff against the previous tag is doc-empty.
+7. **Principles audit**: sweep `docs/` (except `docs/backlog/` and `docs/history/`) and `src/` for forward-looking language ("roadmap", "will be", "planned", "in the future", "currently lacks", `TODO`, `FIXME`) and other violations of § Principles. Acceptable hits carry a one-line justification; the rest get rewritten present-tense or moved to `docs/backlog/` / `docs/history/`. The reviewer agent can run this end-to-end. Skip only for releases where the diff against the previous tag is doc-empty.
 
 What the agent reads:
 - Always: `CLAUDE.md`, `architecture.md`
@@ -196,8 +197,10 @@ docs/
   testing.md               ← test inventory and strategy
   performance.md           ← per-module timing, memory, sizeof for each platform
   backlog/                 ← forward-looking: what to build next (not present-tense)
-    README.md              ← index: what's here (to-build list + design studies + in-flight draft specs)
-    backlog.md             ← the prioritised to-build list
+    README.md              ← landing page: overview of every item + index (the rest of the system links here, not into items)
+    backlog-core.md        ← to-build list, core / infrastructure domain (+ UI)
+    backlog-light.md       ← to-build list, light domain (drivers, effects, preview, sensors)
+    backlog-mixed.md       ← to-build list, items spanning both domains
   history/                 ← backward-looking: accumulated wisdom
     README.md              ← index: what's here + cross-repo trends + digest prompt
     decisions.md           ← actions, lessons, proven patterns
@@ -220,7 +223,7 @@ Do **not** repeat facts the `.h` already states: the controls list (the .h has `
 
 The `history/` folder is the distilled experience of years of building LED/light systems, from WLED, WLED-MM, StarLight, MoonLight, through projectMM. It contains proven patterns, memory tricks, control mechanisms, and hard-won lessons, studied under the [*Industry standards, our own code*](#principles) principle. Per-project credits live in the `history/` digests and the per-module "Prior art" sections.
 
-The `backlog/` folder is its forward-looking counterpart: `backlog.md` is the prioritised to-build list, design studies sit alongside it, and a spec for a not-yet-built module can live here as a plain draft `.md` until it ships (its final spec then goes to `moonmodules/` and the draft is deleted). Both `history/` and `backlog/` are exempt from the present-tense rule and agents don't read them automatically; only when planning new work. Neither folder only accumulates: per [*Mandatory subtraction*](#process-rules), both shrink as well — shipped backlog items and absorbed history entries are deleted, since the git commits are the permanent record and these folders are just the working narrative above it.
+The `backlog/` folder is its forward-looking counterpart: the to-build list is split by domain (`backlog-core.md` / `backlog-light.md` / `backlog-mixed.md`) with `README.md` as the landing page the rest of the docs link to, design studies sit alongside it, and a spec for a not-yet-built module can live here as a plain draft `.md` until it ships (its final spec then goes to `moonmodules/` and the draft is deleted). Both `history/` and `backlog/` are exempt from the present-tense rule and agents don't read them automatically; only when planning new work. Neither folder only accumulates: per [*Mandatory subtraction*](#process-rules), both shrink as well — shipped backlog items and absorbed history entries are deleted, since the git commits are the permanent record and these folders are just the working narrative above it.
 
 ## Code Style
 
diff --git a/docs/architecture.md b/docs/architecture.md
index 1fa647d..87d63a0 100644
--- a/docs/architecture.md
+++ b/docs/architecture.md
@@ -342,7 +342,7 @@ Multiple layouts can live in one Layouts container. Each layout describes one li
 
 **Layers** (a MoonModule) is the top-level container for one or more layers. Each layer renders independently into its own buffer; the Drivers container composes those buffers downstream.
 
-**🚧 Multi-layer composition.** The container exists to compose more than one Layer's buffer into the shared output: alpha-blend and additive, in layer order. With a single layer wired (today's boot pipeline) Layers is a thin pass-through, but the design is the multi-layer case: each Layer renders into its own buffer, and the Drivers container's blend+map step composites them in order into the physical buffer (which is why that buffer is described as a *blend* buffer in [§ Memory strategy](#memory-strategy)). The single-layer path is the degenerate case of this, not a separate design.
+**Multi-layer composition.** The container composes more than one Layer's buffer into the shared output: each enabled Layer renders into its own buffer, and the Drivers container's blend+map step composites them in container order (bottom→top) into the physical buffer (which is why that buffer is a *blend* buffer in [§ Memory strategy](#memory-strategy)). Each Layer carries a `blendMode` (alpha-over or additive) and an `opacity` — inert parameters the Layer never acts on; Drivers reads them and the container child order, and blends bottom→top. The bottom layer clears + overwrites the output; each layer above blends onto the accumulated frame per its mode and opacity. With a single enabled Layer this is the degenerate case: a thin pass-through that hands the driver the Layer's buffer directly (no composite), byte-for-byte the single-layer pipeline. The blend math is integer-only per the hot-path rule (8-bit alpha-over `(src·α + dst·(255−α))/255`, additive sum-with-clamp); cost scales with the enabled-layer count.
 
 A **Layer** (a MoonModule, child of Layers) owns:
 
@@ -351,15 +351,15 @@ A **Layer** (a MoonModule, child of Layers) owns:
 - **Effects** (ordered list): write light values into the buffer.
 - **Modifiers** (ordered list): transform the LUT or light values.
 
-A layer can have **multiple effects**. Effects are not blended; they write to the buffer sequentially in their listed order, each overwriting or adding to the previous. That allows stacked patterns (a base-colour effect followed by a sparkle effect).
+A layer can have **multiple effects**. Each effect writes to the buffer sequentially in its listed order, overwriting or adding to the previous — so the effects stack (a base-colour effect followed by a sparkle effect).
 
-A layer applies its **first enabled modifier** during LUT build (`Layer::rebuildLUT`). Modifier *chaining* (applying several in sequence) is not implemented: only the first enabled modifier takes effect. Order matters for a chain (a multiply-then-checkerboard mask differs from checkerboard-then-multiply, just as mirror-then-rotate differs from rotate-then-mirror), which is why modifiers are reorderable in the UI even though only the first is applied today. Chaining is on the [backlog](backlog/backlog.md): static modifiers chain during LUT build, dynamic modifiers during rendering.
+A layer applies its **first enabled modifier** during LUT build (`Layer::rebuildLUT`). Modifiers are **reorderable** in the UI, and order is meaningful (a multiply-then-checkerboard mask differs from checkerboard-then-multiply, just as mirror-then-rotate differs from rotate-then-mirror). Applying several modifiers in sequence (chaining) is on the [backlog](backlog/README.md).
 
 Each layer references the shared Layouts. The layer builds its own LUT by iterating the Layouts container's coordinates and applying its static modifiers in order. Different layers in Layers can have different modifiers, producing different LUTs from the same Layouts.
 
 ## Effects
 
-Effects produce light colours. They write into the Layer's buffer, which represents a logical grid. The Layer determines the buffer's dimensions (width, height, depth) from the Layouts, its own start/end percentages within the physical layout, and its modifiers. Effects receive these logical dimensions and elapsed time (millis) as their rendering context. They compute light positions from the buffer index (e.g. `x = i % width`, `y = i / width`).
+Effects produce light colours. They write into the Layer's buffer, which represents a logical grid. The Layer determines the buffer's dimensions (width, height, depth) from the Layouts and its modifiers. Effects receive these logical dimensions and elapsed time (millis) as their rendering context. They compute light positions from the buffer index (e.g. `x = i % width`, `y = i / width`).
 
 Effects use elapsed time for animation, not frame count. Animation speed becomes frame-rate independent: an effect looks the same at 30 fps and 60 fps. This is also what makes the 🚧 cross-device clock sync work: a shared elapsed-time base means synced visuals across controllers (see [§ Multi-device sync](#multi-device-sync)).
 
@@ -462,7 +462,7 @@ Network input (ArtNet receive, WebSocket) is processed synchronously at a define
 The system checks available heap before each allocation and degrades gracefully when memory is insufficient. A minimum reserve (`HEAP_RESERVE = 32 KB`) is kept for stack, HTTP, WiFi, and overhead.
 
 - **Mapping LUT** is created only if all of: modifiers exist on the layer; layout is not a simple non-serpentine grid (where physical == logical); enough heap available after the reserve.
-- **Driver output buffer** (see [§ Drivers](#drivers) for what it's for) is created only when at least one layer has a mapping LUT actually allocated and enough heap is available.
+- **Driver output buffer** (see [§ Drivers](#drivers) for what it's for) is created only when the pipeline must write into physical space rather than hand a driver a layer's logical buffer directly — that is, when **two or more layers are enabled** (they must be composited into one buffer) **or** a layer has a **mapping LUT** actually allocated (logical≠physical) — and enough heap is available. A single enabled layer with no LUT needs no output buffer: drivers read its buffer directly (the zero-copy fast path).
 
 ### Degradation cascade
 
diff --git a/docs/backlog/README.md b/docs/backlog/README.md
index 52adcc8..825f90d 100644
--- a/docs/backlog/README.md
+++ b/docs/backlog/README.md
@@ -2,23 +2,53 @@
 
 The forward-looking half of the docs (the backward-looking half is [`../history/`](../history/)). This folder is **not** present-tense and agents don't read it automatically — only when planning new work. See [CLAUDE.md § Documentation](../../CLAUDE.md) for how `backlog/` and `history/` relate.
 
-## What's here
+This README is the **landing page**: the rest of the system links here, not into individual items, so the present-tense docs stay present-tense.
 
-### The prioritised to-build list
+## The to-build list
 
-- [backlog.md](backlog.md) — what to build next, grouped by theme (distribution, effects, drivers, modifiers, …). Completed items are removed; the file is deleted when empty.
-- [ui-deferred.md](ui-deferred.md) — UI items not yet in the live [ui.md](../moonmodules/core/ui.md): deferred-to-1.x features, open design questions, and the gap analysis against v1. The backward-looking v1 UI reverse-engineering lives in [history/v1-inventory.md](../history/v1-inventory.md).
-- [leddriver-deferred.md](leddriver-deferred.md) — the LED-driver increments (RMT single-strand, multi-pin RMT, LCD_CAM on S3) all shipped; this is what's left and tracked nowhere else: the sigrok flicker test, the core-1 driver task, fuller show error handling, the per-driver buffer window, 16-bit/dither, and moving-head preview.
+Split along the codebase's own boundary (`src/core/` vs `src/light/`), with a third file for items that genuinely span both:
 
-### In-flight draft specs
+- **[backlog-core.md](backlog-core.md)** — core / infrastructure: distribution + platforms, ESP32 performance & memory, network & persistence, HTTP/OTA, architecture, testing, housekeeping, and UI.
+- **[backlog-light.md](backlog-light.md)** — the light domain: LED drivers (architecture + deferred increments), LCD/DMA driver work, effects & preview, and sensors / audio-reactive input.
+- **[backlog-mixed.md](backlog-mixed.md)** — cross-domain items where a core mechanism interacts with a light driver/effect/modifier.
 
-A spec for a not-yet-built module can live here as a plain draft `.md` (alongside the design studies below) until the module ships — at which point its final spec is written in [`../moonmodules/`](../moonmodules/) and the draft is deleted. There's no dedicated subfolder or promote step: a draft is just a forward-looking markdown file like the rest of `backlog/`. None are in flight right now (every drafted module has shipped; the former UI draft moved to [ui-deferred.md](ui-deferred.md) and [history/v1-inventory.md](../history/v1-inventory.md)).
+Completed items are removed; a file is deleted when empty (per [*Mandatory subtraction*](../../CLAUDE.md#process-rules)). Tags in item titles: *(investigation)* = needs measurement before a fix · *(backlog)* = scoped but not started · *(deferred)* = waiting on a prerequisite · *(future / long term)* = directional.
 
-### Design studies
+## At a glance
+
+A map of everything in the three files, by theme.
+
+### Core ([backlog-core.md](backlog-core.md))
+
+- **Distribution** — remaining platforms (Linux, Teensy, RPi), code-signing (macOS/Windows), live RMII Ethernet reconfigure, installer UX polish, P4 DHCP-hostname recheck; DevicesModule discovery growth (HTTP probe off the render task, more mDNS types + UDP, deterministic scan scenario).
+- **ESP32 performance & memory** — E1.31 multicast (IGMP), WiFi ArtNet perf matrix, async ArtNet send (PSRAM-only), network round-trip drop/reorder test, slow eth bring-up, non-PSRAM memory ceiling + boot-time buffer degradation, task core-pinning; ops: static IP on STA, mDNS toggle, MoonDeck doc-asset hardening, CI SHA-pinning.
+- **Architecture** — disable-releases-resources, cross-module pin-uniqueness check, Improv-child-of-NetworkModule, `std::span` platform API, Improv-as-REST follow-ups, **live scripting** (on-device authored effects/layouts/modifiers/drivers/sensor logic — design phase, see the bottom-up survey); composition/config: runtime board presets, per-layout coordinate offset.
+- **HTTP & OTA** — direct binary-upload OTA, HTTP file serving off the render tick.
+- **Testing** — additional coverage (UI load time, teardown memory, JS harness), live full-suite state leak.
+- **Housekeeping** — WS-send socket-pair fixture, ESP-IDF version pinning, three-level device model, persistence-overlay audit, **ESP32-P4 rounds 3-4 (in progress)**, WiFi runtime disable.
+- **UI** — deferred-to-1.x items, open design questions (multi-layer UI, modifier-chain viz, presets, node-graph), and the v1 gap analysis.
+
+### Light ([backlog-light.md](backlog-light.md))
+
+- **Drivers** — extract shared lane-driver scaffolding (on the 3rd backend), 1..8-pin LCD output, classic ESP32 I2S 16-lane driver.
+- **LED drivers — deferred** — sigrok flicker cross-check, core-1 driver task, fuller RMT error handling, per-driver buffer window, 16-bit/dither, moving-head preview interpreter.
+- **LCD / DMA driver work** — drop the i80 WR/DC sacrificial pins, LCD/Parlio DMA buffer → PSRAM.
+- **Effects & preview** — real z-axis in 2D effects, full-density interpolated preview, self-describing frame header, RGBW preview, fixture model (moving heads/beams), extract the resumable transport.
+- **Sensors & audio-reactive input** — audio follow-ups (per-band noise floor, adaptive gate), GyroDriver → core Peripheral move, Raspberry Pi 5 sensor input (mic/IMU/line-in).
+
+### Mixed ([backlog-mixed.md](backlog-mixed.md))
+
+- MultiplyModifier mapping-LUT memory at large grids; composed modifiers (chain the whole stack, not just the first); intermittent ~0.5 s RMT LED pauses; NoiseEffect simplex cost on ESP32.
+
+## In-flight draft specs
+
+A spec for a not-yet-built module can live here as a plain draft `.md` (alongside the design studies below) until the module ships — at which point its final spec is written in [`../moonmodules/`](../moonmodules/) and the draft is deleted. None are in flight right now.
+
+## Design studies
 
 One-off research documents that informed a future direction, kept for the reasoning rather than as living specs.
 
 - [leddriver-analysis-top-down.md](leddriver-analysis-top-down.md) — reasons from the end goal (driving WS2812-class LEDs from a GPIO pin) toward a generic driver architecture, per-platform implementation, and a testing strategy.
 - [leddriver-analysis-bottom-up.md](leddriver-analysis-bottom-up.md) — the companion landscape survey: catalogues the existing LED-driver libraries across ESP32, Teensy, Raspberry Pi, and PC, and recommends a path.
-
-(The 3-layer installer plan these analyses' sibling produced shipped fully and its deferred items already had homes in [backlog.md](backlog.md), so its file was deleted per [*Mandatory subtraction*](../../CLAUDE.md#process-rules). The installer lives in `docs/install/` + `scripts/build/`; the durable reasoning is in `architecture.md` / `history/decisions.md`.)
+- [livescripts-analysis-bottom-up.md](livescripts-analysis-bottom-up.md) — live scripting (run user-authored effects/layouts/modifiers/drivers/sensor logic on-device without a reflash), Stage-1 survey. Deep-reads the ESPLiveScript fork (hpwit's native-Xtensa JIT), surveys the field (ARTI-FX interpreter by ewowi, embedded VMs, WASM/WAMR), and records the product-owner direction.
+- [livescripts-analysis-top-down.md](livescripts-analysis-top-down.md) — the Stage-2 redesign: a native-codegen engine, Xtensa-first behind an IR seam (WASM/WAMR the per-target fallback), a C-subset language that ports an effect near-verbatim, the MoonModule binding, and a staged spike plan along the MoonLight effects-tutorial ladder.
diff --git a/docs/backlog/backlog.md b/docs/backlog/backlog-core.md
similarity index 66%
rename from docs/backlog/backlog.md
rename to docs/backlog/backlog-core.md
index fe0e60a..4473c32 100644
--- a/docs/backlog/backlog.md
+++ b/docs/backlog/backlog-core.md
@@ -1,8 +1,6 @@
-# What to build next
+# Backlog — core
 
-Completed items are removed. This file is deleted when empty.
-
----
+Forward-looking to-build items for the **core / infrastructure** domain (`src/core/`, `src/platform/`, build, CI, network, persistence, UI). The light-domain counterpart is [backlog-light.md](backlog-light.md); items that genuinely span both are in [backlog-mixed.md](backlog-mixed.md). Index + overview: [README.md](README.md). Completed items are removed.
 
 ## Distribution
 
@@ -28,26 +26,8 @@ DevicesModule discovers via two strategies that merge into one list: an **mDNS b
 - **More mDNS service types + UDP** — the mDNS browse cycle (`kMdnsServices`) extends one entry at a time as classification lands for each (Home Assistant `_home-assistant._tcp`, ESPHome `_esphome._tcp`, RTP-MIDI `_apple-midi._udp`). Separately, the **four-mechanism split** (decided): discovery and messaging are separate axes, none replaces another — **mDNS** = discovery (standard, whole ecosystem), **HTTP sweep** = discovery fallback (what mDNS misses, e.g. a PC instance on :8080), **REST `/api/control`** = *reliable* messaging (config push, fleet OTA — TCP guarantees delivery, already built), **UDP** = *lossy real-time streaming* only (SuperSync clock / live timing, where drop-and-continue is fine and low latency matters). The MoonLight "messages sometimes didn't arrive" pain came from using UDP for must-arrive messages — route must-arrive over REST, reserve UDP for streams. A UDP *presence beacon* could also seed projectMM↔projectMM discovery, but mDNS is preferred there as the recognizable standard. UDP receive is a cheap non-blocking poll; UDP *send* of large frames is throughput-bound (see Async ArtNet) and belongs off the render task.
 - **Deterministic full-pipeline scan scenario (canned `httpGet`)** — `scenario_DevicesModule_scan.json` is live-only (needs a real LAN, runs on hardware). A desktop-runnable parallel that exercises scan → classify → upsert → age-out → list-serialization with *canned* `httpGet` responses would pin the whole discovery pipeline without flakiness. Needs a new platform seam: a settable response table the desktop `httpGet` consults (mirroring the existing `setTestNowMs` clock override). Today the age-out + restore + serialize paths are covered by `unit_DevicesModule_ageout.cpp` and classify by `unit_DeviceIdentify.cpp`, so this is breadth, not a gap — deferred so the httpGet-mock seam gets its own focused change rather than riding in on a review batch.
 
----
-
 ## ESP32 performance and memory
 
-### MultiplyModifier mapping-LUT memory at large grids (investigation, re-verify on classic)
-
-`scenario_perf_full` on the S3 (2026-06-17) measured the MultiplyModifier's cost across grid sizes. The finding, stated correctly: the modifier **reduces compute** (with the default 2×2 kaleidoscope the effect renders only the ¼-size logical quadrant — Noise+Multiply at 16K is 29,647µs vs 50,555µs for Noise alone), and its real cost is **memory** — the 1:N fan-out mapping LUT. Measured modifier heap cost on the S3: 16²→1.7KB, 32²→10.8KB, 64²→23.5KB, **128²(16K)→93KB** (the LUT destinations array; `nrOfLightsType` is `uint32_t` on a PSRAM board). On the S3's 8MB PSRAM this is trivial.
-
-**This is NOT a no-PSRAM blocker** — 16K Noise + Multiply has run on a classic ESP32 (no PSRAM, 320KB internal) before at **10–20 FPS** (WiFi vs Ethernet), sending frames out over **ArtNet to a display, not physical LED drivers**. It works there because classic's `nrOfLightsType` is `uint16_t` (half the LUT size) and the modifier shrinks the logical render grid. So the action is **re-verify the working classic setup when a classic board is connected** (find the config — grid, mirror, ArtNet target — that reproduces the historical 10–20 FPS), not "fix an impossibility." Worth investigating only if that re-verification shows the LUT memory has regressed since: the destinations array is the obvious lever (it stores a `nrOfLightsType` per physical destination; a 2× kaleidoscope is 1:1 in *count* so the LUT need not store fan-out > the physical count — confirm it isn't over-allocating to `maxMultiplier()` when the effective fan-out is 1). Capture the classic numbers into performance.md's multi-board table first.
-
-### Intermittent ~0.5 s LED pauses with the RMT driver (pending investigation)
-
-Observed on the bench (2026-06): LED output running on the RMT driver occasionally freezes for about half a second. Postponed by the product owner until more observations exist. Ranked suspects from the initial analysis, each with a cheap experiment:
-
-1. **WiFi modem power-save never disabled** — nothing in `src/` calls `esp_wifi_set_ps(WIFI_PS_NONE)`, so the IDF default `WIFI_PS_MIN_MODEM` is active; the radio's DTIM sleep causes exactly this class of intermittent multi-hundred-ms stall. WLED and the v1/v2 lineage disable sleep. Experiment: one line in the ESP32 platform code after association.
-2. **NetworkSendDriver sending synchronously every tick to an absent destination** (default `192.168.1.70`) — lwIP keeps re-ARPing a dead address while the send sits in the render tick. Data point (2026-06-10): the bench esp32-16mb had NetworkSend *disabled* in its persisted config, consistent with the pauses being annoying enough to switch the sender off. Experiment: point the ArtNet IP at a live host (or disable the driver) and see if the pauses stop.
-3. **`rmt_tx_wait_all_done` 1 s timeout** — a wedged transmission blocks the tick up to a full second (multi-pin: up to N×1 s). Least likely (~1 s, not ~0.5 s) but it's the only hard block in the driver itself.
-
-If pauses correlate with UI control changes, also consider the 2 s-debounced SPIFFS save stalling flash-resident code. The per-tick KPI log around a pause discriminates between these immediately.
-
 ### E1.31 multicast receive (IGMP join)
 
 NetworkReceiveEffect accepts E1.31 via unicast only — the same scope MoonLight ships. Multicast senders address the per-universe group `239.255.{universe_hi}.{universe_lo}`, which a receiver must join via IGMP; the platform `UdpSocket` has no `IP_ADD_MEMBERSHIP` support yet (lwIP `setsockopt` on ESP32, plain `setsockopt` on desktop, plus a join-per-accepted-universe bookkeeping question). Add when a multicast-only sender actually shows up on a bench; until then the spec documents "point sACN senders at the device's IP".
@@ -108,21 +88,6 @@ What we still don't know (all **physical** tests — no code change is warranted
 
 Bottom line: intermittent, build-independent, reset-correlated → a hardware/PHY issue, not a firmware bug. The earlier "slow DHCP at boot" is likely the same root cause (the PHY cycling many times before one window holds long enough to complete DHCP). Pick this up with the physical tests above before touching any code.
 
-### NoiseEffect simplex cost on ESP32 (investigation)
-
-With mirror XY at 128×128, NoiseEffect renders the 64×64 logical quadrant in **~11 ms/tick** on the Olimex (measured) — the simplex math dominates, since the Xtensa LX6 has no FPU and float math is software-emulated. (RainbowEffect on the same pipeline is much cheaper.) This is correct, non-degraded behaviour; it's only worth revisiting if a deployment needs Noise faster than ~11 ms at this grid.
-
-Worth investigating if so:
-
-- **Q16 fixed-point simplex** instead of float (kills the software-float emulation cost).
-- **Lower-precision hash** — current simplex uses a 256-entry permutation lookup; a smaller / SIMD-friendly hash may be faster on Xtensa.
-- **Strided sampling + interpolation** — render at 32×32, bilinear up to 64×64. Visual quality cost; needs A/B comparison.
-- **Inline / unroll the inner per-pixel loop** to keep the simplex state in registers.
-
-None of these are obviously free, and a fixed-point port may shift the visual signature. Defer until there's a real use case — on the no-PSRAM Olimex at large grids the tick is dominated by the synchronous ArtNet send (~35 ms), not Noise, so the effect is rarely the bottleneck there.
-
-**S3 render-only data point (2026-06-17, `scenario_perf_full`):** on the PSRAM S3 with **no output driver**, Noise is the dominant cost at every grid and there's no ArtNet floor to hide it: 16²→738µs, 32²→2,831µs, 64²→11,235µs, **128²(16K)→50,555µs (~20 FPS)** — clean ~linear-in-pixels (67×), so no fragmentation/realloc pathology, just raw simplex compute. The light effect (Checkerboard) on the same sweep is 6–11× faster (16K→7,949µs, ~128 FPS). So on a PSRAM board the heavy effect IS the 16K bottleneck (where on the Olimex the network send was). This is the strongest case for the fixed-point/strided-sampling ideas above, since a PSRAM board can run 16K grids that the network-bound Olimex never reaches. The S3 has a real FPU (LX7), so the win is less about software-float emulation and more about per-pixel simplex work; profile before committing.
-
 ### MoonDeck doc-asset endpoint hardening (backlog)
 
 `scripts/moondeck.py::_serve_doc_asset` accepts any ROOT-relative path and serves the file. Path traversal *is* blocked (`asset_path.relative_to(ROOT.resolve())`), but inside the repo any file is served — including local-only artefacts like `scripts/build/wifi_credentials.json` if present. MoonDeck binds to all interfaces by design (the existing comment in `main()` explicitly enables LAN reach), so anyone on the LAN can hit the endpoint.
@@ -181,8 +146,6 @@ Related: this is the render/output-buffer face of the same non-PSRAM fragmentati
 
 No FreeRTOS tasks are pinned today. At 16K LEDs the render task takes ~52 ms/tick; if OTA download or Improv scan causes tick-variance spikes, pin render → core 1, OTA/Improv → core 0 (where WiFi already lives via `CONFIG_ESP_WIFI_TASK_PINNED_TO_CORE_0=y`). Defer until contention is observed — neither OTA nor Improv runs during normal operation.
 
----
-
 ## Architecture
 
 ### Disabling a module should release its resources, not just stop its loop (backlog)
@@ -207,18 +170,6 @@ Today `setEnabled(false)` only makes the Scheduler skip the module's `loop`/`loo
 
 **Related:** [§ Disabling a module should release its resources](#disabling-a-module-should-release-its-resources-not-just-stop-its-loop-backlog) — a disabled module freeing its pins is what lets the same GPIO be reassigned live without a conflict-reject.
 
-### Extract shared lane-driver scaffolding when the 3rd parallel backend lands (deferred)
-
-The LcdLedDriver (S3 LCD_CAM i80) and ParlioLedDriver (P4 Parlio) share ~245 of 362 lines, and their platform-side loopback capture+verify is ~100 lines byte-for-byte identical (`platform_esp32_parlio.cpp` even notes "The RX capture half is byte-for-byte identical" to the LCD one). The status-string lifecycle (`failBuf_` / `configErr_` / `clearFailBuf` / `clearConfigErr`) is triplicated across all three LED drivers (RMT/LCD/Parlio), ~60 lines. The branch deliberately extracted the *encoders* (`LcdSlots.h` shared by i80+Parlio, `RmtSymbol.h`, `PinList.h`) on the "extract when the second user lands" rule, but stopped at the lifecycle/loopback scaffolding. **Accepted for this merge** (the reviewer agreed driver-level extraction can wait): the duplication is in mechanical lifecycle/test scaffolding, not domain logic, and a DriverBase-level refactor touching three drivers is riskier than the duplication it removes. **Do it when the third parallel backend arrives** (16-lane widening, or Teensy FlexIO), at which point the pattern is proven three ways: (a) a `detail::` platform helper for capture+verify (the only per-peripheral difference is the transmit call, pass a callback, beside the already-shared `loopbackJumperOk`), and (b) a small owned-status helper or DriverBase members for the fail/config strings. Until then the cost is line count, not correctness.
-
-### 1..8-pin LCD output (future) — would let S3 default to LCD
-
-`LcdLedDriver` requires **all 8** i80 data lanes (`kExactLaneCount = true`, `LcdLedDriver.h`): the ESP-IDF `esp_lcd` i80 bus configures every data line of the bus width and rejects a partial set, so even a few WS2812 strands claim 8 GPIOs. That's why **S3 boards default to `RmtLedDriver`** in `deviceModels.json` (RMT runs one channel per pin, 1..N) rather than LCD — a board with fewer than 8 strips can't sensibly use the LCD driver, and the 8-lane LCD bench wiring (`1,2,4,5,6,7,8,9`) collides with common peripheral pins (e.g. the mic on 4/5/6). A **1..8-pin LCD mode** (drive only the lanes named in `pins`, leave the rest unclaimed — matching Parlio's flexibility) would let the parallel S3 path run any lane count, at which point an S3 board entry could choose LCD vs RMT by intent. Parlio already does this (`kExactLaneCount = false`, 1..8 lanes), so the P4 default *is* the parallel driver. Until LCD gains the same flexibility, S3 stays on RMT by default. Low priority — RMT covers the few-strip S3 case today.
-
-### Classic ESP32 I2S 16-lane parallel LED driver (future) — beyond RMT's 8 channels
-
-The **classic ESP32 has 8 RMT TX channels** (`platform_config.h`: "8 on classic ESP32, 4 on the S3 and P4"), so RMT covers up to 8 parallel outputs on classic ESP32 — e.g. the 8-output QuinLED Dig-Octa runs fine on `RmtLedDriver`. For **more than 8 lanes on classic ESP32**, the established trick drives the **I2S peripheral in LCD/parallel mode** (the hpwit [I2SClocklessLedDriver](https://github.com/hpwit/I2SClocklessLedDriver) / FastLED I2S lineage), clocking out up to **16 lanes** from one autonomous DMA transfer. This is the classic ESP32's high-lane-count path, distinct from the S3 (LCD_CAM → `LcdLedDriver`, plus the [1..8-pin LCD item](#18-pin-lcd-output-future--would-let-s3-default-to-lcd) above) and the P4 (Parlio). No catalog board needs it today (none exceeds 8 outputs), so no board's `planned` list points at it yet; it's the marker for a future ≥9-output classic-ESP32 board. Studied under *Industry standards, our own code* — carry the idea, write our own against the project architecture (host-testable encoder in `src/light/`, peripheral seam in `src/platform/esp32/`). **When it lands**, follow the per-chip driver-gating pattern now in `main.cpp` (each LED driver's `#include` + `registerType` is wrapped in `#if defined(CONFIG_SOC_<PERIPHERAL>_SUPPORTED)`, keyed off the SOC capability macro that backs its `platform_config.h` lane-count flag): the I2S driver gates on the relevant I2S/LCD SOC macro so it compiles + registers on classic ESP32 only, and adds an `i2sLanes` capability flag beside `rmtTxChannels`/`lcdLanes`/`parlioLanes`. Prior art: hpwit's I2SClockless lineage and FastLED's I2S driver; the same parallel-DMA lineage is already credited in [LcdLedDriver.md § Prior art](../moonmodules/light/drivers/LcdLedDriver.md#prior-art).
-
 ### Runtime board presets (multi-commit, partially landed)
 
 The firmware-vs-board separation is now in place across the codebase (see [architecture.md § Firmware vs deviceModel vs board](../architecture.md#firmware-vs-devicemodel-vs-board)). `build_esp32.py --firmware <variant>` picks the compiled binary; MoonDeck deduces the physical board where the firmware uniquely identifies hardware (`esp32-eth*` ⇒ `olimex-esp32-gateway-rev-g`) and lets the user pick from a short hardcoded list otherwise. Firmware variants stay separate — `esp32-eth` saves ~670 KB flash + ~30 KB DRAM vs the default `esp32` (WiFi+Ethernet, measured); merging would erase that win.
@@ -242,7 +193,7 @@ Board preset catalog + upload (later, when the runtime config has real consumers
 - **LED output pins** — per-strip data GPIOs (1–16 outputs/board); the first real consumer (a Driver pin control) unblocks multi-output boards (QuinLED Dig-Quad/Octa, SE16, LightCrafter).
 - **Ethernet PHY config** — LAN8720/RMII (MDC/MDIO/CLK/power-pin/PHY-addr/clock-mode) vs W5500/SPI (MISO/MOSI/SCK/CS/IRQ); the consumer is the runtime `Network.eth_*` controls listed above, replacing the hardcoded Olimex pins.
 - **Power budget** — `maxPower` (Watts) per board, for a future current-limit / brightness-cap control.
-- **Audio / I2S** — SD/WS/SCK/MCLK pins, the input side of audio-reactive effects ([Pi-5 sensor note](#sensor-input-on-raspberry-pi-5--microphone-imu-line-in-post-10-multi-commit) is the desktop counterpart).
+- **Audio / I2S** — SD/WS/SCK/MCLK pins, the input side of audio-reactive effects ([Pi-5 sensor note](backlog-light.md#sensor-input-on-raspberry-pi-5--microphone-imu-line-in-post-10-multi-commit) is the desktop counterpart).
 - **Buttons & inputs** — push/toggle/lights-on, PIR, digital-input; needs an input-event concept the firmware doesn't have yet.
 - **Relays & power control** — relay / lights-on / high-low pins.
 - **Infrared** — IR receive pin (remote control).
@@ -254,16 +205,6 @@ Sequencing rule (unchanged): each functionality lands a device-side control firs
 
 **Module variant + PSRAM within the classic-ESP32 family.** `getChipDescription()` and MoonLight's `ModuleIO.h` both report only the *core* family ("ESP32"), not the *module* (WROOM / WROVER / PICO) — so neither distinguishes whether a classic-ESP32 board has PSRAM. This matters for projectMM (whose large-LED story leans on PSRAM) in a way it doesn't for MoonLight: e.g. the **QuinLED Dig-Next-2 is built on an ESP32-PICO with 2 MB PSRAM**, but projectMM's `esp32` build has no `CONFIG_SPIRAM` (see the `#ifdef CONFIG_SPIRAM` gate in `platform_esp32.cpp::psramAlloc`), so it flashes and runs as a no-PSRAM device and hits the non-PSRAM fragmentation ceiling at large grids that the 2 MB would otherwise relieve. A PSRAM-enabled classic-ESP32 firmware variant (e.g. `esp32-psram`) would unlock it; `deviceModels.json` could then carry a `psram` hint per board to steer the picker — but only once that variant exists (no consumer today). `deviceModels.json` currently maps every classic board to the WiFi-only `esp32` variant, which is correct-but-unoptimised for PSRAM-bearing PICO boards.
 
-### Multi-layer composition (backlog)
-
-`Layers` holds N layers; `Drivers` reads from a single active layer today. Composition is the missing piece — additional layers render their buffers but only the first enabled layer reaches output.
-
-When picked up:
-- `Drivers::loop()` blends each enabled Layer's buffer into the shared output using per-Layer blend mode + opacity (controls to add on Layer).
-- `Layer::startX/Y/Z` / `endX/Y/Z` (already persisted, currently no-op) become active in `rebuildLUT` — each Layer carves a percentage region of the physical extent.
-- Memory-aware allocator at `onBuildState` time decides how many Layers fit and degrades gracefully.
-- Persistence already encodes Layers children positionally — adding siblings just works on the file-format side.
-
 ### Per-layout coordinate offset for independent placement (backlog)
 
 `Layouts` stitches multiple child layouts into one physical light space, but only their *indices* are stitched (offset sequentially in `forEachCoord`) — their *coordinates* are not translated. Two layouts therefore overlap in the same coordinate box: two 64×64 grids both occupy x,y ∈ 0..63, so the Layer's dense bounding-box buffer is 64×64 (4096 voxels) even though the container reports 8192 lights, and the second layout's lights land on the first's positions. `scenario_Layouts_mutation` documents this (its steps assert pipeline liveness, not buffer-size arithmetic).
@@ -291,67 +232,11 @@ Device-model injection over Improv shipped as **"Improv = REST over serial"** (t
 
 **Open follow-up: shared JS helpers across device-UI and web-installer.** `safeLocalGet` / `safeLocalSet` (3-line hostile-storage guards) are duplicated in `src/ui/install-picker.js` (device firmware, embedded as a C string via `embed_ui.cmake`) and `docs/install/devices.js` (web installer page, served from Pages). The two live in different build contexts so the shared extract isn't trivial — it'd need a new `src/ui/safe-storage.js` plus updates to: `embed_ui.cmake` (embed the new file), `ui_embedded.h` generator (new C array), HTTP server file routing (new path served), `release.yml` workflow staging, `preview_installer.py` staging. Five files for one 3-line helper is too much pre-merge. Worth doing when the next shared helper arrives — `relativeTime` and `formatBytes` are candidates. Two helpers earn the build-glue cost; one doesn't.
 
----
-
-## Sensors and audio-reactive input
-
-### Audio-reactive follow-ups
-
-The manual level + 16-band FFT spectrum has shipped ([AudioModule](../moonmodules/core/AudioModule.md); what landed and why is in [decisions.md](../history/decisions.md)). These are the deferred follow-ups, each its own increment:
-
-- **Per-band noise-floor (kill a steady single-frequency hum)** — the bench mic picks up a constant ~258 Hz tone (a mains harmonic via the mic/supply) that lights one band even in silence. A high-pass can't remove it (it's well above the ~40 Hz DC-blocker cutoff) without also killing real bass; the clean fix is a per-band adaptive floor that learns each band's idle baseline and subtracts it, so a constant tone in one band gates to dark while the others stay sensitive. Minimal version ≈ 16 floats of state + ~16 ops/frame. This is the next concrete audio step.
-- **Adaptive conditioning** — auto noise-floor / auto-gain / smoothing so the display self-calibrates to a room ("sound off → dark, sound on → vivid") instead of being tuned by hand. A self-calibrating version was prototyped and removed; the manual `floor`/`gain` is the shipped baseline. Reinvent from scratch when wanted, and **tune it in a quiet room** — a noisy environment (a strong, varying low-frequency ambient) is the adversarial case that made the prototype hard to settle. (The per-band floor above is the first piece of this.)
-- **Adaptive noise gate** — replace the borrowed `squelch`/`floor`-as-gate with a real noise gate: asymmetric bang-bang timing (open fast, close slow), a relative "detect silence" test (thresholds as factors of a learned floor, not absolute sample counts), keying off the RMS envelope we already compute, GEQ/FFT bands left untouched. A softhack007 concept; analysed and judged in full (good idea, industry-standard, but tight on the <30ms budget; decompose into steps rather than overhaul) in [AudioModule.md § Adaptive noise gate](../moonmodules/core/AudioModule.md#adaptive-noise-gate-forward-looking). The recommended sequencing: the per-band floor above is step 1 (its complementary frequency-domain half), the relative-threshold-over-RMS is the cheap high-value cherry-pick as step 2, hysteresis/timing step 3, log-domain + soft-gate optional. Eventually retires the manual squelch.
-- **Pin auto-scan** — detect the mic's `sdPin` with `wsPin`/`sckPin` fixed (a noise-prompt + confirm convenience); ships today with explicit pin controls.
-- **Beat / onset detection** beyond the raw peak; more audio effects (2D / palette-driven frequency-reactive).
-
-### GyroDriver → core Peripheral move + AudioModule-consistency pass (branched, not merged)
-
-A working **GyroDriver** (MPU6050 IMU over I²C) exists on an unmerged branch (commit `11f8eb7`, "Add GyroDriver (MPU6050) + generic platform I2C layer"); it is not in this branch's tree. This entry reverse-engineers that commit so the move is tracked now. **Verify against the real implementation when the branch merges, then delete this entry.**
-
-What the commit contains (reverse-engineered):
-
-- `src/light/drivers/GyroDriver.h` — reads an MPU6050 over I²C and surfaces five read-only telemetry controls (`gyroX`/`gyroY`/`gyroZ` rates in °/s, `pitch`/`roll` tilt angles). Polls the sensor in `loop20ms()` (50 Hz), formats the display strings in `loop1s()`. WHO_AM_I probe + wake on `setup()`, big-endian 14-byte burst parse, `atan2`-based tilt (no fusion filter).
-- A **generic, domain-neutral platform I²C master** (`platform::i2cInit`/`i2cWriteReg`/`i2cReadRegs`, 7-bit addressing) so future sensors reuse it; ESP32 impl on the IDF v6 `i2c_master` driver in a new `platform_esp32_i2c.cpp`, plus an MPU6050-shaped desktop simulation so the UI and host tests see live values without hardware.
-- `unit_GyroDriver.cpp` — WHO_AM_I probe, simulated burst parse, control formatting, time-ramp tracking.
-
-The move: it currently masquerades as an input-only **driver** under the Drivers container (a no-op `setSourceBuffer(Buffer*) override {}` is the tell). It belongs as a **SystemModule Peripheral** child, exactly like [AudioModule](../moonmodules/core/AudioModule.md) — both are sensor peripherals that poll hardware and publish read-only telemetry. On the move, make it consistent with AudioModule (the established sibling pattern):
-
-- **Relocate** `src/light/drivers/GyroDriver.h` → `src/core/` and its spec `docs/moonmodules/light/drivers/GyroDriver.md` → `docs/moonmodules/core/`; change `role()` to `Peripheral`; delete the `setSourceBuffer` no-op; rewrite the doc's "input-only driver under the Drivers container" framing.
-- **Pin controls + rebuild path.** GyroDriver hardcodes SDA/SCL (`static constexpr` 21/22, with its own "Hardcoded until BoardModule exposes I2C pin mapping" comment). AudioModule already shows the pattern: editable `uint16` pin controls + `controlChangeTriggersBuildState` + a `reinit()` on `onBuildState`. Adopting it retires the hardcoded-pins TODO and satisfies the robustness rule (reconfigure in any order).
-- **Lifecycle.** GyroDriver has `setup()` only — no `teardown()`. Add teardown for symmetry with AudioModule's setup/teardown/reinit (the shared I²C bus has little per-instance state to free, so this is consistency, not a leak fix).
-- **Document the cadence difference.** GyroDriver polls in `loop20ms()` (50 Hz is plenty for tilt); AudioModule reads in `loop()` every tick because I²S DMA must be drained promptly or it overflows. Both are correct; add a one-line "why this cadence" comment at each so the two siblings aren't "harmonised" into a bug.
-- **Wire it** in `main.cpp` as a Peripheral child of System under `markWiredByCode`, the same shape as AudioModule.
-
-Already done on this branch (the reverse direction): AudioModule's two live read-outs were switched from `addText`+`setReadOnly` to `addReadOnly` (the display-only type, matching SystemModule and the way GyroDriver already does it correctly) — so the telemetry idiom is consistent before the gyro branch even lands.
-
-### Sensor input on Raspberry Pi 5 — microphone, IMU, line-in (post-1.0, multi-commit)
-
-Audio-reactive lighting (and motion-reactive) is core to what WLED-MM / MoonLight are known for. The Pi 5 is the right host for it: it has the CPU and RAM for real FFT-based audio analysis that the Xtensa ESP32 struggles with, and a full Linux audio + I²C stack. None of this exists today — the codebase has no sensor, audio, or IMU concept, and the Pi currently runs the **desktop** platform backend (there is no `src/platform/rpi/`), which has no hardware access. So this is a domain expansion built on a real platform-backend prerequisite, not a small add.
-
-**Target sensors and their Pi 5 interfaces:**
+### Live scripting — author effects/layouts/modifiers/drivers/sensor logic on-device (multi-commit, design phase)
 
-- **Microphone** — I²S MEMS mic, or a USB audio device read via ALSA. The high-value one: FFT → frequency bands + beat detection drive audio-reactive effects.
-- **Line-in** — the Pi 5 has no native analog input, so this is a USB audio interface / DAC HAT feeding the same audio pipeline as the mic; only the source differs.
-- **IMU / gyro** — an I²C device (MPU-6050 / 9250-class) on the Pi's I²C bus; tilt / motion → effect parameters.
+Run user-authored scripts on a running device — a scripted effect, layout, modifier, driver, or core sensor rule, pushed as text and live on the next tick with no reflash/reboot — the leap WLED took with ARTI-FX and the heart of the PixelBlaze product. A scripted module **is** a MoonModule (controls, `loop()`, role, generic UI). The engine lives in core (domain-neutral: also "transform sensor data") and serves the light domain specifically. Targets in order: ESP32 classic + S3 first, then P4/other ESP32, then Teensy, then desktop. Must be blazingly fast (runs in the render hot path at 16K+ lights × 50 FPS), memory-smart (IRAM/PSRAM via `platform::alloc`, compile-once), and synced (Scheduler tick, tick-atomic hot-swap, live reconfig).
 
-**How it fits the architecture (the load-bearing part):**
-
-1. **The module category exists — `ModuleRole::Peripheral`.** Peripherals are user-add/deletable children of SystemModule (a gyro `Peripheral` already lands there via the GyroDriver→core move). What's missing for audio-reactive is the *consumption* side: a sensor reads hardware and *produces* values (audio bands, IMU axes) that effects consume — the producer side of the [producer/consumer data-exchange model](../architecture.md#data-exchange-between-modules) (a sensor produces an `AudioFrame` / `ImuState` the way effects produce a buffer that drivers consume). Define the producer struct domain-neutrally so it isn't audio-specific. Today's peripherals are display-only; wiring them into effects is the new work.
-2. **All hardware access stays behind the platform boundary.** New `platform::` APIs (e.g. `readAudio()` returning PCM/FFT, `readImu()` returning axes) with the ALSA / I²S / I²C implementation in a real `src/platform/rpi/` backend — which is itself the prerequisite that doesn't exist yet (the Pi uses the desktop backend today). No ALSA/I²C include or call outside `src/platform/`.
-3. **Effects consume sensor data the same way they read the layer.** An audio-reactive effect reads the current `AudioFrame` (bands/level/beat) the way `PreviewDriver` reads what `Layer` produces — through a plain data structure wired in `main.cpp`, not a direct hardware call.
-
-**Increments (each a normal domain addition, picked up one at a time):**
-
-1. A real `src/platform/rpi/` hardware backend (GPIO/I²C/I²S/ALSA) — the prerequisite; until it lands, the Pi runs the desktop backend with no sensors.
-2. The producer struct(s) (`AudioFrame` / `ImuState`) + the `platform::read*` APIs. (The `Peripheral` role + SystemModule add/delete already exist.)
-3. The first audio peripheral — **MicrophoneModule** (canonical, highest value: FFT bands + beat).
-4. The first audio-reactive effect(s) consuming it.
-5. IMU and line-in slot into the same source-module + platform-API shape afterwards.
-
-Study the proven audio pipeline in MoonLight / WLED-MM (FFT band layout, AGC, beat detection) to inform our own — reference the approach, don't port their code, per [history](../history/README.md) practice. Specs before code: a `MicrophoneModule.md` (and the source-category contract) get written and reviewed before implementation.
-
----
+The **bottom-up landscape survey** is done — [livescripts-analysis-bottom-up.md](livescripts-analysis-bottom-up.md): deep-reads the [ESPLiveScript fork](https://github.com/ewowi/ESPLiveScript/tree/fix-warnings) (a from-scratch C-like JIT that emits **native Xtensa** machine code — blazingly fast but **Xtensa-only**, so it covers classic+S3 and *not* P4/Teensy/desktop), surveys the field (PixelBlaze bytecode VM + web editor, WLED ARTI-FX AST-walking interpreter, embedded VMs / WASM / lightweight multi-ISA JITs), and extracts the load-bearing decisions (execution strategy, the IR seam ESPLiveScript lacks, the MoonModule binding, the per-pixel contract, memory placement, sync, sandboxing). Its thesis to validate: a **portable bytecode-VM baseline that runs on every target on day one + an optional native back-end for the hot ISAs behind a shared IR**. **Next: the top-down redesign** — the prompt that generates `livescripts-analysis-top-down.md` is at the bottom of the bottom-up doc; it produces the reference architecture + staged spike plan. Implementation is multi-commit, spike-ordered, after the top-down lands. Credits: [history/hpwit-ESPLiveScript.md](../history/hpwit-ESPLiveScript.md).
 
 ## HTTP and OTA
 
@@ -370,46 +255,11 @@ What to build (~4 h):
 
 `HttpServerModule::handleConnection()` serves large embedded files (`app.js`, `style.css`) with the blocking `TcpConnection::write` — a page load can briefly stall `loop20ms`. One-shot per load (lower priority than the per-tick preview issue, which is fixed). Fix: serve large HTTP responses with `writeChunks` (the same non-blocking path used for preview frames).
 
----
-
-## Effects and preview
-
-### Add real z-axis variation to 2D effects (pending)
-
-Only **NoiseEffect**, **PlasmaEffect** and **RipplesEffect** have z-aware math. The other honest-D2 effects use `Layer::extrude` to duplicate the z=0 plane, so every z-slice is identical on 3D layers. Candidates for genuine D3 promotion: Metaballs/GlowParticles (add z to blob coordinates), Plasma palette/Spiral (add z-driven phase term), Fire (z-drift heat grid), Rings/LavaLamp/Checkerboard/Particles (add z to each element). Prioritise after seeing real 3D installations; each promoted effect also needs its `dynamicBytes` budget for the full 3D buffer.
-
-### Full-density interpolated preview for large layouts (backlog)
-
-The preview index-downsamples a large layout to fit the WS send budget (e.g. 128×128 = 16384 lights → ~1639 sent at stride 10), so the UI shows a sparse sample, not every light. To show **all** lights at their real positions with **interpolated** colours for the unsent ones:
-
-- Decouple the `0x03` coordinate-table density from the per-frame `0x02` stride. Positions are static and sent once, so the table can carry **all** light coordinates (16384 × 3 = ~48 KB one-time — acceptable off the per-frame path, possibly chunked) while the per-frame RGB stays strided to protect ArtNet/the link.
-- The browser holds the full position set and, per frame, interpolates each unsent light's colour from its nearest sent neighbours (the sent indices are known from the stride). True positions, guessed colours — better than the removed dense-box block-replicate because positions are exact.
-- Open questions: 48 KB one-time table vs `MAX_WRITE_CHUNKS` / send-buffer (needs chunked send or a raised cap, with the same partial-write care as `writeChunks`' drain); interpolation cost on a 16384-point cloud each frame in JS; whether nearest-neighbour or weighted is worth it.
-
-Not simple — own planning pass. Until then the preview is a faithful strided *sample* (correct shape/colour/motion, not per-pixel). A cheap interim (point-size scaled by stride to fatten samples into their cells) was tried and reverted as not what's wanted — it filled the volume but didn't add real points.
-
-### Self-describing preview frame header (mid term)
-
-The preview wire format is a private opcode protocol: `0x02` per-frame channels, `0x03` coordinate table, each a hand-rolled byte layout, and the colour payload is **always RGB** regardless of the buffer's `channelsPerLight`. Every new data kind (RGBW display, beam direction, …) means inventing another opcode and another fixed layout by hand. The minimal fix that stops that sprawl: a small **typed header** — `[type][format][count][stride]` where `format` enumerates `{RGB, RGBW, …}` — so one message kind carries any per-light channel layout and the browser shader reads `format` to interpret the payload. Do it concrete-first, when RGBW *display* (below) is actually wanted, not speculatively. Prereq for both items below.
-
-### RGBW preview end-to-end (mid term)
-
-The light `Buffer` already holds `channelsPerLight = 4` (RGBW), and the device output drivers handle it, but the **preview only ever sends/draws RGB** — the W channel is invisible in the UI. (The full-res fast path no longer penalises a cpl≥3 buffer — see the short-term fix — but it still drops W on the wire.) Once the self-describing header lands, carry the W channel on the wire and render it in the shader (W as a warm-white tint / brightness lift on the disc). Small, but gated on the header so it isn't another bespoke opcode.
-
-### Fixture model — moving heads, beams (long term)
-
-Today a "light" is a point at a static coordinate with a colour. A **moving head** is a fixture that emits a *beam* in a direction it controls live (pan + tilt), plus colour, beam-width, etc. — per-light **vector** state, not just colour, and a different draw (a cone/ray, not a disc). The static-positions-`0x03` + colour-`0x02` split can't express "this fixture's beam now points here." The industry-standard model is **DMX/GDTF fixtures**: a fixture has a position *and* a set of typed attributes (color, pan, tilt, beam). The preview becomes a fixture renderer (disc for a pixel, cone for a beam); this is also the "make Preview a general-purpose module, not light-specific" goal. A domain-model change (the fixture/attribute model), not just transport. Plan when moving heads are actually on the bench.
-
-### Extract the resumable backpressure transport as a domain-neutral channel (long term)
-
-The preview's transport — resumable cross-tick send from a stable buffer + newest-wins backpressure drop + adaptive graceful degradation (see [architecture.md § graceful degradation under transport backpressure](../architecture.md)) — is **payload-agnostic**: any bulky throttled stream (a future MJPEG/video preview, fixture-state streams, fleet telemetry) could ride it. The *payload* model (count/stride/RGB) is light-specific; the *byte-pump* is not. When a second consumer for this transport appears, promote the pump into a domain-neutral core primitive (a `ThrottledChannel`-style sink) that PreviewDriver becomes *a* producer on, rather than owning the protocol. Concrete-first: extract on the second use, not before — until then the seam stays inside HttpServerModule/PreviewDriver.
-
----
-
 ## Testing
 
 ### Additional test coverage (pending)
 
+- **Memory degradation cascade** — the output-buffer *allocation* decision (no buffer for a lone identity layer; a buffer for ≥2 layers or any LUT layer) is unit-pinned (`unit_Layers_container` "Drivers allocates the output buffer only when…"), and LUT-vs-identity is pinned by `unit_Layer_sparse_mapping`. What's **not** pinned is the *low-heap* half of [architecture.md § Degradation cascade](../architecture.md#degradation-cascade): under heap pressure the LUT + driver buffer are skipped *together* (`lutSkipped()` true, forced 1:1), and below that the layer buffer *reduces dimensions* (halving to a 8×8 floor) rather than failing. The hook exists — `unit_BlendMap` already uses `platform::setTestMaxAllocBlock` to force allocation failure for the paging test — so a test could cap the block size and assert: (1) LUT+output buffer both skip and `lutSkipped()` flips, (2) the layer buffer shrinks to fit and never goes null. Pre-existing gap (predates multi-layer); the *happy-path* allocation contract is covered, only the OOM-degrade branch isn't.
 - **UI page load time** — scenario step measuring HTTP response time for `/`, `/api/state`, `/api/system` via the live runner. Verifies acceptable load time on ESP32.
 - **Module teardown memory** — scenario that tears down all modules and verifies heap returns to pre-setup baseline. Confirms no lifecycle leaks.
 - **JavaScript test harness** — `vitest` + `jsdom` for the browser UI: pure helpers in `install-picker.js` (`isCompatible`, `parseFirmwaresFromAssets`, `relativeTime`) **and `app.js`'s conditional-control DOM logic** (`syncVisibleControls` — reconciles which control rows are rendered when a `hidden` flag flips). The C++/backend half of conditional controls IS unit-tested (`conditional_controls.h` + per-module tests pin the binding + `hidden` flag), but the **UI re-render half is not** — `syncVisibleControls` was the source of a real re-render-loop freeze (Network static-IP toggle) caught only on hardware. A `jsdom` test that builds a card, flips a control's `hidden`, runs the reconcile, and asserts the right rows appear/disappear (and that it converges — the unchanged→no-op fast path) would have caught it. **Attempted and reverted (2026-06-17):** stood up vitest + 13 passing tests for the install-picker pure helpers, but the high-value half (`syncVisibleControls`) needs either an `app.js` module seam or extracting its reconcile logic into a separate served `.js` (6 embed/route wiring edits for a firmware-served file). Judged not worth adding a whole Node/npm toolchain to a C++/Python repo to test ~3 small pure functions; the toolchain earns its place only once the `syncVisibleControls` DOM test (and a real body of JS logic) lands with it. **Do it as its own focused branch**, deciding the app.js seam first (it's already `type="module"`, so extracting `reconcileControlRows` into a served file — wired through `embed_ui.cmake` + the two HttpServerModule routes like the other UI .js — is the clean shape). Pure-helper `_test` exports + the reconcile extraction are the two pieces; both were prototyped in that reverted attempt.
@@ -425,8 +275,6 @@ Run a bare-leaving scenario before a tree-assuming one and the latter fails pre-
 
 Fix options: (a) make every live mutate scenario clear+rebuild its own canvas (consistent with the newer ones) so order never matters; or (b) have the live runner reboot / restore the canonical tree between scenarios. (a) is the cleaner long-term shape. Until then, the in-process suite is the gate; live full-suite runs need a clean boot per scenario, or run scenarios individually.
 
----
-
 ## Housekeeping
 
 ### Socket-pair fixture for HttpServerModule WS-send tests (test infra)
@@ -466,18 +314,62 @@ Rounds 1 (board + Ethernet-only) and 2 (Parlio LED driver) have landed. Remainin
 
   **Dev-loop note — reading the P4's runtime log over USB.** The P4-NANO's primary console is **UART on GPIO 37/38** (`CONFIG_ESP_CONSOLE_UART_DEFAULT`), not the USB port, so `ESP_LOGI` / `mm_net` lines are *not* visible over `/dev/cu.usbmodem*` by default — only the ROM boot banner and `std::printf`-to-stdout (which routes to the **secondary** USB-Serial-JTAG console) come through. Two workarounds when you need the runtime log over USB: (a) temporarily set `CONFIG_ESP_CONSOLE_USB_SERIAL_JTAG=y` (note the JTAG endpoint re-enumerates when the app starts, so a reader must reconnect across the drop — `idf.py monitor` handles it; a plain fixed `pyserial` handle dies); or (b) hang a USB-UART adapter on GPIO 37/38. This cost real time during the P4 no-DHCP hunt; the fastest signal there turned out to be a `printf` of the runtime struct (stdout → secondary JTAG console) plus a `git worktree` bisect (build an old commit, flash, check LAN reachability) to prove code-vs-hardware without needing the log at all.
 
-### Drop the i80 WR/DC sacrificial pins (S3 LcdLedDriver) via direct LCD_CAM
+### WiFi runtime disable (backlog)
+
+Compile-time answer already ships: `--firmware esp32-eth` excludes the WiFi stack. The default `esp32` already *cascades* — `ethInit()` runs first, WiFi only comes up if no PHY responds — so a wired board never associates over WiFi. What's still missing is reclaiming WiFi's **heap**: even when Ethernet wins the cascade, `esp_wifi_init`'s RX buffers stay allocated. This item skips that init entirely once Ethernet is up, freeing ~16 KB. Defer until the heap saving is worth the teardown-ordering risk.
 
-The S3 i80 LED path costs **two GPIOs the LEDs never use**: the IDF `esp_lcd` i80 bus hard-requires a WR (pixel clock) and a DC pin on real GPIOs (`esp_lcd_panel_io_i80.c`: `wr_gpio_num >= 0 && dc_gpio_num >= 0`), even though WS2812 strands ignore both. Today `LcdLedDriver` keeps overridable defaults (clockPin=10, dcPin=11) — peripheral-required, not user-strand wiring, so a default cannot do harm. **Two ways to reclaim the pins, neither trivial:**
-- **Cannot reuse a data pin for WR/DC.** A GPIO carries exactly one peripheral signal (`esp_rom_gpio_connect_out_signal` binds data_sig[i] / wr_sig / dc_sig each to its own pin); routing WR onto a data lane would clock the *clock* waveform onto that strand instead of its colour bytes. WR/DC must be distinct *physical* pins from the 8 data pins. (You CAN already point them at any otherwise-free or unstrapped GPIO via the controls — that's the "reuse a pin you're not using" answer; it's the *spare* pin you avoid, not a data pin.)
-- **Zero WR/DC pins needs bypassing esp_lcd** and driving the LCD_CAM peripheral's registers directly (hpwit's I2SClockless approach — legacy parallel mode has no DC concept and emits WR without a dedicated config pin). That's the only path to 8-pins-total on the S3. Cost: leaving the recognisable IDF `esp_lcd` API for register-banging (a *Common patterns first* hit), re-proving the driver bit-perfect on hardware (the loopback self-test is the proof). Benefit: 2 GPIOs back on a tight S3 board. Its own increment, not a pin-default tweak. Parlio (P4) already needs no extra pins (`clk_out_gpio_num = GPIO_NUM_NC`), so this is S3-i80-only.
 
-### LCD/Parlio DMA frame buffer → PSRAM (free internal SRAM for big frames)
+## UI
 
-For driving **lots of LEDs**, internal SRAM is the scarce resource and the parallel-driver DMA frame buffer is the biggest consumer (8 lanes × lights × outCh × 24 slot-bytes + latch pad). Today both parallel drivers allocate it as `MALLOC_CAP_DMA | MALLOC_CAP_INTERNAL` (`platform_esp32_lcd.cpp`, `platform_esp32_parlio.cpp`) — **internal SRAM only**, so a large frame can exhaust DRAM while PSRAM sits unused. The IDF confirms both peripherals' GDMA **can burst straight from PSRAM** on the S3/P4: `esp_lcd_panel_io_i80.c` sets `access_ext_mem = true` and itself allocates the buffer with `MALLOC_CAP_SPIRAM | MALLOC_CAP_DMA` when asked; `esp_driver_parlio/src/parlio_tx.c:158` sets `access_ext_mem = true  // support transmit PSRAM buffer`. (RMT already does the right thing — its symbol buffer goes through `platform::alloc`, which is PSRAM-first with an internal fallback.)
+Forward-looking companion to the shipped UI spec, [moonmodules/core/ui.md](../moonmodules/core/ui.md). The live spec describes the UI as shipped; this file holds what is **not** in it yet: deferred items, open design questions for 1.0, and the gap analysis against projectMM v1. The backward-looking half (how v1/v2 actually worked, patterns consciously rejected, recorded quirks) lives in [history/v1-inventory.md](../history/v1-inventory.md).
 
-**The change:** allocate the LCD/Parlio buffer `MALLOC_CAP_DMA | MALLOC_CAP_SPIRAM` first, falling back to internal when PSRAM is absent/full, using the **external-memory alignment** the IDF requires (`gdma_get_alignment_constraints` → `ext_mem_align`, typically the cache line — larger than the current 64-byte internal alignment) and keeping the buffer cache-aligned + its size a multiple of that alignment. **Why it's its own increment, not this commit:** it changes the proven hot DMA path, PSRAM DMA has real caveats (cache-line alignment, write-back/coherence on the encode→DMA handoff, and lower PSRAM bandwidth that the IDF guards with a CPU-MAX DFS lock during transmit), and it **must be re-proven on S3 + P4 hardware** (the loopback self-test bit-verifies it, then a real strip). Measure the bandwidth headroom too: a very wide, long frame at speed may want internal SRAM regardless. Scope: the two `heap_caps_aligned_alloc` sites + their `bufferBytes` alignment rounding + the capacity check; no domain-code change (the encode loop already writes through `dmaBuf_`).
+### Deferred to 1.x
 
-### WiFi runtime disable (backlog)
+- Side nav with drag-reorder of root modules (root order is fixed in `main.cpp` today; not painful — and arguably correct, see the gap-analysis note below)
+- Health panel (`<details>` + `GET /api/test`)
+- Log panel (`<details>` + WS `{t:"log",m:"…"}`)
+- Core affinity badge (C0/C1) — only meaningful when core pinning lands
+- Module `category()` field — taxonomy beyond `role()` for the picker (decision: derive from `role()` for now)
 
-Compile-time answer already ships: `--firmware esp32-eth` excludes the WiFi stack. The default `esp32` already *cascades* — `ethInit()` runs first, WiFi only comes up if no PHY responds — so a wired board never associates over WiFi. What's still missing is reclaiming WiFi's **heap**: even when Ethernet wins the cascade, `esp_wifi_init`'s RX buffers stay allocated. This item skips that init entirely once Ethernet is up, freeing ~16 KB. Defer until the heap saving is worth the teardown-ordering risk.
+### Open design questions
+
+These don't block the shipped baseline but should be answered before 1.0:
+
+- **Multi-layer UI** — [architecture.md](../architecture.md) plans for N layers blended into one Drivers. The current card layout shows one Layer. Likely needs a tab/accordion to switch layers, or a per-layer column.
+- **Modifier chain visualization** — show the modifier order visually. Today they're a flat list, and only the **first enabled** modifier actually applies (the `children[]` order is *not* yet an apply order — see [Composed modifiers](backlog-mixed.md#composed-modifiers--chain-the-whole-modifier-stack-not-just-the-first-planned-multi-commit)). This viz item only becomes meaningful *after* composed modifiers land; until then a chain UI would imply a stacking the engine doesn't do.
+- **Presets** — save/load named bundles of control values. Persistence already stores them; needs a UI surface.
+- **Canvas/node-graph view** — v2 attempted this. Powerful for complex setups but doubles the UI surface. A reasonable v3 follow-up gated on user demand.
+
+### Gap analysis — v1 features not yet in v3
+
+Inventory of v1 frontend behaviours v3 lacks, with a recommendation each. Items already shipped (control types, dragTs, two-timescale inputs, type picker, theme, scroll-shrink preview, status bar, reset-to-default, fps/ms toggle, drag reorder, side nav + drawer + footer) are not repeated.
+
+Legend: **Adopt-1.0** (small, high value) · **Defer-1.x** (needs engine work or a feature we lack) · **Drop** (not needed).
+
+### Per-card features
+
+| v1 feature | v3 today | Recommendation |
+|---|---|---|
+| Header: setup-dot before name | name only | **Defer-1.x** — needs `setupOk()` + `health()` on MoonModule with a real failure mode. Today both would always be `true` / `""`. |
+| Module ID shown separately from name | name only | **Defer-1.x** — add when instances need disambiguating (e.g. two effects of the same type under one Layer). |
+| Category emoji badge on the card header | role emoji in the picker, not on the card | **Defer-1.x** — `ROLE_EMOJI` already exists in `app.js`; showing it per-card is a small step if card scannability needs it. |
+| Core affinity badge (C0/C1) | core pinning not implemented | **Drop** until core pinning is a real engine feature. |
+| Memory split heap vs PSRAM | `static+dynamic` shown on the card | **Defer-1.x** — splitting `dynamicBytes` further needs `platform::isPsramPointer(p)` or per-alloc tracking, neither exists yet. |
+
+### WebSocket / panels
+
+| v1 feature | v3 today | Recommendation |
+|---|---|---|
+| Drag-to-reorder *root* modules (`POST /api/modules/reorder`) | not supported | **Drop** — root order is fixed in `main.cpp` and that's correct: Layouts/Layers/Drivers + system modules are mandatory and ordered. Children reorder via drag already. |
+| Log channel `{t:"log",m:"…"}` pushed by server | no server log push | **Defer-1.x** — needs an engine-side log producer. Gate: when boot/network/persistence logs become interesting to non-developers. |
+| Schema channel `{t:"schema",modules:[…]}` for tree-shape changes | full `/api/state` push every update | **Drop** — keep the full-tree push; re-evaluate only if WS bandwidth becomes a problem with large trees. |
+| System health panel (polls `GET /api/test`, pass/fail table) | none | **Defer-1.x** — needs a runtime `/api/test` that runs the doctest suite; `ctest` covers this for now. |
+| Log panel (ring buffer, severity colouring, stick-to-bottom, `GET /api/log` backfill) | none | **Defer-1.x** — pairs with the log WS channel; both arrive together. |
+
+### Cost / decision table
+
+| Cost class | Items |
+|---|---|
+| Tiny (< 30 lines, no backend) | category emoji badge on the card header |
+| Medium (minor backend change) | help-link mapping (needs docs site); richer `category()` than role()-derived |
+| Large (separate plan) | health panel + `/api/test`; log panel + WS log channel; OTA + GitHub-update badge; full multi-layer UI; presets UI |
diff --git a/docs/backlog/backlog-light.md b/docs/backlog/backlog-light.md
new file mode 100644
index 0000000..fc3d128
--- /dev/null
+++ b/docs/backlog/backlog-light.md
@@ -0,0 +1,137 @@
+# Backlog — light domain
+
+Forward-looking to-build items for the **light domain** (`src/light/`: drivers, effects, layouts, modifiers, preview) and its sensors. The core/infrastructure counterpart is [backlog-core.md](backlog-core.md); cross-domain items are in [backlog-mixed.md](backlog-mixed.md). Index + overview: [README.md](README.md). Completed items are removed.
+
+## Drivers
+
+### Extract shared lane-driver scaffolding when the 3rd parallel backend lands (deferred)
+
+The LcdLedDriver (S3 LCD_CAM i80) and ParlioLedDriver (P4 Parlio) share ~245 of 362 lines, and their platform-side loopback capture+verify is ~100 lines byte-for-byte identical (`platform_esp32_parlio.cpp` even notes "The RX capture half is byte-for-byte identical" to the LCD one). The status-string lifecycle (`failBuf_` / `configErr_` / `clearFailBuf` / `clearConfigErr`) is triplicated across all three LED drivers (RMT/LCD/Parlio), ~60 lines. The branch deliberately extracted the *encoders* (`LcdSlots.h` shared by i80+Parlio, `RmtSymbol.h`, `PinList.h`) on the "extract when the second user lands" rule, but stopped at the lifecycle/loopback scaffolding. **Accepted for this merge** (the reviewer agreed driver-level extraction can wait): the duplication is in mechanical lifecycle/test scaffolding, not domain logic, and a DriverBase-level refactor touching three drivers is riskier than the duplication it removes. **Do it when the third parallel backend arrives** (16-lane widening, or Teensy FlexIO), at which point the pattern is proven three ways: (a) a `detail::` platform helper for capture+verify (the only per-peripheral difference is the transmit call, pass a callback, beside the already-shared `loopbackJumperOk`), and (b) a small owned-status helper or DriverBase members for the fail/config strings. Until then the cost is line count, not correctness.
+
+### 1..8-pin LCD output (future) — would let S3 default to LCD
+
+`LcdLedDriver` requires **all 8** i80 data lanes (`kExactLaneCount = true`, `LcdLedDriver.h`): the ESP-IDF `esp_lcd` i80 bus configures every data line of the bus width and rejects a partial set, so even a few WS2812 strands claim 8 GPIOs. That's why **S3 boards default to `RmtLedDriver`** in `deviceModels.json` (RMT runs one channel per pin, 1..N) rather than LCD — a board with fewer than 8 strips can't sensibly use the LCD driver, and the 8-lane LCD bench wiring (`1,2,4,5,6,7,8,9`) collides with common peripheral pins (e.g. the mic on 4/5/6). A **1..8-pin LCD mode** (drive only the lanes named in `pins`, leave the rest unclaimed — matching Parlio's flexibility) would let the parallel S3 path run any lane count, at which point an S3 board entry could choose LCD vs RMT by intent. Parlio already does this (`kExactLaneCount = false`, 1..8 lanes), so the P4 default *is* the parallel driver. Until LCD gains the same flexibility, S3 stays on RMT by default. Low priority — RMT covers the few-strip S3 case today.
+
+### Classic ESP32 I2S 16-lane parallel LED driver (future) — beyond RMT's 8 channels
+
+The **classic ESP32 has 8 RMT TX channels** (`platform_config.h`: "8 on classic ESP32, 4 on the S3 and P4"), so RMT covers up to 8 parallel outputs on classic ESP32 — e.g. the 8-output QuinLED Dig-Octa runs fine on `RmtLedDriver`. For **more than 8 lanes on classic ESP32**, the established trick drives the **I2S peripheral in LCD/parallel mode** (the hpwit [I2SClocklessLedDriver](https://github.com/hpwit/I2SClocklessLedDriver) / FastLED I2S lineage), clocking out up to **16 lanes** from one autonomous DMA transfer. This is the classic ESP32's high-lane-count path, distinct from the S3 (LCD_CAM → `LcdLedDriver`, plus the [1..8-pin LCD item](#18-pin-lcd-output-future--would-let-s3-default-to-lcd) above) and the P4 (Parlio). No catalog board needs it today (none exceeds 8 outputs), so no board's `planned` list points at it yet; it's the marker for a future ≥9-output classic-ESP32 board. Studied under *Industry standards, our own code* — carry the idea, write our own against the project architecture (host-testable encoder in `src/light/`, peripheral seam in `src/platform/esp32/`). **When it lands**, follow the per-chip driver-gating pattern now in `main.cpp` (each LED driver's `#include` + `registerType` is wrapped in `#if defined(CONFIG_SOC_<PERIPHERAL>_SUPPORTED)`, keyed off the SOC capability macro that backs its `platform_config.h` lane-count flag): the I2S driver gates on the relevant I2S/LCD SOC macro so it compiles + registers on classic ESP32 only, and adds an `i2sLanes` capability flag beside `rmtTxChannels`/`lcdLanes`/`parlioLanes`. Prior art: hpwit's I2SClockless lineage and FastLED's I2S driver; the same parallel-DMA lineage is already credited in [LcdLedDriver.md § Prior art](../moonmodules/light/drivers/LcdLedDriver.md#prior-art).
+
+## Sensors and audio-reactive input
+
+### Audio-reactive follow-ups
+
+The manual level + 16-band FFT spectrum has shipped ([AudioModule](../moonmodules/core/AudioModule.md); what landed and why is in [decisions.md](../history/decisions.md)). These are the deferred follow-ups, each its own increment:
+
+- **Per-band noise-floor (kill a steady single-frequency hum)** — the bench mic picks up a constant ~258 Hz tone (a mains harmonic via the mic/supply) that lights one band even in silence. A high-pass can't remove it (it's well above the ~40 Hz DC-blocker cutoff) without also killing real bass; the clean fix is a per-band adaptive floor that learns each band's idle baseline and subtracts it, so a constant tone in one band gates to dark while the others stay sensitive. Minimal version ≈ 16 floats of state + ~16 ops/frame. This is the next concrete audio step.
+- **Adaptive conditioning** — auto noise-floor / auto-gain / smoothing so the display self-calibrates to a room ("sound off → dark, sound on → vivid") instead of being tuned by hand. A self-calibrating version was prototyped and removed; the manual `floor`/`gain` is the shipped baseline. Reinvent from scratch when wanted, and **tune it in a quiet room** — a noisy environment (a strong, varying low-frequency ambient) is the adversarial case that made the prototype hard to settle. (The per-band floor above is the first piece of this.)
+- **Adaptive noise gate** — replace the borrowed `squelch`/`floor`-as-gate with a real noise gate: asymmetric bang-bang timing (open fast, close slow), a relative "detect silence" test (thresholds as factors of a learned floor, not absolute sample counts), keying off the RMS envelope we already compute, GEQ/FFT bands left untouched. A softhack007 concept; analysed and judged in full (good idea, industry-standard, but tight on the <30ms budget; decompose into steps rather than overhaul) in [AudioModule.md § Adaptive noise gate](../moonmodules/core/AudioModule.md#adaptive-noise-gate-forward-looking). The recommended sequencing: the per-band floor above is step 1 (its complementary frequency-domain half), the relative-threshold-over-RMS is the cheap high-value cherry-pick as step 2, hysteresis/timing step 3, log-domain + soft-gate optional. Eventually retires the manual squelch.
+- **Pin auto-scan** — detect the mic's `sdPin` with `wsPin`/`sckPin` fixed (a noise-prompt + confirm convenience); ships today with explicit pin controls.
+- **Beat / onset detection** beyond the raw peak; more audio effects (2D / palette-driven frequency-reactive).
+
+### GyroDriver → core Peripheral move + AudioModule-consistency pass (branched, not merged)
+
+A working **GyroDriver** (MPU6050 IMU over I²C) exists on an unmerged branch (commit `11f8eb7`, "Add GyroDriver (MPU6050) + generic platform I2C layer"); it is not in this branch's tree. This entry reverse-engineers that commit so the move is tracked now. **Verify against the real implementation when the branch merges, then delete this entry.**
+
+What the commit contains (reverse-engineered):
+
+- `src/light/drivers/GyroDriver.h` — reads an MPU6050 over I²C and surfaces five read-only telemetry controls (`gyroX`/`gyroY`/`gyroZ` rates in °/s, `pitch`/`roll` tilt angles). Polls the sensor in `loop20ms()` (50 Hz), formats the display strings in `loop1s()`. WHO_AM_I probe + wake on `setup()`, big-endian 14-byte burst parse, `atan2`-based tilt (no fusion filter).
+- A **generic, domain-neutral platform I²C master** (`platform::i2cInit`/`i2cWriteReg`/`i2cReadRegs`, 7-bit addressing) so future sensors reuse it; ESP32 impl on the IDF v6 `i2c_master` driver in a new `platform_esp32_i2c.cpp`, plus an MPU6050-shaped desktop simulation so the UI and host tests see live values without hardware.
+- `unit_GyroDriver.cpp` — WHO_AM_I probe, simulated burst parse, control formatting, time-ramp tracking.
+
+The move: it currently masquerades as an input-only **driver** under the Drivers container (a no-op `setSourceBuffer(Buffer*) override {}` is the tell). It belongs as a **SystemModule Peripheral** child, exactly like [AudioModule](../moonmodules/core/AudioModule.md) — both are sensor peripherals that poll hardware and publish read-only telemetry. On the move, make it consistent with AudioModule (the established sibling pattern):
+
+- **Relocate** `src/light/drivers/GyroDriver.h` → `src/core/` and its spec `docs/moonmodules/light/drivers/GyroDriver.md` → `docs/moonmodules/core/`; change `role()` to `Peripheral`; delete the `setSourceBuffer` no-op; rewrite the doc's "input-only driver under the Drivers container" framing.
+- **Pin controls + rebuild path.** GyroDriver hardcodes SDA/SCL (`static constexpr` 21/22, with its own "Hardcoded until BoardModule exposes I2C pin mapping" comment). AudioModule already shows the pattern: editable `uint16` pin controls + `controlChangeTriggersBuildState` + a `reinit()` on `onBuildState`. Adopting it retires the hardcoded-pins TODO and satisfies the robustness rule (reconfigure in any order).
+- **Lifecycle.** GyroDriver has `setup()` only — no `teardown()`. Add teardown for symmetry with AudioModule's setup/teardown/reinit (the shared I²C bus has little per-instance state to free, so this is consistency, not a leak fix).
+- **Document the cadence difference.** GyroDriver polls in `loop20ms()` (50 Hz is plenty for tilt); AudioModule reads in `loop()` every tick because I²S DMA must be drained promptly or it overflows. Both are correct; add a one-line "why this cadence" comment at each so the two siblings aren't "harmonised" into a bug.
+- **Wire it** in `main.cpp` as a Peripheral child of System under `markWiredByCode`, the same shape as AudioModule.
+
+Already done on this branch (the reverse direction): AudioModule's two live read-outs were switched from `addText`+`setReadOnly` to `addReadOnly` (the display-only type, matching SystemModule and the way GyroDriver already does it correctly) — so the telemetry idiom is consistent before the gyro branch even lands.
+
+### Sensor input on Raspberry Pi 5 — microphone, IMU, line-in (post-1.0, multi-commit)
+
+Audio-reactive lighting (and motion-reactive) is core to what WLED-MM / MoonLight are known for. The Pi 5 is the right host for it: it has the CPU and RAM for real FFT-based audio analysis that the Xtensa ESP32 struggles with, and a full Linux audio + I²C stack. None of this exists today — the codebase has no sensor, audio, or IMU concept, and the Pi currently runs the **desktop** platform backend (there is no `src/platform/rpi/`), which has no hardware access. So this is a domain expansion built on a real platform-backend prerequisite, not a small add.
+
+**Target sensors and their Pi 5 interfaces:**
+
+- **Microphone** — I²S MEMS mic, or a USB audio device read via ALSA. The high-value one: FFT → frequency bands + beat detection drive audio-reactive effects.
+- **Line-in** — the Pi 5 has no native analog input, so this is a USB audio interface / DAC HAT feeding the same audio pipeline as the mic; only the source differs.
+- **IMU / gyro** — an I²C device (MPU-6050 / 9250-class) on the Pi's I²C bus; tilt / motion → effect parameters.
+
+**How it fits the architecture (the load-bearing part):**
+
+1. **The module category exists — `ModuleRole::Peripheral`.** Peripherals are user-add/deletable children of SystemModule (a gyro `Peripheral` already lands there via the GyroDriver→core move). What's missing for audio-reactive is the *consumption* side: a sensor reads hardware and *produces* values (audio bands, IMU axes) that effects consume — the producer side of the [producer/consumer data-exchange model](../architecture.md#data-exchange-between-modules) (a sensor produces an `AudioFrame` / `ImuState` the way effects produce a buffer that drivers consume). Define the producer struct domain-neutrally so it isn't audio-specific. Today's peripherals are display-only; wiring them into effects is the new work.
+2. **All hardware access stays behind the platform boundary.** New `platform::` APIs (e.g. `readAudio()` returning PCM/FFT, `readImu()` returning axes) with the ALSA / I²S / I²C implementation in a real `src/platform/rpi/` backend — which is itself the prerequisite that doesn't exist yet (the Pi uses the desktop backend today). No ALSA/I²C include or call outside `src/platform/`.
+3. **Effects consume sensor data the same way they read the layer.** An audio-reactive effect reads the current `AudioFrame` (bands/level/beat) the way `PreviewDriver` reads what `Layer` produces — through a plain data structure wired in `main.cpp`, not a direct hardware call.
+
+**Increments (each a normal domain addition, picked up one at a time):**
+
+1. A real `src/platform/rpi/` hardware backend (GPIO/I²C/I²S/ALSA) — the prerequisite; until it lands, the Pi runs the desktop backend with no sensors.
+2. The producer struct(s) (`AudioFrame` / `ImuState`) + the `platform::read*` APIs. (The `Peripheral` role + SystemModule add/delete already exist.)
+3. The first audio peripheral — **MicrophoneModule** (canonical, highest value: FFT bands + beat).
+4. The first audio-reactive effect(s) consuming it.
+5. IMU and line-in slot into the same source-module + platform-API shape afterwards.
+
+Study the proven audio pipeline in MoonLight / WLED-MM (FFT band layout, AGC, beat detection) to inform our own — reference the approach, don't port their code, per [history](../history/README.md) practice. Specs before code: a `MicrophoneModule.md` (and the source-category contract) get written and reviewed before implementation.
+
+## Effects and preview
+
+### Add real z-axis variation to 2D effects (pending)
+
+Only **NoiseEffect**, **PlasmaEffect** and **RipplesEffect** have z-aware math. The other honest-D2 effects use `Layer::extrude` to duplicate the z=0 plane, so every z-slice is identical on 3D layers. Candidates for genuine D3 promotion: Metaballs/GlowParticles (add z to blob coordinates), Plasma palette/Spiral (add z-driven phase term), Fire (z-drift heat grid), Rings/LavaLamp/Checkerboard/Particles (add z to each element). Prioritise after seeing real 3D installations; each promoted effect also needs its `dynamicBytes` budget for the full 3D buffer.
+
+### Full-density interpolated preview for large layouts (backlog)
+
+The preview index-downsamples a large layout to fit the WS send budget (e.g. 128×128 = 16384 lights → ~1639 sent at stride 10), so the UI shows a sparse sample, not every light. To show **all** lights at their real positions with **interpolated** colours for the unsent ones:
+
+- Decouple the `0x03` coordinate-table density from the per-frame `0x02` stride. Positions are static and sent once, so the table can carry **all** light coordinates (16384 × 3 = ~48 KB one-time — acceptable off the per-frame path, possibly chunked) while the per-frame RGB stays strided to protect ArtNet/the link.
+- The browser holds the full position set and, per frame, interpolates each unsent light's colour from its nearest sent neighbours (the sent indices are known from the stride). True positions, guessed colours — better than the removed dense-box block-replicate because positions are exact.
+- Open questions: 48 KB one-time table vs `MAX_WRITE_CHUNKS` / send-buffer (needs chunked send or a raised cap, with the same partial-write care as `writeChunks`' drain); interpolation cost on a 16384-point cloud each frame in JS; whether nearest-neighbour or weighted is worth it.
+
+Not simple — own planning pass. Until then the preview is a faithful strided *sample* (correct shape/colour/motion, not per-pixel). A cheap interim (point-size scaled by stride to fatten samples into their cells) was tried and reverted as not what's wanted — it filled the volume but didn't add real points.
+
+### Self-describing preview frame header (mid term)
+
+The preview wire format is a private opcode protocol: `0x02` per-frame channels, `0x03` coordinate table, each a hand-rolled byte layout, and the colour payload is **always RGB** regardless of the buffer's `channelsPerLight`. Every new data kind (RGBW display, beam direction, …) means inventing another opcode and another fixed layout by hand. The minimal fix that stops that sprawl: a small **typed header** — `[type][format][count][stride]` where `format` enumerates `{RGB, RGBW, …}` — so one message kind carries any per-light channel layout and the browser shader reads `format` to interpret the payload. Do it concrete-first, when RGBW *display* (below) is actually wanted, not speculatively. Prereq for both items below.
+
+### RGBW preview end-to-end (mid term)
+
+The light `Buffer` already holds `channelsPerLight = 4` (RGBW), and the device output drivers handle it, but the **preview only ever sends/draws RGB** — the W channel is invisible in the UI. (The full-res fast path no longer penalises a cpl≥3 buffer — see the short-term fix — but it still drops W on the wire.) Once the self-describing header lands, carry the W channel on the wire and render it in the shader (W as a warm-white tint / brightness lift on the disc). Small, but gated on the header so it isn't another bespoke opcode.
+
+### Fixture model — moving heads, beams (long term)
+
+Today a "light" is a point at a static coordinate with a colour. A **moving head** is a fixture that emits a *beam* in a direction it controls live (pan + tilt), plus colour, beam-width, etc. — per-light **vector** state, not just colour, and a different draw (a cone/ray, not a disc). The static-positions-`0x03` + colour-`0x02` split can't express "this fixture's beam now points here." The industry-standard model is **DMX/GDTF fixtures**: a fixture has a position *and* a set of typed attributes (color, pan, tilt, beam). The preview becomes a fixture renderer (disc for a pixel, cone for a beam); this is also the "make Preview a general-purpose module, not light-specific" goal. A domain-model change (the fixture/attribute model), not just transport. Plan when moving heads are actually on the bench.
+
+### Extract the resumable backpressure transport as a domain-neutral channel (long term)
+
+The preview's transport — resumable cross-tick send from a stable buffer + newest-wins backpressure drop + adaptive graceful degradation (see [architecture.md § graceful degradation under transport backpressure](../architecture.md)) — is **payload-agnostic**: any bulky throttled stream (a future MJPEG/video preview, fixture-state streams, fleet telemetry) could ride it. The *payload* model (count/stride/RGB) is light-specific; the *byte-pump* is not. When a second consumer for this transport appears, promote the pump into a domain-neutral core primitive (a `ThrottledChannel`-style sink) that PreviewDriver becomes *a* producer on, rather than owning the protocol. Concrete-first: extract on the second use, not before — until then the seam stays inside HttpServerModule/PreviewDriver.
+
+## LCD / DMA driver work
+
+### Drop the i80 WR/DC sacrificial pins (S3 LcdLedDriver) via direct LCD_CAM
+
+The S3 i80 LED path costs **two GPIOs the LEDs never use**: the IDF `esp_lcd` i80 bus hard-requires a WR (pixel clock) and a DC pin on real GPIOs (`esp_lcd_panel_io_i80.c`: `wr_gpio_num >= 0 && dc_gpio_num >= 0`), even though WS2812 strands ignore both. Today `LcdLedDriver` keeps overridable defaults (clockPin=10, dcPin=11) — peripheral-required, not user-strand wiring, so a default cannot do harm. **Two ways to reclaim the pins, neither trivial:**
+- **Cannot reuse a data pin for WR/DC.** A GPIO carries exactly one peripheral signal (`esp_rom_gpio_connect_out_signal` binds data_sig[i] / wr_sig / dc_sig each to its own pin); routing WR onto a data lane would clock the *clock* waveform onto that strand instead of its colour bytes. WR/DC must be distinct *physical* pins from the 8 data pins. (You CAN already point them at any otherwise-free or unstrapped GPIO via the controls — that's the "reuse a pin you're not using" answer; it's the *spare* pin you avoid, not a data pin.)
+- **Zero WR/DC pins needs bypassing esp_lcd** and driving the LCD_CAM peripheral's registers directly (hpwit's I2SClockless approach — legacy parallel mode has no DC concept and emits WR without a dedicated config pin). That's the only path to 8-pins-total on the S3. Cost: leaving the recognisable IDF `esp_lcd` API for register-banging (a *Common patterns first* hit), re-proving the driver bit-perfect on hardware (the loopback self-test is the proof). Benefit: 2 GPIOs back on a tight S3 board. Its own increment, not a pin-default tweak. Parlio (P4) already needs no extra pins (`clk_out_gpio_num = GPIO_NUM_NC`), so this is S3-i80-only.
+
+### LCD/Parlio DMA frame buffer → PSRAM (free internal SRAM for big frames)
+
+For driving **lots of LEDs**, internal SRAM is the scarce resource and the parallel-driver DMA frame buffer is the biggest consumer (8 lanes × lights × outCh × 24 slot-bytes + latch pad). Today both parallel drivers allocate it as `MALLOC_CAP_DMA | MALLOC_CAP_INTERNAL` (`platform_esp32_lcd.cpp`, `platform_esp32_parlio.cpp`) — **internal SRAM only**, so a large frame can exhaust DRAM while PSRAM sits unused. The IDF confirms both peripherals' GDMA **can burst straight from PSRAM** on the S3/P4: `esp_lcd_panel_io_i80.c` sets `access_ext_mem = true` and itself allocates the buffer with `MALLOC_CAP_SPIRAM | MALLOC_CAP_DMA` when asked; `esp_driver_parlio/src/parlio_tx.c:158` sets `access_ext_mem = true  // support transmit PSRAM buffer`. (RMT already does the right thing — its symbol buffer goes through `platform::alloc`, which is PSRAM-first with an internal fallback.)
+
+**The change:** allocate the LCD/Parlio buffer `MALLOC_CAP_DMA | MALLOC_CAP_SPIRAM` first, falling back to internal when PSRAM is absent/full, using the **external-memory alignment** the IDF requires (`gdma_get_alignment_constraints` → `ext_mem_align`, typically the cache line — larger than the current 64-byte internal alignment) and keeping the buffer cache-aligned + its size a multiple of that alignment. **Why it's its own increment, not this commit:** it changes the proven hot DMA path, PSRAM DMA has real caveats (cache-line alignment, write-back/coherence on the encode→DMA handoff, and lower PSRAM bandwidth that the IDF guards with a CPU-MAX DFS lock during transmit), and it **must be re-proven on S3 + P4 hardware** (the loopback self-test bit-verifies it, then a real strip). Measure the bandwidth headroom too: a very wide, long frame at speed may want internal SRAM regardless. Scope: the two `heap_caps_aligned_alloc` sites + their `bufferBytes` alignment rounding + the capacity check; no domain-code change (the encode loop already writes through `dmaBuf_`).
+
+
+## LED drivers — deferred
+
+The LED-driver increments **shipped**: increment 1 (RMT/WS2812B single-strand on classic ESP32 — [`RmtLedDriver.h`](../../src/light/drivers/RmtLedDriver.h), `RmtSymbol.h`, `platform_esp32_rmt.cpp`) and increment 2 (2a multi-pin RMT, 2b parallel LCD_CAM on the S3 — [`LcdLedDriver.h`](../../src/light/drivers/LcdLedDriver.h) via [`ParallelLedDriver.h`](../../src/light/drivers/ParallelLedDriver.h), `platform_esp32_lcd.cpp`), all with host + on-board-loopback tests, hardware-proven. The locked decisions, file-by-file phases, the WiFi-flicker test-rig analysis, and the bench deviations (8-GPIO i80 bus, 2.67 MHz slot clock, SOC-macro gate, real-frame loopback) are in [decisions.md](../history/decisions.md), the [driver docs](../moonmodules/light/drivers/RmtLedDriver.md), and the [analysis docs](leddriver-analysis-top-down.md). What remains here is only the work that has **not** shipped and is tracked nowhere else.
+
+- **sigrok/fx2lafw cross-check + MoonDeck "LED driver test" Python script** — the independent-clock proof and the run-from-MoonDeck flow ([analysis §5.3](leddriver-analysis-top-down.md)). The on-board RMT-RX loopback (shipped) is the cheap CI correctness gate but a *compromised witness* for WiFi-induced flicker — the RX capture runs on the same ESP32 whose WiFi causes the glitch. The real flicker test is a **sustained capture (seconds) with WiFi associated + a packet flood**, decoding every frame for a byte-slip or reset-gap deviation; it belongs with the core-1 driver-task work below, since that task pinning is the *fix* it validates. A DSLogic Plus (100 MS/s) upgrade is reactive — only if a flicker reproduces that 24 MS/s can't resolve.
+- **Dedicated core-1 driver task + per-module core-affinity control** ([analysis §7.2](leddriver-analysis-top-down.md)) — the WiFi-glitch mitigation, shared across all the LED drivers. (See also [backlog-core § Task core-pinning](backlog-core.md#task-core-pinning-backlog) for the general task-pinning question.)
+- **`rmtWs2812Show` fuller error handling** (deferred from PR #17 / 🐇 CodeRabbit). The shipped path has a finite `rmt_tx_wait_all_done` timeout (1 s) so a wedged DMA can't hang the render tick forever, and a dropped frame self-heals (the driver re-encodes the whole frame next tick). The fuller version — `rmt_transmit` return check, `rmt_tx_stop` to cancel an in-flight transfer on timeout, `show()` returning failure so `loop()` won't reuse `symbols_` mid-transmit — belongs with the **core-1 driver-task** work, since that task owns the buffer lifetime and in-flight state the cancel logic needs.
+- **Per-driver buffer window** — `start`/`count` controls on each physical driver, so different slices of the light buffer can go to different outputs (e.g. "some lights to ArtNet, others to LED pins"). Additive on `DriverBase` consumers when it lands — no change to the Drivers container or the buffer-passing contract; the multi-pin RMT slicing would then subdivide the driver's window instead of the whole buffer.
+
+  **This is the model for light distribution — distribution is *explicit*, not derived from driver order.** Worth stating because it's a common expectation otherwise: every driver reads the **same shared source buffer** ([`Drivers::passBufferToDrivers`](../../src/light/drivers/Drivers.h) hands the same `Buffer*` to every child) and selects *its* lights from *its own* controls — `NetworkSendDriver` via `universe_start` + `light_count` ("0 = whole buffer, >0 = the first N"), the LED drivers via their `pins` / `ledsPerPin`. There is **no running offset across driver siblings**, so **reordering drivers via drag-and-drop does not change which lights each driver outputs** — it only changes tick order and the persisted file order. A "split the buffer across drivers by sibling order" model (some controllers do this) is explicitly *not* what projectMM does; this `start`/`count` window is the deliberate alternative — the user says which slice goes where, order-independently. **Estimate: small — 1–2 commits.** Add `start` (alongside the existing `light_count` as `count`) to `DriverBase`'s windowing, clamp to the source buffer, apply in each driver's read loop, plus a unit test (two drivers, non-overlapping windows, assert each emits its slice) and a doc line. The wire/output loops already read a sub-range, so this is mostly lifting `light_count`'s "first N" into a "[start, start+count)" window on the shared base.
+- **Auto-derived DMA buffer count** (7 / 30 / 75 per [analysis §7.4](leddriver-analysis-top-down.md)), **16-bit pipeline + dither** ([§7.3](leddriver-analysis-top-down.md)), **shift-register expander stubs** ([§7.5](leddriver-analysis-top-down.md)).
+- **Moving-head preview = peer interpreter.** When moving heads land, the previewer must interpret channel semantics (pan/tilt/RGBW-at-arbitrary-indices) to render a moving fixture — the same light-preset model physical drivers use, interpreted to screen. This is *why* the increments named the abstraction "interpret the preset" rather than "apply correction / opt out": so Preview becomes a full peer here without a rename. Its own design plan when moving-head support starts.
+
+(The shared lane-driver scaffolding extraction — when a 3rd parallel backend lands — is tracked separately under [§ Extract shared lane-driver scaffolding](#extract-shared-lane-driver-scaffolding-when-the-3rd-parallel-backend-lands-deferred) above.)
diff --git a/docs/backlog/backlog-mixed.md b/docs/backlog/backlog-mixed.md
new file mode 100644
index 0000000..a9e5b4d
--- /dev/null
+++ b/docs/backlog/backlog-mixed.md
@@ -0,0 +1,53 @@
+# Backlog — mixed (core + light)
+
+Forward-looking items whose work genuinely spans **both** the core and light domains — a core mechanism interacting with a light driver/effect/modifier, where assigning it to one side would misrepresent it. Core-only items are in [backlog-core.md](backlog-core.md), light-only in [backlog-light.md](backlog-light.md). Index + overview: [README.md](README.md).
+
+## Cross-domain
+
+### MultiplyModifier mapping-LUT memory at large grids (investigation, re-verify on classic)
+
+`scenario_perf_full` on the S3 (2026-06-17) measured the MultiplyModifier's cost across grid sizes. The finding, stated correctly: the modifier **reduces compute** (with the default 2×2 kaleidoscope the effect renders only the ¼-size logical quadrant — Noise+Multiply at 16K is 29,647µs vs 50,555µs for Noise alone), and its real cost is **memory** — the 1:N fan-out mapping LUT. Measured modifier heap cost on the S3: 16²→1.7KB, 32²→10.8KB, 64²→23.5KB, **128²(16K)→93KB** (the LUT destinations array; `nrOfLightsType` is `uint32_t` on a PSRAM board). On the S3's 8MB PSRAM this is trivial. [Composed modifiers](#composed-modifiers--chain-the-whole-modifier-stack-not-just-the-first-planned-multi-commit) would multiply this memory cost by the chain depth — size it there.
+
+**This is NOT a no-PSRAM blocker** — 16K Noise + Multiply has run on a classic ESP32 (no PSRAM, 320KB internal) before at **10–20 FPS** (WiFi vs Ethernet), sending frames out over **ArtNet to a display, not physical LED drivers**. It works there because classic's `nrOfLightsType` is `uint16_t` (half the LUT size) and the modifier shrinks the logical render grid. So the action is **re-verify the working classic setup when a classic board is connected** (find the config — grid, mirror, ArtNet target — that reproduces the historical 10–20 FPS), not "fix an impossibility." Worth investigating only if that re-verification shows the LUT memory has regressed since: the destinations array is the obvious lever (it stores a `nrOfLightsType` per physical destination; a 2× kaleidoscope is 1:1 in *count* so the LUT need not store fan-out > the physical count — confirm it isn't over-allocating to `maxMultiplier()` when the effective fan-out is 1). Capture the classic numbers into performance.md's multi-board table first.
+
+### Composed modifiers — chain the whole modifier stack, not just the first (planned, multi-commit)
+
+**Confirmed scope, not an open question:** multiple modifiers per Layer applied as a stack was always the plan, and it ships in **MoonLight** (Mirror, Rotate, Transpose, Kaleidoscope, … all composable on one layer — see [moonlight-inventory.md](../history/moonlight-inventory.md)). projectMM's single-modifier behaviour is the not-yet-finished state, not a design choice.
+
+Today a Layer applies **only the first enabled modifier**. `Layer::rebuildLUT()` finds the first enabled `Modifier` child and `break`s ([Layer.h](../../src/light/layers/Layer.h) `rebuildLUT`), and `Layer::loop()` ticks only that one (with an explicit comment that ticking a later one would desync the LUT, since a dynamic modifier's `loop()` can drive a rebuild the LUT must reflect). So with two modifiers on a Layer the second is dead weight — dragging it above the first is the only way to make it the active one. The intended behaviour is **modifier order = apply order**: a stack where each modifier reshapes the result of the one below ("modifiers on modifiers"), e.g. Multiply (kaleidoscope) *then* Rotate the kaleidoscoped result. The [modifier-chain-viz UI item](backlog-core.md#open-design-questions) is the surface for it and only becomes meaningful once this lands.
+
+**Mechanism — follow MoonLight's proven model, our own code** ([*Industry standards, our own code*](../../CLAUDE.md#principles)). MoonLight composes by streaming the layout's coordinates through each modifier's `modifyLayout`/`modifyLight` in order while the mapping table is built, so the *final* table already encodes the whole chain — the per-frame hot path stays a single lookup. We do the same with our pieces: `rebuildLUT()` walks the layout's coordinate stream (`Layouts::forEachCoord`) and passes each coordinate through modifier 1, then 2, …, then *n* before recording the destination, so the built `MappingLUT` is the composition `M₁ ∘ M₂ ∘ … ∘ Mₙ` collapsed to one `logical→driver` table. Composition is a **cold-path, build-time** concern; modifiers stay simple (each still answers `logicalDimensions()` + its own per-coordinate transform), so the complexity lives in the core per *[Complexity lives in core](../../CLAUDE.md#principles)*. Worth studying MoonLight's `PhysMap` 1:0/1:1/1:N packing (inventory §1) when sizing the table — a deep chain with fan-out is exactly where the per-entry byte cost matters.
+
+Why it's not a one-liner:
+
+- **Build path** — `rebuildLUT()` must iterate *all* enabled modifiers bottom-up, threading each stage's logical dimensions into the next, and fold the per-stage transforms into one final LUT. The single-modifier `maxDest` / fan-out ceiling math (the `maxMultiplier()` clamp that fixed the multiplyZ overflow) has to generalise to a **product** of multipliers across the chain — the dominant new correctness risk (and the memory blow-up noted in the MultiplyModifier-LUT item above: a 2-deep 2× chain is up to 4× the destinations).
+- **Tick path** — a dynamic modifier (RandomMapModifier, RotateModifier) calls back into `Layer::onBuildState()` on its timer to rebuild the LUT. With a chain, *any* dynamic stage rebuilding must recompose the *whole* chain, and `loop()` must tick every enabled modifier (not `break` after the first) in the right order, after the effect pass.
+- **Degrade path** — the per-stage OOM degrade (`degradeIdentity`) must decide what "degrade" means mid-chain (drop the offending stage? collapse to identity?) without leaving a stale partial LUT.
+- **Tests** — `unit_Layers_container` / the modifier unit tests pin single-modifier behaviour; composed-order needs new cases (A∘B ≠ B∘A, a disabled middle stage is skipped not collapsed, the fan-out product ceiling holds at no-PSRAM `uint16_t`), plus a scenario that reorders a 2-modifier stack and asserts the composite changes.
+
+**Estimate: medium — roughly 4–6 commits.** (1) design note pinning the coordinate-stream composition model + the fan-out-product ceiling rule (reference the MoonLight inventory); (2) `MappingLUT` compose/fold primitive + unit tests in isolation; (3) `rebuildLUT()` chain iteration + `loop()` tick-all-in-order, behind the existing single-modifier tests staying green; (4) degrade-path decision + tests; (5) reorder scenario + `performance.md` memory capture at depth 2–3; (6) UI follow-up (the modifier-chain-viz item — see the correction noted there). Gate the depth: most setups are 1 modifier, so the chain path must cost nothing when `n == 1` (the current fast path stays the `n == 1` branch).
+
+### Intermittent ~0.5 s LED pauses with the RMT driver (pending investigation)
+
+Observed on the bench (2026-06): LED output running on the RMT driver occasionally freezes for about half a second. Postponed by the product owner until more observations exist. Ranked suspects from the initial analysis, each with a cheap experiment:
+
+1. **WiFi modem power-save never disabled** — nothing in `src/` calls `esp_wifi_set_ps(WIFI_PS_NONE)`, so the IDF default `WIFI_PS_MIN_MODEM` is active; the radio's DTIM sleep causes exactly this class of intermittent multi-hundred-ms stall. WLED and the v1/v2 lineage disable sleep. Experiment: one line in the ESP32 platform code after association.
+2. **NetworkSendDriver sending synchronously every tick to an absent destination** (default `192.168.1.70`) — lwIP keeps re-ARPing a dead address while the send sits in the render tick. Data point (2026-06-10): the bench esp32-16mb had NetworkSend *disabled* in its persisted config, consistent with the pauses being annoying enough to switch the sender off. Experiment: point the ArtNet IP at a live host (or disable the driver) and see if the pauses stop.
+3. **`rmt_tx_wait_all_done` 1 s timeout** — a wedged transmission blocks the tick up to a full second (multi-pin: up to N×1 s). Least likely (~1 s, not ~0.5 s) but it's the only hard block in the driver itself.
+
+If pauses correlate with UI control changes, also consider the 2 s-debounced SPIFFS save stalling flash-resident code. The per-tick KPI log around a pause discriminates between these immediately.
+
+### NoiseEffect simplex cost on ESP32 (investigation)
+
+With mirror XY at 128×128, NoiseEffect renders the 64×64 logical quadrant in **~11 ms/tick** on the Olimex (measured) — the simplex math dominates, since the Xtensa LX6 has no FPU and float math is software-emulated. (RainbowEffect on the same pipeline is much cheaper.) This is correct, non-degraded behaviour; it's only worth revisiting if a deployment needs Noise faster than ~11 ms at this grid.
+
+Worth investigating if so:
+
+- **Q16 fixed-point simplex** instead of float (kills the software-float emulation cost).
+- **Lower-precision hash** — current simplex uses a 256-entry permutation lookup; a smaller / SIMD-friendly hash may be faster on Xtensa.
+- **Strided sampling + interpolation** — render at 32×32, bilinear up to 64×64. Visual quality cost; needs A/B comparison.
+- **Inline / unroll the inner per-pixel loop** to keep the simplex state in registers.
+
+None of these are obviously free, and a fixed-point port may shift the visual signature. Defer until there's a real use case — on the no-PSRAM Olimex at large grids the tick is dominated by the synchronous ArtNet send (~35 ms), not Noise, so the effect is rarely the bottleneck there.
+
+**S3 render-only data point (2026-06-17, `scenario_perf_full`):** on the PSRAM S3 with **no output driver**, Noise is the dominant cost at every grid and there's no ArtNet floor to hide it: 16²→738µs, 32²→2,831µs, 64²→11,235µs, **128²(16K)→50,555µs (~20 FPS)** — clean ~linear-in-pixels (67×), so no fragmentation/realloc pathology, just raw simplex compute. The light effect (Checkerboard) on the same sweep is 6–11× faster (16K→7,949µs, ~128 FPS). So on a PSRAM board the heavy effect IS the 16K bottleneck (where on the Olimex the network send was). This is the strongest case for the fixed-point/strided-sampling ideas above, since a PSRAM board can run 16K grids that the network-bound Olimex never reaches. The S3 has a real FPU (LX7), so the win is less about software-float emulation and more about per-pixel simplex work; profile before committing.
diff --git a/docs/backlog/leddriver-deferred.md b/docs/backlog/leddriver-deferred.md
deleted file mode 100644
index 6b78ece..0000000
--- a/docs/backlog/leddriver-deferred.md
+++ /dev/null
@@ -1,14 +0,0 @@
-# LED driver — remaining deferred items
-
-The LED-driver increments **shipped**: increment 1 (RMT/WS2812B single-strand on classic ESP32 — [`RmtLedDriver.h`](../../src/light/drivers/RmtLedDriver.h), `RmtSymbol.h`, `platform_esp32_rmt.cpp`) and increment 2 (2a multi-pin RMT, 2b parallel LCD_CAM on the S3 — [`LcdLedDriver.h`](../../src/light/drivers/LcdLedDriver.h) via [`ParallelLedDriver.h`](../../src/light/drivers/ParallelLedDriver.h), `platform_esp32_lcd.cpp`), all with host + on-board-loopback tests, hardware-proven. The locked decisions, file-by-file phases, the WiFi-flicker test-rig analysis, and the bench deviations (8-GPIO i80 bus, 2.67 MHz slot clock, SOC-macro gate, real-frame loopback) are in [decisions.md](../history/decisions.md), the [driver docs](../moonmodules/light/drivers/RmtLedDriver.md), and the [analysis docs](leddriver-analysis-top-down.md). What remains here is only the work that has **not** shipped and is tracked nowhere else.
-
-## Deferred
-
-- **sigrok/fx2lafw cross-check + MoonDeck "LED driver test" Python script** — the independent-clock proof and the run-from-MoonDeck flow ([analysis §5.3](leddriver-analysis-top-down.md)). The on-board RMT-RX loopback (shipped) is the cheap CI correctness gate but a *compromised witness* for WiFi-induced flicker — the RX capture runs on the same ESP32 whose WiFi causes the glitch. The real flicker test is a **sustained capture (seconds) with WiFi associated + a packet flood**, decoding every frame for a byte-slip or reset-gap deviation; it belongs with the core-1 driver-task work below, since that task pinning is the *fix* it validates. A DSLogic Plus (100 MS/s) upgrade is reactive — only if a flicker reproduces that 24 MS/s can't resolve.
-- **Dedicated core-1 driver task + per-module core-affinity control** ([analysis §7.2](leddriver-analysis-top-down.md)) — the WiFi-glitch mitigation, shared across all the LED drivers. (See also backlog [§ Task core-pinning](backlog.md#task-core-pinning-backlog) for the general task-pinning question.)
-- **`rmtWs2812Show` fuller error handling** (deferred from PR #17 / 🐇 CodeRabbit). The shipped path has a finite `rmt_tx_wait_all_done` timeout (1 s) so a wedged DMA can't hang the render tick forever, and a dropped frame self-heals (the driver re-encodes the whole frame next tick). The fuller version — `rmt_transmit` return check, `rmt_tx_stop` to cancel an in-flight transfer on timeout, `show()` returning failure so `loop()` won't reuse `symbols_` mid-transmit — belongs with the **core-1 driver-task** work, since that task owns the buffer lifetime and in-flight state the cancel logic needs.
-- **Per-driver buffer window** — `start`/`count` controls on each physical driver, so different slices of the light buffer can go to different outputs (e.g. "some lights to ArtNet, others to LED pins"). Additive on `DriverBase` consumers when it lands — no change to the Drivers container or the buffer-passing contract; the multi-pin RMT slicing would then subdivide the driver's window instead of the whole buffer.
-- **Auto-derived DMA buffer count** (7 / 30 / 75 per [analysis §7.4](leddriver-analysis-top-down.md)), **16-bit pipeline + dither** ([§7.3](leddriver-analysis-top-down.md)), **shift-register expander stubs** ([§7.5](leddriver-analysis-top-down.md)).
-- **Moving-head preview = peer interpreter.** When moving heads land, the previewer must interpret channel semantics (pan/tilt/RGBW-at-arbitrary-indices) to render a moving fixture — the same light-preset model physical drivers use, interpreted to screen. This is *why* the increments named the abstraction "interpret the preset" rather than "apply correction / opt out": so Preview becomes a full peer here without a rename. Its own design plan when moving-head support starts.
-
-(The shared lane-driver scaffolding extraction — when a 3rd parallel backend lands — is tracked separately in [backlog § Extract shared lane-driver scaffolding](backlog.md#extract-shared-lane-driver-scaffolding-when-the-3rd-parallel-backend-lands-deferred).)
diff --git a/docs/backlog/livescripts-analysis-bottom-up.md b/docs/backlog/livescripts-analysis-bottom-up.md
new file mode 100644
index 0000000..0add6d8
--- /dev/null
+++ b/docs/backlog/livescripts-analysis-bottom-up.md
@@ -0,0 +1,236 @@
+# MoonLive — live-script engine landscape analysis
+
+> **Forward-looking research document — exception to CLAUDE.md present-tense rule.** This is a Stage-1 bottom-up survey of *live scripting* for projectMM: running user-authored scripts (LED effects, layouts, modifiers, drivers, sensor logic) on a running device without a recompile-and-flash cycle. It deep-reads one reference implementation — the [ewowi/ESPLiveScript `fix-warnings` fork](https://github.com/ewowi/ESPLiveScript/tree/fix-warnings) of [hpwit/ESPLiveScript](https://github.com/hpwit/ESPLiveScript) — at HEAD on **2026-06-25**, surveys the comparable field (WLED ARTI-FX, embedded VMs, WASM), and extracts the architectural primitives a clean projectMM redesign must decide. Companion to the monthly digest [history/hpwit-ESPLiveScript.md](../history/hpwit-ESPLiveScript.md) (credits + activity log). The **top-down** redesign document ([livescripts-analysis-top-down.md](livescripts-analysis-top-down.md)) expands the decisions recorded here into the build spec. Source citations use `file:line` against the cloned fork; inferred claims are marked *(inferred)*. Modelled on [leddriver-analysis-bottom-up.md](leddriver-analysis-bottom-up.md).
+
+## TL;DR
+
+- **What live scripting is, and why projectMM wants it.** The same itch that produced WLED ARTI-FX and ESPLiveScript: author an effect (or layout, modifier, driver, sensor rule) *as text*, push it to a running device, see it run **on the next tick** — no toolchain, no flash, no reboot. It turns projectMM from "the effects we compiled in" into "any effect a user can write," and it's the natural home for a web-based pattern editor.
+- **The design space has three corners, set by *how* a script becomes execution.** (1) **AST-walking interpreter** — parse to a tree, walk it every frame (WLED **ARTI-FX**: everything stored as `double`, flexible, slow). (2) **Bytecode VM** — compile to a compact opcode stream, run a dispatch loop (**PixelBlaze**, most embedded Lua/JS). (3) **Native JIT** — emit real machine code, call it as a function (**ESPLiveScript**). Speed climbs (1)→(3); portability and simplicity fall (1)→(3). projectMM's "blazingly fast like ESPLiveScript" requirement points at (3), but (3) is exactly where portability dies — see below.
+- **ESPLiveScript is a from-scratch C-like compiler that JIT-emits native Xtensa machine code** (confirmed, not bytecode): `tokenizer.h` → `asm_parser.h` (AST of `NodeToken`) → visitor methods emit Xtensa assembly *strings* → `asm_parser_LMbin.h` encodes them to 32-bit opcodes → the binary is copied to executable RAM (`heap_caps_malloc(..., MALLOC_CAP_EXEC)`) and **called as a function pointer** via inline `callx8` (`execute_asm.h:386-399`). That direct-call, no-dispatch-loop design is the entire "85 fps C++ vs 10 fps Gravity vs 3 fps Lua" speed story from its README.
+- **The portability finding that reshapes everything: ESPLiveScript is Xtensa-only.** The agent deep-read confirmed **no RISC-V backend** — all codegen is Tensilica Xtensa LX (`asm_parser_LMbin.h`, the inline-asm executor). This matters enormously for projectMM's target order: classic ESP32 + S3 are Xtensa (✅ ESPLiveScript runs), but **ESP32-P4 is RISC-V** (❌), as are Teensy 4.x (ARM Cortex-M7) and desktop (x86-64 / ARM64). So ESPLiveScript as-is covers exactly the *first two* targets on projectMM's list and **none** of the rest. A native-codegen engine needs **one backend per ISA** (Xtensa, RISC-V, ARM Thumb-2, x86-64, ARM64) — that's the real cost of "blazingly fast everywhere."
+- **The front-end is portable; the back-end is not.** Tokenizer + parser + AST (`NodeToken`) are CPU-agnostic; only the *visitor → opcode* tier and the *load-and-execute* tier are ISA-bound. But today they're **deeply interleaved** — visitor methods emit Xtensa strings inline, there is **no intermediate representation (IR)** between AST and machine code. A clean redesign's load-bearing decision is whether to introduce that IR seam so one front-end feeds many back-ends (the LLVM shape, scaled down).
+- **The "compatible with MoonModule" requirement is the projectMM-specific value-add.** ESPLiveScript binds to the host via `addExternalFunction(name, ret, sig, fnptr)` / `addExternalVariable(name, type, _, ptr)` (`asm_external.h`) — a flat C-pointer registry. projectMM needs scripts to read/write **controls**, consume the **producer/consumer data structures** (a `Buffer`, an `AudioFrame`), and slot into the **module tree** as a scripted effect/layout/modifier/driver/peripheral. That binding layer — script ⇄ MoonModule — is ours to design; no surveyed engine has it.
+- **Memory + sync are already partly modelled in ESPLiveScript** and align with projectMM's constraints: compiled code lands in IRAM/PSRAM by target (`execute.h:10-15` gates PSRAM stack on S3/P4), a **save/load compiled-binary path** exists (`savebinary`/`executebinary` examples → compile once, ship the binary, skip re-compile on boot), and a `sync()` primitive coordinates concurrent script tasks. These are the right *ideas*; the redesign carries them forward against our `platform::` seam and `Scheduler`.
+- **Code-quality reality (for the redesign).** Header-only, ~18K lines across 11 headers, **pervasive global state** (`string signature; Token __t;` and dozens of file-scope compiler counters), no IR, no unit tests, a 4,100-line `Parser` and a 5,824-line `NodeToken`. It works and it's fast, but it is **not** a base to extend in place — it's the reference to learn from and rewrite against our architecture (exactly the *Industry standards, our own code* method we used for LED drivers).
+- **Recommendation: build our own native engine, Xtensa-first, behind an IR seam — start small, start beautiful, no dead-ends.** Take the ESPLiveScript *approach* (native machine-code execution, near-100% speed — the standout, never-done-before-in-this-space when bound to a module system) and add the one thing our multi-target goal needs that a single-ISA engine doesn't: put an **IR seam** between a platform-independent front-end (tokenizer→parser→AST) and the code generator. **Ship one backend first — Xtensa (classic ESP32 + S3)** — exactly where ESPLiveScript already proves native speed; that's the small, beautiful, blazingly-fast first deliverable. The IR seam is the **no-dead-end guarantee**: adding RISC-V (P4), ARM (Teensy), or x86/ARM64 (desktop) later is "write another backend behind the same IR," never "go back to the drawing board." ESPLiveScript's real dead-end isn't *Xtensa-first* — it's *Xtensa-welded-in, no IR*; we start at the same fast place but with the seam it lacks. **WASM/WAMR is the named fallback, per target**: a target without a native backend yet can run the portable path through the same IR, so we're never blocked — but the *flagship* experience is native. (Detail + why-this-over-WASM-wholesale in [§ Recommendation](#recommendation--native-engine-xtensa-first-behind-an-ir-seam).)
+- **Safety the same way — climb the tiers, don't pay upfront.** A user-facing script editor means a bad script must degrade, not brick. Start with the **cheap** safety (array **bounds-checking** = a compare-branch per indexed access, low single-digit %, and removable in a trusted/fast mode; **watchdog / instruction budget** to kill a runaway loop = near-free, the task WDT already does most of it) — these catch the common bad-script cases at low cost (the kind the `fix-warnings` null-deref was). The **expensive** tier — a true memory sandbox where a script *cannot* touch memory outside its arena — is exactly what WASM gives for free and native can't cheaply; leave it as a tier we *can* climb via the IR→WASM fallback if field experience demands it, not a wall we hit. So safety is staged, not a foregone full-sandbox cost.
+- **Ruled out (with reasons, so the top-down doesn't relitigate).** **FastLED's WASM** is browser *preview* (Emscripten-compiled FastLED in a Web Worker), not on-device scripting — adjacent, not it. **MicroPython/Python** is the right *edit* ergonomics but far too slow for the hot path (the Lua/Gravity wall that birthed ESPLiveScript). **Rust/TinyGo** are near-native but **AOT-compiled-and-flashed** — they remove no edit loop. **Adopting WASM/WAMR *wholesale* as the only engine** is the considered alternative, not a dead end — it wins portability + free sandbox but tops out at ~50% native (WAMR-AOT) and carries a 200KB+ runtime; we keep it as the per-target fallback rather than the flagship, because *native speed is the differentiator we're chasing*.
+- **Out of scope for Stage 1.** Final VM-vs-JIT decision; IR design; the web editor; benchmarking on real hardware; the language grammar spec. All Stage 2 (top-down).
+
+## Why this document exists
+
+projectMM compiles its effects, layouts, modifiers, and drivers into the firmware. Adding one means writing C++, building, and flashing. **Live scripting removes that loop**: a user writes an effect as text in a browser, the device compiles/loads it, and it runs as a first-class module on the next tick — the same leap WLED took with ARTI-FX.
+
+The product owner's requirements (verbatim intent):
+
+- **General in core, specific in light.** Scripts must work for domain-neutral core jobs (e.g. read/transform sensor data) *and* the light domain: a scripted **layout** (coordinate iterator), **effect** (writes the buffer), **modifier** (remaps positions), **driver** (consumes the buffer). One engine, many module roles.
+- **Target order.** ESP32 classic + S3 **first**; then P4 and other ESP32 flavours; then Teensy; then macOS / Linux / Windows.
+- **Blazingly fast, like ESPLiveScript** — near-native per-pixel throughput, because a script runs in the render hot path at up to 16K+ lights × 50 FPS.
+- **Smart memory management** — IRAM/PSRAM-aware, no hot-path allocation, compile-once/run-many.
+- **Infinitely scalable** — run *as many* live scripts concurrently as memory allows, exploiting PSRAM (each script is an independent compiled unit; the only ceiling is free heap, not a fixed slot count). Many small scripted modules — several effects across layers, a scripted modifier, a couple of core sensor rules — coexist; the device hosts what fits and degrades gracefully when it doesn't, the same way the light pipeline already scales to available memory.
+- **Sync with the rest of the system** — live reconfig (no reboot), `Scheduler`-driven, robust to add/delete/replace in any order, controls and producer/consumer data wired in.
+- **Compatible with the MoonModule class** — a scripted module is a MoonModule: it has controls, a `loop()`, a role, and renders generically in the UI with zero per-script UI code.
+
+This document characterises the one reference that already hits "blazingly fast" (ESPLiveScript), maps it against the field, and surfaces every decision the redesign must make. It does **not** pick the design — that's the top-down doc.
+
+## ESP32 — primary depth: ESPLiveScript (the reference)
+
+Read at `ewowi/ESPLiveScript@fix-warnings`, cloned 2026-06-25. ~18,358 lines across 11 header-only files in `src/`.
+
+### What it is, in one sentence
+
+A hand-written **C-like language with a from-scratch tokenizer → parser → AST → native-Xtensa code generator**, where the compiled script is loaded into executable RAM and **called directly as a function** — a JIT compiler, not an interpreter. Yves Bazin (hpwit) built it because Lua (3 fps) and Gravity (10 fps) couldn't drive his 12,288-LED panel where hand-written C++ hit 85 fps (README intro).
+
+### The pipeline (the load-bearing structure)
+
+Source text flows through five stages; the data structure between them is `Token` → `NodeToken` (the AST node) → assembly text → binary:
+
+1. **Tokenize** — `src/tokenizer.h` (2,394 lines). Lexes source into `Token`s with a `tokenType` enum. Also owns the user-defined-type registry (`_userDefinedTypes`, global).
+2. **Parse → AST** — `src/asm_parser.h` (1,929 lines) builds a tree of `NodeToken` (`src/NodeToken.h`, 5,824 lines). `NodeToken`'s `nodeType` enum has ~47 kinds (`binOpNode`, `defFunctionNode`, `forNode`, `ifNode`, `callFunctionNode`, `returnNode`, `defAsmFunctionNode`, …). A for-loop becomes a `forNode` with init/cond/incr/body children.
+3. **Generate code (visitor)** — `NodeToken::visitNode()` (`NodeToken.h:818-1001`) dispatches to `_visitbinOpNode()`, `_visitcallFunctionNode()`, etc., each of which **emits Xtensa assembly strings** into output buffers (e.g. `NodeToken.h:1858` emits `movi a%d,%d`). There is **no IR** — visitors know Xtensa directly.
+4. **Encode to binary** — `src/asm_parser_LMbin.h` (592 lines) turns assembly text into 32-bit Xtensa opcodes (`bin_add`, `bin_l32i`, `bin_movi`; e.g. `bin_add` at `:97-100` emits `0x800000 | …`).
+5. **Load + execute** — `src/execute_asm.h` (876 lines). `_createExcutablefromBinary()` (`:224-275`) copies the binary into executable RAM with `heap_caps_malloc(size, MALLOC_CAP_EXEC)` (`:232`), patches external references (relocation, `:44-223`), and `executeBinaryAsm()` (`:386-399`) runs it via inline asm: `l32i a15,%0,0 ; callx8 a15` — **a direct indirect call to the generated code.** No dispatch loop. That is the speed.
+
+### Why it's blazingly fast (confirmed)
+
+It is **native machine code called as a function** — the CPU fetches the script's own instructions from IRAM, exactly like a compiled C function. There is no per-opcode interpreter overhead (the cost a bytecode VM or AST-walker pays every operation). The README's benchmark (85 fps C++ ≈ ESPLiveScript ≫ 10 fps Gravity ≫ 3 fps Lua) is the direct consequence. Scripts can even drop to **inline Xtensa** for the hottest paths (`__ASM__ uint32_t millis() { "entry a1,32" … "retw.n" }`, `sc_examples/animwle.sc`).
+
+### What ties it to ESP32 — the portability barrier
+
+The agent's deep-read is unambiguous: **Xtensa-only, ESP-IDF-coupled.**
+
+- **Codegen is 100% Xtensa LX** (`asm_parser_LMbin.h`, all visitor emission). **No RISC-V, no ARM, no x86 backend exists.** Only ~1 arch `#ifdef` in the codegen — and it's a *memory-caps* choice (S3/P4 PSRAM stack vs classic internal, `execute.h:10-15`), not a second ISA. (Note the irony: that one `#ifdef` *mentions* ESP32-P4, but only for stack allocation — P4 is RISC-V, so the **generated code wouldn't run on it.** *(inferred from "Xtensa-only codegen" + P4 being RISC-V)*.)
+- **Execution is ESP-IDF-specific**: `MALLOC_CAP_EXEC` IRAM allocation, inline `callx8`, `rsr a14,234` cycle-counter reads, `xTaskCreatePinnedToCoreWithCaps` (`execute.h:590`).
+- **Front-end is portable, back-end is not**: tokenizer + parser + AST are CPU-agnostic; tiers 2-4 (visit→opcode, encode, load-execute) are ISA/platform-bound and **interleaved** with no seam between them.
+
+So on projectMM's target list, ESPLiveScript as-is runs on **classic ESP32 + S3** and stops there. P4 (RISC-V), Teensy (ARM), and desktop (x86-64/ARM64) each need a *new code generator* — 2-3K lines per ISA *(inferred, agent estimate)* — or a different execution strategy entirely.
+
+### Host integration — the binding model
+
+A host C program drives it through `class Parser` (`ESPLiveScript.h:79`):
+
+- **Compile + run**: `parseScript(&str)` → `Executable`; `Executable::execute("fn", args)` runs a function; `executeAsTask("fn", core, args)` runs it pinned to a FreeRTOS core; `suspend()/restart()/kill()/free()` manage its lifetime (`execute.h:352+`).
+- **Expose a C function to scripts**: `addExternalFunction("calc","float","int",(void*)calcul)` → script calls `float h = calc(52);` (`asm_external.h`, README example).
+- **Expose a C variable**: `addExternalVariable("value","int","",(void*)&v)` and `("array","int *","",(void*)arr)` → script does `value = value + 2; array[i] = 10;`.
+- **Arguments**: `int` and `float` only (`ESPLivescriptRuntime.h:150-176`).
+- **JSON path** (`__JSON__OPTION__`): scripts exchange JSON with the host (`execute_asm.h:400-471`) — the `enjoy json` feature from the digest; the bridge a web editor would lean on.
+- **Precompiled binaries**: `parseScriptBinary()` → `saveBinary()/loadBinary()` → `createExecutableFromBinary()` (`execute_asm.h:276-384`). Compile once (on a desktop or web service), persist the `ESPLiveScript1.0.1`-format binary, load it on the device — but **external pointers are not serialized**, they re-bind at load (README). This is the seed of a smart compile-once memory strategy.
+
+This binding is a **flat C-pointer registry** — exactly what projectMM must *replace* with a MoonModule-aware layer (controls, producer/consumer structs, the module tree).
+
+### Memory model
+
+- Generated code → executable RAM via `MALLOC_CAP_EXEC` (IRAM on classic; PSRAM-capable on S3/P4 via `__LS_STACK_CAPS`, `execute.h:10-15`).
+- Script globals → a malloc'd `data` buffer; locals → the Xtensa ABI stack frame (`entry a1, size`); params → registers a2-a7.
+- Precompiled-binary persistence (above) = compile-once.
+- `Executable::free()` releases both code and data.
+- No PSRAM is *forced* for the data section; that's a knob the redesign would make policy.
+
+### The language (what a user writes)
+
+C-like, LED-oriented. From `sc_examples/*.sc` + README:
+
+- **Types**: `int`/`s_int` (32/16-bit), `uint8_t..uint32_t`, `float`, `char`, `bool`, plus **`CRGB`/`CRGBW`** (LED colour) as first-class; user `struct`s with fields, methods, constructors; multi-dimensional arrays (`int g[z][y][x]`).
+- **Control flow**: `if/else`, ternary, `while`, C-style `for`, `break`/`continue`, `return`; recursion (`sc_examples/fibonacci.sc`).
+- **Built-ins**: `printf`/`printfln` (int only), `millis()`, `rand`/`copy`/`memset`/`fill` (inline-asm in `functionlib.h`), `hsv()` and FastLED math when `USE_FASTLED` is set.
+- **Escape hatch**: `__ASM__ … @` blocks for hand-written Xtensa.
+- **Preprocessor**: `#define TOKEN value` (substitution only).
+- **Flavour example** — `sc_examples/animwle.sc` is a **Mandelbrot effect ported from an existing pattern** (`#define width 128`, float `cR/cI`, nested grid loops, inline-asm `millis()`), which tells you the target audience: people porting effects from other LED-scripting environments.
+
+### What the `fix-warnings` fork changed
+
+Despite the branch name, the fork's substantive change is **one commit (`4871509`, 2026-04-02): a null-pointer crash fix**, not a `-Wall` cleanup. `findMaxArgumentSize()` in `NodeToken.h` dereferenced `getChildAtPos(1)`/`(2)` unconditionally; a **nested external-function argument** (`setRGB(random16(NUM_LEDS), CRGB(0,0,255))`) produces a node without those children → `LoadProhibited` crash on device. The fix adds null guards (return 0 — a scalar needs no pre-call stack spill). *Relevance to projectMM*: this is precisely the class of bug a from-scratch hand-written parser breeds (no test harness caught it), and a data point for "rewrite with tests" over "extend in place."
+
+### Structural observations (what a multi-target rewrite must account for — not a verdict on the original)
+
+These are the differences between ESPLiveScript's design (one author, one ISA, maximum speed) and what projectMM's *different* goals (multi-target, module-bound, tested) need. They are reasons to write our own against our architecture, not faults — ESPLiveScript meets its own goals well.
+
+- **Header-only**, ~18K lines, 11 files; the two biggest (`NodeToken.h` 5,824, `ESPLiveScript.h` 4,100) carry several jobs each (tree + metadata + 47 visitors + asm emission). Fine for a single-include library; we'd split for testability.
+- **File-scope state**: `string signature; Token __t;` (`ESPLiveScript.h:29-30`), plus global register-allocation stacks, output buffers, compiler counters. A consequence: one compilation at a time. Acceptable on a device that compiles one script; we'd encapsulate it.
+- **No IR** between AST and Xtensa — the one structural thing that makes multi-target hard, and the single highest-leverage change our redesign makes. (ESPLiveScript didn't need it — it targets one ISA.)
+- **`.ino` integration examples, no unit suite** — natural for an Arduino library; we'd add unit + scenario tests because robustness is pinned by tests here.
+
+The lesson is the LED-driver lesson: **study it hard, credit it (see § Prior art & credits), write our own against our architecture and goals.**
+
+## The comparable field (what else to learn from)
+
+projectMM's "industry standards" rule says: name the prior art, take the textbook approach. The live-scripting field has three established design points; ESPLiveScript is the extreme of one.
+
+### WLED ARTI-FX — the AST-walking interpreter (our sibling project)
+
+[ARTI-FX](https://mm.kno.wled.ge/moonmodules/arti-fx/) (MoonModules, by ewowi — the author of this analysis — built on the **ARTI** runtime, a PEG-grammar-driven interpreter) parses a script and **walks the AST every frame**. Every value is stored as a **`double`**, converted to int when needed; scripts define `renderFrame` (per-frame) + `renderLed` (per-LED) callbacks and call `setPixelColor`/`setRange`/`fill`. Host binding is `arti_external_function` / `arti_set/get_external_variable` (the same flat-registry shape as ESPLiveScript). **What it contributes:** it proved live scripting works end-to-end in this ecosystem, and its design is maximally flexible and portable — pure C++ tree-walking, runs anywhere unchanged. The `double`-everything per-LED walk trades per-frame speed for that flexibility, which is the trade projectMM's 16K hot path can't take (and exactly the gap ESPLiveScript's native path closes). So the two are complementary baselines: ARTI-FX is the **reach** baseline (runs everywhere, the product shape proven), ESPLiveScript is the **speed** baseline (native, Xtensa) — and projectMM wants both, which is why neither alone is the answer.
+
+### WASM on ESP32 — the strongest off-the-shelf portable-runtime candidate (answering "is WASM what we want?")
+
+WebAssembly is a portable **bytecode standard** with mature small runtimes that **already run on the ESP32**, which makes it the most serious "don't build the engine, adopt one" option for the multi-target problem ESPLiveScript can't solve. Two runtimes matter:
+
+- **wasm3** — an ultra-light **interpreter** in C (~64 KB code, ~10 KB RAM), runs Arduino-class MCUs upward. Pure interpretation, so *slower* (the per-opcode dispatch cost, same class as a bytecode VM) — fine for control logic, questionable for a 16K-pixel inner loop.
+- **WAMR (WebAssembly Micro Runtime)** — supports interpreter **and AOT/JIT**; in **AOT mode WAMR reaches ~50% of native speed**, "quite acceptable" for embedded use, at a larger footprint. Rule of thumb from the field: **RAM < 256 KB → wasm3, > 256 KB → WAMR**; the classic ESP32's 320 KB+ puts it in WAMR's range. ([arXiv survey](https://arxiv.org/html/2512.00035v1), [WAMR-ESP32](https://registry.platformio.org/libraries/mlaass/WAMR-ESP32))
+
+**Why this is genuinely relevant to projectMM**, and arguably *the* answer to "runs everywhere":
+
+- **One artifact, every target.** A script compiled to `.wasm` runs on classic/S3/P4/Teensy/desktop through the same runtime — no per-ISA backend, which is exactly ESPLiveScript's missing piece. WASM **is** the portable IR + VM, off the shelf.
+- **WAMR-AOT is the "blazingly fast" bridge.** AOT-compiling the `.wasm` to native on the device (or on a host) gets ~50% of native — between a naive bytecode VM and ESPLiveScript's near-100%. That's the same "portable baseline + native acceleration" shape the bottom-up proposes, but **already built and multi-ISA** (WAMR's AOT backends cover Xtensa, RISC-V, ARM, x86).
+- **Sandboxed by design.** WASM is memory-safe and bounds-checked — a runaway/bad script traps instead of bricking the device (the safety story ESPLiveScript's native code lacks; recall the `fix-warnings` null-deref).
+- **Mature toolchain + editor path.** Any language that targets WASM (C/C++, Rust, AssemblyScript ≈ TypeScript) becomes a script source; the browser already runs WASM natively, so a web editor could compile *and preview* the exact artifact the device runs.
+
+**The costs / open questions** (the top-down must weigh): the runtime is **heavier** than a hand-rolled VM (WAMR is 200 KB+; wasm3 is light but interpreter-only); the **host-binding** for WASM (imports/exports, linear-memory marshalling of a `Buffer`/`AudioFrame`) is more ceremony than ESPLiveScript's flat pointer registry and must be designed against the MoonModule data model; the **toolchain** (a WASM compiler in the editor path) is a real dependency; and **whether WAMR-AOT actually holds 16K×50FPS** on an S3 is the load-bearing benchmark. But as a way to get *every target on day one with sandboxing for free*, WASM is the candidate to beat — the top-down should evaluate "WAMR as the engine" head-to-head against "our own VM+IR."
+
+### FastLED's WASM — adjacent but **not** what we want
+
+FastLED's `master` WASM support (`src/platforms/wasm/`) compiles **FastLED itself to WebAssembly via Emscripten to run in a *browser*** — a **simulation/preview** of effects, not a runtime that runs user scripts *on the ESP32*. It runs FastLED in a Web Worker (`PROXY_TO_PTHREAD`), bridges C++↔JS via `EMSCRIPTEN_KEEPALIVE` exports (`js_bindings.cpp`), and exports frame/strip/UI data as JSON for the page to draw. FastLED's `FxEngine` is likewise a *compiled* effect manager (switch/transition between C++ effects), not an on-device scripting language. So FastLED gives projectMM **two adjacent ideas, neither the live-script engine**: (1) "compile your effect library to WASM to **preview it in the browser**" — a preview technique that sits next to projectMM's own 3D WebGL preview, not the scripting engine; (2) precedent that the WASM toolchain is production-ready. It does **not** answer the on-device live-scripting need. ([FastLED wasm platform](https://github.com/FastLED/FastLED/tree/master/src/platforms/wasm))
+
+### Compiled languages (Rust / TinyGo) and interpreted Python — why neither is the answer (answering the Rust/Python question)
+
+- **Python / MicroPython is too slow for the hot path** — the benchmark literature is consistent: MicroPython is *"many times slower"* than C/Rust/TinyGo on ESP32 ([MDPI study](https://www.mdpi.com/2079-9292/12/1/143)). It's the same wall hpwit hit (Lua 3 fps, Gravity 10 fps) that *caused* ESPLiveScript. So "Python is an interpreter, so live-editing is easy" is true for the *edit loop* but fails the *speed* requirement at 16K×50FPS. Its real value is the **REPL/editor UX** reference, not the engine. (For non-hot-path *core* scripts — a slow sensor rule at 1 Hz — an interpreter's speed is irrelevant and Python-class ergonomics would be fine; this argues again for a **tiered** answer: cheap interpreter acceptable off the hot path, fast path needs VM/native.)
+- **Rust / TinyGo are fast but *compiled*, not interpreted** — Rust-on-ESP32 (`esp-hal`, `no_std`) and TinyGo land near C speed, but they are **AOT-compiled and flashed** — they need a toolchain and a reflash, which is *exactly the loop live scripting exists to remove*. They give no live-edit story on their own. (Rust *does* become relevant via WASM: Rust → `.wasm` → WAMR is a legitimate script-authoring path, but then the engine is WASM, not Rust-on-device.)
+- **Net:** interpreted-Python solves edit-speed but not run-speed; compiled-Rust solves run-speed but not edit-speed. The only options that give **both** live edit *and* hot-path speed are (a) a custom VM/native engine (ESPLiveScript's path, our redesign) or (b) **WASM+WAMR-AOT** (portable, sandboxed, ~50% native). Those two are the real finalists.
+
+### Other embedded VMs / JIT libraries (textbook back-ends)
+
+- **Lua / eLua / Luau** — the canonical embeddable scripting VM (register-based bytecode); the reference for a clean host C API and a GC'd value model. Too slow per-pixel raw (hpwit measured 3 fps), but the *architecture* (compile → bytecode → register VM) is the textbook.
+- **Espruino** — JS on MCUs; full-language, GC-paused; an editor/REPL UX reference, the "too much" end for a per-pixel hot path.
+- **LLVM / MIR / GNU lightning** — real JIT libraries with multi-ISA back-ends. LLVM is far too big for an MCU; **MIR** and **GNU lightning** are lightweight JITs that *do* target multiple ISAs and are the closest prior art to "one front-end, many native back-ends" if we go the custom-native-multi-target route (the alternative to adopting WASM).
+
+### The design-space map
+
+| Approach | Example | Speed (per-pixel) | Portability | Runtime size | Sandbox | Editor-friendliness |
+|---|---|---|---|---|---|---|
+| AST-walk interpreter | WLED **ARTI-FX** | Low (double-everything) | **Highest** (pure C++) | Small | Easy | High |
+| Bytecode VM | Lua, AssemblyScript | Medium-High | **High** (one VM, any CPU) | Small-Medium | Easy | High |
+| **WASM interpreter** | **wasm3** | Medium | **Highest** (standard) | ~64 KB | **Built-in** | High (any→wasm) |
+| **WASM AOT/JIT** | **WAMR** | **~50% native** | **Highest** (standard, multi-ISA) | 200 KB+ | **Built-in** | High (any→wasm) |
+| Native JIT (custom) | **ESPLiveScript** | **Highest** (native) | **Lowest** (one backend/ISA) | Medium | None (can crash) | Medium |
+
+projectMM wants ESPLiveScript's **speed** *and* ARTI-FX's **reach** — no single *custom* corner gives both, which is why one redesign path is a **layered custom** engine (portable VM baseline + optional native back-end behind a shared IR). But **WASM+WAMR-AOT collapses that table into one row**: portable to every target *and* ~50% native *and* sandboxed, off the shelf. The two real finalists for the top-down are therefore **(A) build our own VM+IR (+ optional native backend)** vs **(B) adopt WASM/WAMR as the engine** — weighed on hot-path speed (does WAMR-AOT hold 16K×50FPS?), runtime footprint, and how cleanly each binds to the MoonModule data model.
+
+## Architectural primitives observed (the decisions the redesign must make)
+
+Distilled across all four references, these are the load-bearing choices a clean engine faces — the *questions* the survey raises. Each is **decided and designed in the top-down**; listed here so the survey names what's at stake.
+
+1. **Execution strategy** — AST-walk vs bytecode-VM vs native-JIT (or a tier ladder). *The* decision; everything follows. ([top-down §2](livescripts-analysis-top-down.md#2-why-native-and-why-our-own-expanding-decision-1))
+2. **The IR seam** — ESPLiveScript emits Xtensa directly (right for one ISA); a multi-target redesign adds a representation between AST and execution so one front-end feeds many backends. The highest-leverage structural change. ([§3.2](livescripts-analysis-top-down.md#32-the-three-tiers-where-the-ir-seam-lives))
+3. **Host-binding model** — all four references use a flat name→pointer registry (`addExternalFunction`/`arti_*`); projectMM's value-add is a MoonModule binding (controls, producer/consumer structs, module role) with no prior art to copy. ([§3.4](livescripts-analysis-top-down.md#34-the-host-binding--script--moonmodule-decision-7-the-value-add))
+4. **Per-frame contract** — script writes its own `loop()` vs an engine-called `renderLed()`; determines the hot-loop shape and where per-pixel dispatch lands. ([§3.4](livescripts-analysis-top-down.md#34-the-host-binding--script--moonmodule-decision-7-the-value-add))
+5. **Compile-once / persist** — a saved artifact skips device-side recompile; portable (one artifact) with a VM/WASM, per-ISA with native. ([§3.7](livescripts-analysis-top-down.md#37-memory-placement--infinite-scalability-routed-through-platform-decisions-smart-memory-infinitely-scalable))
+6. **Memory placement** — code IRAM/PSRAM, data internal/PSRAM, per-target; routed through `platform::` as one policy. ([§3.7](livescripts-analysis-top-down.md#37-memory-placement--infinite-scalability-routed-through-platform-decisions-smart-memory-infinitely-scalable))
+7. **Concurrency + sync** — in-tick vs a pinned task; the threading contract against the scheduler + no-blocking-hot-path rule. ([§3.8](livescripts-analysis-top-down.md#38-execution-model--inline-by-default-task-as-the-exception-decision-sync))
+8. **Live reconfig + robustness** — a re-pushed script swaps in tick-atomically, old freed, no reboot, no mid-render crash. ([§3.6](livescripts-analysis-top-down.md#36-live-reconfig--tick-atomic-hot-swap-decision-sync))
+9. **Safety / sandboxing** — native can crash, a VM can bound; a user-facing editor raises the stakes. Coupled to the execution-strategy choice. ([§4](livescripts-analysis-top-down.md#4-safety--staged-decision-6))
+
+## Mapping to projectMM's requirements
+
+| Requirement | ESPLiveScript today | What the redesign must add |
+|---|---|---|
+| Blazingly fast | ✅ native Xtensa | Keep native speed *where the ISA has a backend*; VM elsewhere |
+| Core (sensor data) + light (layout/effect/modifier/driver) | ⚠️ generic funcs only; no module roles | The MoonModule binding + per-role entry-point contracts |
+| ESP32 classic + S3 first | ✅ (both Xtensa) | Carry forward (native backend) |
+| P4 + other ESP32 | ❌ P4 is RISC-V | RISC-V backend *or* VM fallback |
+| Teensy | ❌ ARM | ARM backend *or* VM |
+| macOS/Linux/Windows | ❌ x86/ARM + no IRAM | Desktop backend *or* VM (VM is the obvious win here) |
+| Smart memory | ⚠️ one `#ifdef`, IRAM/PSRAM | Route through `platform::alloc`; compile-once artifact |
+| Infinitely scalable (N scripts) | ❌ examples run one script | Independent `MoonLive` per module; code+data arenas PSRAM-first; ceiling = free heap, not a fixed count |
+| Sync with system | ⚠️ FreeRTOS tasks + `sync()` | `Scheduler` tick contract; tick-atomic hot-swap; live reconfig |
+| MoonModule-compatible | ❌ flat C registry | Scripted module = MoonModule (controls, loop, role, generic UI) |
+
+The pattern is clear: **ESPLiveScript nails speed on two chips and nothing else on this list.** Every other requirement is new work, and the multi-target + MoonModule-binding pieces are the bulk of it.
+
+## Recommendation — native engine, Xtensa-first, behind an IR seam
+
+The survey lands on a clear direction (mirroring the LED-driver bottom-up's "walk Scenario B" call, not an open fork): **build our own native-codegen engine, ship the Xtensa backend first, put an IR seam between the front-end and the code generator from day one — start small, start beautiful, extend with no dead-ends.** Native speed (near-100%) is the differentiator; the IR seam is the no-dead-end guarantee that makes "Xtensa-first" safe (RISC-V/ARM/desktop are each a new backend behind the unchanged IR); WASM/WAMR is the per-target fallback, never the rival; safety is staged (cheap bounds+watchdog first, true sandbox deferred to the WASM fallback).
+
+The full reasoning — why native over WASM-wholesale, why Xtensa-first isn't a corner, the cost accepted, the load-bearing spike — **is expanded in the top-down** ([§2 Why native](livescripts-analysis-top-down.md#2-why-native-and-why-our-own-expanding-decision-1), [§9 Staged plan](livescripts-analysis-top-down.md#9-staged-plan--the-moonlight-tutorial-ladder-as-the-spine)), and the decisions it rests on are recorded verbatim in [§ Answers — product-owner direction](#answers--product-owner-direction-2026-06-25) below. This section is the survey's conclusion; the build spec is the top-down.
+
+## Prior art & credits
+
+Per *Industry standards, our own code*: study the prior art, credit it by name, write our own. This redesign rests on work others did first.
+
+- **ESPLiveScript — Yves Bazin (hpwit).** The native-codegen approach the recommendation builds on is his. A from-scratch C-like compiler — tokenizer, parser, register allocator, Xtensa code generator, save/load compiled-binary path, header-only — that runs a script at near hand-written-C++ speed on an ESP32 (85 fps on a 12,288-LED panel where Lua managed 3 and Gravity 10). That is the result that makes "go native, not interpreted" the right call, and the reason this document exists. The structural notes below (global state, no IR, large files) are what a *rewrite toward a different goal* — multi-target, module-bound — has to account for; they are not a verdict on the original, which does its job and does it fast. We carry the idea forward and add the IR seam + the MoonModule binding.
+- **ARTI-FX / ARTI — ewowi.** The prior projectMM-family answer to the same problem, written by this analysis's author: the interpreted-effects runtime in WLED MoonModules, on the PEG-grammar ARTI interpreter. It proved the live-scripting idea works end-to-end in this ecosystem (load a script, run it live), and it is the source of lessons carried straight into this design — the `renderFrame`/`renderLed` split, the host-binding shape, and, by being the AST-walking design, the clearest demonstration of *why* a 16K hot path wants native or VM execution over tree-walking. The redesign trades its interpreter for native speed; it keeps its product shape and its lessons.
+- **MoonLight — MoonModules** (the [effects tutorial](https://moonmodules.org/MoonLight/moonlight/effects-tutorial/), the staging spine and the host-binding surface model). See the per-engine sections above for what each contributes.
+
+Activity + credits also in the digest [history/hpwit-ESPLiveScript.md](../history/hpwit-ESPLiveScript.md).
+
+## Risks and unknowns
+
+The open questions the survey surfaced are **resolved in the top-down**, each in its own section: the load-bearing speed unknown — can native-with-safety hold 16K×50FPS, else fall back to WASM — is the first spike ([top-down §9.2](livescripts-analysis-top-down.md#92-the-ladder)); IR design ([§3.2](livescripts-analysis-top-down.md#32-the-three-tiers-where-the-ir-seam-lives)); the per-pixel-vs-per-frame contract ([§3.4](livescripts-analysis-top-down.md#34-the-host-binding--script--moonmodule-decision-7-the-value-add)); the MoonModule-binding mechanics ([§3.3–3.4](livescripts-analysis-top-down.md#33-a-scripted-module-is-a-moonmodule-decision-7)); safety depth ([§4](livescripts-analysis-top-down.md#4-safety--staged-decision-6)); editor + persistence ([§9.2](livescripts-analysis-top-down.md#92-the-ladder), stage 10). The single load-bearing one to flag here: **whether native codegen holds the frame budget on a real S3** — if it doesn't, the IR seam makes the WASM fallback a backend swap, not a restart.
+
+## Answers — product-owner direction (2026-06-25)
+
+Decisions from the design discussion that produced this survey. These are *direction*, terse on purpose; the top-down expands each into full reasoning, an API/architecture, and a staged plan. (Mirrors the LED-driver bottom-up's product-owner-direction section.)
+
+1. **Execution = native, the standout.** Build our own **native-codegen** engine (ESPLiveScript-class speed, near-100%) — the differentiator; projectMM should stand out with something not done before (a native live-compiler bound to a real module system). *Not* a slow interpreter, *not* WASM-as-flagship.
+2. **No dead-ends, start small + beautiful (the LED-driver method).** Ship **one ISA backend first — Xtensa (classic ESP32 + S3)** — as a complete, blazing first increment, then grow. The **IR seam** (front-end → typed IR → per-ISA backend) is the no-dead-end guarantee: RISC-V (P4), ARM (Teensy), x86/ARM64 (desktop) each become a *new backend behind the unchanged IR*, never a rewrite. WASM/WAMR is the **per-target fallback** so no target is ever blocked.
+3. **The IR must NOT cost speed (hard constraint).** It is a *compile-time* representation that lowers to the *same* native instructions ESPLiveScript hand-emits — **zero per-pixel runtime overhead**, no interpreted layer. Equally fast as hpwit on Xtensa is non-negotiable; prove it by diffing generated instructions for a hot loop against hand-written Xtensa, and keep an `__asm__` escape hatch for the very hottest paths (as ESPLiveScript has).
+4. **Source language = a C-subset, "as close as possible" to the precompiled effect, with pragmatic simplifications.** The effect *body* (types like `uint8_t`/`uint32_t`/`lengthType`, nested `for`, integer + 64-bit math, `static_cast`, `RGB`, `hsvToRgb`, buffer writes) ports **near-verbatim** from a file like `RipplesEffect.h` (our reference effect — it exercises the hard cases: `float` trig `std::sqrt`/`std::sin`/`std::floor`, `std::memset`, 3D with `depth()`, two controls). The C++ *file/class ceremony* that buys nothing in a script (`#pragma`/`#include`/`namespace`, and — accepted as a pragmatic simplification — `class : public EffectBase`/`override`/the `controls_.addUint8` host-object dance) is **dropped or lightened**: the engine supplies the module scaffolding around the script. Target: porting an existing effect is the loop body verbatim + a handful of lines changed, *not* a rewrite, and *not* implementing a full C++ object model (inheritance/vtables/host-method binding) in the engine. **Not** a JS-subset (the ARTI-FX surface): JS's double-everything number model is the slow path *and* further from our C++ codebase, so it's worse on both speed and portability of existing effects.
+5. **Controls = minimal ceremony.** A scripted control is a near-plain top-level variable (e.g. `uint8_t speed = 60;` with a range annotation); the engine derives the MoonModule control + UI + persistence. Lighter than today's explicit `controls_.addUint8(...)`, copy-paste-friendly. (Exact annotation syntax is the top-down's call.)
+6. **Safety = staged, climb the tiers, don't pay upfront.** Ship the **cheap** tier first — array **bounds-checking** (a compare-branch per indexed access, low single-digit %, removable in a trusted/fast mode) + **watchdog / instruction budget** (kill a runaway loop, near-free). The **expensive** true-memory-sandbox tier (a script physically can't touch memory outside its arena — what WASM gives free, native can't cheaply) is **deferred**, reachable via the IR→WASM fallback only if a public script editor in the field shows the cheap tier isn't enough. Decided this way because the price of full sandboxing upfront isn't worth paying before evidence demands it.
+7. **MoonModule-first.** A scripted module **is** a MoonModule (role, controls, `loop()`, generic UI, lifecycle, robustness, live-reconfig). The script ⇄ MoonModule binding (reach the `Buffer`/`AudioFrame`/LUT via the producer/consumer pull pattern, no copy) is the projectMM value-add to design — no prior art copies cleanly.
+8. **General in core + specific in light.** One engine serves a domain-neutral core script (e.g. transform sensor data) *and* a scripted layout / effect / modifier / driver. **Effect is the first role.** `RipplesEffect.h` is the *reference* effect for the language design (it stresses float trig + 3D + memset), but it is **too complex for the hello-world spike** — the first running script must be trivial (e.g. fill the buffer one colour, or a single moving dot), proving the engine end-to-end before any real effect. Ripples is the *graduation* target, not the spike. For how an effect is structured for a newcomer, the [MoonLight effects tutorial](https://moonmodules.org/MoonLight/moonlight/effects-tutorial/) is a good read (a sibling project's step-by-step). The simple→Ripples progression is itself the start-small-grow staging applied to the demo.
+9. **Infinitely scalable.** Run *as many* live scripts concurrently as memory allows, exploiting PSRAM — each script is an independent compiled unit, the ceiling is free heap, not a fixed slot count. Many small scripted modules coexist; the device hosts what fits and degrades gracefully when it doesn't (the same scaling-to-available-memory contract the light pipeline already honours).
+10. **Inline execution by default; task is the exception.** A scripted effect/layout/modifier/driver runs *inline in the `Scheduler` tick*, called exactly like a compiled effect's `loop()` — one mental model, no cross-thread sync to reach the buffer/`AudioFrame`, and it runs on the render task's *internal-RAM* stack (fast). Task-per-script isn't blocked on memory (a task stack can live in PSRAM), but it pays two costs inline doesn't: per-task **scheduling overhead** (a context switch per task per frame — hundreds of tasks thrash the scheduler, a ceiling independent of memory), and a **PSRAM-backed stack is hot-path-slow** (PSRAM latency on every per-pixel local access, ~12 vs ~80 MB/s). So inline keeps the per-script stack fast and free, and PSRAM is spent on script *code + data* (decision 9) rather than per-script stacks. A pinned task is the narrow, documented opt-in *only* for a long/blocking *core* script (e.g. slow sensor I/O) that must not share the render tick — never the default, never for a pipeline script.
+11. **Sequencing: hybrid (depth-first to hello-world, then prove the seam on a 2nd ISA early).** Build the full vertical slice on Xtensa just far enough to run hello-world native (classic/S3), then *immediately* prove a minimal second-ISA backend (P4/RISC-V, or desktop x86-64) on that same slice — before deepening to controls/math/2D/3D. This retires the project's biggest risk (does the IR seam genuinely decouple front-end from backend?) at hello-world cost, when fixing it is cheap, rather than discovering a leak after six stages. Then deepen, primarily on Xtensa; the full second backend follows later.
+12. **Domain-neutral engine core, thin binding.** The engine (front-end + IR + backends) is domain-neutral core — it never depends on projectMM; the binding (`MoonLiveHost`/`MoonLiveEffect`) depends on the engine, one-directionally, through the engine's public API + a tiny injectable platform seam (`allocExec`/`alloc`). This clean layering is adopted *because it is what makes projectMM-as-a-library optimal* (the [*Domain-neutral core*](../../CLAUDE.md) principle applied), and is **never compromised** for any separability — if a separation would cost projectMM's speed/simplicity/hot-path/principles, it isn't done.
+## Out of scope for Stage 1
+
+Final VM-vs-JIT decision; the IR design; the language grammar spec; the web editor; per-engine benchmarking on real hardware; the MoonModule-binding mechanics; the sandboxing depth. All belong to the top-down document the prompt above generates.
diff --git a/docs/backlog/livescripts-analysis-top-down.md b/docs/backlog/livescripts-analysis-top-down.md
new file mode 100644
index 0000000..e729070
--- /dev/null
+++ b/docs/backlog/livescripts-analysis-top-down.md
@@ -0,0 +1,432 @@
+# MoonLive — live-script engine, top-down redesign
+
+> **Forward-looking research document — exception to CLAUDE.md present-tense rule.** **MoonLive** is projectMM's live-script engine (the Moon family: MoonLight, MoonDeck, MoonLive — author an effect as text, see it live). Stage-2 companion to [livescripts-analysis-bottom-up.md](livescripts-analysis-bottom-up.md) (read first: it deep-reads the ESPLiveScript fork, surveys WLED ARTI-FX, the embedded-VM field, and a portable WASM fallback, and ends with the product-owner-direction decisions this document expands). It reasons from projectMM's end goal — *author a script as text, run it on a running device on the next tick* — down to a reference architecture, a concrete API, a performance budget, and a staged spike plan. Modelled on [leddriver-analysis-top-down.md](leddriver-analysis-top-down.md). This expands the eight decisions already made; it does not re-open them. All design is written fresh against projectMM's architecture — prior art (ESPLiveScript, ARTI-FX, MoonLight) is credited, not traced.
+
+## TL;DR
+
+- **MoonLive is our native-codegen engine** — a real compiler (lex → parse → AST → **IR** → native machine code), executed by direct function-pointer call, so a scripted effect runs at **near-100% native speed** in the render hot path. That speed, bound to a real module system, is projectMM's standout.
+- **One narrow boundary, three tiers.** The seam is `MoonLive::run()` (the analog of `LedDriver::push()`). Above it: a **platform-independent front-end** (tokenizer → parser → typed AST). Below it: a **typed IR** (the seam that lets one front-end feed many backends) → a **per-ISA backend** (Xtensa first). The IR is compile-time only — **zero per-pixel runtime cost**; it lowers to the same native instructions a hand-written backend would emit.
+- **Xtensa first, no dead-ends.** Ship the Xtensa backend (classic ESP32 + S3 — projectMM's first targets, the bench hardware) as a complete, blazing first increment. RISC-V (P4), ARM (Teensy), x86-64/ARM64 (desktop) are each *a new backend behind the unchanged IR* later — additive, never a rewrite. **WASM/WAMR is the per-target fallback** (IR→WASM is one more backend), so no target is ever blocked and a true sandbox stays reachable.
+- **Source language: a C-subset, "as close as possible" to a precompiled effect, with pragmatic simplifications.** The effect *body* ports near-verbatim from a `.h` (types, `for`, integer + float math, `static_cast`, `RGB`, `hsvToRgb`, buffer writes). The C++ *file/class ceremony* that buys nothing in a script (`#pragma`/`#include`/`namespace`; lightened: `class : public EffectBase`/`override`/the `controls_`-dance) is supplied by the engine. **Not** JS (doubles = slow + further from our code); **not** full C++ (object model = build + hot-path cost for zero-value boilerplate).
+- **Minimal-ceremony controls.** A control is a near-plain top-level variable with a range annotation; the engine derives the MoonModule control + UI + persistence.
+- **MoonModule-first.** A scripted module **is** a `MoonModule` (role, controls, `loop()`, generic UI, lifecycle, robustness, live-reconfig). The script ⇄ host binding reaches the `Buffer` / `AudioFrame` / LUT through the producer/consumer pull pattern — no copy. This is the projectMM value-add with no prior art to trace.
+- **Safety staged.** Ship cheap first — array **bounds-checking** (a compare-branch per indexed access, low single-digit %, switchable off) + a **watchdog / instruction budget** (kill a runaway loop, near-free). The expensive **true memory sandbox** (WASM gives it free; native can't cheaply) is deferred, reachable via the IR→WASM fallback only if a public editor in the field demands it.
+- **Staging spine = the [MoonLight effects tutorial](https://moonmodules.org/MoonLight/moonlight/effects-tutorial/) ladder.** Each tutorial rung (random pixel → control → trails → oscillators → 2D → 3D → audio) is one engine-capability spike with a concrete acceptance bar. **RipplesEffect.h is the language-fidelity *graduation test*** (does the C-subset handle float trig + 3D + `memset` near-verbatim?) — the hard case, not the hello-world.
+- **Load-bearing spike:** a minimal native Xtensa engine running the tutorial's hello-world (`setRGB(random16(N), blue)`) live on an ESP32-S3, hitting the frame budget *and* surviving a deliberately-bad script via cheap safety. If native-with-cheap-safety can't hold 16K×50FPS, the fallback is demote-to-WASM/WAMR — a backend swap behind the IR, not a restart.
+- **Cost, eyes open.** A real compiler is more work than adopting an off-the-shelf VM — weeks to the first beautiful Xtensa increment, each ISA backend its own increment later. The deliberate trade for native speed + a differentiator, mitigated exactly as the LED drivers were: spike-ordered, one complete increment at a time, the hard multi-target part deferred behind a seam that keeps it reachable.
+
+## 1. The goal, in detail
+
+A user writes a script — an effect, layout, modifier, driver, or a domain-neutral core rule (transform sensor data) — in a text box in the browser. The device compiles it and runs it as a first-class `MoonModule` **on the next tick**: no toolchain, no flash, no reboot. The same leap WLED took with ARTI-FX. The hard requirements (from the bottom-up):
+
+- **Blazingly fast** — the script runs in the render hot path at up to 16K+ lights × 50 FPS, so a slow per-pixel path is fatal. This is *the* constraint that picks native over interpreted.
+- **General in core + specific in light** — one engine, many `MoonModule` roles.
+- **Target order** — ESP32 classic + S3, then P4 + other ESP32, then Teensy, then desktop.
+- **Smart memory** — IRAM/PSRAM-aware via `platform::alloc`, no hot-path allocation, compile-once.
+- **Infinitely scalable** — run *as many* live scripts concurrently as memory allows, exploiting PSRAM. No fixed slot count; each script is an independent compiled unit and the only ceiling is free heap. A device hosts as many scripted modules (effects across layers, modifiers, core sensor rules) as fit, and degrades gracefully when it doesn't — the same scaling-to-available-memory contract the light pipeline already honours.
+- **Synced** — `Scheduler`-tick, live reconfig (no reboot), tick-atomic hot-swap, robust to add/delete/replace in any order.
+- **MoonModule-compatible** — controls, `loop()`, role, generic UI with zero per-script UI code.
+
+## 2. Why native, and why our own (expanding decision 1)
+
+The design space runs from interpreted to native, and the choice is driven by the hot-path requirement:
+
+- **AST-walk** (ARTI-FX): stores values as `double` and walks the tree per frame — which buys maximum flexibility and runs on any platform unchanged, at the cost of per-frame speed. That speed cost is what rules it out *for the 16K×50FPS hot path specifically* — not a flaw, a different trade than projectMM needs here. (For a slow core script off the hot path, that trade would be fine.)
+- **A bytecode VM is the middle ground** — a compact opcode stream run by a dispatch loop, far faster than tree-walking but paying a per-opcode dispatch tax every operation; at 16K×50FPS = 800K px/s that tax is the open question, not a given.
+- **Native JIT is the only thing that reaches ~100%** (ESPLiveScript's 85 fps ≈ hand-written C++ — hpwit's result). The differentiator we're after is the *combination*: native speed **and** multi-target **and** bound to a real module system. Each prior engine has part of it — ESPLiveScript has the native speed (Xtensa); ARTI-FX has the live-scripting product shape and runs anywhere (interpreted). Neither combines all three; that combination is the open space.
+- **WASM/WAMR** gets portability + free sandbox but tops at ~50% native (WAMR-AOT) with a 200KB+ runtime — kept as the fallback, not the flagship, because native speed is what we're chasing.
+
+**Why our own, not "adopt WAMR":** *Industry standards, our own code.* We take the textbook compiler *shape* (lex → parse → AST → IR → native — the LLVM structure scaled to an MCU) and textbook *names*, written fresh against our architecture. An off-the-shelf runtime would make the engine someone else's and cap us at half speed; building means the language, the MoonModule binding, and the hot path are ours to make beautiful. The cost (a real compiler) is accepted and staged.
+
+**What would flip it to WASM-wholesale:** if the load-bearing spike shows native-with-cheap-safety *cannot* hold 16K×50FPS on an S3 (native machine code makes this unlikely), or if a public script editor proves to demand a true sandbox we can't afford natively. The IR seam makes either flip a backend swap, not a restart.
+
+## 3. Reference architecture
+
+### 3.1 The one narrow boundary
+
+Everything hangs off a single tiny seam — the analog of the LED doc's `LedDriver::push(std::span<...>)`:
+
+```cpp
+// A compiled script, ready to run. The host calls run() once per tick.
+class MoonLive {
+public:
+    bool ok() const;                 // compiled cleanly
+    const char* error() const;       // human-readable compile/runtime error, "" if none
+    void run();                      // execute the script's loop() — the hot path
+    void bind(MoonLiveHost& host);     // wire controls + host data (§3.4)
+    // lifecycle: free() releases code + data; recompile swaps tick-atomically (§3.6)
+};
+```
+
+Above the line is the portable front-end; below it the IR and the per-ISA backend. The host (a `MoonLiveModule`, §3.3) owns a `MoonLive` and calls `run()` from its `loop()`.
+
+### 3.2 The three tiers (where the IR seam lives)
+
+```
+   source text
+        │   ┌─────────────── platform-independent (one implementation, all targets)
+   tokenizer (lexer)
+        │
+   parser → typed AST
+        │
+   ┌────┴──────────── IR SEAM ──────────────┐   ← one front-end, many backends
+        │
+   typed IR  (SSA-ish, register/temp model, types resolved, bounds-check nodes inserted)
+        │   ┌─────────────── platform-bound (one backend per ISA)
+   backend: lower IR → native instructions
+        │       Xtensa first; RISC-V / ARM / x86-64 / ARM64 later; WASM as the fallback backend
+   encode → executable memory (platform::allocExec) → call as function pointer
+```
+
+- **Front-end (portable):** tokenizer + parser + AST live in `src/core/moonlive/` (domain-neutral). They know the *language*, never a CPU. One implementation serves every target.
+- **IR (the seam):** a small typed intermediate representation — the AST lowered to a flat list of typed operations with explicit temporaries, types resolved, and **bounds-check / safety nodes inserted here** (so every backend inherits safety for free). This is a *compile-time data structure*; it does not exist at run time.
+- **Backend (per-ISA):** lowers the IR to native instructions for one ISA. `src/platform/<target>/moonlive_backend_*.{h,cpp}` — the only place CPU-specific codegen lives, behind the platform boundary. A WASM backend (lower IR → `.wasm`, run by WAMR) is one such backend, the portable fallback.
+
+**Critical: the IR costs nothing at run time (decision 3).** It is consumed during compilation and discarded. The CPU executes only the final native instructions — identical in kind to hand-written assembly. *Matching native speed on Xtensa is non-negotiable.* The Xtensa backend must lower a hot loop to instructions that match hand-written Xtensa; the spike's acceptance bar **diffs generated instructions for the Ripples inner loop against a hand-emitted reference**, and an `__asm__` escape hatch covers the very hottest paths. If the IR ever costs hot-path speed, that's a backend bug to fix, not a tax to accept.
+
+### 3.3 A scripted module IS a MoonModule (decision 7)
+
+The one deliberate class hierarchy in the codebase is the module tree; a scripted module joins it like any other. `MoonLiveEffect` is a normal `EffectBase` whose `loop()` delegates to the compiled `MoonLive`:
+
+```cpp
+// src/light/moonlive/MoonLiveEffect.h  — a scripted effect is a first-class EffectBase
+class MoonLiveEffect : public EffectBase {
+public:
+    ModuleRole role() const override { return ModuleRole::Effect; }
+    const char* tags() const override { return "📝"; }   // scripted
+    Dim dimensions() const override { return engine_.declaredDim(); }  // from the script
+
+    void setup() override {                                // acquire the engine
+        engine_.bind(host_);                               // wire the host data (§3.4)
+    }
+
+    void onBuildControls() override {                      // DYNAMIC controls — re-runs when the script changes
+        controls_.addText("source", source_, kMaxSource);  // the script text (persisted, editable)
+        // The engine declares its controls as NEUTRAL data; the binding translates to controls_.
+        for (auto& c : engine_.declaredControls())         // {name,type,min,max,default} — no projectMM type
+            controls_.add(c.name, c.type, c.min, c.max);   // binding maps neutral → projectMM control (§3.5)
+    }
+
+    // onBuildState is the rebuild sweep: it fires on a source edit (recompile) AND on a
+    // grid/size change (the engine re-sizes its script buffers for the new dimensions).
+    // projectMM has no separate onSizeChanged — resize routes through onBuildState, so the
+    // dynamic-memory re-allocation rides the same hook every config change already uses.
+    void onBuildState() override {
+        engine_.compile(source_);                          // recompile if source changed
+        if (!engine_.ok()) { setStatus(engine_.error(), Severity::Error); return; }
+        engine_.allocForSize(width(), height(), depth());  // (re)alloc script data for the current size
+    }
+
+    void onUpdate(const char* name) override {             // cheap per-control reaction, no full rebuild
+        engine_.onControlChanged(name);                    // poke a running script's bound control
+    }
+
+    void loop() override {
+        if (engine_.ok()) engine_.run();                   // the hot path: native code over our buffer
+    }
+
+    void teardown() override {                             // release: free compiled code + script data
+        engine_.free();                                    // the "destructor" role — arenas returned to the heap
+    }
+};
+```
+
+The same shape gives `MoonLiveLayout` (role `Layout`, emits coordinates), `MoonLiveModifier` (role `Modifier`, remaps positions), `MoonLiveDriver` (role `Driver`, consumes the buffer), and a core `MoonLiveModule` (domain-neutral, e.g. a sensor rule). One engine, many roles — each a thin `MoonModule` subclass whose `loop()` is `engine_.run()`. The UI renders them generically (the `source` text control + the script-declared controls) with **zero per-script UI code** — exactly the module-tree payoff.
+
+**A scripted module implements the whole `MoonModule` lifecycle, not just `loop()`** — that's what makes it a first-class module and what answers dynamic controls / dynamic memory / cleanup:
+
+- **`onBuildControls()` — dynamic controls.** Re-runs whenever the module rebuilds, so a script that declares different controls (a new `@control` var) gets a different control set in the UI + persistence, live. The controls are *the script's*, not a fixed list.
+- **`onBuildState()` — dynamic memory on size change.** projectMM routes a grid/size change through `onBuildState` (the same rebuild sweep that applies every config change without a reboot), so MoonLive re-allocates its per-size script buffers here (`allocForSize`, PSRAM-first per §3.7). There is no bespoke `onSizeChanged` — using the existing hook means a scripted module resizes exactly like a compiled one, and inherits the no-reboot + robustness contracts for free.
+- **`setup()` / `teardown()` — acquire / release (the destructor role).** `teardown` frees the compiled code block + the script's data arena back to the heap, so deleting a scripted module returns all its memory — the lifecycle that makes "as many scripts as memory allows" (§3.7) safe to add *and remove* in any order.
+- **`onUpdate(name)` — cheap per-control reaction.** A control edit pokes the running script's bound variable without a full recompile (the fast path for a slider drag); only a *source* edit triggers the heavier `onBuildState` recompile.
+
+So the binding overrides the same hooks any compiled module does; the only difference is that each one delegates to the compiled `MoonLive` instead of hand-written C++.
+
+**Crucially, all of these lifecycle methods live in the *binding* (`MoonLiveEffect`, `src/light/moonlive/`), not in the engine.** `onBuildControls`/`onBuildState`/`onUpdate`/`teardown`, `EffectBase`, `ModuleRole`, `controls_` — every projectMM type — sit on the binding side of the §3.9 seam. The engine (`MoonLive`, `src/core/moonlive/`) sees none of them; the binding reaches it only through a **neutral public API**: `compile(source)`, `run()`, `free()`, `declaredControls()` → a plain list of `{name, type, min, max, default}` structs the engine owns, and `allocForSize(w, h, d)` → plain ints. The binding *translates* — it reads the engine's neutral `declaredControls()` and calls projectMM's `controls_.addUint8(...)`; it maps a grid resize to `allocForSize`. **The engine never takes a `ControlList`, a `Buffer`, or any projectMM type** — so the rich MoonModule lifecycle is entirely a property of the binding, and the engine stays the domain-neutral core §3.9 describes. (This is the seam working as intended: a different host writes its own binding with its own lifecycle against the same neutral engine API.)
+
+### 3.4 The host binding — script ⇄ MoonModule (decision 7, the value-add)
+
+Rather than a flat name→pointer registry (the host-binding shape surveyed engines share), projectMM uses a **MoonModule-aware `MoonLiveHost`** that exposes the producer/consumer data the script needs, by reference, no copy — the same pull pattern effects already use (`EffectBase::buffer()/width()/elapsed()`, [Layer.h:499-504](../../src/light/layers/Layer.h)):
+
+- **Buffer + geometry** — `width()`, `height()`, `depth()`, `channelsPerLight()`, `nrOfLights()`, `elapsed()`, and pixel writers `setRGB(i,c)` / `setRGBXY(x,y,c)` / `setRGBXYZ(x,y,z,c)` (the MoonLight tutorial's exact surface). These compile to direct loads/stores against `layer_->buffer()` — the **identity-mapping fast path** preserved (the script writes the real buffer, no intermediate copy).
+- **Controls** — the script's declared variables (§3.5) bind by reference so a UI control edit updates the running script live.
+- **Producer structs** — a core or audio script reads `AudioFrame` (level + 16-band spectrum) / sensor structs through the same `const`-pointer pull the C++ effects use (`AudioModule::latestFrame()`), so add/remove in any order returns a live or silent-default frame, never null (robustness).
+- **Built-ins** — `hsvToRgb`/`hsv`, `random16`, `sin`/`cos`/`sqrt`/`floor` (the trig Ripples needs), `millis`/`elapsed`, `fill`/`memset`. A small, fixed, recognizable library (FastLED-flavoured — the vocabulary effect authors already know), implemented once in the host and callable from any backend.
+
+The binding is generated *around* the script body — the script never writes `#include`, never reaches a raw pointer it shouldn't, and the host decides what's in scope per role (an effect sees the buffer; a core sensor script sees the sensor struct, not the LED buffer).
+
+### 3.5 Controls — minimal ceremony (decision 5)
+
+A control is a near-plain top-level variable with a range annotation; the engine derives the `MoonModule` control + UI + persistence:
+
+```c
+uint8_t speed = 50;      // @control 0..99      → controls_.addUint8("speed", …, 0, 99)
+uint8_t interval = 128;  // @control 1..254
+```
+
+The front-end collects annotated top-level vars during parsing and the engine exposes them as a neutral `declaredControls()` list (`{name, type, min, max, default}` — no projectMM type); the *binding* reads that list and calls the normal `controls_.add(...)` the rest of projectMM uses (§3.3) — so a scripted control is indistinguishable from a compiled one in the UI, persistence, and the live-reconfig sweep, while the engine stays projectMM-agnostic. Lighter than today's explicit `onBuildControls` + `addUint8` (the engine writes that for you), and copy-paste-friendly: the `uint8_t speed = 50;` line is *already* how RipplesEffect.h declares it. (Exact annotation syntax — `@control`, a trailing comment convention, or a `slider(0,99)` initializer — is settled in the spike; the principle is "declare the var, get the control".)
+
+### 3.6 Live reconfig + tick-atomic hot-swap (decision: sync)
+
+A re-pushed script must swap in on the next tick with the old one freed, no reboot, no crash mid-render — the no-reboot + robustness principles applied to *code*. The mechanism rides the existing `onBuildState()` rebuild sweep (the same one that makes every config change live): a `source` edit marks the module dirty; the next `onBuildState()` compiles the new source into a *second* `MoonLive`, and only on success swaps the active pointer (the old `MoonLive` freed after the swap), so a failed compile leaves the running effect untouched and surfaces the error in the module's status. `run()` reads the active pointer once per tick — the swap is a single pointer store between ticks, never mid-`loop()`.
+
+### 3.7 Memory placement + infinite scalability, routed through `platform::` (decisions: smart memory, infinitely scalable)
+
+Memory placement routes through the existing `platform::` seam, so it's one policy, not scattered per-target branches:
+
+- **Compiled code** → `platform::allocExec(size)` (a new seam: `MALLOC_CAP_EXEC` IRAM on ESP32; `mmap(PROT_EXEC)` on desktop; the platform decides, the engine doesn't know). PSRAM-capable on S3/P4 where the chip allows executable PSRAM.
+- **Script data** (globals, stack arena) → `platform::alloc` (PSRAM-first with internal fallback — already the project's policy).
+- **Compile-once** → a portable compiled-artifact format persisted to LittleFS, so a known-good script skips device-side recompile on boot. The native artifact is per-ISA; the portable fallback artifact is one file for all targets.
+
+**Infinite scalability — as many scripts as memory allows.** Each `MoonLive` (§3.1) is a **self-contained compiled unit**: its own code block (from `allocExec`) and its own data arena (from `alloc`), owned by the `MoonLiveModule` that holds it, freed when that module is deleted. Nothing is shared or fixed-slot — so running N scripts is just N independent `MoonLive`s, and **the only ceiling is free heap**, not an arbitrary limit. This falls out of the architecture for free:
+
+- **The module tree already hosts N modules.** A scripted module is a `MoonModule` (§3.3); the tree puts no cap on how many effects a Layer holds or how many peripherals System hosts. Ten scripted effects across layers + a scripted modifier + two core sensor rules are just twelve modules — the UI, persistence, and `Scheduler` handle them like any other.
+- **PSRAM is where it scales.** On an S3/P4 (8 MB PSRAM) the compiled code + data arenas live in PSRAM (`alloc` is PSRAM-first), so the device holds *far* more scripts than internal RAM alone would allow — exploiting PSRAM is exactly what lifts the ceiling from "a handful" to "as many as the script sizes sum to under PSRAM." A non-PSRAM classic ESP32 holds fewer (internal heap only) — correct and honest, the same internal-vs-PSRAM split the rest of the system has.
+- **Graceful degradation when full.** When the next script won't fit, the device does what the light pipeline already does at the memory edge ([architecture.md § scaling to available memory](../architecture.md#scaling-to-available-memory)): the compile/bind fails cleanly, the module reports a "not enough memory" status, and everything already running keeps running — no crash, no reboot (the robustness + no-reboot principles). The cap is reached by *degrading*, never by bricking.
+- **The hot-path cost is per-*running* script, not per-*loaded* script.** Memory scales with how many scripts are loaded; tick time scales with how many are *enabled and rendering*. A device can hold a large library of scripts in PSRAM and run only the active ones, so "infinitely scalable in memory" doesn't mean "infinitely slow" — a disabled scripted module costs RAM but no tick time (and the disable-releases-resources backlog item, when it lands, lets it cost neither).
+
+### 3.8 Execution model — inline by default, task as the exception (decision: sync)
+
+**A script runs inline in the `Scheduler` tick by default — not in its own task.** A scripted effect's `loop()` is called exactly like a compiled effect's `loop()`, on the render task, each tick. The task-per-script model some engines use fits when a script *is* the top-level loop and owns the device; in projectMM a scripted module is one `MoonModule` among many, called from the same single-threaded render loop as every compiled module, so inline is the consistent shape. Three reasons make inline the default, not just a choice:
+
+- **Consistency.** A scripted effect behaves identically to a compiled one — same call site, same hot-path rules, same `Scheduler`. One mental model, and the UI/persistence/lifecycle treat it like any other module.
+- **It sidesteps two costs task-per-script can't.** Task stacks *can* live in PSRAM (`xTaskCreateWithCaps`, `MALLOC_CAP_SPIRAM`), so task-per-script is not blocked on *internal* RAM — but it pays two costs inline doesn't: (a) **scheduling overhead** — each task is a TCB + scheduler bookkeeping + a context switch; hundreds of tasks all wanting to run each frame thrash the scheduler instead of rendering, a ceiling that has nothing to do with memory; and (b) **a PSRAM-backed task stack is hot-path-slow** — a per-pixel inner loop touching locals on a PSRAM stack pays PSRAM latency (~12 MB/s vs internal ~80 MB/s) every access, exactly what a 16K×50FPS loop can't afford. An inline script runs on the render task's *internal-RAM* stack, fast, with no per-task scheduler cost. So PSRAM scales the script's *code + data* (§3.7), and inline keeps the per-script *stack* fast and free — the two pull together, where task-per-script would put them in tension.
+- **No cross-thread sync.** An inline script reads `buffer()` / `elapsed()` / `AudioFrame` from the thread that owns them — no locks, no race, no memory barriers. A task touching the shared buffer while the render task reads it is exactly the data race the single-threaded hot path avoids by design.
+
+An inline script obeys the no-blocking-hot-path rule (it can't `delay`); a runaway loop is caught by the instruction-budget watchdog (§4), so a bad inline script degrades, it doesn't wedge the tick.
+
+**The exception — a pinned task — is narrow and opt-in.** A *core* script that genuinely blocks or runs at its own cadence and must **not** share the render tick (e.g. a slow I²C sensor transaction, or a rule that ticks at 1 Hz independent of render) may opt into its own task, pinned opposite the render core. This is a per-module, documented exception for off-hot-path core work — never the default, and never for a script in the render pipeline (effect/layout/modifier/driver), which is always inline. Two execution paths exist, but the inline one is the default and the task one earns its place case by case.
+
+### 3.9 Layering — a domain-neutral engine core, a thin binding (decision: domain-neutral core)
+
+The tiers above already separate cleanly along projectMM's own *Domain-neutral core* principle, and the layering is held to it deliberately:
+
+- **The engine core (MoonLive) is domain-neutral.** "MoonLive" is the engine's *name*, not a coupling — the front-end (`src/core/moonlive/`) and the IR + backends (`src/platform/<target>/moonlive_backend_*`) know the *language* and the *ISA*, never `Buffer`, `EffectBase`, the module tree, or anything light- or projectMM-specific. The core's only outward contract is a tiny injectable platform seam (`platform::allocExec` / `alloc` / `millis`) — a handful of functions, not a reach into projectMM's full platform layer.
+- **The binding is the only projectMM-coupled layer**, and it is *thin*. `MoonLiveHost` + `MoonLiveEffect`/`MoonLiveLayout`/… (`src/light/moonlive/`, with a core `MoonLiveModule` for sensor rules) sit **on top of** the engine's public API and consume it; they never reach into engine internals.
+- **Dependency direction is one-way:** the binding depends on the engine; the engine never depends on the binding (or on projectMM). The engine does not `#include` projectMM; projectMM `#include`s the engine.
+
+Why this matters concretely: **it is what makes projectMM-as-a-library optimal.** A clean library needs exactly this — a domain-neutral core with a one-directional dependency and a thin, replaceable binding, so the whole stack composes without circular dependencies or hidden coupling. So this layering is not extra structure for its own sake; it is the *Domain-neutral core* + *Complexity lives in core, domain modules stay simple* principles applied, and it is the same boundary projectMM needs to be a well-formed library.
+
+A true property of that boundary, worth stating: because the core (MoonLive) knows only the *language* and the *ISA* — never LEDs, buffers, or projectMM — the same front-end + IR + backends would serve a **wholly different host**: a different output device, or a different application entirely (a script that drives a display, reads a keypad, computes a result). Such a host writes its own thin binding against the same public API + platform seam; nothing in the core changes. The IR seam is what makes that portable, too — the host targets whatever chip it likes by writing one backend behind the unchanged IR. This is a *consequence* of building the core domain-neutral for projectMM, not a goal we design toward — but it is real, and it is the mark of a well-factored core: it doesn't care what you point it at.
+
+**Hard constraint: the layering is justified entirely by projectMM's optimality — never compromised for it.** The clean engine/binding split is adopted only because it makes projectMM architecturally sound, fast, and CLAUDE.md/architecture.md-compliant (domain-neutral core, data-over-objects on the hot path, the platform boundary). If any separability would cost projectMM's optimality — a slower hot path, a heavier binding, an abstraction the engine doesn't need — it is **not** done. The binding stays thin and the core stays neutral *because that is the optimal projectMM design*, full stop; nothing in the layering is bent toward a use beyond projectMM.
+
+## 4. Safety — staged (decision 6)
+
+A user-facing editor means a bad script must degrade, not brick. There are two distinct failure surfaces, and they need different defenses:
+
+- **Compile-time (parser / analysis).** A malformed script must be *rejected cleanly at parse*, never crash the compiler. The `fix-warnings` fork's null-deref is exactly this class: a nested external-call argument produced an AST node missing its children, and the compiler dereferenced them unconditionally. The defense is **AST/analysis validation** — the parser checks node shape (children present, types resolved) and emits a diagnostic instead of dereferencing a null, backed by a **regression test** per malformed input (the `fix-warnings` case is the first such test). This is a correctness property of the front-end, not a runtime cost.
+- **Runtime — cheap, ship first.** Once a script *compiles*, a bad *value* at run time must degrade, not brick: (a) **Array bounds-checking** — the IR inserts a compare-branch before each indexed access (a clamp or skip on out-of-range), e.g. a `setRGB(i, …)` with `i` past the buffer. Low single-digit % overhead, inserted at the IR so every backend gets it, and **switchable off** in a trusted/fast mode for vetted built-in scripts. (b) **Watchdog / instruction budget** — a per-tick instruction or time budget that aborts a runaway `while(1)` (near-free; the task WDT already does most of it). Together these catch the common *runtime* failures — out-of-range index, infinite loop — at low cost.
+- **Expensive, deferred.** A *true* memory sandbox (the script physically cannot touch memory outside its arena) is what native can't cheaply provide. Don't build it first — it's reachable via the IR→WASM fallback (suspect scripts compiled to the sandboxed backend) only if a public editor in the field shows the cheap tier isn't enough. Safety is a ladder climbed on evidence, not a wall built before any script runs.
+
+## 5. The language — a C-subset as close as possible (decision 4)
+
+### 5.1 The model
+
+A C-subset, not full C++, not JS. The type model is exactly what real effects use: `uint8_t`/`uint16_t`/`uint32_t`/`int`/`lengthType`/`nrOfLightsType` integers (with 64-bit where overflow matters — Rainbow's `uint64_t` phase), `float` (Ripples' trig), `bool`, `char`, a `RGB`/`CRGB` struct, and arrays (incl. multi-dim). Control flow: `if/else`, ternary, `while`, C-style `for`, `break`/`continue`, `return`; user functions; `static_cast` (or C casts). Grammar: **hand-written recursive-descent** — the recognizable textbook default, what most embedded script languages use; a PEG is the alternative but recursive-descent is simpler to make fast and to emit good errors from. Built-ins: the fixed host library (§3.4).
+
+### 5.2 What's dropped vs lightened (the pragmatic simplifications)
+
+- **Dropped** (file ceremony, zero value in a script): `#pragma once`, `#include`, `namespace`. The engine supplies the surrounding module.
+- **Lightened** (the C++ object model): no `class : public EffectBase`, no `override`, no `controls_.addUint8(...)` host-object dance. The engine synthesizes the `MoonLiveEffect` wrapper (§3.3) around the script body; the role/`dimensions`/controls come from light annotations (§3.5) and the script's `loop()`.
+- **Kept verbatim** (the part you iterate on): types, the `loop()` body, all the math, `static_cast`, `RGB c = hsvToRgb(...)`, the loops.
+
+**Why not full C++:** supporting `class`/inheritance/`override`/host-method-binding means implementing a C++ object model (vtables, member-reference binding) in the engine — build cost up front, and the object machinery is the very "object graph in the hot path" the architecture forbids. The wrapper has no runtime value; let the engine write it.
+
+**Why not JS** (the ARTI-FX surface): JS's number model is doubles-everywhere — the per-pixel cost that makes ARTI-FX flexible-but-not-fast — *and* it's further from our C++ effects, so porting an existing effect is harder, not easier. A C-subset is both faster and closer to the source.
+
+### 5.3 RipplesEffect.h → scripted form (the language-fidelity test)
+
+`RipplesEffect.h` is the **graduation test** for the language (float trig + 3D + `memset` + two controls — the hard case, deliberately not the hello-world). The body must port near-verbatim:
+
+**Today (`src/light/effects/RipplesEffect.h`, the C++):**
+
+```cpp
+class RipplesEffect : public EffectBase {              // ← dropped (engine supplies)
+    const char* tags() const override { return "💫🟦🦅"; }   // ← lightened → annotation
+    Dim dimensions() const override { return Dim::D3; } // ← lightened → annotation
+    uint8_t speed = 50;                                 // ← kept (becomes a control)
+    uint8_t interval = 128;
+    void onBuildControls() override {                   // ← dropped (derived from the vars)
+        controls_.addUint8("speed", speed, 0, 99);
+        controls_.addUint8("interval", interval, 1, 254);
+    }
+    void loop() override {                              // ← KEPT VERBATIM (the body)
+        uint8_t* buf = buffer(); … std::memset(buf, 0, nrOfLights()*cpl);
+        const float rippleInterval = 1.3f * … * std::sqrt((float)h);
+        for (lengthType z=0; z<d; z++) for (lengthType x=0; x<w; x++) {
+            const float dist = std::sqrt(dx*dx+dz*dz)/9.899f*(float)h;
+            const lengthType y = (lengthType)std::floor((float)h/2*(1+std::sin(phase)));
+            const RGB c = hsvToRgb(hue,255,255);
+            … px[0]=c.r; px[1]=c.g; px[2]=c.b;
+        }
+    }
+};
+```
+
+**Scripted (the target — body unchanged, ceremony gone):**
+
+```c
+// @effect dim=3D                          // role + dimensions, one line
+uint8_t speed = 50;       // @control 0..99
+uint8_t interval = 128;   // @control 1..254
+
+void loop() {                              // ← byte-for-byte the C++ loop body
+    uint8_t* buf = buffer();
+    lengthType w = width(), h = height(), d = depth();
+    uint8_t cpl = channelsPerLight();
+    if (w<=0 || h<=0 || d<=0) return;
+    memset(buf, 0, nrOfLights()*cpl);
+    float rippleInterval = 1.3 * ((255.0-interval)/128.0) * sqrt((float)h);
+    if (rippleInterval < 0.01) return;
+    float timeInterval = (float)elapsed() / (100.0-speed) / 6.4;
+    float cx = (float)(w-1)/2, cz = (float)(d-1)/2;
+    nrOfLightsType wh = (nrOfLightsType)w*h;
+    for (lengthType z=0; z<d; z++)
+      for (lengthType x=0; x<w; x++) {
+        float dx=(float)x-cx, dz=(float)z-cz;
+        float dist = sqrt(dx*dx+dz*dz)/9.899495 * (float)h;
+        float phase = dist/rippleInterval + timeInterval;
+        lengthType y = (lengthType)floor((float)h/2 * (1+sin(phase)));
+        if (y<0 || y>=h) continue;
+        uint8_t hue = elapsed()/50 + x*3 + z*7;
+        RGB c = hsvToRgb(hue,255,255);
+        setRGBXYZ(x, y, z, c);              // replaces manual idx + px[0..2]
+      }
+}
+```
+
+The diff is exactly the ceremony: gone are `class`/`override`/`onBuildControls`/`#include`/`namespace`/`std::`-qualification and the manual buffer-index arithmetic (→ `setRGBXYZ`). The math, the trig, the loops, the types — verbatim. **If the engine can compile this at native speed, the C-subset decision is proven.** (Float-trig native codegen is the part to validate — see the perf budget.)
+
+## 6. Testing — the engine's biggest structural advantage
+
+A live-script engine is one of the **most testable things projectMM can build**, and projectMM's two-tier test framework ([testing.md](../testing.md): doctest unit tests + JSON scenarios, each run in-process *and* live) maps onto it almost perfectly. This is a genuine edge: the bottom-up's structural note that ESPLiveScript ships `.ino` examples and no unit suite isn't a knock on it — it's the gap our framework closes. **Every live-script feature gets pinned by a test, back to back**, because two properties make a compiler exceptionally test-friendly:
+
+1. **Every compiler stage is a pure input→output function.** Lex, parse, IR-lower, codegen each take a known input and produce a deterministic output — the easiest thing in the world to unit-test, with no hardware and no flakiness.
+2. **A script's *result* is deterministic and exactly assertable.** A known script over a known grid at a known `elapsed()` produces an exact buffer — byte-for-byte checkable. There is no "looks about right"; there is a golden buffer.
+
+### 6.1 Unit tests (`test/unit/core/unit_moonlive_*.cpp`, doctest)
+
+The compiler front-end and IR are domain-neutral core (§3.9), so they unit-test on the desktop with zero hardware:
+
+- **Tokenizer / parser** — source string → expected token list / AST shape; every language construct (types, `for`/`if`/ternary, functions, arrays, `static_cast`, struct access) and every *error* (unterminated string, type mismatch, undeclared var) pinned to an expected diagnostic. The fuzz-class bug the `fix-warnings` fork fixed (a nested external-call arg) is exactly a parser unit test — the regression that would have caught it for free.
+- **IR** — AST → expected IR for representative snippets; the bounds-check / safety nodes (§4) asserted present where the IR should insert them.
+- **Codegen (host backend)** — the **desktop/x86-64 backend** is itself a test asset: it runs in-process, so a compiled script *executes during a unit test* and its output buffer is asserted directly. A script that fills blue → assert every pixel is `(0,0,255)`; Ripples at a fixed `elapsed()` → assert the exact lit-column pattern. No device needed to test *the language*; the device tests only *the native ISA backend*.
+- **Determinism harness** — the existing `setTestNowMs` clock-override seam (the same one scenarios use) lets a time-dependent script be tested at a fixed tick, so an animated effect is a deterministic assertion, not a guess.
+
+### 6.2 Scenario tests (`test/scenarios/{core,light}/scenario_moonlive_*.json`)
+
+Scenarios exercise a scripted module *as a wired `MoonModule`* — the integration layer unit tests don't reach:
+
+- **The MoonModule binding** — `add_module MoonLiveEffect`, `set_control source=<script>`, `set_control speed=…`, `measure` → assert the module renders, the control edits live, the buffer is non-zero. A scripted effect is tested the same way a compiled effect is, through the same runner.
+- **Live reconfig + tick-atomic hot-swap (§3.6)** — a scenario pushes a new `source` mid-run and asserts the swap is clean (old freed, new rendering, no crash). Push a *broken* script → assert the prior effect keeps running and the status reports the compile error (the robustness contract).
+- **Robustness (the hard rule)** — add/delete/replace a scripted module in any order, at any grid size, including 0×0×0; a scripted effect alongside compiled ones; ten scripts at once (the scalability claim, §3.7, becomes a measured scenario, not a hope). A discovered crash drives a new scenario that pins the fix — the same regression rule the rest of projectMM follows.
+- **Performance bounds** — a scenario carries `"bounds": {"fps": …}`, so script-Ripples-vs-compiled-Ripples (§7's headline number) is a *enforced* bound that fails CI on regression, not a one-off measurement. The perf budget becomes a guardrail.
+- **Two tiers for free** — every scenario runs in-process (desktop backend, the CI workhorse) *and* live against a real S3/P4 over REST (the native backend). The same JSON pins the language on desktop and the ISA backend on hardware — the cross-check the LED-driver doc gets from a logic analyzer, we get from running the *same* script on two backends and asserting the *same* buffer.
+
+### 6.3 Why this compounds the staged plan
+
+Each staging rung (§9.2) lands with its tests: the hello-world spike ships its parser + codegen + render-output unit tests and a "scripted random-pixel" scenario; the controls rung ships a control-binding scenario; Ripples graduation ships the golden-buffer assertion + the perf bound. So "test all live-script features back to back" isn't a phase bolted on at the end — **every increment is a tested increment**, and the suite grows rung by rung. By the time the engine is complete, every language feature, every binding, every role, and the scalability + hot-swap + robustness contracts are each pinned by a unit test or scenario that runs on every commit. That body of tests is also what lets the worker-bee agents implement against a pinned spec (the *Industry standards, our own code* method) — the behaviour is fixed by tests first, so the implementation is independent by construction.
+
+## 7. Performance budget (16K LEDs × 50 FPS, ESP32-S3)
+
+The frame budget at 50 FPS is **20 ms/tick** for everything (render + drivers + network + system). A 16K effect like Ripples touches each lit column once; Rainbow touches all 16K pixels. Reference points from `scenario_perf_full` (in [performance.md](../performance.md)): the *compiled* heavy effect (Noise) is ~50 ms at 16K on the S3 (≈20 FPS — already the bottleneck), the light effect (Checkerboard) ~8 ms (≈128 FPS). So:
+
+- **Native script ≈ compiled.** A native-codegen script must land within a few % of the equivalent compiled effect — that's the whole point of native, and the spike's headline measurement (script-Ripples µs/tick vs compiled-Ripples µs/tick, same grid).
+- **Float trig is the watch-item.** Ripples' per-column `sqrt`/`sin` dominate its cost; the S3 (LX7) has an FPU, so native float is real hardware ops — but the codegen must emit FPU instructions, not a soft-float call. The spike measures this directly.
+- **Bytecode-VM comparison (the fallback's ceiling).** A VM pays per-opcode dispatch; at 800K px/s (16K×50) for an all-pixels effect that tax is the question the bottom-up flagged. The spike measures a VM path too (even a throwaway one) so the native-vs-fallback gap is a number, not a guess. If native holds and VM doesn't, native is vindicated; if both hold, the fallback is comfortable.
+
+**Acceptance bar:** native script-Ripples within ~10% of compiled Ripples at 16K on the S3, float trig on the FPU, bounds-checking on, inside the 20 ms budget with headroom for drivers. Miss it → investigate codegen quality (the `__asm__` escape hatch + IR-lowering fixes) before falling back.
+
+## 8. Hot-path do / don't checklist
+
+**Don't** (in the generated code / the `run()` path):
+- No heap allocation during `run()` — the script's data arena is allocated at compile/bind, reused every tick.
+- No per-pixel function-call dispatch into the host for the common writers — `setRGBXY` lowers to inline loads/stores against the buffer, not a `call`.
+- No soft-float where the FPU exists — emit FPU ops on S3/P4; integer-preferred for per-light colour work (the project rule), float only for the wavefront math, exactly as the compiled effects do.
+- No blocking — a script can't `delay`; a runaway loop hits the instruction budget.
+
+**Do:**
+- Bind the buffer pointer + geometry once per tick, then loop in native code (the identity-mapping fast path — the script writes `layer_->buffer()` directly).
+- Insert bounds-checks at the IR so they're uniform and removable as one switch.
+- Keep the host built-in library small, fixed, and inlinable.
+- Provide the `__asm__` escape hatch for the hottest inner loop, so a power user is never capped by codegen quality.
+
+## 9. Staged plan — the MoonLight tutorial ladder as the spine
+
+### 9.1 Sequencing: depth-first vs broad-first → a hybrid
+
+The first sequencing question is **depth-first** (build the whole engine on Xtensa through a real effect, *then* add the second ISA) vs **broad-first** (a trivial example on Xtensa *and* RISC-V early, then deepen both). Each retires a different risk:
+
+- **Depth-first** is the fastest path to a visible bench result, but it defers the project's single biggest unknown — *does the IR seam genuinely decouple the front-end from the backend, or did it quietly leak Xtensa assumptions?* — until a second ISA is built, late. That is exactly the "back to the drawing board" dead-end the IR seam exists to prevent; validating it last is backwards.
+- **Broad-first** over-corrects: it stands up the hardest part (a second codegen backend) before the language is even proven pleasant to write effects in — a lot of compiler plumbing before anything user-visible, and P4 is only the third target.
+
+**The hybrid takes broad-first's one real insight without its cost.** Build a *complete vertical slice* on Xtensa just far enough to run the hello-world native (front-end → IR → Xtensa backend → `allocExec` → call), then **immediately prove a minimal second-ISA backend on that same slice** — *before* deepening to controls/math/2D/3D. A hello-world exercises only a sliver of the IR, so a second backend for *just that* is cheap, and it tests the load-bearing claim (the seam decouples) when fixing it is still cheap. Every later stage then rests on a seam that's been *demonstrated* to decouple, not trusted to. (Pragmatic note: the second ISA for this proof is **P4/RISC-V** if a P4 is on the bench, else the **desktop x86-64 backend** — a different ISA than Xtensa either way, so it validates the seam, and the desktop backend is useful anyway for host tests. P4 is the most on-target; desktop is the most convenient.)
+
+### 9.2 The ladder
+
+The [MoonLight effects tutorial](https://moonmodules.org/MoonLight/moonlight/effects-tutorial/) is a ready-made *start-small-grow* curriculum (random pixel → control → trails → oscillators → 2D → 3D → audio → Cosmic Noise). Each rung is **one engine-capability spike** with a concrete acceptance bar. **RipplesEffect.h is the graduation test** (the hard real effect, after the 3D rung). Each step is a normal small commit; the multi-target part is sequenced per §9.1 — the *seam* is proven on a second ISA at Stage 0.5, but the *full* second backend (all stages) comes later, opportunistically.
+
+| Stage | Capability proven | Acceptance bar (the spike) |
+|---|---|---|
+| **0. Load-bearing spike (Xtensa)** | Front-end → IR → **Xtensa** backend → `allocExec` → call. The hello-world: `setRGB(random16(N), blue)`. | Runs live on an **ESP32-S3**, lights a random pixel each tick, inside the frame budget; a deliberately-bad script degrades via cheap safety, no crash. **If this can't hit native speed, fall back to WASM/WAMR — a backend swap behind the IR.** |
+| **0.5. Seam-proof (2nd ISA, early)** | The IR genuinely decouples: a *minimal* **RISC-V (P4)** backend — or the **desktop x86-64** backend — runs the *same* hello-world behind the *same* IR. | The same script through the same front-end/IR path renders **equivalent output on both backends** (same lit pixel each tick), and **the second backend is added without changing a line of the front-end or IR** — only new backend code. That "front-end + IR untouched" is the no-dead-end proof, paid for at hello-world cost. If the seam leaked (the IR needed backend-specific edits), fix it now — cheap, before anything is built on it. |
+| **1. Controls** | Minimal-ceremony control binding (annotated var → `MoonModule` control + UI + persistence + live edit). | A `speed` slider appears, edits the running script live, persists across reboot. |
+| **2. Buffer read-modify-write** | Trails / fade — read the buffer, fade, write. | The tutorial's trail effect runs; a moving dot with a fading tail. |
+| **3. Math + time** | `float`/fixed math, `elapsed()`, oscillators (`beatsin`/`sin`). FPU codegen on S3. | A smooth oscillator effect; float trig measured on the FPU, within budget. |
+| **4. 2D** | `width/height`, `setRGBXY`, 2D addressing. | A 2D tutorial effect at the real grid size. |
+| **5. 3D** | `depth`, `setRGBXYZ`, 3D addressing. | A 3D tutorial effect. |
+| **6. Graduation: RipplesEffect** | The full C-subset on a real hard effect — `sqrt`/`sin`/`floor`, `memset`, 3D, two controls — ported **near-verbatim** (§5.3). | Script-Ripples within ~10% of compiled Ripples at 16K on the S3. **Proves the language decision.** |
+| **7. Full 2nd backend** | Deepen the second ISA from §0.5's minimal proof to the full stage-1–6 surface (Ripples on **P4**). | A tutorial step + Ripples run on the **ESP32-P4** via the RISC-V backend; front-end/IR untouched. |
+| **8. WASM fallback backend** | IR → `.wasm` → WAMR. | A target with no native backend yet runs the same script through WAMR; one artifact, sandboxed. Validates the fallback is real. |
+| **9. More roles** | `MoonLiveLayout`, `MoonLiveModifier`, `MoonLiveDriver`, core `MoonLiveModule` (sensor). | A scripted layout emits coordinates; a scripted modifier remaps; a core script transforms an `AudioFrame`. One engine, many roles. |
+| **10. Editor + delivery** | Scripts in LittleFS, pushed via REST/WS, compile-on-device (and optionally compile-on-host/web for the portable artifact). | Author a script in the browser, push, see it live — the live-edit loop, projectMM-native. |
+| **Later targets** | ARM (Teensy), x86-64/ARM64 (desktop) full backends. | Each a new backend behind the IR, when the target is in scope. |
+
+**Acceptance bar for every step:** runs on real hardware at the target grid, within the frame budget, surviving a bad script; the front-end + IR stay unchanged across backends (the no-dead-end invariant, *proven* at Stage 0.5); a compiled-vs-scripted timing is recorded. The fallback at any speed-failure is demote-to-WASM, never redesign.
+
+## 10. Product-owner decisions (carried from the bottom-up, expanded here)
+
+Settled (bottom-up § *Answers — product-owner direction*), expanded in the sections above:
+
+1. **Native engine, our own** — §2. The standout; WAMR is fallback, not flagship.
+2. **Xtensa-first, IR seam, no dead-ends** — §3.2, §9. Start small + beautiful; multi-target stays reachable.
+3. **IR costs zero at run time** — §3.2. Equally fast as hpwit on Xtensa is non-negotiable; proven by instruction-diff + `__asm__` escape.
+4. **C-subset, as close as possible, pragmatic simplifications** — §5. Body verbatim; ceremony supplied by the engine; not JS, not full C++.
+5. **Minimal-ceremony controls** — §3.5. Declare the var, get the control.
+6. **Staged safety** — §4. Cheap bounds+watchdog first; true sandbox deferred to the WASM fallback.
+7. **MoonModule-first** — §3.3, §3.4. A scripted module is a `MoonModule`; the binding is the value-add.
+8. **General core + specific light, effect first** — §3.3, §9. Tutorial hello-world is the spike; Ripples is the graduation test; other roles follow.
+9. **Infinitely scalable** — §3.7. As many scripts as memory allows, PSRAM-exploiting; each `MoonLive` self-contained, ceiling = free heap.
+10. **Inline execution by default, task the exception** — §3.8. A scripted effect runs in the `Scheduler` tick like a compiled one (consistent, near-zero overhead — what makes scalability real, no cross-thread sync); a pinned task is the narrow opt-in for a long/blocking core script.
+11. **Sequencing: hybrid** — §9.1. Full Xtensa vertical slice to hello-world, then prove the IR seam on a second ISA *early* (Stage 0.5) before deepening.
+12. **Domain-neutral engine core, thin binding** — §3.9. Engine never depends on projectMM; the clean layering is what makes projectMM-as-a-library optimal, and is never compromised for any separability.
+
+## 11. Prior art & credits
+
+This design stands on work others did first; per *Industry standards, our own code*, we study it, credit it by name, and write our own.
+
+- **ESPLiveScript — Yves Bazin (hpwit).** The native-codegen approach this whole redesign builds on is his. ESPLiveScript demonstrates the thing that matters most here: a from-scratch C-like compiler — a complete tokenizer, parser, register allocator, Xtensa code generator, and a save/load compiled-binary path, header-only — that JIT-emits native Xtensa and runs a script at near the speed of hand-written C++ on an ESP32 (85 fps on a 12,288-LED panel where Lua managed 3 and Gravity 10). Our redesign's central choice — go native, not interpreted — is taken directly from that result; what we add is the IR seam (so the same approach reaches RISC-V/ARM/desktop) and the MoonModule binding. Where the bottom-up notes structural costs (global state, no IR, large files), those are observations a *rewrite for a different goal* must make, not a verdict on the original — ESPLiveScript does its job, fast, and is the reference precisely because it works.
+- **ARTI-FX / ARTI — ewowi.** The author of this analysis also wrote ARTI-FX (the interpreted-effects runtime in WLED MoonModules, on the PEG-grammar ARTI interpreter). It is the prior projectMM-family answer to the same problem and the source of hard-won lessons carried here: the `renderFrame`/`renderLed` per-frame/per-LED split, the host-binding shape (`arti_external_function` / `arti_*_variable`), and — by being the AST-walking, double-everything design — the concrete demonstration of *why* the hot path wants native or VM execution rather than tree-walking. ARTI-FX proved the live-scripting *idea* works end-to-end in this ecosystem (load a script, run it, edit live); this redesign trades its interpreter for native speed, but inherits its product shape and its lessons.
+- **MoonLight — MoonModules.** The [effects tutorial](https://moonmodules.org/MoonLight/moonlight/effects-tutorial/) is the staging spine of §9, and its `setRGB`/`setRGBXY`/`setRGBXYZ` + `addControl` surface is the model for the host binding (§3.4–3.5).
+
+Credits also live in the bottom-up's *Prior art & credits* and the digest [history/hpwit-ESPLiveScript.md](../history/hpwit-ESPLiveScript.md).
+
+### Public credit — to lift into `docs/moonmodules/core/MoonLive.md` when the module spec is written
+
+The credits above are the analysis's internal record. The block below is the **user-facing** version for the eventual `MoonLive.md` "Prior art" section. Drop it in when MoonLive ships; matches the house style of the other modules' Prior-art sections (e.g. [AudioModule.md](../moonmodules/core/AudioModule.md), [LcdLedDriver.md](../moonmodules/light/drivers/LcdLedDriver.md)).
+
+> MoonLive's native-codegen approach — compile a small C-like language straight to machine code and call it as a function, so a live-authored effect runs at near hand-written speed — was pioneered by **Yves Bazin (hpwit)** in **[ESPLiveScript](https://github.com/hpwit/ESPLiveScript)**: a from-scratch tokenizer, parser, and Xtensa code generator that drives a 12,288-LED panel at ~85 fps where interpreted languages (Lua, Gravity) managed 3–10. That result is what makes "go native, not interpreted" the right call, and ESPLiveScript is the reference MoonLive is built against — studied closely, credited, and written fresh against projectMM's architecture, never copied, per [*Industry standards, our own code*](../../CLAUDE.md#principles). MoonLive carries the idea forward where ESPLiveScript stops: a multi-ISA backend behind an IR seam (Xtensa, then RISC-V / ARM / desktop) and a binding that makes a script a first-class MoonModule.
+>
+> The live-scripting idea in this ecosystem also descends from **ARTI-FX / ARTI** (the interpreted-effects runtime in WLED MoonModules), which proved the load-a-script-and-run-it-live loop end-to-end and contributed the `renderFrame`/`renderLed` shape and the host-binding model MoonLive learns from.
+
+
+## 12. Reconciliation with the bottom-up
+
+- **Strong agreement.** The bottom-up's recommendation (native, Xtensa-first, IR seam, WASM fallback, staged safety, C-subset) is carried whole — this doc is its expansion into an architecture + plan, not a revision.
+- **What this doc adds.** The concrete `MoonLive`/`MoonLiveHost`/`MoonLiveEffect` API; the three-tier diagram with the IR seam placed; the host-binding surface mapped to the real `EffectBase`/`Layer` accessors; the perf budget against `scenario_perf_full` numbers; the RipplesEffect side-by-side; and — the key staging insight — **the MoonLight tutorial ladder as the spike spine**, with Ripples demoted from "first demo" to "graduation test."
+- **One refinement vs the bottom-up.** The bottom-up implied Ripples as the first scripted-effect demo; this doc corrects that — Ripples is too complex for hello-world. The tutorial's `setRGB(random16, blue)` is the **spike** (the first thing the engine runs end-to-end); Ripples is the **language-fidelity exam** after the 3D rung. (Separately: that same `setRGB(random16, blue)` line is, by coincidence, also the input the `fix-warnings` fork crashed on — so it doubles as the first compile-time **regression case** for parser validation, §4. Two roles, one line: the spike proves the happy path runs; the regression test proves the malformed-AST path is caught.)
+
+## Out of scope (deferred to implementation)
+
+The exact annotation syntax for controls/role; the compiled-artifact binary format; the web-editor UI; the per-target benchmark numbers (produced by the spikes, not predicted here); the precise instruction-budget tuning; the choice of which built-ins ship in the first library. These are settled in the spikes, concrete-first, not up front.
diff --git a/docs/backlog/ui-deferred.md b/docs/backlog/ui-deferred.md
deleted file mode 100644
index cc0ee51..0000000
--- a/docs/backlog/ui-deferred.md
+++ /dev/null
@@ -1,56 +0,0 @@
-# UI — deferred items & open questions
-
-Forward-looking companion to the shipped UI spec, [moonmodules/core/ui.md](../moonmodules/core/ui.md). The live spec describes the UI as shipped; this file holds what is **not** in it yet: deferred items, open design questions for 1.0, and the gap analysis against projectMM v1. The backward-looking half (how v1/v2 actually worked, patterns consciously rejected, recorded quirks) lives in [history/v1-inventory.md](../history/v1-inventory.md).
-
-Promote items from here into the live spec as they ship. Delete the file when empty.
-
-## Deferred to 1.x
-
-- Side nav with drag-reorder of root modules (root order is fixed in `main.cpp` today; not painful — and arguably correct, see the gap-analysis note below)
-- Health panel (`<details>` + `GET /api/test`)
-- Log panel (`<details>` + WS `{t:"log",m:"…"}`)
-- Core affinity badge (C0/C1) — only meaningful when core pinning lands
-- Module `category()` field — taxonomy beyond `role()` for the picker (decision: derive from `role()` for now)
-
-## Open design questions
-
-These don't block the shipped baseline but should be answered before 1.0:
-
-- **Multi-layer UI** — [architecture.md](../architecture.md) plans for N layers blended into one Drivers. The current card layout shows one Layer. Likely needs a tab/accordion to switch layers, or a per-layer column.
-- **Modifier chain visualization** — show the modifier order visually (the `children[]` order is the apply order). Today they're a flat list.
-- **Presets** — save/load named bundles of control values. Persistence already stores them; needs a UI surface.
-- **Canvas/node-graph view** — v2 attempted this. Powerful for complex setups but doubles the UI surface. A reasonable v3 follow-up gated on user demand.
-
-## Gap analysis — v1 features not yet in v3
-
-Inventory of v1 frontend behaviours v3 lacks, with a recommendation each. Items already shipped (control types, dragTs, two-timescale inputs, type picker, theme, scroll-shrink preview, status bar, reset-to-default, fps/ms toggle, drag reorder, side nav + drawer + footer) are not repeated.
-
-Legend: **Adopt-1.0** (small, high value) · **Defer-1.x** (needs engine work or a feature we lack) · **Drop** (not needed).
-
-### Per-card features
-
-| v1 feature | v3 today | Recommendation |
-|---|---|---|
-| Header: setup-dot before name | name only | **Defer-1.x** — needs `setupOk()` + `health()` on MoonModule with a real failure mode. Today both would always be `true` / `""`. |
-| Module ID shown separately from name | name only | **Defer-1.x** — add when instances need disambiguating (e.g. two effects of the same type under one Layer). |
-| Category emoji badge on the card header | role emoji in the picker, not on the card | **Defer-1.x** — `ROLE_EMOJI` already exists in `app.js`; showing it per-card is a small step if card scannability needs it. |
-| Core affinity badge (C0/C1) | core pinning not implemented | **Drop** until core pinning is a real engine feature. |
-| Memory split heap vs PSRAM | `static+dynamic` shown on the card | **Defer-1.x** — splitting `dynamicBytes` further needs `platform::isPsramPointer(p)` or per-alloc tracking, neither exists yet. |
-
-### WebSocket / panels
-
-| v1 feature | v3 today | Recommendation |
-|---|---|---|
-| Drag-to-reorder *root* modules (`POST /api/modules/reorder`) | not supported | **Drop** — root order is fixed in `main.cpp` and that's correct: Layouts/Layers/Drivers + system modules are mandatory and ordered. Children reorder via drag already. |
-| Log channel `{t:"log",m:"…"}` pushed by server | no server log push | **Defer-1.x** — needs an engine-side log producer. Gate: when boot/network/persistence logs become interesting to non-developers. |
-| Schema channel `{t:"schema",modules:[…]}` for tree-shape changes | full `/api/state` push every update | **Drop** — keep the full-tree push; re-evaluate only if WS bandwidth becomes a problem with large trees. |
-| System health panel (polls `GET /api/test`, pass/fail table) | none | **Defer-1.x** — needs a runtime `/api/test` that runs the doctest suite; `ctest` covers this for now. |
-| Log panel (ring buffer, severity colouring, stick-to-bottom, `GET /api/log` backfill) | none | **Defer-1.x** — pairs with the log WS channel; both arrive together. |
-
-### Cost / decision table
-
-| Cost class | Items |
-|---|---|
-| Tiny (< 30 lines, no backend) | category emoji badge on the card header |
-| Medium (minor backend change) | help-link mapping (needs docs site); richer `category()` than role()-derived |
-| Large (separate plan) | health panel + `/api/test`; log panel + WS log channel; OTA + GitHub-update badge; full multi-layer UI; presets UI |
diff --git a/docs/building.md b/docs/building.md
index 0a8dcff..6721472 100644
--- a/docs/building.md
+++ b/docs/building.md
@@ -124,11 +124,11 @@ The ESP32 tab in MoonDeck wraps the same steps as cards (Setup → Firmware →
 
 **Pinned to `v6.1-dev-399-gd1b91b79b5`** (a specific commit on the pre-release v6.1 branch). `setup_esp_idf.py` holds the exact commit in `PINNED_IDF_VERSION` and warns loudly when the installed tree differs, so a stray `git pull` or a fresh shallow clone landing on a newer dev commit is visible rather than silent. Minimum is ESP-IDF v5.1 (C++20 needs GCC 12+); the project uses v6.x APIs (`esp_eth_phy_new_generic`, the component manager for mDNS, the modern RMT/parlio/LCD drivers) so v5.x would need adjustments.
 
-**Why a dev snapshot and not a stable tag.** As of June 2026 the v6.x line is: **v6.0 is the current stable** (GA 2026-02-27); **v6.1 is still pre-release** (beta1 2026-06-11, RC1 2026-07-23, GA 2026-07-31). We pin a v6.1-dev commit because it carries driver fixes we want on the newer SoCs (P4 parlio, RMT v2 on every chip), and because v6.0 vs v6.1-dev is a small delta. The trade-off is honest: a dev branch gets **no support guarantee** and moves under you, which is exactly why the pin is a fixed commit, not a floating branch. The clean inflection point is **v6.1 GA (2026-07-31)**: re-pin to the `v6.1` tag then, which starts the 30-month support clock (see below). That move is a deliberate re-test pass, not a routine pull. Tracked in [backlog § ESP-IDF version pinning](backlog/backlog.md#esp-idf-version-pinning-pending).
+**Why a dev snapshot and not a stable tag.** As of June 2026 the v6.x line is: **v6.0 is the current stable** (GA 2026-02-27); **v6.1 is still pre-release** (beta1 2026-06-11, RC1 2026-07-23, GA 2026-07-31). We pin a v6.1-dev commit because it carries driver fixes we want on the newer SoCs (P4 parlio, RMT v2 on every chip), and because v6.0 vs v6.1-dev is a small delta. The trade-off is honest: a dev branch gets **no support guarantee** and moves under you, which is exactly why the pin is a fixed commit, not a floating branch. The clean inflection point is **v6.1 GA (2026-07-31)**: re-pin to the `v6.1` tag then, which starts the 30-month support clock (see below). That move is a deliberate re-test pass, not a routine pull. Tracked in [backlog](backlog/README.md).
 
 **v6.0 is the floor — don't depend on anything newer than it.** Because **v6.0 stable is our fallback** if the v6.1 line proves troublesome, the firmware and build tooling must stay buildable on v6.0. The rule is generic: **use no IDF API, component, Kconfig symbol, or tool that isn't present in v6.0.** A feature that exists only on the v6.1-dev branch (or arrives in a later minor) is off-limits until v6.0 is no longer the fallback. When adopting anything new from the IDF, confirm it shipped in v6.0 first (check the v6.0 docs / release notes, not `latest`); if it's v6.1-only, it waits.
 
-**Explicit exceptions are allowed.** The floor is a default, not an absolute. A feature may step below it (depend on something not in v6.0) when the product owner decides so *explicitly* and the reason is documented at the point it's introduced — in the module spec, a code comment at the dependency, and the commit body. The bar is a conscious, recorded decision, not a silent drift: a floor you can consciously waive with a stated reason stays honest, whereas a rule quietly violated does not. Each such exception also narrows the v6.0 fallback (that target now needs the newer dependency too), so it states what the fallback loses. The known exception today is **P4 WiFi over the C6 co-processor**, which needs `esp_wifi_remote` / esp-hosted (a managed component outside mainline v6.0); it is an accepted, documented exception, scoped to the P4 target, tracked in the [backlog](backlog/backlog.md#esp32-p4-support--rounds-3-4-in-progress).
+**Explicit exceptions are allowed.** The floor is a default, not an absolute. A feature may step below it (depend on something not in v6.0) when the product owner decides so *explicitly* and the reason is documented at the point it's introduced — in the module spec, a code comment at the dependency, and the commit body. The bar is a conscious, recorded decision, not a silent drift: a floor you can consciously waive with a stated reason stays honest, whereas a rule quietly violated does not. Each such exception also narrows the v6.0 fallback (that target now needs the newer dependency too), so it states what the fallback loses. The known exception today is **P4 WiFi over the C6 co-processor**, which needs `esp_wifi_remote` / esp-hosted (a managed component outside mainline v6.0); it is an accepted, documented exception, scoped to the P4 target, tracked in the [backlog](backlog/README.md).
 
 **v6.0 vs v6.1, and where the real change was.** The earthquake was **v5.x → v6.0**, not v6.0 → v6.1:
 
@@ -172,7 +172,7 @@ The general rule: **anything already in v6.0 we adopt proactively** (it clears t
 2. **`network_provisioning`** — the headline capability: a sibling provisioning module beside ImprovProvisioning adding the phone-app + SoftAP onboarding flow. Its own plan (spec before code), a `Peripheral`/System module reusing the WiFi-credential plumbing, BLE-stack cost weighed per chip.
 3. Further v6.0 items (PSA-native crypto, CMake v2, MCP) are pulled in as their triggers fire (first direct crypto use; v2 GA; a debug need), per the rows above.
 
-Tracked in [backlog § ESP-IDF version pinning](backlog/backlog.md#esp-idf-version-pinning-pending).
+Tracked in [backlog](backlog/README.md).
 
 ### Firmware variants
 
diff --git a/docs/history/README.md b/docs/history/README.md
index 1ea8910..249b723 100644
--- a/docs/history/README.md
+++ b/docs/history/README.md
@@ -48,7 +48,7 @@ Reading across the friend-repo digests, the themes the wider ESP32-LED ecosystem
 
 ## What these projects do that projectMM doesn't (yet)
 
-Observational — where the landscape is ahead of projectMM. These are *not* commitments; real adoption decisions live in [`../backlog/backlog.md`](../backlog/backlog.md), cross-referenced where one already exists.
+Observational — where the landscape is ahead of projectMM. These are *not* commitments; real adoption decisions live in the [`../backlog/`](../backlog/README.md), cross-referenced where one already exists.
 
 - **Parallel multi-strip output on S3/P4** (PARLIO/LCD_CAM, and hpwit's I2S/shift-register drivers) — projectMM's driver story is ArtNet-out today; native parallel LED output is unbuilt. See the [LED-driver analysis](../backlog/leddriver-analysis-top-down.md) in backlog.
 - **Audio-reactive input** — none of projectMM's effects are audio- or motion-reactive yet. The Peripheral role + the Pi-sensor backlog entry are the foundation; the producer→effect wiring is backlog.
diff --git a/docs/history/decisions.md b/docs/history/decisions.md
index 7d712eb..7b90324 100644
--- a/docs/history/decisions.md
+++ b/docs/history/decisions.md
@@ -116,7 +116,7 @@ are concrete rules, not aspirations.
 - **addControl binds to class variable by reference.** Control stores a `uintptr_t` pointer to the variable. Hot-path code reads the variable directly — zero overhead. UI updates write through the pointer. Supports uint8_t, int8_t, uint16_t, uint32_t, int, float, bool, Coord3D.
 - **Node — minimal memory.** Base class ~29 bytes + vtable. Effects add only their control variables (uint8_t each). A typical effect adds just 2 bytes on top. No std::string members.
 - **LightsHeader — one struct for LEDs AND DMX fixtures.** Configurable `channelsPerLight` (3=RGB, 4=RGBW, up to 32 for moving heads) with offset fields for red/green/blue/white/pan/tilt/zoom/rotate/gobo. This IS the "light = LED pixel or DMX fixture" concept.
-- **Layer start/end percentages.** `startPct`/`endPct` as Coord3D percentages (0-100) of the total fixture. Maps to v3's "start/end position within the physical layout."
+- **Region start/end percentages.** MoonLight's `startPct`/`endPct` as Coord3D percentages (0-100) of the total fixture. Shipped in v3 as a modifier, not as Layer controls.
 - **oneToOneMapping / allOneLight fast paths.** Boolean flags that skip the mapping table entirely when mapping is 1:1 identity. Essential for the no-PSRAM 12K LED case.
 - **Transition brightness.** Per-layer animated brightness overlay (current, target, step). Enables smooth fade-in/out when switching effects. Should be added to v3.
 - **SharedData — zero-allocation inter-node communication.** Single struct shared by all nodes: 16-band FFT audio, volume, beat detection, gravity (IMU), status. Lightweight alternative to pub/sub.
@@ -692,7 +692,7 @@ The installer was reworked so a board catalog ([`boards.json`](../install/boards
 
 **A persistence overlay must distinguish "key absent" from "value 0".** The runtime-Ethernet-PHY work moved pin/PHY config from a compile-time `constexpr ethPins` into persisted NetworkModule controls (`ethType`, pin GPIOs, …) with **non-zero per-chip defaults** (P4 IP101 = `ethType` 2). That exposed a latent bug in `applyControlValue` (the persistence load path): it used `json::parseInt(json,key)`, which returns 0 for an *absent* key — indistinguishable from a real 0 — and then wrote that 0 into the control under the Clamp policy. So loading an older/partial `<Module>.json` that omitted a key **clobbered the control's default with 0**. On the ESP32-P4 this zeroed `ethType` (2 → 0 = none), so `ethInit()` dispatched to "no Ethernet": link LEDs on, but no DHCP. It was invisible on classic/Olimex (their eth defaults are mostly 0 anyway) and on `main` (which still read the `constexpr ethPins` directly), so it only bit once eth config became persisted controls with meaningful non-zero defaults. **Fix:** a `json::hasKey()` guard in `applyControlValue` — an absent key leaves the control untouched (preserves its default); a present key (even value 0) still applies. Lesson: any "control resets to its default/0 after reboot" symptom is a persistence-overlay smell, not a control-init bug; a flat JSON parser that returns a zero sentinel for missing keys MUST be paired with a presence check before the value is applied as authoritative. The decisive debugging move was a `std::printf` of the runtime struct over the P4's *secondary* USB-Serial-JTAG console (stdout reaches USB even when ESP_LOG/UART is on GPIO 37/38), after a `git worktree` bisect (round-1 ✓, main ✓, uncommitted ✗) proved it was our code, not hardware or IDF.
 
-**A GPIO pin is its own control type (`ControlType::Pin`), not an overloaded int16.** Pins were first added as `addInt16` with a `-1..48` range, which the UI rendered as a *slider* — meaningless for a GPIO, and the cap wrongly excluded the P4's high pins (MDIO 52, clk 50). Dropping the range didn't help: the UI's `int16` case *always* draws a slider (an unbounded int16 falls back to a −100..200 percentage slider that Layer start/end positions rely on), so int16 couldn't be made to mean both "position slider" and "pin number." The fix is a dedicated `Pin` type: `int8_t` storage (one byte — a GPIO never exceeds ~54, and on a DRAM-scarce ESP32 the per-pin byte matters across many pin controls), −1 = unused, the UI always renders a plain number input keyed off the `"pin"` type string, and min/max are a server-side write-clamp guard only. Serializes/parses as a plain integer (same as int16). This also serves every future pin control (LED-driver clockPin/dcPin, GyroDriver SDA/SCL, board pins) — they migrate to `addPin` for free. Lesson: when one control type is doing two jobs with different UX (slider vs number), that's the smell for a new type, not a range hack; and pick the smallest storage that fits the domain (int8 for a pin).
+**A GPIO pin is its own control type (`ControlType::Pin`), not an overloaded int16.** Pins were first added as `addInt16` with a `-1..48` range, which the UI rendered as a *slider* — meaningless for a GPIO, and the cap wrongly excluded the P4's high pins (MDIO 52, clk 50). Dropping the range didn't help: the UI's `int16` case *always* draws a slider (an unbounded int16 falls back to a −100..200 percentage slider that position/region controls rely on), so int16 couldn't be made to mean both "position slider" and "pin number." The fix is a dedicated `Pin` type: `int8_t` storage (one byte — a GPIO never exceeds ~54, and on a DRAM-scarce ESP32 the per-pin byte matters across many pin controls), −1 = unused, the UI always renders a plain number input keyed off the `"pin"` type string, and min/max are a server-side write-clamp guard only. Serializes/parses as a plain integer (same as int16). This also serves every future pin control (LED-driver clockPin/dcPin, GyroDriver SDA/SCL, board pins) — they migrate to `addPin` for free. Lesson: when one control type is doing two jobs with different UX (slider vs number), that's the smell for a new type, not a range hack; and pick the smallest storage that fits the domain (int8 for a pin).
 
 **`deviceName` (identity) vs `deviceModel` (product) vs board (bare PCB) — one term was doing three jobs.** "Board" had been overloaded to mean the per-unit network identity, the hardware product/catalog key, AND the bare PCB. Untangling it: `deviceName` is the **per-unit identity** — one string that drives mDNS (`<deviceName>.local`), the SoftAP name, and the DHCP hostname, so the device shows up under one name everywhere; it's RFC-1123-coerced (`sanitizeHostname`) because it becomes a hostname. `deviceModel` is the **hardware product** (the `deviceModels.json` catalog key, e.g. "projectMM testbench S3") — display-form, spaces allowed, never a hostname. "Device" is the umbrella noun; "board" now means **only the bare PCB**. This drove the BoardModule→SystemModule fold (the identity is core unit state, not a separate module), the `board`→`deviceModel` rename across catalog/installer/Improv (SET_BOARD→SET_DEVICE_MODEL, byte 0xFE unchanged), and the eth pin-map clarification (driver = firmware, pin map = firmware-seeded but **deviceModel-authoritative** so an Olimex entry can override). Lesson: when one noun answers three different questions ("what do I call this unit on the network?", "what product is it?", "what's the bare board?"), that's a naming smell — split it into the qualified terms, pick one umbrella word, and make the split visible in every layer (control names, RPC symbols, catalog keys, docs) so the three concepts can't re-merge.
 
@@ -703,3 +703,9 @@ The installer was reworked so a board catalog ([`boards.json`](../install/boards
 **When a working seam regresses after your "fix," suspect the fix — and measure with a tool faithful to what the user sees.** The resumable preview send (`sendBufferedFrame`/`drainPreviewSend` — stream the producer buffer a memory-adaptive chunk per `loop20ms`, drop-new backpressure, downsample + display cap) shipped working on all three boards. A later attempt to *also* route the coordinate table + downsampled colour frame through the resumable path (removing the synchronous `sendAllOrClose` spin-and-close) looked principled but **regressed every board into an intermittent stall**, through several variants. Three lessons compounded: (1) **Stop at the first failed fix on a working path.** Each "improvement" to a seam that already worked added a new failure; the discipline (CLAUDE.md *Anti-stalling*) is to revert to the known-good state at attempt two, not re-engineer. The committed synchronous coord/downsampled path *closes a wedged client past a spin budget and lets it reconnect* — not elegant, but proven; the elegant unification wasn't worth a regression nobody could pin. (2) **A measurement tool must be faithful to the real client or it invents and hides bugs.** A plain one-shot WebSocket probe *gave up on close* where a browser *reconnects*, so it reported stalls users never saw AND missed blips they did — it sent the debugging in circles for a whole session. The fix was a browser-faithful probe (`scripts/diag/preview_health.py`: reads binary frames, sends the 25 s keepalive ping, auto-reconnects with backoff — exactly `app.js`'s `connectWs`); only then did probe and eyes agree. (3) **A stale process masquerades as a code bug.** "No preview on the PC build" with a corrupt-looking on-the-wire coordinate count survived every fresh rebuild — because a **38-hour-old desktop binary** still held port 8080; the freshly-built one couldn't bind and the browser/probe hit the stale one. The tell was the *uptime*, spotted by the product owner, not the diff. Lesson: before bisecting a "rebuild didn't fix it" bug, confirm the artifact under test is the one you built (check the process uptime / `build` timestamp / what's actually bound to the port). The faithful probe is now the standing way to measure preview health on any target (PC + the three boards), wired into MoonDeck's Live tab.
 
 **Don't hold a vendor library's async handle across your own event loop — it races the library's internal timers.** A UI refresh intermittently crashed the device (`assert failed: xQueueSemaphoreTake queue.c:1709 (( pxQueue ))` — a null FreeRTOS queue — inside the espressif mDNS component's `mdns_query_async_get_results`, plus an `Interrupt wdt timeout`). The mDNS *browse* (discovering peers for the "Your devices" list — distinct from mDNS *advertise*, which serves `<deviceName>.local` and was never the problem) used the async API: `mdns_query_async_new` returns a handle that `DevicesModule` held across ticks, polling it each `loop1s` with a 0 ms timeout. The trap: the mDNS component's **own task** owns that handle's queue and **frees it when the query's window (3 s) expires** — so a poll landing in the gap after expiry asserts on a freed queue. It was intermittent and grid-size-sensitive (a bigger grid lengthens the tick, widening the gap) and looked like "refresh crashes it" only because a refresh's activity coincided with the poll. **First fix attempt was wrong:** I assumed a *service-table mutation* (live rename re-registering `_http._tcp`) tore the handle down and added a cancel-before-mutate guard — it didn't fix it, because the freeing party is the component's expiry timer, not our code. **Real fix:** stop using the async-handle API entirely — replace the start/poll/stop trio with one synchronous `mdnsBrowse()` (`mdns_query_ptr`) that queries, delivers results, and frees everything in a single call, holding **no handle across ticks**, so the race window can't exist. The catch that synchronous introduced: `mdns_query_ptr` blocks the *full* timeout (it waits the whole window for late responders, no early return) and `loop1s` is charged to the tick — an 80 ms query tanked the tick. So **throttle**: browse one service type every ~8th tick with a ~60 ms timeout — one brief hiccup every ~8 s, invisible for discovery, FPS untouched in between. Lessons: (1) a library's async/iterator handle is only valid between *its* lifecycle events — if you can't see/where those fire (here, an internal expiry timer on another task), don't hold the handle across your loop; prefer a self-contained synchronous call that owns the whole lifecycle. (2) An *intermittent, load-dependent* crash whose backtrace sits in a vendor component is a **lifecycle race**, not a component bug — but find the *actual* concurrent actor before "fixing" (my first guess at the actor was wrong and the fix did nothing). (3) Trading async for synchronous trades a race for a blocking cost — budget it (throttle + bound the timeout) so the cure isn't a tick-killer. (4) Desktop stubs these mDNS calls to no-ops, so it's a hardware-only fix the unit suite can't reach; the reproduction (concurrent WS churn at a large grid → crash before, stable after, uptime climbing) is the proof, in the commit, not a desktop test.
+
+**A dead control that was always meant to be functional belongs in the mechanism that already expresses it, not where it happens to sit.** Six persisted-but-ignored Layer controls (percent region carving) were due to be wired into `rebuildLUT`; the product owner's question — *can a modifier already do this?* — was the better path. `ModifierBase`'s two virtuals (`logicalDimensions`, `mapToPhysical`) express carving exactly, so it shipped as a modifier and the Layer controls were deleted. Lessons: (1) before wiring an inert control where it lives, check whether an existing mechanism already covers it. (2) "make the default fastest" is best met by making the default the *absence* of the feature — full coverage = no modifier = the existing fast path, zero added cost — not a guarded branch through it.
+
+One sub-decision the implementation forced: the boundary rounding. The original spec said inclusive-ceil ("start 33/end 66 on a 4-wide axis → pixels 1..3"), which on a 128-wide axis makes `end=50` land on pixel 64 *inclusive* — so two abutting layers (0..50, 50..100) **overlap by one pixel** at the seam. The product owner chose **half-open `[start, end)`** instead: `end=50` → pixels 0..63, and 0..50 + 50..100 tile a 128 axis into 0..63 / 64..127 exactly, no overlap, no gap (with a min-1-pixel floor so tiny panels still get a non-zero region). Lesson: when a region/range feature will be used to *tile* a space, half-open intervals are the textbook choice (same reason `[begin, end)` is the C++ iterator convention) — inclusive bounds double-count the seam.
+
+Lessons: (1) a persisted-but-inert control is a feature with no home yet — before wiring it where it sits, ask whether an existing mechanism already expresses it (the modifier interface did, completely). (2) "make it the fastest at the default" is often best met by making the default the *absence* of the feature, not a fast branch inside it. (3) a feature framed as "a Layer property" may really be "a composable transform" — the modifier framing also unlocked stacking for free. (4) reach for half-open intervals whenever regions abut.
diff --git a/docs/history/plans/Plan-20260624 - Dev-channel update badge.md b/docs/history/plans/Plan-20260624 - Dev-channel update badge.md
new file mode 100644
index 0000000..aa507d1
--- /dev/null
+++ b/docs/history/plans/Plan-20260624 - Dev-channel update badge.md	
@@ -0,0 +1,48 @@
+# Plan — Per-build `latest` version (`2.1.0-dev.<N>`) + dev-channel update badge
+
+Lands on `next-iteration` (joins PR #27), building on the semver-clean version + update-badge work.
+
+## Context
+
+The semver-clean version work gave the device a clean `version`, but the moving `latest` build has **no distinct version identity**: every `latest` build reports `2.1.0-dev`, and its published manifest/assets are stamped with the old stable `2.0.0` (everything keys off `library.json`'s bare version). So two devices from different `latest` builds report the same version, and the update badge can't tell a stale `latest` device that a newer `latest` exists.
+
+Fix (semver.org §9/§11, also corrects the mislabeled-`2.0.0` manifest): give each `latest` build a monotonic prerelease version `2.1.0-dev.<N>`, `<N>` = commit count since the last tag (`git rev-list --count`, git-describe style). `semver.js` already compares these numerically (§11). Then extend the badge so a device on a `-dev` build also lights up when a newer `latest` exists.
+
+## Decisions (PO)
+- `<N>` = commit count since last tag.
+- Lands on `next-iteration` (PR #27).
+
+## Approach
+
+### 1. Per-build `latest` version through the pipeline
+One computed `V`, consistent across binary (`MM_VERSION`), asset names (`firmware-<F>-v<V>.bin`), manifest (`generate_manifest.py --version`):
+- Stable `vX.Y.Z`: `V` = library.json core (drop `-dev`). Unchanged.
+- `latest` (main push): `V` = `<core>-dev.<commit-count-since-last-tag>`.
+- Local/dev: library.json verbatim — `2.1.0-dev` sorts *below* any published `2.1.0-dev.N`, so a local build never falsely claims newer.
+
+Reuse the existing `-D` override pattern (`MM_FIRMWARE_NAME`/`MM_RELEASE` already do this):
+- `generate_build_info.py`: `MM_VERSION` becomes an `#ifndef` default (= library.json), overridable by `-DMM_VERSION`.
+- `build_esp32.py` `firmware_cmake_args(...)`: optional `version` → `-DMM_VERSION`; add `--version` CLI arg.
+- `compute_version.py` (NEW): the `V` computation as a testable helper (stable core vs latest `-dev.<count>`, tag-less fallback to `rev-list --count HEAD`).
+- `release.yml`: call compute_version once, `fetch-depth: 0`, thread `V` into build matrix + asset-name step + manifest step.
+
+### 2. Dev-channel update badge (`app.js`)
+Extend `checkFirmwareUpdate`: if the device version is a prerelease (`parse(...).prerelease.length > 0`) and no stable update is shown, fetch the `latest` release (cache key `projectMM.update.dev.v1`), read its version from `manifest-<firmware>.json` (`.version`), `isNewer(latestDev, deviceVersion)` → badge → click opens Firmware with `latest` pre-selected. Stable update takes precedence. Best-effort, cached, compatible-`.bin` check applies.
+
+## Files
+- `scripts/build/compute_version.py` (NEW) + `test/python/test_compute_version.py` (NEW)
+- `scripts/build/generate_build_info.py` — `MM_VERSION` overridable `#ifndef`
+- `scripts/build/build_esp32.py` — `--version` → `-DMM_VERSION`
+- `.github/workflows/release.yml` — compute V, fetch-depth 0, thread through
+- `src/ui/app.js` — dev-channel branch
+- `src/ui/semver.js` tests — `2.1.0-dev.7 > 2.1.0-dev.6`, `2.1.0-dev.1 > 2.1.0-dev`
+- `docs/moonmodules/core/FirmwareUpdateModule.md` — note `-dev.<N>` for latest
+
+## Verification
+- Host: node/python tests, build, ctest, scenarios, spec check.
+- Smoke: `build_esp32.py --version 2.1.0-dev.7` → device reports it.
+- Bench S3: flash `-dev.5`, latest manifest reports higher `-dev.N` → badge appears, click opens Firmware/latest. Newest `-dev` → no badge.
+- CI dry: compute_version → `2.1.0-dev.<n>` on main, `2.1.0` on tag; verify-version passes (compares cores).
+
+## Risks
+- Python helper over inline YAML shell (testable). `fetch-depth: 0` required for git history. Tag-less fallback. One extra fetch for `-dev` devices, cached.
diff --git a/docs/history/plans/Plan-20260624 - Semver version + update-available badge.md b/docs/history/plans/Plan-20260624 - Semver version + update-available badge.md
new file mode 100644
index 0000000..54c345f
--- /dev/null
+++ b/docs/history/plans/Plan-20260624 - Semver version + update-available badge.md	
@@ -0,0 +1,56 @@
+# Plan — Semver-clean version + "firmware update available" badge
+
+## Context
+
+The Firmware card's `version` control shows `2.0.0 (v2.0.0)` — a semver (`kVersion`) concatenated with a release-channel tag (`kRelease`). For a stable build the tag is just `v` + the semver, so it's redundant *and* non-semver. The product owner wants `version` to be **industry-standard semver, always** — and the channel **derivable from the semver itself**, not stored as separate metadata. The semver-correct way (semver.org §9/§11) to express "a moving `latest`/dev build that is ahead of the last stable but not itself a release" is a **prerelease identifier**: `2.1.0-dev`. So a stable build shows `2.0.0`; the moving `latest` build shows `2.1.0-dev`. Channel = "has a prerelease suffix → not stable."
+
+On top of that clean version, add a status-bar **"firmware update available" badge**: the browser compares the device's running semver to the newest GitHub **stable** release and, when newer, shows a badge that opens the Firmware card. Modelled on ESP32-sveltekit's `UpdateIndicator.svelte` (the upstream firmware lineage MoonLight forks) — *carry the idea forward, write our own code* (CLAUDE.md *Industry standards, our own code*).
+
+## Git tag vs firmware version (important distinction)
+`2.1.0-dev` is the **semver burned into the firmware** (`MM_VERSION`), NOT a new git tag. The moving build keeps its **`latest`** GitHub tag — only the version *inside* it changes. So: stable release → tag `v2.0.0`, firmware version `2.0.0`; moving build → tag `latest` (unchanged), firmware version `2.1.0-dev`; next stable → tag `v2.1.0`, firmware version `2.1.0` (the `-dev` suffix dropped at release time). The badge compares the device's firmware version against `releases/latest` (newest stable, `latest` excluded), so a `2.1.0-dev` device shows no badge — it is correctly *ahead* of the latest stable.
+
+## Decisions made with the PO
+- Moving/latest builds carry **`2.1.0-dev`** (library.json bumped to the next dev version right after each release — standard "develop on a prerelease" flow).
+- Badge fetches GitHub **cached in localStorage, re-fetch only if > 1 hour stale, PLUS** a fresh check when the Firmware module is opened (don't slow page load).
+- Semver comparison via a **reusable `src/ui/semver.js`** (our own code, no npm dep), JS unit test. Improves the codebase's semver story (today releases sort by *date*; no semver compare exists).
+- **Badge click → open the Firmware card with the new release pre-selected** (lands the user one click from Install). Reuses the picker's `PREF_RELEASE_KEY` restore + `selectModule()`; no new popup.
+
+## Approach (3 pieces)
+
+### 1. Semver-clean version (build pipeline + firmware)
+- `library.json`: version `2.0.0` → `2.1.0-dev`. `build_info.h` is gitignored + generated from this, so `MM_VERSION` follows.
+- `scripts/build/verify_version.py`: a stable `vX.Y.Z` tag matches `library.json` **with any prerelease suffix stripped** (so `v2.1.0` ↔ `2.1.0-dev` passes — the release of what was in dev; a wrong *core* like `v2.2.0` ↔ `2.1.0-dev` still fails). Keep the `latest`-skips behaviour. Doc the ritual.
+- `src/core/FirmwareUpdateModule.h` (`setup()`): `version` control = **just `kVersion`** (pure semver). Drop the `(kRelease)` concatenation. Update inline comment + spec doc.
+- `docs/moonmodules/core/FirmwareUpdateModule.md`: `version` description → "pure semver; a `-dev`/prerelease suffix marks a moving/pre-release build."
+
+### 2. Reusable semver module (`src/ui/semver.js`, NEW)
+- Dependency-free, textbook: `parse(v)` (strip leading `v`) → `{major,minor,patch,prerelease[]}`; `compare(a,b)` → -1/0/1 per semver.org §11 (numeric core, then prerelease-present < absent, identifiers field-by-field, numeric < non-numeric); `isNewer(candidate,current)` = `compare===1`.
+- One home for the comparison (CLAUDE.md *Complexity lives in core*). ESM, importable by app.js + the picker.
+
+### 3. "Update available" badge (status bar)
+- `src/ui/index.html`: `<a id="fw-update-badge" class="fw-update-badge" hidden>` in `#status-bar`, before `#ws-dot`.
+- `src/ui/style.css`: small amber-ish badge (reuse existing palette), hidden by default.
+- `src/ui/app.js`:
+  - Cache + fetch (reuse picker's `safeLocalGet/Set` + TTL pattern; key `projectMM.update.latest.v1`; TTL 1 h; serve stale on failure). `getLatestStableRelease({force})` → fetches `api.github.com/repos/MoonModules/projectMM/releases/latest` only if stale or forced.
+  - Compare: device `version` + `firmware` key from `/api/state`; `isNewer(latest.tag_name, deviceVersion)` AND a compatible `firmware-<key>-v<ver>.bin` exists in the release assets (mirrors sveltekit's asset-target check).
+  - When: cache-first check on load; `{force:true}` when the Firmware module opens.
+  - Click: `safeLocalSet("projectMM.picker.releaseTag", tag)` then `selectModule(<firmware module>)` → Firmware card opens with the new release pre-selected, Install ready.
+  - Graceful: any failure → badge hidden, `console.warn` only.
+
+## Files
+- `library.json` · `scripts/build/verify_version.py` · `src/core/FirmwareUpdateModule.h` · `docs/moonmodules/core/FirmwareUpdateModule.md`
+- `src/ui/semver.js` (NEW) · `src/ui/index.html` · `src/ui/style.css` · `src/ui/app.js`
+- `test/js/semver.test.mjs` (NEW)
+
+## Verification
+- Host: `node --test "test/js/**/*.test.mjs"`; `node --check` the JS + extract-check index.html; `cmake --build build` + `ctest`; `uv run scripts/scenario/run_scenario.py`; `uv run scripts/check/check_specs.py`; a `test/python` verify_version case (`v2.1.0` ↔ `2.1.0-dev` OK; `v2.2.0` ↔ `2.1.0-dev` fails).
+- Bench/preview: Firmware card shows clean semver; badge appears on an older device, opens Firmware pre-selected; no badge on newest stable; no error offline.
+
+## Existing releases — already semver-compatible (no migration)
+Only `v1.0.0` + `v2.0.0` (both clean semver) + `latest` (moving prerelease channel, excluded by `releases/latest`). Badge input is always a clean `vX.Y.Z`; nothing to migrate.
+
+## Risks / notes
+- Release ritual: next stable bumps `library.json` `2.1.0-dev` → `2.1.0` before tagging. Keep verify_version's suffix-strip exact so a wrong core still fails. Call out in the PR.
+- GitHub rate limit (60/h/IP): 1 h cache + serve-stale keeps it well under; badge is best-effort.
+- No npm toolchain: semver.js is plain ESM, `node:test` only. Our own code, no `compare-versions` dep.
+- `release.yml` `paths:` change currently uncommitted on this branch is a *separate* installer-deploy fix — commit independently.
diff --git a/docs/history/plans/Plan-20260625 - Multi-layer composition.md b/docs/history/plans/Plan-20260625 - Multi-layer composition.md
new file mode 100644
index 0000000..6345dda
--- /dev/null
+++ b/docs/history/plans/Plan-20260625 - Multi-layer composition.md	
@@ -0,0 +1,77 @@
+# Plan — Multi-layer composition (blend N layers into the consumer buffer)
+
+> Approved feature plan (PO reference, per CLAUDE.md *Plan before implementing*). The filename gets a `(shipped)` / `(attempted, abandoned)` marker when its outcome is known.
+
+## Context
+
+The product owner wants two things: **multiple effects per layer** and **multiple layers blended into the consumer buffer**. Investigation shows:
+
+- **Multiple effects per layer is ALREADY DONE.** `Layer::loop()` ([src/light/layers/Layer.h:137-142](../../src/light/layers/Layer.h)) iterates *all* enabled effect children in order and calls each `eff->loop()`; they write the same layer buffer sequentially, each overwriting/adding where it writes — exactly the requested "next effect overwrites the previous where it writes." No work needed; verify with a scenario and move on.
+- **Multi-layer composition is the real work** — the 🚧 designed-not-implemented item (architecture.md §345) + backlog item (backlog-core.md:208). `Layers` holds N layers but `Layers::activeLayer()` hands `Drivers` only the **first enabled** layer; the rest render their buffers but never reach output.
+
+The groundwork is already in place, which makes this small:
+- **`Drivers` already owns `outputBuffer_`** and already calls `blendMap(layer->buffer(), outputBuffer_, lut, cpl)` in `loop()` ([Drivers.h:186-193](../../src/light/drivers/Drivers.h)) — for one layer today.
+- **`blendMap` already has the additive-with-clamp path** for overlapping sources, built *for* this ([BlendMap.h:16](../../src/light/layers/BlendMap.h), documented in [BlendMap.md](../../docs/moonmodules/light/BlendMap.md) §5).
+- **Each Layer already owns its own buffer + LUT** and renders independently.
+
+So composition = loop over enabled layers instead of one, blending each into the same `outputBuffer_` per its mode/opacity.
+
+## Decisions (with PO)
+
+- **Compositing site: Drivers.** Each Layer keeps its own buffer; `Drivers` composites them in order into `outputBuffer_`, then map+correct per child driver as today. (Matches architecture.md §345.)
+- **Blend value on Layer, blend logic in Drivers.** `blendMode` + `opacity` are per-Layer **controls** (inert parameters that travel with the layer through add/delete/reorder — no separate sync'd list). Drivers reads each layer's settings + the **Layers container's child order** and blends predecessors→successors. Precedent: `Correction` (per-X state, Drivers applies it). The PO's insight — a Layer can't know its stack position — is honoured: order and orchestration live in Drivers; only the *parameter* lives on the Layer.
+- **Blend modes first: Alpha (opacity) + Additive.** The two architecture.md §345 names. Additive = sum-with-clamp (the existing `blendMap` path); Alpha = opacity-weighted over. More modes (multiply/screen) later.
+- **Order = Layers container child order** (already drag-reorderable, like effects/modifiers). The bottom (first-composited) layer's blendMode is moot — nothing under it; it just fills the buffer.
+
+## Approach
+
+### 1. Per-Layer blend controls (`src/light/layers/Layer.h`)
+- Add `blendMode` (Select: `alpha` / `additive`) + `opacity` (uint8 0–255, default 255) controls in `onBuildControls()`. Inert — Layer doesn't act on them; Drivers reads them.
+- Expose accessors `blendMode()` / `opacity()` for Drivers to read.
+
+### 2. `Layers` exposes all enabled layers in order (`src/light/layers/Layers.h`)
+- Keep `activeLayer()` (first enabled) for the degenerate/back-compat path, but add an ordered walk — e.g. `forEachEnabledLayer(cb)` or `enabledLayers()` — so Drivers can iterate the stack in child order. Don't build a parallel list; iterate the container's children, role-filtered to `Layer`, `enabled()` only (same filter `activeLayer()` already uses).
+
+### 3. Drivers composites all layers (`src/light/drivers/Drivers.h`)
+- `onBuildState()`: size `outputBuffer_` from the composition extent (the max physical extent across enabled layers — today it's the single layer's `physicalLightCount()`; with N layers it's the max, since they composite into one physical space). Keep the degrade-on-alloc-fail path.
+- `loop()`: replace the single `blendMap(layer_->buffer(), outputBuffer_, …)` with an ordered pass:
+  - **First enabled layer**: clears + writes `outputBuffer_` (the existing overwrite/clear behaviour — `blendMap` already clears dst first).
+  - **Each subsequent enabled layer**: blends into `outputBuffer_` per its `blendMode` + `opacity` — `additive` uses the existing clamp path; `alpha` is `out = src*α + out*(1-α)`.
+  - This needs `blendMap` to take a **blend mode + opacity** (today it picks overwrite-vs-additive purely from the LUT's `overwrites_`). Extend its signature: `blendMap(src, dst, lut, cpl, BlendOp op, uint8_t opacity, bool first)` — `first` selects clear-then-write; `op`/`opacity` select the per-pixel combine. Keep the fast overwrite path for `first && opacity==255`.
+- `passBufferToDrivers()`: unchanged in spirit — children still read `outputBuffer_` (the composed result). The single-layer identity fast path (no LUT → read `layer_->buffer()` directly) only applies when there's exactly one enabled layer with no LUT; with ≥2 layers there's always a composite, so `outputBuffer_` is the source. Preserve the 1-layer-no-LUT zero-copy fast path as a special case.
+
+### 4. `blendMap` gains a mode + opacity (`src/light/layers/BlendMap.h`)
+- Add a small `BlendOp { Overwrite, Alpha, Additive }` enum + opacity param. Keep the existing fast overwrite-copy path (first layer, full opacity, single-write LUT). Bounds-checks stay. The additive-clamp path already exists; add the alpha path (integer math: `(src*α + dst*(255-α) + 127) / 255` per channel, clamped — textbook 8-bit alpha-over).
+
+## Files
+- `src/light/layers/Layer.h` — blendMode + opacity controls + accessors
+- `src/light/layers/Layers.h` — ordered enabled-layer walk
+- `src/light/drivers/Drivers.h` — composite loop over enabled layers into outputBuffer_; size from max extent
+- `src/light/layers/BlendMap.h` — BlendOp + opacity param; alpha path
+- `docs/moonmodules/light/Layer.md` / `Layers.md` / `Drivers.md` / `BlendMap.md` — document the controls + composition (move the 🚧 in architecture.md §345 to present-tense; remove/trim the backlog item)
+- `docs/architecture.md` — §345 multi-layer composition: 🚧 → present tense once it ships
+- `test/scenarios/light/scenario_*` — new composition scenario(s); a unit test for the alpha/additive blend math
+
+## Hot-path notes
+- Integer alpha math only (no float per-light) — `(src*α + dst*(255-α) + 127)/255`, clamped; the project's per-light-integer rule.
+- N layers = N `blendMap` passes over the physical buffer per tick — cost scales with enabled-layer count × physical lights. Single-layer path keeps today's cost (one pass, or zero-copy when no LUT). Capture the multi-layer tick in `performance.md`.
+- No per-tick allocation: `outputBuffer_` is allocated in `onBuildState`, reused each frame. PSRAM-first via the existing alloc.
+- Robustness: add/delete/reorder/disable any layer in any order, 0×0×0, all enabled / none enabled — the compositor degrades (none enabled → cleared/black output, never a crash; the existing null-tolerance + degrade-on-alloc-fail patterns extend to the loop).
+
+## Verification
+- Unit: blend math (alpha + additive, clamp, opacity endpoints 0/255).
+- Scenario: two layers, one additive one alpha, assert composited buffer; reorder layers → output changes; disable top layer → only bottom shows; multi-effect-per-layer (verify the already-working behaviour while here).
+- Build (`-Werror`), ctest, scenarios, ESP32 build, KPI (record the multi-layer tick).
+- Bench: two layers on the S3, blend modes + opacity live-adjusted, no reboot.
+
+## Staging (start small, grow)
+1. **Additive-only, opacity 255**, 2 layers → proves the composite loop end-to-end (smallest beautiful increment; uses the existing blendMap additive path almost unchanged).
+2. **Opacity** (alpha-over) — the per-pixel alpha path + the opacity control.
+3. **blendMode control + UI** — select between alpha/additive per layer.
+4. **Docs present-tense + backlog removal**; performance.md multi-layer numbers.
+5. (later) more blend modes (multiply/screen) when wanted.
+
+## Out of scope
+- Per-layer coordinate offset (separate backlog item — layers still share the coordinate box today).
+- More blend modes beyond alpha/additive (later).
+- Multi-layer UI beyond the per-layer controls (the "tab/accordion to switch layers" UI note in backlog-core.md:347 stays backlog).
diff --git a/docs/history/plans/Plan-20260625 - RegionModifier (start-end carving).md b/docs/history/plans/Plan-20260625 - RegionModifier (start-end carving).md
new file mode 100644
index 0000000..00c6084
--- /dev/null
+++ b/docs/history/plans/Plan-20260625 - RegionModifier (start-end carving).md	
@@ -0,0 +1,81 @@
+# Plan — RegionModifier (start/end region carving)
+
+**Date:** 2026-06-25
+**Branch:** next-iteration
+
+## Goal
+
+Make per-Layer start/end region carving functional: a Layer can render its effect into only a sub-region of the physical bounding box (e.g. start `0,0,0` → end `50,50,0` writes only the top-left quarter; the rest stays dark). Coordinates are **percentages** of the physical width/height/depth, not absolute pixels.
+
+## Decision: implement as a modifier, not as Layer::rebuildLUT logic
+
+The six `startX/Y/Z`, `endX/Y/Z` controls currently live on `Layer` as **dead state** (persisted, surfaced in the UI, but `rebuildLUT()` ignores them). The original spec planned to wire them into `rebuildLUT`. The better solution, chosen with the product owner: a **`RegionModifier`** — a static modifier carrying the six percentage controls.
+
+Why the modifier path wins (per § Principles):
+
+- **Zero core change.** `Layer::rebuildLUT()` already runs the first enabled modifier through `logicalDimensions()` + `mapToPhysical()`. Carving is exactly those two operations, so it rides the existing path — no new branch in the most complex core file.
+- **Fast path is free.** The product owner's hard constraint: full region (0,0,0→100,100,100) must cost nothing. With a modifier, *full region = no modifier present* → the existing identity-memcpy / dense fast path runs byte-identical. There is no carving code in the hot path or the no-modifier build path at all.
+- **Minimalism / subtraction.** Net: **delete** six dead controls + their wiring from `Layer.h`; **add** one ~60-line modifier mirroring `CheckerboardModifier`. Reuses a recognisable shape (a crop/region node in any compositor).
+- **Composes with modifier chaining** (backlog item): carving-as-a-modifier *is* the composition story — once chaining lands, Region + Mirror + Rotate stack.
+
+Behaviour (product owner confirmed): **drop outside.** Lights outside the region get no physical destination (`outCount = 0`, the same mask path `CheckerboardModifier` uses). The logical box shrinks to the region size, so the effect only renders the carved region; the rest of the layer is dark. `maxMultiplier() == 1` (1:1 inside, 1:0 outside — never fans out).
+
+## Rounding rule (from the existing spec, Layer.md § start/end)
+
+> **Shipped differently:** during implementation the product owner chose a **half-open `[start, end)`** interval (end exclusive) so abutting regions tile exactly, instead of the inclusive rule sketched below. The authoritative rule is in `RegionModifier.h` / `RegionModifier.md`; the inclusive version here is the original intent, kept as the design record.
+
+Per axis, percentage → pixel:
+- `startPixel = floor(start% / 100 · W)`
+- `endPixel   = ceil (end%  / 100 · W)`, treated as an **inclusive** last pixel
+- region width on that axis = `endPixel − startPixel + 1`
+
+Clamp `startPixel` to `[0, W−1]` and `endPixel` to `[startPixel, W−1]` so a region is always ≥1 pixel and never runs off the box. (Negative / >100 percentages are legal on the wire — they clamp to the box here; a future drag-off-screen use reads them raw, but carving clamps.)
+
+Spec example: start=33, end=66 on a 4-wide axis → start `floor(1.32)=1`, end `ceil(2.64)=3` → pixels 1..3 inclusive (width 3). Default start=0,end=100 → 0..(W−1) = full width (identity).
+
+## Files
+
+### New: `src/light/modifiers/RegionModifier.h` (~60 lines)
+
+Mirror `CheckerboardModifier.h`:
+- Controls: `startX, startY, startZ` (default 0), `endX, endY, endZ` (default 100), all `addInt16` (negative/>100 legal on the wire, clamped in the math).
+- `maxMultiplier() == 1`.
+- `dimensions()` — advisory chip; D3 (it can carve any axis).
+- A private `axisRange(pct_start, pct_end, physExtent) -> {startPixel, count}` helper applying the rounding rule + clamp, used by both `logicalDimensions` and `mapToPhysical` so the two can't drift.
+- `logicalDimensions()`: `logW/H/D = count` per axis (the region size).
+- `mapToPhysical(lx,ly,lz, physW,physH,physD, ...)`: translate region-local `(lx,ly,lz)` to box coordinate `(lx+startPixelX, ly+startPixelY, lz+startPixelZ)`, emit the single box index, `outCount = 1`. (Always in-bounds because `logicalDimensions` already sized the logical box to the clamped region — no per-cell drop needed; the "drop outside" is achieved by the logical box being smaller, exactly like a Mirror shrinks it.)
+
+### Edit: `src/light/layers/Layer.h`
+
+- **Remove** `startX/Y/Z`, `endX/Y/Z` fields, their `addInt16` calls in `onBuildControls`, and the long start/end comment block (lines ~21-48). Keep `blendMode`/`opacity` (unrelated, live).
+- No other change — `rebuildLUT` already handles modifiers.
+
+### Edit: module factory / registration
+
+- Register `RegionModifier` in the factory next to the other modifiers (`CheckerboardModifier`, `MultiplyModifier`, …) so it's addable in the UI and round-trips through persistence/types.
+
+### Docs
+
+- `docs/moonmodules/light/RegionModifier.md` — new spec page (controls, percent semantics, rounding rule, drop-outside, prior art: a crop/region node; MoonLight has no direct equivalent but its modifier model is the lineage). Mention every control name (spec-check requirement).
+- `docs/moonmodules/light/Layer.md` — delete the `## start/end controls` section; replace with a one-line pointer: region carving is a modifier ([RegionModifier](RegionModifier.md)), not a Layer control. Update the § Status paragraph (it currently says "start/end region carving" reshapes the logical box — still true, but now via the modifier).
+- `docs/architecture.md` § Effects (line ~362) — the Layer determines buffer dims from "the Layouts, its own start/end percentages, and its modifiers"; change to "the Layouts and its modifiers (region carving among them)".
+- `docs/architecture.md` § Layers and Layer — note RegionModifier as a built-in carve modifier if the modifier list is enumerated.
+- Remove the now-shipped backlog reference to start/end region carving (Layer.md pointed at backlog/README; if backlog has an item, delete it per *Mandatory subtraction*).
+
+### Tests
+
+- `test/unit/light/unit_RegionModifier.cpp`:
+  - `logicalDimensions`: 0/100 → full box (identity); 0/50 on 128 → 64; the spec's 33/66-on-4 → start 1, count 3; clamp of end=100 to W−1 (no off-box overflow); clamp of a >100 / negative percentage.
+  - `mapToPhysical`: a region-local (0,0,0) maps to the box index at the start offset; the last region cell maps to the correct box index; never emits an out-of-box index.
+  - `axisRange` edge cases: W=1 (degenerate axis stays 1), W=0 (no crash).
+- `test/unit/light/unit_Layers_container.cpp` or a Layer carving case: add a Layer with a RegionModifier, build, assert the logical box (`width_×height_×depth_`) equals the region and the driver buffer only carries the region's lights (rest dark). Reuse the existing CaptureDriver fixture.
+- Scenario: extend an existing pipeline scenario (or a small new `scenario_RegionModifier`) — add a RegionModifier at 0,0→50,50, assert the tick passes its gate and the buffer is non-zero only in the carved region. (Construct-mode can't set_control post-scheduler, so use the modifier's default region or a fixture that builds it with the region preset — mirror how `scenario_MultiplyModifier_pipeline` handles defaults.)
+
+## Fast-path guarantee (the product owner's constraint)
+
+No RegionModifier on a Layer → `rebuildLUT` takes the no-modifier branch → identity memcpy (dense natural-order) or the sparse box→driver LUT, exactly as today. The carving code is never reached. Even an *added* full-region (0/100) RegionModifier produces an identity logical box and a 1:1 offset-0 map — correct, just not the absolute cheapest; the cheap path is "don't add it," which is the default.
+
+## Out of scope
+
+- Modifier **chaining** (Region + another modifier composed) — separate backlog item. Today only the first enabled modifier applies, so a Layer uses *either* Region *or* another modifier until chaining lands.
+- Negative / >100 "drag off-screen" semantics beyond clamping — the wire type allows them; carving clamps to the box. Revisit if a real drag-off-screen feature needs the raw values.
diff --git a/docs/history/v1-inventory.md b/docs/history/v1-inventory.md
index a3db28a..e0ca22a 100644
--- a/docs/history/v1-inventory.md
+++ b/docs/history/v1-inventory.md
@@ -119,7 +119,7 @@ This is a throwaway reference document — not committed. Used to decide what to
 
 ### Detailed reverse-engineering (the v1 frontend at 1.4.0)
 
-The v1 `index.html` was fully reverse-engineered. The notes below capture mechanisms worth not rediscovering and, where v3 chose differently, why. The **forward-looking** UI gap analysis (what to still adopt) lives in [backlog/ui-deferred.md](../backlog/ui-deferred.md).
+The v1 `index.html` was fully reverse-engineered. The notes below capture mechanisms worth not rediscovering and, where v3 chose differently, why. The **forward-looking** UI gap analysis (what to still adopt) lives in the [backlog](../backlog/README.md) (UI chapter of backlog-core.md).
 
 **Engine-side data fields v1 exposed that v3 doesn't (yet):**
 - `setup_ok` (bool) + `health` (string) per module — drove a setup-dot colour and tooltip. v3 would add `bool setupOk()` + `const char* health()` to MoonModule when a real failure mode exists.
diff --git a/docs/install/index.html b/docs/install/index.html
index 1ff7ba8..fa5aa6f 100644
--- a/docs/install/index.html
+++ b/docs/install/index.html
@@ -14,481 +14,10 @@
        shadow DOM). The install flow is now driven by
        ./install-orchestrator.js — esptool-js for flash + improv-wifi-serial-sdk
        for WiFi provisioning, both sharing the SerialPort we own end-to-end.
-       The orchestrator is imported by the inline module script at the
-       bottom of <body>; no top-level <script> needed. -->
+       The orchestrator is imported by ./install.js (the page's module script,
+       loaded at the bottom of <body>). -->
 
-  <style>
-    :root {
-      --bg:     #1a1a2e;
-      --card:   #16213e;
-      --fg:     #e0e0e0;
-      --muted:  #a0a0b0;
-      --accent: #a78bfa;
-      --border: #2a3a6a;
-      --ok:     #57c97a;   /* green  — "active" capability (supported + a module configured in deviceModels.json) */
-      --sup:    #e3c84a;   /* yellow — "supported" capability (firmware supports it, not pre-configured) */
-      --plan:   #e8923a;   /* orange — "planned" capability (no module yet; greener than red, by design) */
-    }
-    * { box-sizing: border-box; }
-    body {
-      margin: 0;
-      min-height: 100vh;
-      background: var(--bg);
-      color: var(--fg);
-      font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, sans-serif;
-      font-size: 15px;
-      line-height: 1.55;
-      display: flex;
-      flex-direction: column;
-      align-items: center;
-      padding: 24px 16px 64px;
-    }
-    main { width: 100%; max-width: 640px; }
-    .help-link {
-      display: inline-block;
-      margin-left: 8px;
-      width: 22px; height: 22px; line-height: 22px;
-      text-align: center;
-      font-size: 14px; font-weight: 600;
-      vertical-align: middle;
-      color: var(--accent);
-      border: 1px solid var(--border);
-      border-radius: 50%;
-      text-decoration: none;
-    }
-    .help-link:hover { border-color: var(--accent); }
-    .version-chip {
-      display: inline-block;
-      margin-left: 8px;
-      padding: 2px 8px;
-      background: var(--card);
-      color: var(--muted);
-      border: 1px solid var(--border);
-      border-radius: 4px;
-      font-size: 13px;
-      font-weight: normal;
-      vertical-align: middle;
-    }
-    h1 {
-      margin: 0 0 8px;
-      font-size: 28px;
-      color: var(--accent);
-    }
-    p.tag { margin: 0 0 24px; color: var(--muted); }
-    .card {
-      background: var(--card);
-      border: 1px solid var(--border);
-      border-radius: 8px;
-      padding: 20px;
-      margin-bottom: 16px;
-    }
-    label { display: block; font-weight: 600; margin-bottom: 6px; }
-    select {
-      width: 100%;
-      padding: 10px 12px;
-      background: var(--bg);
-      color: var(--fg);
-      border: 1px solid var(--border);
-      border-radius: 6px;
-      font: inherit;
-    }
-    .button-row { margin-top: 16px; }
-    .note { color: var(--muted); font-size: 13px; margin-top: 10px; }
-    /* `.windows-only` elements are `hidden` by default in the HTML; the tiny
-       userAgent check at the top of <body> below removes `hidden` only on
-       Windows. Inverse to a CSS-only approach because CSS can't detect the
-       host OS — `[hidden]` already wins specificity-wise. */
-    .erase-row { margin-top: 12px; font-size: 13px; }
-    .erase-row label { cursor: pointer; }
-    .erase-row input { vertical-align: middle; margin-right: 6px; }
-    .erase-note { display: inline; margin-top: 0; }
-    a { color: var(--accent); }
-    code {
-      background: rgba(255,255,255,0.06);
-      padding: 1px 6px;
-      border-radius: 3px;
-      font-size: 13px;
-    }
-    .browser-warning {
-      background: #3a2a1a;
-      border: 1px solid #6a4a2a;
-      color: #e6c890;
-      display: none;
-    }
-    ol { padding-left: 22px; }
-    ol li { margin-bottom: 6px; }
-    .credits {
-      max-width: 720px;
-      margin: 32px auto 24px;
-      padding: 0 16px;
-      text-align: center;
-      border-top: 1px solid var(--border);
-      padding-top: 16px;
-    }
-    .credits .note { margin-top: 0; }
-
-    /* Minimal mirror of the device UI's control-row shape so the shared
-       install-picker module (src/ui/install-picker.js) renders the same
-       way on the installer page. The picker emits `.control-row` + child
-       `<select>` markup; without these rules the rows wouldn't lay out. */
-    .control-row {
-      display: flex;
-      align-items: center;
-      gap: 12px;
-      margin: 10px 0;
-    }
-    .control-label {
-      flex: 0 0 80px;
-      font-weight: 600;
-      color: var(--muted);
-    }
-    .control-row select { flex: 1; }
-
-    /* the shared picker still renders its own board <select>
-       (#rp-board) — we keep it (so its change-listener wires) but hide its row;
-       the picture grid above drives it. The row is the .control-row that
-       contains #rp-board. */
-    .control-row:has(#rp-board) { display: none; }
-
-    /* Picture board grid — collapsed by default (a control-row field), expands
-       on click. The summary button is the row's field, so it flexes like the
-       selects (flex: 1) to line up with USB Port / Release / Firmware. */
-    #board-summary {
-      flex: 1; display: flex; align-items: center; justify-content: space-between;
-      gap: 12px; padding: 10px 12px; background: var(--bg); color: var(--fg);
-      border: 1px solid var(--border); border-radius: 6px; font: inherit;
-      cursor: pointer; text-align: left;
-    }
-    #board-summary:hover { border-color: var(--accent); }
-    .board-summary-left { display: flex; align-items: center; gap: 10px; min-width: 0; }
-    .board-summary-thumb {
-      width: 36px; height: 24px; border-radius: 3px; flex-shrink: 0;
-      background: #0e1020 center/contain no-repeat; border: 1px solid var(--border);
-    }
-    #board-summary-label { overflow: hidden; text-overflow: ellipsis; white-space: nowrap; }
-    .board-summary-caret { color: var(--muted); transition: transform .15s; flex-shrink: 0; }
-    #board-summary[aria-expanded="true"] .board-summary-caret { transform: rotate(180deg); }
-    /* The expanded grid breaks out full-width below the row (aligns with the
-       field column by offsetting the label width + gap). */
-    #board-expand { margin: 0 0 10px 92px; }
-    .board-grid-controls { display: flex; align-items: center; gap: 12px; margin-bottom: 12px; flex-wrap: wrap; }
-    #board-search {
-      flex: 1; min-width: 160px; padding: 8px 10px; background: var(--bg);
-      color: var(--fg); border: 1px solid var(--border); border-radius: 6px; font: inherit;
-    }
-    .board-clear {
-      background: transparent; color: var(--muted); border: 1px solid var(--border);
-      border-radius: 6px; padding: 8px 12px; font: inherit; font-size: 13px; cursor: pointer;
-    }
-    .board-clear:hover { color: var(--fg); border-color: var(--accent); }
-    .board-filter-notice { color: var(--muted); font-size: 12px; margin-bottom: 10px; }
-    .board-filter-notice button {
-      background: none; border: none; color: var(--accent); font: inherit; font-size: 12px;
-      cursor: pointer; padding: 0; text-decoration: underline;
-    }
-    #board-grid { max-height: 420px; overflow-y: auto; }   /* expanded grid scrolls, not the page */
-    #board-grid {
-      display: grid; grid-template-columns: repeat(auto-fill, minmax(150px, 1fr)); gap: 10px;
-    }
-    .bg-chip-label {
-      grid-column: 1 / -1; color: var(--muted); font-size: 11px; text-transform: uppercase;
-      letter-spacing: .06em; margin: 6px 0 0;
-    }
-    .bg-card {
-      background: var(--bg); border: 1px solid var(--border); border-radius: 8px;
-      overflow: hidden; cursor: pointer; transition: border-color .12s, background .12s;
-      display: flex; flex-direction: column;
-    }
-    .bg-card:hover { border-color: var(--accent); }
-    .bg-card.selected { border-color: var(--accent); box-shadow: 0 0 0 1px var(--accent) inset; }
-    .bg-thumb {
-      aspect-ratio: 16 / 10; background: #0e1020 center/contain no-repeat;
-      display: flex; align-items: center; justify-content: center;
-      color: var(--muted); font-size: 10px; border-bottom: 1px solid var(--border);
-    }
-    .bg-thumb.noimg::after { content: "no photo"; }
-    .bg-body { padding: 8px 9px; display: flex; flex-direction: column; gap: 3px; }
-    .bg-name { font-weight: 600; font-size: 12px; line-height: 1.2; }
-    .bg-meta { color: var(--muted); font-size: 11px; }
-    /* Capability chips: supported (green) vs planned (orange) — distinguished by
-       colour, not by extra text. Labels are kept short in deviceModels.json so every
-       chip fits the ~150px card; the full label + state is in the chip's title
-       tooltip. */
-    .bg-caps { display: flex; flex-wrap: wrap; gap: 3px; margin-top: 3px; }
-    .bg-cap {
-      font-size: 9px; line-height: 1.5; padding: 0 5px; border-radius: 999px;
-      max-width: 100%; overflow: hidden; text-overflow: ellipsis; white-space: nowrap;
-    }
-    .bg-cap.act { background: color-mix(in srgb, var(--ok) 18%, transparent); color: var(--ok); }
-    .bg-cap.sup { background: color-mix(in srgb, var(--sup) 20%, transparent); color: var(--sup); }
-    .bg-cap.plan { background: color-mix(in srgb, var(--plan) 20%, transparent); color: var(--plan); }
-    .bg-link { color: var(--accent); font-size: 11px; text-decoration: none; }
-    .bg-link:hover { text-decoration: underline; }
-
-    /* Board-details popup — native <dialog> (standard modal pattern: built-in
-       backdrop, ESC-to-close, focus trap; no bespoke modal JS). Shows the full
-       deviceModels.json entry as a readable summary plus a collapsible raw-JSON block. */
-    #board-details::backdrop { background: rgba(0,0,0,0.6); }
-    #board-details {
-      background: var(--card); color: var(--fg);
-      border: 1px solid var(--border); border-radius: 10px;
-      padding: 0; max-width: 560px; width: calc(100% - 32px);
-      max-height: 80vh; overflow: auto;
-    }
-    .bd-head {
-      display: flex; align-items: baseline; justify-content: space-between;
-      gap: 12px; padding: 16px 18px 8px;
-    }
-    .bd-title { font-size: 16px; font-weight: 600; }
-    .bd-close {
-      background: none; border: none; color: var(--muted);
-      font-size: 20px; line-height: 1; cursor: pointer; padding: 0 4px;
-    }
-    .bd-close:hover { color: var(--fg); }
-    .bd-body { padding: 0 18px 18px; }
-    .bd-row { display: flex; gap: 8px; padding: 3px 0; font-size: 13px; }
-    .bd-key { color: var(--muted); min-width: 92px; }
-    .bd-val { flex: 1; min-width: 0; word-break: break-word; }
-    .bd-section { margin-top: 14px; font-weight: 600; font-size: 13px; }
-    .bd-mod { margin-top: 8px; padding-left: 10px; border-left: 2px solid var(--border); }
-    .bd-mod-name { font-size: 13px; }
-    .bd-mod-name .bd-mod-id { color: var(--muted); font-weight: normal; }
-    .bd-ctrl { font-size: 12px; color: var(--muted); padding-left: 8px; }
-    .bd-ctrl code { font-size: 11px; }
-    .bd-raw { margin-top: 16px; }
-    .bd-raw summary { cursor: pointer; color: var(--accent); font-size: 12px; }
-    .bd-raw pre {
-      margin: 8px 0 0; padding: 10px; background: var(--bg);
-      border: 1px solid var(--border); border-radius: 6px;
-      font-size: 11px; overflow: auto; white-space: pre;
-    }
-    .bg-link.bg-details { cursor: pointer; }
-
-    .action-btn {
-      background: var(--accent);
-      color: var(--bg);
-      border: none;
-      border-radius: 6px;
-      padding: 10px 20px;
-      font: inherit;
-      font-weight: 600;
-      cursor: pointer;
-    }
-    .action-btn:disabled { opacity: 0.5; cursor: not-allowed; }
-    .rp-status { color: var(--muted); font-size: 13px; }
-    .rp-status-row { min-height: 1.5em; }
-
-    /* Inline spinner shown in a field while its data is still being fetched
-       (install-picker renderSkeleton). A 1em spinning ring, sized to sit next
-       to the select's "Loading…" placeholder. */
-    .rp-spinner {
-      display: inline-block;
-      width: 1em; height: 1em;
-      vertical-align: -0.15em;
-      margin-right: 0.4em;
-      border: 2px solid var(--muted);
-      border-top-color: transparent;
-      border-radius: 50%;
-      animation: rp-spin 0.7s linear infinite;
-    }
-    @keyframes rp-spin { to { transform: rotate(360deg); } }
-
-    /* "Your devices" card — one row per provisioned device. The row
-       is the picker's `.control-row` flex shape with the device info
-       on the left and action buttons on the right. */
-    .device-row {
-      justify-content: space-between;
-      padding: 8px 0;
-      border-top: 1px solid rgba(255,255,255,0.06);
-    }
-    .device-row:first-child { border-top: 0; }
-    .device-info { min-width: 0; flex: 1; }
-    .device-url {
-      display: block;
-      font-family: ui-monospace, monospace;
-      color: var(--muted);
-      font-size: 12px;
-      text-decoration: none;
-      overflow: hidden;
-      text-overflow: ellipsis;
-      white-space: nowrap;
-    }
-    .device-url:hover { color: var(--accent); text-decoration: underline; }
-    .device-seen { color: var(--muted); font-size: 12px; margin-top: 2px; }
-    .device-actions { display: flex; gap: 6px; flex-shrink: 0; }
-    .device-btn {
-      background: transparent;
-      color: var(--accent);
-      border: 1px solid var(--accent);
-      border-radius: 4px;
-      padding: 4px 10px;
-      font: inherit;
-      font-size: 12px;
-      cursor: pointer;
-    }
-    .device-model-name { color: var(--fg); font-size: 12px; margin-top: 2px; }
-    .device-btn:hover { background: rgba(123, 158, 255, 0.08); }
-
-    /* Install modal — backdrop + centered card. Replaces the ESP Web Tools
-       <esp-web-install-button> shadow-DOM dialog. Sections show one at a
-       time via .install-section.active. */
-    .install-backdrop {
-      position: fixed; inset: 0;
-      background: rgba(0, 0, 0, 0.65);
-      display: none;
-      align-items: center;
-      justify-content: center;
-      z-index: 1000;
-    }
-    .install-backdrop.open { display: flex; }
-    .install-modal {
-      background: var(--card);
-      border: 1px solid var(--border);
-      border-radius: 8px;
-      padding: 24px;
-      max-width: 480px;
-      width: calc(100% - 32px);
-      box-shadow: 0 8px 32px rgba(0, 0, 0, 0.5);
-    }
-    .install-modal h2 {
-      margin: 0 0 16px;
-      font-size: 20px;
-      color: var(--accent);
-    }
-    .install-section { display: none; }
-    .install-section.active { display: block; }
-    .install-status { margin: 8px 0; color: var(--muted); }
-    .install-done-note { margin: 4px 0 10px; font-size: 13px; color: var(--muted); }
-    /* Notice variant — for a flashed-OK-but-action-needed outcome (e.g. eth-only firmware
-       waiting on a cable). Amber, like the "supported" capability chip (var(--sup)): reads as
-       "do this next", not a plain note and not a red error. */
-    .install-done-note.install-done-note--notice {
-      color: var(--sup);
-      background: color-mix(in srgb, var(--sup) 12%, transparent);
-      border-left: 3px solid var(--sup);
-      padding: 8px 10px; border-radius: 4px;
-    }
-    .install-warn { color: #d4a052; font-size: 12px; margin-top: 8px; }
-    .install-progress {
-      height: 8px;
-      background: var(--bg);
-      border-radius: 4px;
-      overflow: hidden;
-      margin: 12px 0;
-    }
-    .install-progress-bar {
-      height: 100%;
-      background: var(--accent);
-      width: 0;
-      transition: width 0.2s;
-    }
-    /* Indeterminate state — esptool-js's eraseFlash() doesn't report
-       progress (12 s of "wait and hope"), so we animate a marquee-style
-       bar to confirm the page hasn't hung. Toggled by adding the
-       .indeterminate class to .install-progress-bar; width set to 100%
-       so the animation has something to clip. */
-    .install-progress-bar.indeterminate {
-      width: 100%;
-      background: linear-gradient(
-        90deg,
-        var(--bg) 0%,
-        var(--accent) 40%,
-        var(--accent) 60%,
-        var(--bg) 100%);
-      background-size: 200% 100%;
-      animation: install-marquee 1.4s linear infinite;
-      transition: none;
-    }
-    @keyframes install-marquee {
-      from { background-position: 100% 0; }
-      to   { background-position: -100% 0; }
-    }
-    .install-form label {
-      display: block;
-      margin: 12px 0 4px;
-      font-size: 13px;
-      color: var(--muted);
-    }
-    .install-form input[type="text"],
-    .install-form input[type="password"] {
-      width: 100%;
-      padding: 8px 12px;
-      background: var(--bg);
-      color: var(--fg);
-      border: 1px solid var(--border);
-      border-radius: 6px;
-      font: inherit;
-    }
-    .install-actions {
-      display: flex;
-      gap: 8px;
-      justify-content: flex-end;
-      margin-top: 16px;
-    }
-    .install-actions button {
-      padding: 8px 16px;
-      font: inherit;
-      font-weight: 600;
-      border: 0;
-      border-radius: 6px;
-      cursor: pointer;
-    }
-    .install-actions button.primary {
-      background: var(--accent);
-      color: #1a1a2e;
-    }
-    .install-actions button.secondary {
-      background: transparent;
-      color: var(--fg);
-      border: 1px solid var(--border);
-    }
-    .install-error {
-      color: #f8a5a5;
-      font-size: 13px;
-      margin: 12px 0;
-      white-space: pre-wrap;
-      word-break: break-word;
-    }
-    .install-success-url {
-      display: block;  /* IP and <name>.local each on their own line */
-      width: fit-content;
-      margin-top: 8px;
-      color: var(--accent);
-      text-decoration: none;
-      font-family: ui-monospace, monospace;
-    }
-    .install-success-url:hover { text-decoration: underline; }
-    .install-log-wrap {
-      margin-top: 16px;
-      border-top: 1px solid var(--border);
-      padding-top: 12px;
-    }
-    .install-log-toggle {
-      background: transparent;
-      color: var(--muted);
-      border: 0;
-      padding: 0;
-      cursor: pointer;
-      font: inherit;
-      font-size: 12px;
-      text-decoration: underline;
-    }
-    .install-log-toggle:hover { color: var(--fg); }
-    .install-log {
-      margin-top: 8px;
-      max-height: 240px;
-      overflow: auto;
-      background: var(--bg);
-      color: var(--muted);
-      font-family: ui-monospace, monospace;
-      font-size: 11px;
-      padding: 8px;
-      border: 1px solid var(--border);
-      border-radius: 4px;
-      white-space: pre-wrap;
-      word-break: break-all;
-    }
-  </style>
+  <link rel="stylesheet" href="./install.css">
 </head>
 <body>
   <!-- Reveal the Windows-CH340 BOOT-button hints (the `.windows-only`
@@ -499,13 +28,6 @@
        no third-party UA parser pulled in for one boolean. The install
        modal is hidden by default, so the toggle happens off-screen and
        there's no flash-of-visible-content concern. -->
-  <script>
-    document.addEventListener('DOMContentLoaded', () => {
-      if (/Windows/i.test(navigator.userAgent)) {
-        document.querySelectorAll('.windows-only').forEach(el => el.hidden = false);
-      }
-    });
-  </script>
   <main>
     <h1>projectMM Installer <span class="version-chip" id="version-chip" hidden></span>
       <a class="help-link" href="https://github.com/MoonModules/projectMM/blob/main/docs/install/README.md"
@@ -875,1206 +397,6 @@ <h2>Serial monitor</h2>
     </div>
   </div>
 
-  <script type="module">
-    // Shared install-picker (release → board → firmware). Same file as the
-    // on-device OTA UI uses; only the onInstall callback differs:
-    //   - Device UI: POST the chosen .bin URL to /api/firmware/url; device
-    //     fetches the binary directly via esp_https_ota.
-    //   - Web installer (here): hand the manifest URL to the orchestrator,
-    //     which flashes via esptool-js then provisions WiFi via Improv,
-    //     all over the same SerialPort.
-    //
-    // Manifests + binaries must be same-origin with this page (Web Serial
-    // would happily flash from any URL, but the manifest fetch + part
-    // downloads via fetch() are subject to CORS). The release workflow
-    // self-hosts the last N releases into pages/install/releases/<tag>/.
-    // toLocalUrl rewrites the picker's absolute GitHub URLs to the local
-    // copies before handing them to the orchestrator.
-    import { installPicker } from "./install-picker.js";
-    import { myDevices }    from "./devices.js";
-    import { installer }    from "./install-orchestrator.js";
-    // Board catalog + chip detection — web-installer only, kept out of the
-    // firmware-embedded install-picker.js and injected here via boardSupport.
-    import * as boardSupport from "./install-picker-boards.js";
-
-    // Show the project version next to the heading. library.json ships
-    // alongside index.html (preview_installer.py + release.yml both copy
-    // it). Fetch silently — if it's missing for any reason, leave the
-    // chip hidden rather than rendering "?" noise.
-    (async () => {
-        try {
-            const res = await fetch("./library.json");
-            if (!res.ok) return;
-            const lib = await res.json();
-            if (!lib || !lib.version) return;
-            const chip = document.getElementById("version-chip");
-            chip.textContent = `v${lib.version}`;
-            chip.hidden = false;
-        } catch (_) { /* silent: cosmetic-only */ }
-    })();
-
-    // Map a GitHub release-asset URL to its Pages-hosted mirror.
-    //   https://github.com/MoonModules/projectMM/releases/download/<TAG>/<file>
-    //   → ./releases/<TAG>/<file>
-    function toLocalUrl(githubUrl) {
-      const m = /\/releases\/download\/([^/]+)\/([^/]+)$/.exec(githubUrl);
-      if (!m) return githubUrl;  // unrecognised shape: pass through unchanged
-      const [, tag, name] = m;
-      //   https://github.com/.../releases/download/<TAG>/<file>
-      //   → ./releases/<TAG>/<file>  (same-origin, served from this dir)
-      return `./releases/${tag}/${name}`;
-    }
-
-    // --- Install modal section toggling ---------------------------------
-    const backdrop = document.getElementById("install-backdrop");
-    const title = document.getElementById("install-title");
-    const sections = {
-      connecting:   document.getElementById("section-connecting"),
-      wrongPort:    document.getElementById("section-wrong-port"),
-      flashing:     document.getElementById("section-flashing"),
-      wifiForm:     document.getElementById("section-wifi-form"),
-      provisioning: document.getElementById("section-provisioning"),
-      needsIp:      document.getElementById("section-needs-ip"),
-      done:         document.getElementById("section-done"),
-      error:        document.getElementById("section-error"),
-    };
-    function showSection(name) {
-      for (const [k, el] of Object.entries(sections)) {
-        el.classList.toggle("active", k === name);
-      }
-    }
-    function openModal(titleText) {
-      title.textContent = titleText;
-      backdrop.classList.add("open");
-      // Reset the log per install session so users see only the current run.
-      document.getElementById("install-log").textContent = "";
-      // Reset toggle to collapsed state.
-      const log = document.getElementById("install-log");
-      const toggle = document.getElementById("log-toggle");
-      log.hidden = true;
-      toggle.textContent = "Show log";
-      // Reset the needs-ip dialog to its idle state — covers the case where
-      // a prior install ended in retry-success (which leaves the disabled +
-      // spinner state intact, since the WiFi-creds form took over the
-      // visible card) and the next install hits the needs-ip path again.
-      showNeedsIpRetrying(false);
-      // Lock out the monitor button while an install runs. Web Serial
-      // grants exclusive port access; a Monitor click mid-flash would
-      // race the install for the SerialPort and either steal it
-      // (corrupting the flash) or get a misleading "already open" error.
-      // closeModal re-enables.
-      monitorBtn.disabled = true;
-      // Guard against accidental tab-close mid-flash. Browser shows a
-      // generic "leave site?" prompt (Chrome ignores the custom text since
-      // 2017 — security hardening). disarmUnloadGuard() runs on done /
-      // error / cancel so the user can close the page when it's safe.
-      armUnloadGuard();
-    }
-    function closeModal() {
-      backdrop.classList.remove("open");
-      disarmUnloadGuard();
-      monitorBtn.disabled = false;
-      // Wipe the password field on every modal close — success, cancel,
-      // or error. The form is built lazily and re-used across installs in
-      // the same page session; without this the typed password lingers
-      // in the live `.value`. (We don't clear `defaultValue` — it stayed
-      // as the form's initial empty string from buildWifiForm's innerHTML
-      // assignment; setting `.value` clears the rendered value, which is
-      // the only thing visible to a script reading the DOM after close.)
-      // Same wipe runs at the start of each `wifi-creds-form` show, but
-      // having both belts ensures the wipe runs even when the user
-      // bypasses the form via Skip or the install fails before reaching
-      // the creds step.
-      const passEl = document.getElementById("wifi-password");
-      if (passEl) passEl.value = "";
-    }
-    let unloadGuard = null;
-    function armUnloadGuard() {
-      if (unloadGuard) return;
-      unloadGuard = (e) => {
-        e.preventDefault();
-        e.returnValue = "";  // legacy contract — Chrome ignores the string
-      };
-      window.addEventListener("beforeunload", unloadGuard);
-    }
-    function disarmUnloadGuard() {
-      if (!unloadGuard) return;
-      window.removeEventListener("beforeunload", unloadGuard);
-      unloadGuard = null;
-    }
-    document.getElementById("done-close").addEventListener("click", closeModal);
-    document.getElementById("error-close").addEventListener("click", closeModal);
-
-    // Board-details popup close button. The <dialog> also closes on ESC and a
-    // backdrop click (native); this wires the explicit ✕. A click on the dialog
-    // backdrop (the element itself, outside .bd-body) closes it too.
-    const bd = document.getElementById("board-details");
-    document.getElementById("bd-close").addEventListener("click", () => bd.close());
-    bd.addEventListener("click", (e) => { if (e.target === bd) bd.close(); });
-
-    // Log panel: collapsible, fed by the orchestrator's onLog callback.
-    // Auto-scrolls to bottom on append so the latest line is always visible.
-    const logEl = document.getElementById("install-log");
-    const logToggle = document.getElementById("log-toggle");
-    logToggle.addEventListener("click", () => {
-      logEl.hidden = !logEl.hidden;
-      logToggle.textContent = logEl.hidden ? "Show log" : "Hide log";
-    });
-    function appendLog(line) {
-      logEl.textContent += line + "\n";
-      logEl.scrollTop = logEl.scrollHeight;
-    }
-
-    // --- Orchestrator UI bindings --------------------------------------
-    // Mapping from orchestrator's progress stage → which modal section to
-    // show + any per-stage detail rendering. Centralizes the UI ↔ flow
-    // contract so the orchestrator stays UI-agnostic.
-    function handleProgress(stage, detail) {
-      switch (stage) {
-        case "request-port":
-          showSection("connecting");
-          document.getElementById("connecting-detail").textContent =
-            "Pick the serial port the device is connected to.";
-          break;
-        case "wrong-port-retry":
-          // Distinct section with a Try-again button gates the OS-picker
-          // re-prompt so the user reads the guidance BEFORE the OS modal
-          // covers the page (the picker's a native dialog, no way around
-          // its overlay; if we just updated connecting-detail and went
-          // straight to requestPort(), the message would never be seen).
-          showSection("wrongPort");
-          break;
-        case "connect-flash":
-          showSection("connecting");
-          document.getElementById("connecting-detail").textContent =
-            detail && detail.chipName
-              ? `Detected ${detail.chipName}`
-              : "Detecting chip…";
-          break;
-        case "fetch-firmware":
-          showSection("flashing");
-          document.getElementById("flashing-status").textContent =
-            "Downloading firmware…";
-          document.getElementById("flash-bar").style.width = "0%";
-          break;
-        case "erase": {
-          showSection("flashing");
-          document.getElementById("flashing-status").textContent =
-            "Erasing flash (this takes ~12 s)…";
-          // esptool-js's eraseFlash doesn't report progress — animate the
-          // bar so the user sees the page isn't hung. flash stage clears
-          // the class below and switches to determinate progress.
-          //
-          // Clear the inline width set by an earlier stage (fetch-firmware
-          // forces `style.width = "0%"`); inline style beats the CSS class's
-          // `width: 100%` rule, so the animation would run invisibly on a
-          // zero-width bar without this reset.
-          const bar = document.getElementById("flash-bar");
-          bar.style.width = "";
-          bar.classList.add("indeterminate");
-          break;
-        }
-        case "flash": {
-          showSection("flashing");
-          const pct = detail && typeof detail.pct === "number" ? detail.pct : 0;
-          const bar = document.getElementById("flash-bar");
-          bar.classList.remove("indeterminate");
-          document.getElementById("flashing-status").textContent =
-            `Writing firmware… ${pct}%`;
-          bar.style.width = `${pct}%`;
-          break;
-        }
-        case "reboot":
-          showSection("connecting");
-          document.getElementById("connecting-detail").textContent =
-            "Rebooting device…";
-          break;
-        case "connect-improv":
-          showSection("connecting");
-          document.getElementById("connecting-detail").textContent =
-            "Connecting over Improv…";
-          break;
-        case "wifi-creds-form": {
-          buildWifiForm();
-          showSection("wifiForm");
-          // Prefill the last-used SSID (not password — that stays out of
-          // localStorage as a privacy / security-scanner concession). Focus
-          // password if SSID is prefilled (user only needs to type the
-          // password), else focus SSID.
-          const ssidEl = document.getElementById("wifi-ssid");
-          const passEl = document.getElementById("wifi-password");
-          // Clear the password input on every show. The form is built
-          // lazily once and re-used across multiple installs in the same
-          // page session; without this clear, a re-install would show the
-          // previous install's typed password in plaintext (well, dotted)
-          // inside the field. Don't leave that sitting in the DOM longer
-          // than the active install.
-          passEl.value = "";
-          try {
-            const saved = localStorage.getItem("projectMM.installer.lastSsid");
-            if (saved) ssidEl.value = saved;
-          } catch (_) { /* hostile storage */ }
-          requestAnimationFrame(() => (ssidEl.value ? passEl : ssidEl).focus());
-          break;
-        }
-        case "provisioning":
-          showSection("provisioning");
-          document.getElementById("provisioning-status").textContent =
-            "Connecting to your WiFi…";
-          break;
-        case "set-board":
-          showSection("provisioning");
-          document.getElementById("provisioning-status").textContent =
-            "Setting board identity…";
-          break;
-        case "apply-defaults":
-          showSection("provisioning");
-          document.getElementById("provisioning-status").textContent =
-            detail && detail.board
-              ? `Applying device defaults for ${detail.board}…`
-              : "Applying device defaults…";
-          break;
-        case "needs-ip":
-          showSection("needsIp");
-          // Focus the input so the user can start typing immediately.
-          requestAnimationFrame(() => {
-            const el = document.getElementById("needs-ip-input");
-            if (el) el.focus();
-          });
-          break;
-        case "done":
-          // onSuccess fires next; section toggles there once URL is known.
-          break;
-      }
-    }
-
-    // Render the WiFi-creds form into #section-wifi-form on first use.
-    // Idempotent — re-installs after the first run are no-ops. See the
-    // comment on #section-wifi-form's empty div for why this is deferred
-    // (avoids the macOS iCloud Passwords prompt on page load).
-    //
-    // Attributes on the injected inputs:
-    // - autocomplete="off": defeats Chrome's built-in field-fill (the
-    //   browser's own offer; not the OS keychain).
-    // - data-lpignore / data-1p-ignore: vendor opt-outs for LastPass /
-    //   1Password's browser-extension fill icons.
-    // - autocomplete="off" on the password (NOT "new-password"):
-    //   "new-password" actively signals password managers "credential
-    //   being created, offer a generated value", which is wrong here —
-    //   the user is typing their existing home-WiFi password, not
-    //   creating a new account.
-    //
-    // The OS keychain prompt (iCloud Passwords) ignores all of the above
-    // when it scans the DOM at page load; deferring the form is the only
-    // reliable way to keep it quiet until the user is actually mid-install.
-    let _wifiFormBuilt = false;
-    function buildWifiForm() {
-      if (_wifiFormBuilt) return;
-      _wifiFormBuilt = true;
-      const section = document.getElementById("section-wifi-form");
-      section.innerHTML = `
-        <div class="install-status">Flash done. Enter your WiFi credentials to provision the device.</div>
-        <form id="wifi-form" class="install-form" onsubmit="return false">
-          <label for="wifi-ssid">Network name (SSID)</label>
-          <input type="text" id="wifi-ssid" autocomplete="off"
-                 data-lpignore="true" data-1p-ignore required>
-          <label for="wifi-password">Password</label>
-          <input type="password" id="wifi-password" autocomplete="off"
-                 data-lpignore="true" data-1p-ignore>
-          <div class="install-actions">
-            <button type="button" class="secondary" id="wifi-skip">Skip</button>
-            <button type="submit" class="primary" id="wifi-connect">Connect</button>
-          </div>
-        </form>
-      `;
-    }
-
-    // Returns a Promise the orchestrator awaits — resolves when the user
-    // submits the WiFi form. The form's Connect button completes via the
-    // form's submit event; the Skip button bypasses WiFi (the device
-    // falls back to its AP). Skip resolves with empty creds — the
-    // orchestrator's provision() with empty SSID will fail fast and the
-    // user falls back to the AP flow as documented in Step 2.
-    function uiWaitForCreds() {
-      return new Promise((resolve) => {
-        const form = document.getElementById("wifi-form");
-        const ssidEl = document.getElementById("wifi-ssid");
-        const passEl = document.getElementById("wifi-password");
-        const skipBtn = document.getElementById("wifi-skip");
-
-        const onSubmit = (e) => {
-          e.preventDefault();
-          cleanup();
-          const ssid = ssidEl.value.trim();
-          // Save SSID only — password stays out of localStorage. WiFi SSIDs
-          // are network-visible anyway (any scanning device sees them);
-          // passwords are not.
-          try {
-            if (ssid) localStorage.setItem("projectMM.installer.lastSsid", ssid);
-          } catch (_) { /* hostile storage */ }
-          resolve({ ssid, password: passEl.value });
-        };
-        const onSkip = () => {
-          cleanup();
-          resolve({ ssid: "", password: "" });
-        };
-        const cleanup = () => {
-          form.removeEventListener("submit", onSubmit);
-          skipBtn.removeEventListener("click", onSkip);
-        };
-        form.addEventListener("submit", onSubmit);
-        skipBtn.addEventListener("click", onSkip);
-      });
-    }
-
-    // Returns a Promise that resolves with one of:
-    //   { action: "ip", url: "<typed value>" }    — user typed an IP + Add
-    //   { action: "skip" }                        — user clicked Skip
-    //   { action: "retry" }                       — user clicked Try Improv again
-    // Shown when the orchestrator's probe-open on the user's pre-picked
-    // port fails. The OS port picker is modal and covers the install
-    // modal, so any guidance written and immediately followed by
-    // requestPort() is invisible — gate the re-prompt behind a Try
-    // again click so the message lands before the OS picker covers
-    // the page. Resolves when the user clicks Try again.
-    function uiWaitForPortRetry() {
-      return new Promise((resolve) => {
-        const btn = document.getElementById("wrong-port-retry");
-        const onClick = () => {
-          btn.removeEventListener("click", onClick);
-          resolve();
-        };
-        btn.addEventListener("click", onClick);
-      });
-    }
-
-    // Symmetric with uiWaitForCreds. Normalisation of the typed value lives
-    // in the orchestrator so the host page stays UI-only. The retry action
-    // is the orchestrator's signal to re-run Improv `initialize()`; while
-    // that's in flight the host re-shows the dialog via showNeedsIpRetrying()
-    // (input + buttons disabled, "Trying Improv again…" status visible).
-    function uiWaitForIp() {
-      return new Promise((resolve) => {
-        const form = document.getElementById("needs-ip-form");
-        const input = document.getElementById("needs-ip-input");
-        const skipBtn = document.getElementById("needs-ip-skip");
-        const retryBtn = document.getElementById("needs-ip-retry");
-
-        const onSubmit = (e) => {
-          e.preventDefault();
-          // Reject whitespace-only input here so the user sees the
-          // browser's built-in validation tooltip on the same field
-          // instead of a silent re-prompt after the orchestrator
-          // discovers an empty normalized URL downstream. `required`
-          // on the input catches empty submits but not "   " — trim
-          // first, then use setCustomValidity to surface the same UI.
-          const trimmed = input.value.trim();
-          if (!trimmed) {
-            input.setCustomValidity("Enter an IP address or hostname.");
-            input.reportValidity();
-            input.setCustomValidity("");  // clear so the next valid submit proceeds
-            return;
-          }
-          cleanup();
-          resolve({ action: "ip", url: trimmed });
-        };
-        const onSkip = () => {
-          cleanup();
-          resolve({ action: "skip" });
-        };
-        const onRetry = () => {
-          cleanup();
-          resolve({ action: "retry" });
-        };
-        const cleanup = () => {
-          form.removeEventListener("submit", onSubmit);
-          skipBtn.removeEventListener("click", onSkip);
-          retryBtn.removeEventListener("click", onRetry);
-        };
-        form.addEventListener("submit", onSubmit);
-        skipBtn.addEventListener("click", onSkip);
-        retryBtn.addEventListener("click", onRetry);
-      });
-    }
-
-    // Toggle the needs-ip dialog into "retry in flight" mode: input + all
-    // three buttons disabled, retry status line visible, input field
-    // cleared so the user starts fresh if retry fails. The orchestrator
-    // calls this before re-running Improv `initialize()`; on completion
-    // (success or failure) it returns to the normal `uiWaitForIp()` call,
-    // which by re-rendering the dialog implicitly re-enables everything.
-    function showNeedsIpRetrying(retrying) {
-      const form = document.getElementById("needs-ip-form");
-      const input = document.getElementById("needs-ip-input");
-      const skipBtn = document.getElementById("needs-ip-skip");
-      const retryBtn = document.getElementById("needs-ip-retry");
-      const addBtn = document.getElementById("needs-ip-add");
-      const status = document.getElementById("needs-ip-retry-status");
-      input.disabled = retrying;
-      skipBtn.disabled = retrying;
-      retryBtn.disabled = retrying;
-      addBtn.disabled = retrying;
-      status.hidden = !retrying;
-      if (retrying) input.value = "";
-    }
-
-    function handleSuccess({ url, mdns, board, applyDefaults = true, defaultsApplied = false, viaHttp, alreadyOnline, ethOnlyNoLink }) {
-      disarmUnloadGuard();
-      // Clear the amber notice styling from any prior install in this session — only the
-      // eth-only-no-link branch re-adds it, so every other outcome shows the plain note.
-      document.getElementById("done-defaults").classList.remove("install-done-note--notice");
-      // Default header: most done outcomes mean the device reported an IP (it's reachable).
-      // The eth-only-no-link branch overrides it (the device isn't online until a cable is in).
-      document.getElementById("done-status").textContent = "Device is online!";
-      // Device-model defaults are applied DURING the install over serial (Improv =
-      // REST over serial — APPLY_OP). The success screen just confirms + links;
-      // the device is already fully configured by the time it shows.
-      if (ethOnlyNoLink) {
-        // Ethernet-only firmware flashed, but no cable was connected so the device isn't
-        // online yet (and this build has no WiFi to provision). Defaults WERE pushed over
-        // serial. Tell the user the one thing they need to do: plug in Ethernet — the device
-        // then comes online on its own and the link appears at its IP / <name>.local.
-        showSection("done");
-        document.getElementById("done-status").textContent = "Flashed — connect Ethernet";
-        document.getElementById("done-url").removeAttribute("href");
-        document.getElementById("done-url").textContent = "";
-        document.getElementById("done-url-mdns").hidden = true;
-        const note = document.getElementById("done-defaults");
-        // The device-model defaults are pushed over SERIAL during install (no network needed), so on
-        // this eth-only path they normally DID apply — report that honestly. The only "next step" is
-        // the network cable. Append a defaults caveat only when the push actually didn't run.
-        const defaultsNote = defaultsApplied
-          ? ` ${board} defaults were applied.`
-          : (board && applyDefaults ? ` ${board} defaults weren't applied — apply them later from MoonDeck.` : "");
-        note.textContent =
-          `Flashed. This is an Ethernet-only firmware — connect a network cable and the device comes online on its own (find it via its IP or <name>.local, or in MoonDeck).${defaultsNote}`;
-        note.classList.add("install-done-note--notice");   // amber: flashed OK, action needed (plug in Ethernet)
-        note.hidden = false;
-        return;
-      }
-      if (!url) {
-        // No device URL (user skipped the IP prompt, or an eth-only/no-Improv device).
-        // On that path no serial config push happened. If a model was picked, say so —
-        // it can be applied later from MoonDeck on the LAN — else just close.
-        if (board && applyDefaults) {
-          showSection("done");
-          document.getElementById("done-url").removeAttribute("href");
-          document.getElementById("done-url").textContent = "";
-          document.getElementById("done-url-mdns").hidden = true;
-          document.getElementById("done-defaults").textContent =
-            `Flashed. ${board} defaults weren't applied (no device address) — apply them later from MoonDeck on your network.`;
-          document.getElementById("done-defaults").hidden = false;
-          return;
-        }
-        closeModal();
-        return;
-      }
-      showSection("done");
-      // Always show the IP link (guaranteed to work). When the boot serial also
-      // reported the device's <deviceName>.local name, show it as a second link —
-      // it survives a DHCP lease change but only resolves where mDNS works.
-      const a = document.getElementById("done-url");
-      a.textContent = url;
-      a.href = url;
-      const aMdns = document.getElementById("done-url-mdns");
-      if (mdns) {
-        const mdnsUrl = `http://${mdns}/`;
-        aMdns.textContent = mdnsUrl;
-        aMdns.href = mdnsUrl;
-        aMdns.hidden = false;
-      } else {
-        aMdns.hidden = true;
-      }
-      // Report the defaults outcome HONESTLY, from `defaultsApplied` (did the serial
-      // push actually run?), not `applyDefaults` (the checkbox intent): applied,
-      // wanted-but-couldn't (model picked + ticked but no push happened — e.g. an
-      // Improv-less path), or kept-config (unticked).
-      const note = document.getElementById("done-defaults");
-      if (defaultsApplied) {
-        note.textContent = `Applied ${board} defaults.`;
-        note.hidden = false;
-      } else if (board && applyDefaults) {
-        note.textContent = `Flashed, but ${board} defaults weren't applied — apply them from MoonDeck on your network.`;
-        note.hidden = false;
-      } else if (board) {
-        note.textContent = `Kept the device's existing config (device defaults not applied).`;
-        note.hidden = false;
-      } else {
-        note.hidden = true;
-      }
-      // Store no board unless the defaults actually applied, so the saved entry doesn't
-      // claim a model the device wasn't configured to.
-      myDevices.addProvisionedDevice(url, defaultsApplied ? board : "");
-    }
-
-    function handleError(stage, error) {
-      disarmUnloadGuard();
-      console.error("[install]", stage, error);
-      showSection("error");
-      document.getElementById("error-message").textContent =
-        `Stage: ${stage}\n${error && error.message ? error.message : error}`;
-    }
-
-    // --- Pre-pick port -------------------------------------------------
-    // Two-option dropdown: the currently-picked port (or a "Pick a port…"
-    // placeholder), and a "Pick another port…" sentinel that opens the
-    // browser's Web Serial picker. We never list multiple previously-
-    // granted ports — Web Serial doesn't expose OS device names, so a list
-    // of "Port 1 / Port 2 / Port 3" is just confusing. The native picker
-    // is the only place where the user can match a port to a physical
-    // device (it shows the OS device name there).
-    //
-    // We also don't pre-select from `navigator.serial.getPorts()` on page
-    // load. A surviving grant is not a guarantee the port is still openable
-    // — if the device re-enumerated (reboot, replug, host sleep), `open()`
-    // fails with "Failed to open serial port" mid-install. Cheaper UX to
-    // always have the user re-pick this session than to chase a confusing
-    // mid-flash error. installer.start() falls back to its own requestPort()
-    // prompt if the user clicks Install without pre-picking.
-    let pickedPort = null;
-    const portSelect = document.getElementById("port-select");
-    const PICK_NEW = "__pick_new__"; // sentinel value for the "pick another" option
-
-    function rebuildPortSelect() {
-      portSelect.replaceChildren();
-      // No-port state: a single "Pick a port…" option. The select-as-button
-      // shape lets the change-event fire when the user re-picks the same
-      // option after cancelling the picker (so the picker can be reopened
-      // without an extra "Pick another" row to collapse to). Browsers fire
-      // `change` when the chosen <option> changes; clicking the lone option
-      // when it's already selected doesn't fire — handled by the click
-      // listener below.
-      if (!pickedPort) {
-        const pickOpt = document.createElement("option");
-        pickOpt.value = PICK_NEW;
-        pickOpt.textContent = "Pick a port…";
-        portSelect.appendChild(pickOpt);
-        portSelect.value = PICK_NEW;
-        return;
-      }
-      // Picked state: "Port selected" + "Pick another port…" sentinel.
-      const currentOpt = document.createElement("option");
-      currentOpt.value = "current";
-      currentOpt.textContent = "Port selected";
-      portSelect.appendChild(currentOpt);
-      const pickOpt = document.createElement("option");
-      pickOpt.value = PICK_NEW;
-      pickOpt.textContent = "Pick another port…";
-      portSelect.appendChild(pickOpt);
-      portSelect.value = "current";
-    }
-
-    // Reflect the port state in the picker's Install gate after every rebuild
-    // (init, post-pick, and any cancel that leaves pickedPort null). Wrapped so
-    // both rebuildPortSelect() exits and all call sites stay covered by one hook.
-    function syncPortState() {
-      rebuildPortSelect();
-      installPicker.notifyPortChanged();
-    }
-
-    syncPortState();
-
-    async function openPortPicker() {
-      let granted = false;
-      try {
-        pickedPort = await navigator.serial.requestPort({});
-        granted = true;
-        // A pending detect() handle is bound to the OLD port — drop it so the
-        // next Detect/Install opens the newly-picked port cleanly.
-        await installer.clearDetected();
-      } catch (_) {
-        // User cancelled the picker — keep whatever was picked before.
-      }
-      syncPortState();
-      // Auto-detect right after a fresh grant — the ESP Web Tools / ESPHome
-      // model where picking the device detects it immediately, so the board
-      // list narrows without a second click. Only on a genuine new grant (not
-      // a dropdown re-select), and non-fatal: runDetect routes any failure to
-      // the status line. Re-detect = pick another port (same path).
-      if (granted) {
-        const status = document.getElementById("detect-status");
-        installPicker.runDetect((text) => { status.textContent = text; });
-      }
-    }
-
-    portSelect.addEventListener("change", () => {
-      if (portSelect.value === PICK_NEW) openPortPicker();
-    });
-    // Mousedown rather than click — `change` won't fire when the only
-    // option (the "Pick a port…" entry in the no-port state) is "re-chosen",
-    // and click on a <select> opens the native list before our handler
-    // runs. Mousedown fires before the list pops up; we preventDefault to
-    // suppress the list and open the Web Serial picker instead. Only
-    // applies in the no-port state — once a port is picked the regular
-    // change-event path handles it.
-    portSelect.addEventListener("mousedown", (e) => {
-      if (!pickedPort) {
-        e.preventDefault();
-        openPortPicker();
-      }
-    });
-
-    // --- Serial monitor -------------------------------------------------
-    // Live read-only viewer of the picked port at 115200 baud. Web Serial
-    // owns the port exclusively, so the monitor mutex'es with the
-    // install/erase flows in both directions (see openModal /
-    // closeModal for the button-disable side, and the closeMonitor
-    // calls in onInstall / the Erase handler for the port-release side).
-    const _monitor = { port: null, reader: null, closing: false };
-    const monitorBackdrop = document.getElementById("monitor-backdrop");
-    const monitorOutput = document.getElementById("monitor-output");
-    const monitorStatus = document.getElementById("monitor-status");
-    const monitorBtn = document.getElementById("monitor-btn");
-
-    function setMonitorStatus(text) { monitorStatus.textContent = text; }
-
-    function appendMonitor(text) {
-      // Autoscroll only when the user is at the bottom — otherwise they're
-      // scrolled up reading something and we shouldn't yank them down.
-      const atBottom = monitorOutput.scrollTop + monitorOutput.clientHeight
-                       >= monitorOutput.scrollHeight - 4;
-      monitorOutput.textContent += text;
-      if (atBottom) monitorOutput.scrollTop = monitorOutput.scrollHeight;
-    }
-
-    async function openMonitor() {
-      if (_monitor.port) return;  // already open (Monitor clicked twice fast)
-      // Browser-support gate: Safari / Firefox have no Web Serial API.
-      // The page-load banner (#browser-warning) already tells the user,
-      // but the Monitor button is still rendered and clickable; without
-      // this guard we'd hit `navigator.serial.requestPort()` and the
-      // resulting TypeError would be swallowed by openPortPicker's
-      // catch, leaving the user with a non-responsive button. Show the
-      // existing banner explicitly so a click here surfaces the cause.
-      if (!("serial" in navigator)) {
-        document.getElementById("browser-warning").style.display = "block";
-        document.getElementById("browser-warning").scrollIntoView({behavior: "smooth"});
-        return;
-      }
-      if (!pickedPort) {
-        // Trigger the port picker; openMonitor was called from a user
-        // gesture (Monitor button click), so requestPort() is allowed.
-        await openPortPicker();
-        if (!pickedPort) return;  // user cancelled
-      }
-      monitorOutput.textContent = "";
-      setMonitorStatus("Opening port at 115200…");
-      monitorBackdrop.classList.add("open");
-      try {
-        await pickedPort.open({ baudRate: 115200 });
-      } catch (e) {
-        // Already-open errors get caught here — the orchestrator opens
-        // the port at flash time; if a prior install left it open we just
-        // proceed (the reader still works on an open port).
-        if (!String(e.message || "").includes("already open")) {
-          setMonitorStatus(`Failed to open: ${e.message || e}`);
-          return;
-        }
-      }
-      _monitor.port = pickedPort;
-      setMonitorStatus("Reading (115200 8N1)…");
-      readLoop().catch(e => {
-        // Read errors land here once — surface and shut down. Don't loop
-        // forever on a dead port.
-        if (!_monitor.closing) setMonitorStatus(`Read error: ${e.message || e}`);
-      });
-    }
-
-    async function readLoop() {
-      const decoder = new TextDecoder("utf-8", { fatal: false });
-      _monitor.reader = _monitor.port.readable.getReader();
-      try {
-        while (true) {
-          const { value, done } = await _monitor.reader.read();
-          if (done) break;
-          if (value && value.length) appendMonitor(decoder.decode(value, { stream: true }));
-        }
-      } finally {
-        try { _monitor.reader.releaseLock(); } catch (_) { /* already released */ }
-        _monitor.reader = null;
-      }
-    }
-
-    async function closeMonitor() {
-      if (_monitor.closing) return;
-      _monitor.closing = true;
-      monitorBackdrop.classList.remove("open");
-      try {
-        if (_monitor.reader) {
-          // cancel() makes the pending read() return {done:true}; the read
-          // loop then exits and releases the lock in its finally.
-          await _monitor.reader.cancel();
-        }
-      } catch (_) { /* ignore */ }
-      try {
-        if (_monitor.port) await _monitor.port.close();
-      } catch (_) { /* ignore */ }
-      _monitor.port = null;
-      _monitor.closing = false;
-    }
-
-    // Pulse RTS low → high to trigger the device's auto-reset circuit
-    // (DTR/RTS combo mirrors what esptool does pre-flash; for a bare
-    // reset, toggling RTS alone is enough on most USB-Serial bridges).
-    // setSignals() requires the port to be open — we are, since the
-    // monitor is running. After the pulse the device reboots and its
-    // boot log starts streaming through the read loop already in place.
-    async function monitorReset() {
-      if (!_monitor.port) return;
-      try {
-        await _monitor.port.setSignals({ dataTerminalReady: false, requestToSend: true });
-        await new Promise(r => setTimeout(r, 100));
-        await _monitor.port.setSignals({ dataTerminalReady: false, requestToSend: false });
-        appendMonitor("\n--- reset ---\n");
-      } catch (e) {
-        setMonitorStatus(`Reset failed: ${e.message || e}`);
-      }
-    }
-
-    monitorBtn.addEventListener("click", openMonitor);
-    document.getElementById("monitor-close").addEventListener("click", closeMonitor);
-    document.getElementById("monitor-clear").addEventListener("click", () => {
-      monitorOutput.textContent = "";
-    });
-    document.getElementById("monitor-reset").addEventListener("click", monitorReset);
-    // Esc closes the monitor (same affordance the install modal has via
-    // closeModal — keeps the two dialogs symmetric).
-    document.addEventListener("keydown", (e) => {
-      if (e.key === "Escape" && monitorBackdrop.classList.contains("open")) {
-        closeMonitor();
-      }
-    });
-
-    // --- Picker wiring -------------------------------------------------
-    const _pickerReady = installPicker.init({
-      container: document.getElementById("picker-mount"),
-      ownFirmwareKey: null,  // web installer flashes any firmware variant
-      installRowExtras: document.getElementById("erase-row"),
-      boardSupport,  // board catalog + chip detection (web-installer-only module)
-      // Gate Install on a picked USB port — the web installer requires the user
-      // to choose the port in the dropdown before flashing. (notifyPortChanged()
-      // below re-evaluates the button whenever pickedPort changes.)
-      hasPort: () => !!pickedPort,
-      onDetect: async () => {
-        // The monitor (if open) holds the port — release it before esptool
-        // claims it, same as the install path. detect() keeps the port open
-        // afterwards so the following Install reuses it.
-        if (_monitor.port) await closeMonitor();
-        return await installer.detect({ port: pickedPort, onLog: appendLog });
-      },
-      onInstall: async (firmware, manifestUrl /*, binaryUrl */) => {
-        // If the monitor is open it holds the port — release it before
-        // esptool tries to claim it. The reverse lock (monitor button
-        // disabled for the install's duration) lives in openModal /
-        // closeModal so the user can't reopen the monitor mid-flash.
-        if (_monitor.port) await closeMonitor();
-        const localUrl = toLocalUrl(manifestUrl);
-        const board = installPicker.getSelectedBoard();
-        const txPower = installPicker.getSelectedBoardTxPower();
-        openModal(board ? `Installing projectMM on ${board}` : `Installing ${firmware}`);
-        showSection("connecting");
-        document.getElementById("connecting-detail").textContent = "";
-        const eraseBefore = document.getElementById("erase-before-flash").checked;
-        // Apply the device-model's catalog defaults (modules + controls) after flashing.
-        // Default-ticked-with-erase (see the change listener below): a clean slate wants
-        // defaults; re-flashing a configured device should NOT silently re-inject (the
-        // catalog's replaceChildren would delete the user's effects). Untick to flash the
-        // firmware while keeping the device's current config. txPower (the brown-out cap)
-        // is a hardware trait, not a "default", so it still applies regardless — only the
-        // module/control inject is gated.
-        const applyDefaults = document.getElementById("apply-device-defaults").checked;
-        // Ethernet-only firmware: WiFi compiled out (firmwares.json `eth_only`). Keyed off the
-        // name like isCompatible's `-eth*` rule — a `-eth` variant is eth-only UNLESS it's the
-        // `-eth-wifi` co-processor build. The orchestrator uses this to skip WiFi provisioning
-        // (the build has no WIFI_SETTINGS RPC) and tell the user to connect Ethernet instead.
-        const ethOnly = /-eth$/.test(firmware);
-        await installer.start({
-          // pickedPort may be null — orchestrator falls back to requestPort.
-          port: pickedPort,
-          manifestUrl: localUrl,
-          board,         // names the install title + identifies the catalog entry
-          applyDefaults, // gates the APPLY_OP config push (not txPower, sent earlier)
-          txPower,
-          eraseBefore,
-          ethOnly,
-          onProgress: handleProgress,
-          uiWaitForCreds,
-          uiWaitForIp,
-          uiShowNeedsIpRetrying: showNeedsIpRetrying,
-          uiWaitForPortRetry,
-          onSuccess: handleSuccess,
-          onError: handleError,
-          onLog: appendLog,
-        });
-      },
-    });
-
-    // Auto-tie "Apply device defaults" to "Erase chip first": ticking erase (a clean
-    // slate) ticks defaults; unticking erase unticks it. The user can still override
-    // either box independently afterwards — the tie only fires on an erase toggle. Both
-    // start unticked (erase's default), so a plain re-flash keeps the device's config.
-    (() => {
-      const eraseBox = document.getElementById("erase-before-flash");
-      const defaultsBox = document.getElementById("apply-device-defaults");
-      if (eraseBox && defaultsBox) {
-        eraseBox.addEventListener("change", () => { defaultsBox.checked = eraseBox.checked; });
-      }
-    })();
-
-    myDevices.init({
-      container: document.getElementById("devices-mount"),
-      onErase: async (device) => {
-        if (!confirm(
-            `Erase ${device.name}? This wipes WiFi credentials and all ` +
-            `module state. You can flash a fresh firmware afterwards.`)) {
-          return;
-        }
-        // Same port-lock concern as install: release the monitor before
-        // esptool tries to claim the port.
-        if (_monitor.port) await closeMonitor();
-        openModal(`Erasing ${device.name}`);
-        showSection("connecting");
-        document.getElementById("connecting-detail").textContent = "";
-        await installer.eraseOnly({
-          port: pickedPort,
-          onProgress: handleProgress,
-          uiWaitForPortRetry,
-          onSuccess: () => {
-            showSection("done");
-            const a = document.getElementById("done-url");
-            a.removeAttribute("href");
-            a.textContent = "Erase complete — flash a fresh firmware to use the device again.";
-            document.getElementById("done-url-mdns").hidden = true;  // no device URL after erase
-            document.getElementById("done-defaults").hidden = true;  // nothing applied on erase
-          },
-          onError: handleError,
-          onLog: appendLog,
-        });
-      },
-    });
-
-    // Show the unsupported-browser banner when Web Serial isn't available.
-    if (!("serial" in navigator)) {
-      document.getElementById("browser-warning").style.display = "block";
-    }
-
-    // --- picture board grid --------------------------------
-    // Renders deviceModels.json as a visual card grid; on select it drives the shared
-    // picker's own (hidden) #rp-board <select> via a dispatched change event, so
-    // the existing release/firmware narrowing + flash flow runs unchanged. The
-    // shared install-picker.js is NOT modified.
-    (async function boardGrid() {
-      let boards = [];
-      try {
-        const res = await fetch("./deviceModels.json");   // same catalog as the picker
-        boards = await res.json();
-      } catch (e) {
-        document.getElementById("board-grid").textContent = "Could not load deviceModels.json: " + e;
-        return;
-      }
-      await _pickerReady;   // ensure the picker has mounted its (hidden) #rp-board
-
-      const gridEl    = document.getElementById("board-grid");
-      const searchEl  = document.getElementById("board-search");
-      const summaryEl = document.getElementById("board-summary");
-      const labelEl   = document.getElementById("board-summary-label");
-      const thumbEl   = document.getElementById("board-summary-thumb");
-      const expandEl  = document.getElementById("board-expand");
-      const clearEl   = document.getElementById("board-clear");
-      let selected = installPicker.getSelectedBoard() || "";   // honour a restored pick
-
-      function ledDriver(b) {
-        const d = (b.modules || []).find(m => /LedDriver$/.test(m.type || ""));
-        return d ? d.type.replace(/Driver$/, "") : null;
-      }
-      // A supported capability is "active" (configured) when deviceModels.json has a module
-      // backing it. The capability→module link is implicit in the data, so this map
-      // names it in one place (bespoke, but it just reads the modules[] already there —
-      // no duplicated `active` field to drift). A capability with no entry here, or no
-      // matching module, stays merely "supported". Each predicate gets the whole module
-      // object so it can inspect controls — needed to tell Ethernet from WiFi: both ride
-      // NetworkModule, but Ethernet is only ACTUALLY wired when the board's NetworkModule
-      // carries an ethType control set to a real PHY (not absent / "None"/0). WiFi is
-      // active wherever NetworkModule exists (the radio is always available); a board
-      // that lists WiFi as supported but ships no NetworkModule entry stays "supported".
-      const ethConfigured = (m) => {
-        const t = m.controls && m.controls.ethType;
-        return t !== undefined && t !== 0 && t !== "0" && t !== "None";
-      };
-      const CAP_MODULE = {
-        LEDs:     m => /LedDriver$/.test(m.type || ""),
-        Ethernet: m => m.type === "NetworkModule" && ethConfigured(m),
-        WiFi:     m => m.type === "NetworkModule",
-        Audio:    m => /^Audio/.test(m.type || ""),
-      };
-      function capActive(b, cap) {
-        const test = CAP_MODULE[cap];
-        return !!test && (b.modules || []).some(m => test(m));
-      }
-      function setExpanded(open) {
-        expandEl.hidden = !open;
-        summaryEl.setAttribute("aria-expanded", open ? "true" : "false");
-        if (open) { searchEl.focus(); }
-      }
-      // Reflect the current pick in the collapsed summary (label + thumbnail).
-      function updateSummary() {
-        const b = boards.find(x => x.name === selected);
-        if (b) {
-          labelEl.textContent = b.name;
-          if (b.image) { thumbEl.hidden = false; thumbEl.style.backgroundImage = `url("${b.image}")`; }
-          else { thumbEl.hidden = true; }
-        } else {
-          labelEl.textContent = "Pick a device";
-          thumbEl.hidden = true;
-        }
-      }
-      function pickBoard(name) {
-        selected = name;
-        // Drive the shared picker's hidden <select>: set value + fire change so
-        // its listener updates state.selectedBoard and re-filters firmware.
-        const rpBoard = document.getElementById("rp-board");
-        if (rpBoard) {
-          // A Detect narrows #rp-board's options to one family. With "show all
-          // boards" the grid can pick a board from ANOTHER family — whose option
-          // isn't in the narrowed list, so `value = name` would silently no-op
-          // (value stays "") and the firmware list wouldn't narrow. Ensure the
-          // option exists first so the assignment takes and selectedBoard is set.
-          if (name && !Array.from(rpBoard.options).some(o => o.value === name)) {
-            const o = document.createElement("option");
-            o.value = name; o.textContent = name;
-            rpBoard.appendChild(o);
-          }
-          rpBoard.value = name;
-          rpBoard.dispatchEvent(new Event("change", { bubbles: true }));
-        }
-        updateSummary();
-        setExpanded(false);   // collapse back to the summary after a pick
-        render();             // keep the grid's selected-card state in sync for next open
-      }
-      // After a Detect, the shared picker narrows its hidden #rp-board <select>
-      // to the matching-family boards (applyDetectedChip → fillBoardOptions). The
-      // grid mirrors that: it shows only boards whose name is a current #rp-board
-      // option. Before any detect, #rp-board holds the FULL catalog (plus the
-      // "(any board)" / "Other…" pass-through, which has no value), so the grid
-      // shows everything — only a detect narrows it. Returns null = no constraint.
-      // `showAll` is the user's escape hatch (the "show all boards" toggle) for a
-      // wrong/unhelpful detection — when set, the filter is bypassed.
-      let showAll = false;
-      function narrowedNames() {
-        const sel = document.getElementById("rp-board");
-        if (!sel) return null;
-        const names = Array.from(sel.options).map(o => o.value).filter(Boolean);
-        // If the option set equals the full catalog, there's no narrowing.
-        return names.length && names.length < boards.length ? new Set(names) : null;
-      }
-      function allowedNames() {
-        return showAll ? null : narrowedNames();
-      }
-      // The detected family label (from the narrowed boards' shared chip), for the
-      // "Detected <family> · show all" notice. null when not narrowed.
-      function detectedFamily() {
-        const allow = narrowedNames();
-        if (!allow) return null;
-        const fams = new Set(boards.filter(b => allow.has(b.name)).map(b => b.chip));
-        return fams.size === 1 ? [...fams][0] : null;
-      }
-      function renderFilterNotice() {
-        const notice = document.getElementById("board-filter-notice");
-        const fam = detectedFamily();
-        if (!fam) { notice.hidden = true; notice.replaceChildren(); return; }
-        notice.hidden = false;
-        notice.replaceChildren();
-        if (showAll) {
-          notice.append(`Showing all boards. `);
-          const a = document.createElement("button");
-          a.textContent = `Filter to detected ${fam}`;
-          a.onclick = () => { showAll = false; render(); };
-          notice.append(a);
-        } else {
-          notice.append(`Detected ${fam}. `);
-          const a = document.createElement("button");
-          a.textContent = "Show all boards";
-          a.title = "Detection wrong, or your board isn't in this family? Show the full catalog.";
-          a.onclick = () => { showAll = true; render(); };
-          notice.append(a);
-        }
-      }
-      function render() {
-        const q = (searchEl.value || "").toLowerCase();
-        const allow = allowedNames();
-        const shown = boards.filter(b =>
-          (!q || b.name.toLowerCase().includes(q)) &&
-          (!allow || allow.has(b.name)));
-        renderFilterNotice();
-        gridEl.replaceChildren();
-        const byChip = {};
-        for (const b of shown) (byChip[b.chip] ||= []).push(b);
-        for (const chip of Object.keys(byChip).sort()) {
-          const lbl = document.createElement("div");
-          lbl.className = "bg-chip-label"; lbl.textContent = chip;
-          gridEl.appendChild(lbl);
-          for (const b of byChip[chip]) gridEl.appendChild(card(b));
-        }
-        if (!shown.length) {
-          const e = document.createElement("p"); e.className = "note"; e.textContent = "No boards match.";
-          gridEl.appendChild(e);
-        }
-      }
-      function card(b) {
-        const el = document.createElement("div");
-        el.className = "bg-card" + (selected === b.name ? " selected" : "");
-        // Keyboard-accessible: a focusable option that picks on Enter/Space, the
-        // same affordance the click handler gives the mouse.
-        el.tabIndex = 0;
-        el.setAttribute("role", "option");
-        el.setAttribute("aria-selected", selected === b.name ? "true" : "false");
-        el.onclick = (ev) => { if (!ev.target.classList.contains("bg-link")) pickBoard(b.name); };
-        el.onkeydown = (ev) => {
-          if (ev.key === "Enter" || ev.key === " ") { ev.preventDefault(); pickBoard(b.name); }
-        };
-        const thumb = document.createElement("div");
-        thumb.className = "bg-thumb" + (b.image ? "" : " noimg");
-        // the deploy stages a copy of deviceModels.json
-        // + the referenced board images alongside this page, so an "image" path of
-        // "assets/boards/<slug>.jpg" resolves same-origin from this page.
-        if (b.image) thumb.style.backgroundImage = `url("${b.image}")`;
-        el.appendChild(thumb);
-        const body = document.createElement("div"); body.className = "bg-body";
-        const nm = document.createElement("div"); nm.className = "bg-name"; nm.textContent = b.name; body.appendChild(nm);
-        const meta = document.createElement("div"); meta.className = "bg-meta";
-        meta.textContent = b.chip + (ledDriver(b) ? " · " + ledDriver(b) : "");
-        body.appendChild(meta);
-        // Capability chips, three states by colour (not text): green = active
-        // (supported AND a module configured in deviceModels.json), yellow = supported
-        // (firmware supports it, not pre-configured), orange = planned (no module
-        // yet — the backlog seed). All chips are shown (labels kept short in
-        // deviceModels.json so they fit the card).
-        const caps = [
-          ...(Array.isArray(b.supported) ? b.supported.map(c =>
-            capActive(b, c) ? { c, cls: "act", label: "active" }
-                            : { c, cls: "sup", label: "supported" }) : []),
-          ...(Array.isArray(b.planned) ? b.planned.map(c => ({ c, cls: "plan", label: "planned" })) : []),
-        ];
-        if (caps.length) {
-          const capsEl = document.createElement("div"); capsEl.className = "bg-caps";
-          for (const { c, cls, label } of caps) {
-            const chip = document.createElement("span");
-            chip.className = "bg-cap " + cls;
-            chip.textContent = c;   // colour conveys active / supported / planned
-            chip.title = c + " — " + label;
-            capsEl.appendChild(chip);
-          }
-          body.appendChild(capsEl);
-        }
-        if (b.url) {
-          const a = document.createElement("a"); a.className = "bg-link"; a.href = b.url;
-          a.target = "_blank"; a.rel = "noopener"; a.textContent = "product page ↗"; body.appendChild(a);
-        }
-        // "details" opens the full deviceModels.json entry in a popup. It carries the
-        // bg-link class so the card's onclick treats it as a non-select region
-        // (same guard the product-page link relies on).
-        const det = document.createElement("a");
-        det.className = "bg-link bg-details"; det.textContent = "details ⓘ";
-        det.setAttribute("role", "button"); det.tabIndex = 0;
-        det.onclick = (ev) => { ev.stopPropagation(); showBoardDetails(b); };
-        det.onkeydown = (ev) => {
-          if (ev.key === "Enter" || ev.key === " ") { ev.preventDefault(); ev.stopPropagation(); showBoardDetails(b); }
-        };
-        body.appendChild(det);
-        el.appendChild(body);
-        return el;
-      }
-      // Fill + open the board-details popup from a deviceModels.json entry: a readable
-      // summary (chip, firmwares, capabilities, modules + their controls) plus a
-      // collapsible raw-JSON block for the exact entry. Built with DOM nodes (not
-      // innerHTML) so board-supplied strings can't inject markup.
-      function showBoardDetails(b) {
-        const dlg = document.getElementById("board-details");
-        document.getElementById("bd-title").textContent = b.name || "Device";
-        const body = document.getElementById("bd-body");
-        body.replaceChildren();
-        const row = (key, val) => {
-          const r = document.createElement("div"); r.className = "bd-row";
-          const k = document.createElement("span"); k.className = "bd-key"; k.textContent = key;
-          const v = document.createElement("span"); v.className = "bd-val"; v.textContent = val;
-          r.append(k, v); body.appendChild(r);
-        };
-        // Same shape as row(), but the value is a clickable link. href + textContent
-        // only (no innerHTML), so a board-supplied URL can't inject markup. Opens in
-        // a new tab; only http(s) links are made clickable (else fall back to text).
-        const rowLink = (key, url) => {
-          const r = document.createElement("div"); r.className = "bd-row";
-          const k = document.createElement("span"); k.className = "bd-key"; k.textContent = key;
-          const v = document.createElement("span"); v.className = "bd-val";
-          const a = document.createElement("a");
-          a.href = url; a.target = "_blank"; a.rel = "noopener"; a.textContent = url;
-          v.appendChild(a); r.append(k, v); body.appendChild(r);
-        };
-        if (b.chip) row("Chip", b.chip);
-        if (Array.isArray(b.firmwares)) row("Firmwares", b.firmwares.join(", "));
-        if (Array.isArray(b.supported) && b.supported.length) row("Supported", b.supported.join(", "));
-        if (Array.isArray(b.planned) && b.planned.length) row("Planned", b.planned.join(", "));
-        if (b.url) {
-          if (/^https?:\/\//.test(b.url)) rowLink("Product page", b.url);
-          else row("Product page", b.url);
-        }
-
-        if (Array.isArray(b.modules) && b.modules.length) {
-          const h = document.createElement("div"); h.className = "bd-section"; h.textContent = "Modules";
-          body.appendChild(h);
-          for (const m of b.modules) {
-            const mod = document.createElement("div"); mod.className = "bd-mod";
-            const nm = document.createElement("div"); nm.className = "bd-mod-name";
-            nm.textContent = m.type || "?";
-            if (m.id && m.id !== m.type) {
-              const idEl = document.createElement("span"); idEl.className = "bd-mod-id";
-              idEl.textContent = "  (" + m.id + ")"; nm.appendChild(idEl);
-            }
-            mod.appendChild(nm);
-            const ctrls = m.controls && typeof m.controls === "object" ? m.controls : null;
-            if (ctrls) {
-              for (const [k, v] of Object.entries(ctrls)) {
-                const c = document.createElement("div"); c.className = "bd-ctrl";
-                const code = document.createElement("code"); code.textContent = k + " = " + v;
-                c.appendChild(code); mod.appendChild(c);
-              }
-            }
-            body.appendChild(mod);
-          }
-        }
-
-        // Collapsible raw JSON — the exact entry, for developers.
-        const raw = document.createElement("details"); raw.className = "bd-raw";
-        const sum = document.createElement("summary"); sum.textContent = "Raw JSON";
-        const pre = document.createElement("pre"); pre.textContent = JSON.stringify(b, null, 2);
-        raw.append(sum, pre); body.appendChild(raw);
-
-        dlg.showModal();
-      }
-      searchEl.oninput = render;
-      summaryEl.addEventListener("click", () => setExpanded(expandEl.hidden));
-      clearEl.addEventListener("click", () => pickBoard(""));   // generic / no board
-
-      // Re-render when a Detect narrows the picker: applyDetectedChip swaps out
-      // #rp-board's <option>s, so observe its child list. The grid then filters
-      // to the detected family (allowedNames), and updateSummary picks up any
-      // auto-selected single match.
-      const rpBoard = document.getElementById("rp-board");
-      if (rpBoard) {
-        new MutationObserver(() => {
-          showAll = false;   // a fresh detect is a new context — re-apply the filter
-          // Take the picker's value verbatim — an empty string means it cleared the
-          // selection (detected family with multiple matches → generic mode), and
-          // `|| selected` would wrongly keep the stale board in the summary.
-          selected = installPicker.getSelectedBoard();
-          updateSummary();
-          render();
-        }).observe(rpBoard, { childList: true });
-      }
-
-      updateSummary();   // reflect any restored pick in the collapsed summary
-      render();
-    })();
-  </script>
+  <script type="module" src="./install.js"></script>
 </body>
 </html>
diff --git a/docs/install/install.css b/docs/install/install.css
new file mode 100644
index 0000000..2ca8067
--- /dev/null
+++ b/docs/install/install.css
@@ -0,0 +1,472 @@
+/* projectMM web installer styles. Extracted from index.html — a static GitHub Pages
+   page (not embedded like the device UI), so an external stylesheet is free. */
+    :root {
+      --bg:     #1a1a2e;
+      --card:   #16213e;
+      --fg:     #e0e0e0;
+      --muted:  #a0a0b0;
+      --accent: #a78bfa;
+      --border: #2a3a6a;
+      --ok:     #57c97a;   /* green  — "active" capability (supported + a module configured in deviceModels.json) */
+      --sup:    #e3c84a;   /* yellow — "supported" capability (firmware supports it, not pre-configured) */
+      --plan:   #e8923a;   /* orange — "planned" capability (no module yet; greener than red, by design) */
+    }
+    * { box-sizing: border-box; }
+    body {
+      margin: 0;
+      min-height: 100vh;
+      background: var(--bg);
+      color: var(--fg);
+      font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, sans-serif;
+      font-size: 15px;
+      line-height: 1.55;
+      display: flex;
+      flex-direction: column;
+      align-items: center;
+      padding: 24px 16px 64px;
+    }
+    main { width: 100%; max-width: 640px; }
+    .help-link {
+      display: inline-block;
+      margin-left: 8px;
+      width: 22px; height: 22px; line-height: 22px;
+      text-align: center;
+      font-size: 14px; font-weight: 600;
+      vertical-align: middle;
+      color: var(--accent);
+      border: 1px solid var(--border);
+      border-radius: 50%;
+      text-decoration: none;
+    }
+    .help-link:hover { border-color: var(--accent); }
+    .version-chip {
+      display: inline-block;
+      margin-left: 8px;
+      padding: 2px 8px;
+      background: var(--card);
+      color: var(--muted);
+      border: 1px solid var(--border);
+      border-radius: 4px;
+      font-size: 13px;
+      font-weight: normal;
+      vertical-align: middle;
+    }
+    h1 {
+      margin: 0 0 8px;
+      font-size: 28px;
+      color: var(--accent);
+    }
+    p.tag { margin: 0 0 24px; color: var(--muted); }
+    .card {
+      background: var(--card);
+      border: 1px solid var(--border);
+      border-radius: 8px;
+      padding: 20px;
+      margin-bottom: 16px;
+    }
+    label { display: block; font-weight: 600; margin-bottom: 6px; }
+    select {
+      width: 100%;
+      padding: 10px 12px;
+      background: var(--bg);
+      color: var(--fg);
+      border: 1px solid var(--border);
+      border-radius: 6px;
+      font: inherit;
+    }
+    .button-row { margin-top: 16px; }
+    .note { color: var(--muted); font-size: 13px; margin-top: 10px; }
+    /* `.windows-only` elements are `hidden` by default in the HTML; the tiny
+       userAgent check at the top of <body> below removes `hidden` only on
+       Windows. Inverse to a CSS-only approach because CSS can't detect the
+       host OS — `[hidden]` already wins specificity-wise. */
+    .erase-row { margin-top: 12px; font-size: 13px; }
+    .erase-row label { cursor: pointer; }
+    .erase-row input { vertical-align: middle; margin-right: 6px; }
+    .erase-note { display: inline; margin-top: 0; }
+    a { color: var(--accent); }
+    code {
+      background: rgba(255,255,255,0.06);
+      padding: 1px 6px;
+      border-radius: 3px;
+      font-size: 13px;
+    }
+    .browser-warning {
+      background: #3a2a1a;
+      border: 1px solid #6a4a2a;
+      color: #e6c890;
+      display: none;
+    }
+    ol { padding-left: 22px; }
+    ol li { margin-bottom: 6px; }
+    .credits {
+      max-width: 720px;
+      margin: 32px auto 24px;
+      padding: 0 16px;
+      text-align: center;
+      border-top: 1px solid var(--border);
+      padding-top: 16px;
+    }
+    .credits .note { margin-top: 0; }
+
+    /* Minimal mirror of the device UI's control-row shape so the shared
+       install-picker module (src/ui/install-picker.js) renders the same
+       way on the installer page. The picker emits `.control-row` + child
+       `<select>` markup; without these rules the rows wouldn't lay out. */
+    .control-row {
+      display: flex;
+      align-items: center;
+      gap: 12px;
+      margin: 10px 0;
+    }
+    .control-label {
+      flex: 0 0 80px;
+      font-weight: 600;
+      color: var(--muted);
+    }
+    .control-row select { flex: 1; }
+
+    /* the shared picker still renders its own board <select>
+       (#rp-board) — we keep it (so its change-listener wires) but hide its row;
+       the picture grid above drives it. The row is the .control-row that
+       contains #rp-board. */
+    .control-row:has(#rp-board) { display: none; }
+
+    /* Picture board grid — collapsed by default (a control-row field), expands
+       on click. The summary button is the row's field, so it flexes like the
+       selects (flex: 1) to line up with USB Port / Release / Firmware. */
+    #board-summary {
+      flex: 1; display: flex; align-items: center; justify-content: space-between;
+      gap: 12px; padding: 10px 12px; background: var(--bg); color: var(--fg);
+      border: 1px solid var(--border); border-radius: 6px; font: inherit;
+      cursor: pointer; text-align: left;
+    }
+    #board-summary:hover { border-color: var(--accent); }
+    .board-summary-left { display: flex; align-items: center; gap: 10px; min-width: 0; }
+    .board-summary-thumb {
+      width: 36px; height: 24px; border-radius: 3px; flex-shrink: 0;
+      background: #0e1020 center/contain no-repeat; border: 1px solid var(--border);
+    }
+    #board-summary-label { overflow: hidden; text-overflow: ellipsis; white-space: nowrap; }
+    .board-summary-caret { color: var(--muted); transition: transform .15s; flex-shrink: 0; }
+    #board-summary[aria-expanded="true"] .board-summary-caret { transform: rotate(180deg); }
+    /* The expanded grid breaks out full-width below the row (aligns with the
+       field column by offsetting the label width + gap). */
+    #board-expand { margin: 0 0 10px 92px; }
+    .board-grid-controls { display: flex; align-items: center; gap: 12px; margin-bottom: 12px; flex-wrap: wrap; }
+    #board-search {
+      flex: 1; min-width: 160px; padding: 8px 10px; background: var(--bg);
+      color: var(--fg); border: 1px solid var(--border); border-radius: 6px; font: inherit;
+    }
+    .board-clear {
+      background: transparent; color: var(--muted); border: 1px solid var(--border);
+      border-radius: 6px; padding: 8px 12px; font: inherit; font-size: 13px; cursor: pointer;
+    }
+    .board-clear:hover { color: var(--fg); border-color: var(--accent); }
+    .board-filter-notice { color: var(--muted); font-size: 12px; margin-bottom: 10px; }
+    .board-filter-notice button {
+      background: none; border: none; color: var(--accent); font: inherit; font-size: 12px;
+      cursor: pointer; padding: 0; text-decoration: underline;
+    }
+    #board-grid { max-height: 420px; overflow-y: auto; }   /* expanded grid scrolls, not the page */
+    #board-grid {
+      display: grid; grid-template-columns: repeat(auto-fill, minmax(150px, 1fr)); gap: 10px;
+    }
+    .bg-chip-label {
+      grid-column: 1 / -1; color: var(--muted); font-size: 11px; text-transform: uppercase;
+      letter-spacing: .06em; margin: 6px 0 0;
+    }
+    .bg-card {
+      background: var(--bg); border: 1px solid var(--border); border-radius: 8px;
+      overflow: hidden; cursor: pointer; transition: border-color .12s, background .12s;
+      display: flex; flex-direction: column;
+    }
+    .bg-card:hover { border-color: var(--accent); }
+    .bg-card.selected { border-color: var(--accent); box-shadow: 0 0 0 1px var(--accent) inset; }
+    .bg-thumb {
+      aspect-ratio: 16 / 10; background: #0e1020 center/contain no-repeat;
+      display: flex; align-items: center; justify-content: center;
+      color: var(--muted); font-size: 10px; border-bottom: 1px solid var(--border);
+    }
+    .bg-thumb.noimg::after { content: "no photo"; }
+    .bg-body { padding: 8px 9px; display: flex; flex-direction: column; gap: 3px; }
+    .bg-name { font-weight: 600; font-size: 12px; line-height: 1.2; }
+    .bg-meta { color: var(--muted); font-size: 11px; }
+    /* Capability chips: supported (green) vs planned (orange) — distinguished by
+       colour, not by extra text. Labels are kept short in deviceModels.json so every
+       chip fits the ~150px card; the full label + state is in the chip's title
+       tooltip. */
+    .bg-caps { display: flex; flex-wrap: wrap; gap: 3px; margin-top: 3px; }
+    .bg-cap {
+      font-size: 9px; line-height: 1.5; padding: 0 5px; border-radius: 999px;
+      max-width: 100%; overflow: hidden; text-overflow: ellipsis; white-space: nowrap;
+    }
+    .bg-cap.act { background: color-mix(in srgb, var(--ok) 18%, transparent); color: var(--ok); }
+    .bg-cap.sup { background: color-mix(in srgb, var(--sup) 20%, transparent); color: var(--sup); }
+    .bg-cap.plan { background: color-mix(in srgb, var(--plan) 20%, transparent); color: var(--plan); }
+    .bg-link { color: var(--accent); font-size: 11px; text-decoration: none; }
+    .bg-link:hover { text-decoration: underline; }
+
+    /* Board-details popup — native <dialog> (standard modal pattern: built-in
+       backdrop, ESC-to-close, focus trap; no bespoke modal JS). Shows the full
+       deviceModels.json entry as a readable summary plus a collapsible raw-JSON block. */
+    #board-details::backdrop { background: rgba(0,0,0,0.6); }
+    #board-details {
+      background: var(--card); color: var(--fg);
+      border: 1px solid var(--border); border-radius: 10px;
+      padding: 0; max-width: 560px; width: calc(100% - 32px);
+      max-height: 80vh; overflow: auto;
+    }
+    .bd-head {
+      display: flex; align-items: baseline; justify-content: space-between;
+      gap: 12px; padding: 16px 18px 8px;
+    }
+    .bd-title { font-size: 16px; font-weight: 600; }
+    .bd-close {
+      background: none; border: none; color: var(--muted);
+      font-size: 20px; line-height: 1; cursor: pointer; padding: 0 4px;
+    }
+    .bd-close:hover { color: var(--fg); }
+    .bd-body { padding: 0 18px 18px; }
+    .bd-row { display: flex; gap: 8px; padding: 3px 0; font-size: 13px; }
+    .bd-key { color: var(--muted); min-width: 92px; }
+    .bd-val { flex: 1; min-width: 0; overflow-wrap: anywhere; }
+    .bd-section { margin-top: 14px; font-weight: 600; font-size: 13px; }
+    .bd-mod { margin-top: 8px; padding-left: 10px; border-left: 2px solid var(--border); }
+    .bd-mod-name { font-size: 13px; }
+    .bd-mod-name .bd-mod-id { color: var(--muted); font-weight: normal; }
+    .bd-ctrl { font-size: 12px; color: var(--muted); padding-left: 8px; }
+    .bd-ctrl code { font-size: 11px; }
+    .bd-raw { margin-top: 16px; }
+    .bd-raw summary { cursor: pointer; color: var(--accent); font-size: 12px; }
+    .bd-raw pre {
+      margin: 8px 0 0; padding: 10px; background: var(--bg);
+      border: 1px solid var(--border); border-radius: 6px;
+      font-size: 11px; overflow: auto; white-space: pre;
+    }
+    .bg-link.bg-details { cursor: pointer; }
+
+    .action-btn {
+      background: var(--accent);
+      color: var(--bg);
+      border: none;
+      border-radius: 6px;
+      padding: 10px 20px;
+      font: inherit;
+      font-weight: 600;
+      cursor: pointer;
+    }
+    .action-btn:disabled { opacity: 0.5; cursor: not-allowed; }
+    .rp-status { color: var(--muted); font-size: 13px; }
+    .rp-status-row { min-height: 1.5em; }
+
+    /* Inline spinner shown in a field while its data is still being fetched
+       (install-picker renderSkeleton). A 1em spinning ring, sized to sit next
+       to the select's "Loading…" placeholder. */
+    .rp-spinner {
+      display: inline-block;
+      width: 1em; height: 1em;
+      vertical-align: -0.15em;
+      margin-right: 0.4em;
+      border: 2px solid var(--muted);
+      border-top-color: transparent;
+      border-radius: 50%;
+      animation: rp-spin 0.7s linear infinite;
+    }
+    @keyframes rp-spin { to { transform: rotate(360deg); } }
+
+    /* "Your devices" card — one row per provisioned device. The row
+       is the picker's `.control-row` flex shape with the device info
+       on the left and action buttons on the right. */
+    .device-row {
+      justify-content: space-between;
+      padding: 8px 0;
+      border-top: 1px solid rgba(255,255,255,0.06);
+    }
+    .device-row:first-child { border-top: 0; }
+    .device-info { min-width: 0; flex: 1; }
+    .device-url {
+      display: block;
+      font-family: ui-monospace, monospace;
+      color: var(--muted);
+      font-size: 12px;
+      text-decoration: none;
+      overflow: hidden;
+      text-overflow: ellipsis;
+      white-space: nowrap;
+    }
+    .device-url:hover { color: var(--accent); text-decoration: underline; }
+    .device-seen { color: var(--muted); font-size: 12px; margin-top: 2px; }
+    .device-actions { display: flex; gap: 6px; flex-shrink: 0; }
+    .device-btn {
+      background: transparent;
+      color: var(--accent);
+      border: 1px solid var(--accent);
+      border-radius: 4px;
+      padding: 4px 10px;
+      font: inherit;
+      font-size: 12px;
+      cursor: pointer;
+    }
+    .device-model-name { color: var(--fg); font-size: 12px; margin-top: 2px; }
+    .device-btn:hover { background: rgba(123, 158, 255, 0.08); }
+
+    /* Install modal — backdrop + centered card. Replaces the ESP Web Tools
+       <esp-web-install-button> shadow-DOM dialog. Sections show one at a
+       time via .install-section.active. */
+    .install-backdrop {
+      position: fixed; inset: 0;
+      background: rgba(0, 0, 0, 0.65);
+      display: none;
+      align-items: center;
+      justify-content: center;
+      z-index: 1000;
+    }
+    .install-backdrop.open { display: flex; }
+    .install-modal {
+      background: var(--card);
+      border: 1px solid var(--border);
+      border-radius: 8px;
+      padding: 24px;
+      max-width: 480px;
+      width: calc(100% - 32px);
+      box-shadow: 0 8px 32px rgba(0, 0, 0, 0.5);
+    }
+    .install-modal h2 {
+      margin: 0 0 16px;
+      font-size: 20px;
+      color: var(--accent);
+    }
+    .install-section { display: none; }
+    .install-section.active { display: block; }
+    .install-status { margin: 8px 0; color: var(--muted); }
+    .install-done-note { margin: 4px 0 10px; font-size: 13px; color: var(--muted); }
+    /* Notice variant — for a flashed-OK-but-action-needed outcome (e.g. eth-only firmware
+       waiting on a cable). Amber, like the "supported" capability chip (var(--sup)): reads as
+       "do this next", not a plain note and not a red error. */
+    .install-done-note.install-done-note--notice {
+      color: var(--sup);
+      background: color-mix(in srgb, var(--sup) 12%, transparent);
+      border-left: 3px solid var(--sup);
+      padding: 8px 10px; border-radius: 4px;
+    }
+    .install-warn { color: #d4a052; font-size: 12px; margin-top: 8px; }
+    .install-progress {
+      height: 8px;
+      background: var(--bg);
+      border-radius: 4px;
+      overflow: hidden;
+      margin: 12px 0;
+    }
+    .install-progress-bar {
+      height: 100%;
+      background: var(--accent);
+      width: 0;
+      transition: width 0.2s;
+    }
+    /* Indeterminate state — esptool-js's eraseFlash() doesn't report
+       progress (12 s of "wait and hope"), so we animate a marquee-style
+       bar to confirm the page hasn't hung. Toggled by adding the
+       .indeterminate class to .install-progress-bar; width set to 100%
+       so the animation has something to clip. */
+    .install-progress-bar.indeterminate {
+      width: 100%;
+      background: linear-gradient(
+        90deg,
+        var(--bg) 0%,
+        var(--accent) 40%,
+        var(--accent) 60%,
+        var(--bg) 100%);
+      background-size: 200% 100%;
+      animation: install-marquee 1.4s linear infinite;
+      transition: none;
+    }
+    @keyframes install-marquee {
+      from { background-position: 100% 0; }
+      to   { background-position: -100% 0; }
+    }
+    .install-form label {
+      display: block;
+      margin: 12px 0 4px;
+      font-size: 13px;
+      color: var(--muted);
+    }
+    .install-form input[type="text"],
+    .install-form input[type="password"] {
+      width: 100%;
+      padding: 8px 12px;
+      background: var(--bg);
+      color: var(--fg);
+      border: 1px solid var(--border);
+      border-radius: 6px;
+      font: inherit;
+    }
+    .install-actions {
+      display: flex;
+      gap: 8px;
+      justify-content: flex-end;
+      margin-top: 16px;
+    }
+    .install-actions button {
+      padding: 8px 16px;
+      font: inherit;
+      font-weight: 600;
+      border: 0;
+      border-radius: 6px;
+      cursor: pointer;
+    }
+    .install-actions button.primary {
+      background: var(--accent);
+      color: #1a1a2e;
+    }
+    .install-actions button.secondary {
+      background: transparent;
+      color: var(--fg);
+      border: 1px solid var(--border);
+    }
+    .install-error {
+      color: #f8a5a5;
+      font-size: 13px;
+      margin: 12px 0;
+      white-space: pre-wrap;
+      overflow-wrap: anywhere;
+    }
+    .install-success-url {
+      display: block;  /* IP and <name>.local each on their own line */
+      width: fit-content;
+      margin-top: 8px;
+      color: var(--accent);
+      text-decoration: none;
+      font-family: ui-monospace, monospace;
+    }
+    .install-success-url:hover { text-decoration: underline; }
+    .install-log-wrap {
+      margin-top: 16px;
+      border-top: 1px solid var(--border);
+      padding-top: 12px;
+    }
+    .install-log-toggle {
+      background: transparent;
+      color: var(--muted);
+      border: 0;
+      padding: 0;
+      cursor: pointer;
+      font: inherit;
+      font-size: 12px;
+      text-decoration: underline;
+    }
+    .install-log-toggle:hover { color: var(--fg); }
+    .install-log {
+      margin-top: 8px;
+      max-height: 240px;
+      overflow: auto;
+      background: var(--bg);
+      color: var(--muted);
+      font-family: ui-monospace, monospace;
+      font-size: 11px;
+      padding: 8px;
+      border: 1px solid var(--border);
+      border-radius: 4px;
+      white-space: pre-wrap;
+      word-break: break-all;
+    }
diff --git a/docs/install/install.js b/docs/install/install.js
new file mode 100644
index 0000000..1e81c1c
--- /dev/null
+++ b/docs/install/install.js
@@ -0,0 +1,1228 @@
+// projectMM web installer logic. Extracted from index.html's inline module script.
+// A static GitHub Pages page, so an external module is free.
+
+// Shared install-picker (release → board → firmware). Same file as the
+// on-device OTA UI uses; only the onInstall callback differs:
+//   - Device UI: POST the chosen .bin URL to /api/firmware/url; device
+//     fetches the binary directly via esp_https_ota.
+//   - Web installer (here): hand the manifest URL to the orchestrator,
+//     which flashes via esptool-js then provisions WiFi via Improv,
+//     all over the same SerialPort.
+//
+// Manifests + binaries must be same-origin with this page (Web Serial
+// would happily flash from any URL, but the manifest fetch + part
+// downloads via fetch() are subject to CORS). The release workflow
+// self-hosts the last N releases into pages/install/releases/<tag>/.
+// toLocalUrl rewrites the picker's absolute GitHub URLs to the local
+// copies before handing them to the orchestrator.
+import { installPicker } from "./install-picker.js";
+import { myDevices }    from "./devices.js";
+import { installer }    from "./install-orchestrator.js";
+// Board catalog + chip detection — web-installer only, kept out of the
+// firmware-embedded install-picker.js and injected here via boardSupport.
+import * as boardSupport from "./install-picker-boards.js";
+
+// Windows-only hints (was a separate inline <script> in <head>): reveal .windows-only
+// rows when the UA is Windows.
+document.addEventListener('DOMContentLoaded', () => {
+  if (/Windows/i.test(navigator.userAgent)) {
+    document.querySelectorAll('.windows-only').forEach(el => el.hidden = false);
+  }
+});
+
+
+    // Show the project version next to the heading. library.json ships
+    // alongside index.html (preview_installer.py + release.yml both copy
+    // it). Fetch silently — if it's missing for any reason, leave the
+    // chip hidden rather than rendering "?" noise.
+    (async () => {
+        try {
+            const res = await fetch("./library.json");
+            if (!res.ok) return;
+            const lib = await res.json();
+            if (!lib || !lib.version) return;
+            const chip = document.getElementById("version-chip");
+            chip.textContent = `v${lib.version}`;
+            chip.hidden = false;
+        } catch (_) { /* silent: cosmetic-only */ }
+    })();
+
+    // Map a GitHub release-asset URL to its Pages-hosted mirror.
+    //   https://github.com/MoonModules/projectMM/releases/download/<TAG>/<file>
+    //   → ./releases/<TAG>/<file>
+    function toLocalUrl(githubUrl) {
+      const m = /\/releases\/download\/([^/]+)\/([^/]+)$/.exec(githubUrl);
+      if (!m) return githubUrl;  // unrecognised shape: pass through unchanged
+      const [, tag, name] = m;
+      //   https://github.com/.../releases/download/<TAG>/<file>
+      //   → ./releases/<TAG>/<file>  (same-origin, served from this dir)
+      return `./releases/${tag}/${name}`;
+    }
+
+    // --- Install modal section toggling ---------------------------------
+    const backdrop = document.getElementById("install-backdrop");
+    const title = document.getElementById("install-title");
+    const sections = {
+      connecting:   document.getElementById("section-connecting"),
+      wrongPort:    document.getElementById("section-wrong-port"),
+      flashing:     document.getElementById("section-flashing"),
+      wifiForm:     document.getElementById("section-wifi-form"),
+      provisioning: document.getElementById("section-provisioning"),
+      needsIp:      document.getElementById("section-needs-ip"),
+      done:         document.getElementById("section-done"),
+      error:        document.getElementById("section-error"),
+    };
+    function showSection(name) {
+      for (const [k, el] of Object.entries(sections)) {
+        el.classList.toggle("active", k === name);
+      }
+    }
+    function openModal(titleText) {
+      title.textContent = titleText;
+      backdrop.classList.add("open");
+      // Reset the log per install session so users see only the current run.
+      document.getElementById("install-log").textContent = "";
+      // Reset toggle to collapsed state.
+      const log = document.getElementById("install-log");
+      const toggle = document.getElementById("log-toggle");
+      log.hidden = true;
+      toggle.textContent = "Show log";
+      // Reset the needs-ip dialog to its idle state — covers the case where
+      // a prior install ended in retry-success (which leaves the disabled +
+      // spinner state intact, since the WiFi-creds form took over the
+      // visible card) and the next install hits the needs-ip path again.
+      showNeedsIpRetrying(false);
+      // Lock out the monitor button while an install runs. Web Serial
+      // grants exclusive port access; a Monitor click mid-flash would
+      // race the install for the SerialPort and either steal it
+      // (corrupting the flash) or get a misleading "already open" error.
+      // closeModal re-enables.
+      monitorBtn.disabled = true;
+      // Guard against accidental tab-close mid-flash. Browser shows a
+      // generic "leave site?" prompt (Chrome ignores the custom text since
+      // 2017 — security hardening). disarmUnloadGuard() runs on done /
+      // error / cancel so the user can close the page when it's safe.
+      armUnloadGuard();
+    }
+    function closeModal() {
+      backdrop.classList.remove("open");
+      disarmUnloadGuard();
+      monitorBtn.disabled = false;
+      // Wipe the password field on every modal close — success, cancel,
+      // or error. The form is built lazily and re-used across installs in
+      // the same page session; without this the typed password lingers
+      // in the live `.value`. (We don't clear `defaultValue` — it stayed
+      // as the form's initial empty string from buildWifiForm's innerHTML
+      // assignment; setting `.value` clears the rendered value, which is
+      // the only thing visible to a script reading the DOM after close.)
+      // Same wipe runs at the start of each `wifi-creds-form` show, but
+      // having both belts ensures the wipe runs even when the user
+      // bypasses the form via Skip or the install fails before reaching
+      // the creds step.
+      const passEl = document.getElementById("wifi-password");
+      if (passEl) passEl.value = "";
+    }
+    let unloadGuard = null;
+    function armUnloadGuard() {
+      if (unloadGuard) return;
+      unloadGuard = (e) => {
+        e.preventDefault();
+        e.returnValue = "";  // legacy contract — Chrome ignores the string
+      };
+      window.addEventListener("beforeunload", unloadGuard);
+    }
+    function disarmUnloadGuard() {
+      if (!unloadGuard) return;
+      window.removeEventListener("beforeunload", unloadGuard);
+      unloadGuard = null;
+    }
+
+    // Only http(s) URLs are safe as a link href (same guard as
+    // myDevices.addProvisionedDevice) — a malformed value must never become a
+    // javascript:/data:/file: link.
+    function isHttpUrl(u) {
+      try { const p = new URL(u); return p.protocol === "http:" || p.protocol === "https:"; }
+      catch (_) { return false; }
+    }
+    document.getElementById("done-close").addEventListener("click", closeModal);
+    document.getElementById("error-close").addEventListener("click", closeModal);
+
+    // Board-details popup close button. The <dialog> also closes on ESC and a
+    // backdrop click (native); this wires the explicit ✕. A click on the dialog
+    // backdrop (the element itself, outside .bd-body) closes it too.
+    const bd = document.getElementById("board-details");
+    document.getElementById("bd-close").addEventListener("click", () => bd.close());
+    bd.addEventListener("click", (e) => { if (e.target === bd) bd.close(); });
+
+    // Log panel: collapsible, fed by the orchestrator's onLog callback.
+    // Auto-scrolls to bottom on append so the latest line is always visible.
+    const logEl = document.getElementById("install-log");
+    const logToggle = document.getElementById("log-toggle");
+    logToggle.addEventListener("click", () => {
+      logEl.hidden = !logEl.hidden;
+      logToggle.textContent = logEl.hidden ? "Show log" : "Hide log";
+    });
+    function appendLog(line) {
+      logEl.textContent += line + "\n";
+      logEl.scrollTop = logEl.scrollHeight;
+    }
+
+    // --- Orchestrator UI bindings --------------------------------------
+    // Mapping from orchestrator's progress stage → which modal section to
+    // show + any per-stage detail rendering. Centralizes the UI ↔ flow
+    // contract so the orchestrator stays UI-agnostic.
+    function handleProgress(stage, detail) {
+      switch (stage) {
+        case "request-port":
+          showSection("connecting");
+          document.getElementById("connecting-detail").textContent =
+            "Pick the serial port the device is connected to.";
+          break;
+        case "wrong-port-retry":
+          // Distinct section with a Try-again button gates the OS-picker
+          // re-prompt so the user reads the guidance BEFORE the OS modal
+          // covers the page (the picker's a native dialog, no way around
+          // its overlay; if we just updated connecting-detail and went
+          // straight to requestPort(), the message would never be seen).
+          showSection("wrongPort");
+          break;
+        case "connect-flash":
+          showSection("connecting");
+          document.getElementById("connecting-detail").textContent =
+            detail && detail.chipName
+              ? `Detected ${detail.chipName}`
+              : "Detecting chip…";
+          break;
+        case "fetch-firmware":
+          showSection("flashing");
+          document.getElementById("flashing-status").textContent =
+            "Downloading firmware…";
+          document.getElementById("flash-bar").style.width = "0%";
+          break;
+        case "erase": {
+          showSection("flashing");
+          document.getElementById("flashing-status").textContent =
+            "Erasing flash (this takes ~12 s)…";
+          // esptool-js's eraseFlash doesn't report progress — animate the
+          // bar so the user sees the page isn't hung. flash stage clears
+          // the class below and switches to determinate progress.
+          //
+          // Clear the inline width set by an earlier stage (fetch-firmware
+          // forces `style.width = "0%"`); inline style beats the CSS class's
+          // `width: 100%` rule, so the animation would run invisibly on a
+          // zero-width bar without this reset.
+          const bar = document.getElementById("flash-bar");
+          bar.style.width = "";
+          bar.classList.add("indeterminate");
+          break;
+        }
+        case "flash": {
+          showSection("flashing");
+          const pct = detail && typeof detail.pct === "number" ? detail.pct : 0;
+          const bar = document.getElementById("flash-bar");
+          bar.classList.remove("indeterminate");
+          document.getElementById("flashing-status").textContent =
+            `Writing firmware… ${pct}%`;
+          bar.style.width = `${pct}%`;
+          break;
+        }
+        case "reboot":
+          showSection("connecting");
+          document.getElementById("connecting-detail").textContent =
+            "Rebooting device…";
+          break;
+        case "connect-improv":
+          showSection("connecting");
+          document.getElementById("connecting-detail").textContent =
+            "Connecting over Improv…";
+          break;
+        case "wifi-creds-form": {
+          buildWifiForm();
+          showSection("wifiForm");
+          // Prefill the last-used SSID (not password — that stays out of
+          // localStorage as a privacy / security-scanner concession). Focus
+          // password if SSID is prefilled (user only needs to type the
+          // password), else focus SSID.
+          const ssidEl = document.getElementById("wifi-ssid");
+          const passEl = document.getElementById("wifi-password");
+          // Clear the password input on every show. The form is built
+          // lazily once and re-used across multiple installs in the same
+          // page session; without this clear, a re-install would show the
+          // previous install's typed password in plaintext (well, dotted)
+          // inside the field. Don't leave that sitting in the DOM longer
+          // than the active install.
+          passEl.value = "";
+          try {
+            const saved = localStorage.getItem("projectMM.installer.lastSsid");
+            if (saved) ssidEl.value = saved;
+          } catch (_) { /* hostile storage */ }
+          requestAnimationFrame(() => (ssidEl.value ? passEl : ssidEl).focus());
+          break;
+        }
+        case "provisioning":
+          showSection("provisioning");
+          document.getElementById("provisioning-status").textContent =
+            "Connecting to your WiFi…";
+          break;
+        case "set-board":
+          showSection("provisioning");
+          document.getElementById("provisioning-status").textContent =
+            "Setting board identity…";
+          break;
+        case "apply-defaults":
+          showSection("provisioning");
+          document.getElementById("provisioning-status").textContent =
+            detail && detail.board
+              ? `Applying device defaults for ${detail.board}…`
+              : "Applying device defaults…";
+          break;
+        case "needs-ip":
+          showSection("needsIp");
+          // Focus the input so the user can start typing immediately.
+          requestAnimationFrame(() => {
+            const el = document.getElementById("needs-ip-input");
+            if (el) el.focus();
+          });
+          break;
+        case "done":
+          // onSuccess fires next; section toggles there once URL is known.
+          break;
+      }
+    }
+
+    // Render the WiFi-creds form into #section-wifi-form on first use.
+    // Idempotent — re-installs after the first run are no-ops. See the
+    // comment on #section-wifi-form's empty div for why this is deferred
+    // (avoids the macOS iCloud Passwords prompt on page load).
+    //
+    // Attributes on the injected inputs:
+    // - autocomplete="off": defeats Chrome's built-in field-fill (the
+    //   browser's own offer; not the OS keychain).
+    // - data-lpignore / data-1p-ignore: vendor opt-outs for LastPass /
+    //   1Password's browser-extension fill icons.
+    // - autocomplete="off" on the password (NOT "new-password"):
+    //   "new-password" actively signals password managers "credential
+    //   being created, offer a generated value", which is wrong here —
+    //   the user is typing their existing home-WiFi password, not
+    //   creating a new account.
+    //
+    // The OS keychain prompt (iCloud Passwords) ignores all of the above
+    // when it scans the DOM at page load; deferring the form is the only
+    // reliable way to keep it quiet until the user is actually mid-install.
+    let _wifiFormBuilt = false;
+    function buildWifiForm() {
+      if (_wifiFormBuilt) return;
+      _wifiFormBuilt = true;
+      const section = document.getElementById("section-wifi-form");
+      section.innerHTML = `
+        <div class="install-status">Flash done. Enter your WiFi credentials to provision the device.</div>
+        <form id="wifi-form" class="install-form" onsubmit="return false">
+          <label for="wifi-ssid">Network name (SSID)</label>
+          <input type="text" id="wifi-ssid" autocomplete="off"
+                 data-lpignore="true" data-1p-ignore required>
+          <label for="wifi-password">Password</label>
+          <input type="password" id="wifi-password" autocomplete="off"
+                 data-lpignore="true" data-1p-ignore>
+          <div class="install-actions">
+            <button type="button" class="secondary" id="wifi-skip">Skip</button>
+            <button type="submit" class="primary" id="wifi-connect">Connect</button>
+          </div>
+        </form>
+      `;
+    }
+
+    // Returns a Promise the orchestrator awaits — resolves when the user
+    // submits the WiFi form. The form's Connect button completes via the
+    // form's submit event; the Skip button bypasses WiFi (the device
+    // falls back to its AP). Skip resolves with empty creds — the
+    // orchestrator's provision() with empty SSID will fail fast and the
+    // user falls back to the AP flow as documented in Step 2.
+    function uiWaitForCreds() {
+      return new Promise((resolve) => {
+        const form = document.getElementById("wifi-form");
+        const ssidEl = document.getElementById("wifi-ssid");
+        const passEl = document.getElementById("wifi-password");
+        const skipBtn = document.getElementById("wifi-skip");
+
+        const onSubmit = (e) => {
+          e.preventDefault();
+          cleanup();
+          const ssid = ssidEl.value.trim();
+          // Save SSID only — password stays out of localStorage. WiFi SSIDs
+          // are network-visible anyway (any scanning device sees them);
+          // passwords are not.
+          try {
+            if (ssid) localStorage.setItem("projectMM.installer.lastSsid", ssid);
+          } catch (_) { /* hostile storage */ }
+          resolve({ ssid, password: passEl.value });
+        };
+        const onSkip = () => {
+          cleanup();
+          resolve({ ssid: "", password: "" });
+        };
+        const cleanup = () => {
+          form.removeEventListener("submit", onSubmit);
+          skipBtn.removeEventListener("click", onSkip);
+        };
+        form.addEventListener("submit", onSubmit);
+        skipBtn.addEventListener("click", onSkip);
+      });
+    }
+
+    // Returns a Promise that resolves with one of:
+    //   { action: "ip", url: "<typed value>" }    — user typed an IP + Add
+    //   { action: "skip" }                        — user clicked Skip
+    //   { action: "retry" }                       — user clicked Try Improv again
+    // Shown when the orchestrator's probe-open on the user's pre-picked
+    // port fails. The OS port picker is modal and covers the install
+    // modal, so any guidance written and immediately followed by
+    // requestPort() is invisible — gate the re-prompt behind a Try
+    // again click so the message lands before the OS picker covers
+    // the page. Resolves when the user clicks Try again.
+    function uiWaitForPortRetry() {
+      return new Promise((resolve) => {
+        const btn = document.getElementById("wrong-port-retry");
+        const onClick = () => {
+          btn.removeEventListener("click", onClick);
+          resolve();
+        };
+        btn.addEventListener("click", onClick);
+      });
+    }
+
+    // Symmetric with uiWaitForCreds. Normalisation of the typed value lives
+    // in the orchestrator so the host page stays UI-only. The retry action
+    // is the orchestrator's signal to re-run Improv `initialize()`; while
+    // that's in flight the host re-shows the dialog via showNeedsIpRetrying()
+    // (input + buttons disabled, "Trying Improv again…" status visible).
+    function uiWaitForIp() {
+      return new Promise((resolve) => {
+        const form = document.getElementById("needs-ip-form");
+        const input = document.getElementById("needs-ip-input");
+        const skipBtn = document.getElementById("needs-ip-skip");
+        const retryBtn = document.getElementById("needs-ip-retry");
+
+        const onSubmit = (e) => {
+          e.preventDefault();
+          // Reject whitespace-only input here so the user sees the
+          // browser's built-in validation tooltip on the same field
+          // instead of a silent re-prompt after the orchestrator
+          // discovers an empty normalized URL downstream. `required`
+          // on the input catches empty submits but not "   " — trim
+          // first, then use setCustomValidity to surface the same UI.
+          const trimmed = input.value.trim();
+          if (!trimmed) {
+            input.setCustomValidity("Enter an IP address or hostname.");
+            input.reportValidity();
+            input.setCustomValidity("");  // clear so the next valid submit proceeds
+            return;
+          }
+          cleanup();
+          resolve({ action: "ip", url: trimmed });
+        };
+        const onSkip = () => {
+          cleanup();
+          resolve({ action: "skip" });
+        };
+        const onRetry = () => {
+          cleanup();
+          resolve({ action: "retry" });
+        };
+        const cleanup = () => {
+          form.removeEventListener("submit", onSubmit);
+          skipBtn.removeEventListener("click", onSkip);
+          retryBtn.removeEventListener("click", onRetry);
+        };
+        form.addEventListener("submit", onSubmit);
+        skipBtn.addEventListener("click", onSkip);
+        retryBtn.addEventListener("click", onRetry);
+      });
+    }
+
+    // Toggle the needs-ip dialog into "retry in flight" mode: input + all
+    // three buttons disabled, retry status line visible, input field
+    // cleared so the user starts fresh if retry fails. The orchestrator
+    // calls this before re-running Improv `initialize()`; on completion
+    // (success or failure) it returns to the normal `uiWaitForIp()` call,
+    // which by re-rendering the dialog implicitly re-enables everything.
+    function showNeedsIpRetrying(retrying) {
+      const form = document.getElementById("needs-ip-form");
+      const input = document.getElementById("needs-ip-input");
+      const skipBtn = document.getElementById("needs-ip-skip");
+      const retryBtn = document.getElementById("needs-ip-retry");
+      const addBtn = document.getElementById("needs-ip-add");
+      const status = document.getElementById("needs-ip-retry-status");
+      input.disabled = retrying;
+      skipBtn.disabled = retrying;
+      retryBtn.disabled = retrying;
+      addBtn.disabled = retrying;
+      status.hidden = !retrying;
+      if (retrying) input.value = "";
+    }
+
+    function handleSuccess({ url, mdns, board, applyDefaults = true, defaultsApplied = false, viaHttp, alreadyOnline, ethOnlyNoLink }) {
+      disarmUnloadGuard();
+      // Clear the amber notice styling from any prior install in this session — only the
+      // eth-only-no-link branch re-adds it, so every other outcome shows the plain note.
+      document.getElementById("done-defaults").classList.remove("install-done-note--notice");
+      // Default header: most done outcomes mean the device reported an IP (it's reachable).
+      // The eth-only-no-link branch overrides it (the device isn't online until a cable is in).
+      document.getElementById("done-status").textContent = "Device is online!";
+      // Device-model defaults are applied DURING the install over serial (Improv =
+      // REST over serial — APPLY_OP). The success screen just confirms + links;
+      // the device is already fully configured by the time it shows.
+      if (ethOnlyNoLink) {
+        // Ethernet-only firmware flashed, but no cable was connected so the device isn't
+        // online yet (and this build has no WiFi to provision). Defaults WERE pushed over
+        // serial. Tell the user the one thing they need to do: plug in Ethernet — the device
+        // then comes online on its own and the link appears at its IP / <name>.local.
+        showSection("done");
+        document.getElementById("done-status").textContent = "Flashed — connect Ethernet";
+        document.getElementById("done-url").removeAttribute("href");
+        document.getElementById("done-url").textContent = "";
+        document.getElementById("done-url-mdns").hidden = true;
+        const note = document.getElementById("done-defaults");
+        // The device-model defaults are pushed over SERIAL during install (no network needed), so on
+        // this eth-only path they normally DID apply — report that honestly. The only "next step" is
+        // the network cable. Append a defaults caveat only when the push actually didn't run.
+        const defaultsNote = defaultsApplied
+          ? ` ${board} defaults were applied.`
+          : (board && applyDefaults ? ` ${board} defaults weren't applied — apply them later from MoonDeck.` : "");
+        note.textContent =
+          `Flashed. This is an Ethernet-only firmware — connect a network cable and the device comes online on its own (find it via its IP or <name>.local, or in MoonDeck).${defaultsNote}`;
+        note.classList.add("install-done-note--notice");   // amber: flashed OK, action needed (plug in Ethernet)
+        note.hidden = false;
+        return;
+      }
+      if (!url) {
+        // No device URL (user skipped the IP prompt, or an eth-only/no-Improv device).
+        // On that path no serial config push happened. If a model was picked, say so —
+        // it can be applied later from MoonDeck on the LAN — else just close.
+        if (board && applyDefaults) {
+          showSection("done");
+          // No device address → not online; don't claim "Device is online!" (the
+          // default header set above).
+          document.getElementById("done-status").textContent = "Flashed";
+          document.getElementById("done-url").removeAttribute("href");
+          document.getElementById("done-url").textContent = "";
+          document.getElementById("done-url-mdns").hidden = true;
+          document.getElementById("done-defaults").textContent =
+            `Flashed. ${board} defaults weren't applied (no device address) — apply them later from MoonDeck on your network.`;
+          document.getElementById("done-defaults").hidden = false;
+          return;
+        }
+        closeModal();
+        return;
+      }
+      showSection("done");
+      // Always show the IP link (guaranteed to work). When the boot serial also
+      // reported the device's <deviceName>.local name, show it as a second link —
+      // it survives a DHCP lease change but only resolves where mDNS works.
+      // Only assign href for http(s) URLs (same guard as myDevices.addProvisionedDevice),
+      // so a malformed boot-log value can't become a javascript:/data: link.
+      const a = document.getElementById("done-url");
+      a.textContent = url;
+      if (isHttpUrl(url)) a.href = url; else a.removeAttribute("href");
+      const aMdns = document.getElementById("done-url-mdns");
+      if (mdns) {
+        const mdnsUrl = `http://${mdns}/`;
+        aMdns.textContent = mdnsUrl;
+        if (isHttpUrl(mdnsUrl)) aMdns.href = mdnsUrl; else aMdns.removeAttribute("href");
+        aMdns.hidden = false;
+      } else {
+        aMdns.hidden = true;
+      }
+      // Report the defaults outcome HONESTLY, from `defaultsApplied` (did the serial
+      // push actually run?), not `applyDefaults` (the checkbox intent): applied,
+      // wanted-but-couldn't (model picked + ticked but no push happened — e.g. an
+      // Improv-less path), or kept-config (unticked).
+      const note = document.getElementById("done-defaults");
+      if (defaultsApplied) {
+        note.textContent = `Applied ${board} defaults.`;
+        note.hidden = false;
+      } else if (board && applyDefaults) {
+        note.textContent = `Flashed, but ${board} defaults weren't applied — apply them from MoonDeck on your network.`;
+        note.hidden = false;
+      } else if (board) {
+        note.textContent = `Kept the device's existing config (device defaults not applied).`;
+        note.hidden = false;
+      } else {
+        note.hidden = true;
+      }
+      // Store no board unless the defaults actually applied, so the saved entry doesn't
+      // claim a model the device wasn't configured to.
+      myDevices.addProvisionedDevice(url, defaultsApplied ? board : "");
+    }
+
+    function handleError(stage, error) {
+      disarmUnloadGuard();
+      console.error("[install]", stage, error);
+      showSection("error");
+      document.getElementById("error-message").textContent =
+        `Stage: ${stage}\n${error && error.message ? error.message : error}`;
+    }
+
+    // --- Pre-pick port -------------------------------------------------
+    // Two-option dropdown: the currently-picked port (or a "Pick a port…"
+    // placeholder), and a "Pick another port…" sentinel that opens the
+    // browser's Web Serial picker. We never list multiple previously-
+    // granted ports — Web Serial doesn't expose OS device names, so a list
+    // of "Port 1 / Port 2 / Port 3" is just confusing. The native picker
+    // is the only place where the user can match a port to a physical
+    // device (it shows the OS device name there).
+    //
+    // We also don't pre-select from `navigator.serial.getPorts()` on page
+    // load. A surviving grant is not a guarantee the port is still openable
+    // — if the device re-enumerated (reboot, replug, host sleep), `open()`
+    // fails with "Failed to open serial port" mid-install. Cheaper UX to
+    // always have the user re-pick this session than to chase a confusing
+    // mid-flash error. installer.start() falls back to its own requestPort()
+    // prompt if the user clicks Install without pre-picking.
+    let pickedPort = null;
+    const portSelect = document.getElementById("port-select");
+    const PICK_NEW = "__pick_new__"; // sentinel value for the "pick another" option
+
+    function rebuildPortSelect() {
+      portSelect.replaceChildren();
+      // No-port state: a single "Pick a port…" option. The select-as-button
+      // shape lets the change-event fire when the user re-picks the same
+      // option after cancelling the picker (so the picker can be reopened
+      // without an extra "Pick another" row to collapse to). Browsers fire
+      // `change` when the chosen <option> changes; clicking the lone option
+      // when it's already selected doesn't fire — handled by the click
+      // listener below.
+      if (!pickedPort) {
+        const pickOpt = document.createElement("option");
+        pickOpt.value = PICK_NEW;
+        pickOpt.textContent = "Pick a port…";
+        portSelect.appendChild(pickOpt);
+        portSelect.value = PICK_NEW;
+        return;
+      }
+      // Picked state: "Port selected" + "Pick another port…" sentinel.
+      const currentOpt = document.createElement("option");
+      currentOpt.value = "current";
+      currentOpt.textContent = "Port selected";
+      portSelect.appendChild(currentOpt);
+      const pickOpt = document.createElement("option");
+      pickOpt.value = PICK_NEW;
+      pickOpt.textContent = "Pick another port…";
+      portSelect.appendChild(pickOpt);
+      portSelect.value = "current";
+    }
+
+    // Reflect the port state in the picker's Install gate after every rebuild
+    // (init, post-pick, and any cancel that leaves pickedPort null). Wrapped so
+    // both rebuildPortSelect() exits and all call sites stay covered by one hook.
+    function syncPortState() {
+      rebuildPortSelect();
+      installPicker.notifyPortChanged();
+    }
+
+    syncPortState();
+
+    async function openPortPicker() {
+      let granted = false;
+      try {
+        pickedPort = await navigator.serial.requestPort({});
+        granted = true;
+        // A pending detect() handle is bound to the OLD port — drop it so the
+        // next Detect/Install opens the newly-picked port cleanly.
+        await installer.clearDetected();
+      } catch (_) {
+        // User cancelled the picker — keep whatever was picked before.
+      }
+      syncPortState();
+      // Auto-detect right after a fresh grant — the ESP Web Tools / ESPHome
+      // model where picking the device detects it immediately, so the board
+      // list narrows without a second click. Only on a genuine new grant (not
+      // a dropdown re-select), and non-fatal: runDetect routes any failure to
+      // the status line. Re-detect = pick another port (same path).
+      if (granted) {
+        const status = document.getElementById("detect-status");
+        installPicker.runDetect((text) => { status.textContent = text; });
+      }
+    }
+
+    portSelect.addEventListener("change", () => {
+      if (portSelect.value === PICK_NEW) openPortPicker();
+    });
+    // Mousedown rather than click — `change` won't fire when the only
+    // option (the "Pick a port…" entry in the no-port state) is "re-chosen",
+    // and click on a <select> opens the native list before our handler
+    // runs. Mousedown fires before the list pops up; we preventDefault to
+    // suppress the list and open the Web Serial picker instead. Only
+    // applies in the no-port state — once a port is picked the regular
+    // change-event path handles it.
+    portSelect.addEventListener("mousedown", (e) => {
+      if (!pickedPort) {
+        e.preventDefault();
+        openPortPicker();
+      }
+    });
+
+    // --- Serial monitor -------------------------------------------------
+    // Live read-only viewer of the picked port at 115200 baud. Web Serial
+    // owns the port exclusively, so the monitor mutex'es with the
+    // install/erase flows in both directions (see openModal /
+    // closeModal for the button-disable side, and the closeMonitor
+    // calls in onInstall / the Erase handler for the port-release side).
+    const _monitor = { port: null, reader: null, closing: false };
+    const monitorBackdrop = document.getElementById("monitor-backdrop");
+    const monitorOutput = document.getElementById("monitor-output");
+    const monitorStatus = document.getElementById("monitor-status");
+    const monitorBtn = document.getElementById("monitor-btn");
+
+    function setMonitorStatus(text) { monitorStatus.textContent = text; }
+
+    function appendMonitor(text) {
+      // Autoscroll only when the user is at the bottom — otherwise they're
+      // scrolled up reading something and we shouldn't yank them down.
+      const atBottom = monitorOutput.scrollTop + monitorOutput.clientHeight
+                       >= monitorOutput.scrollHeight - 4;
+      monitorOutput.textContent += text;
+      if (atBottom) monitorOutput.scrollTop = monitorOutput.scrollHeight;
+    }
+
+    async function openMonitor() {
+      if (_monitor.port) return;  // already open (Monitor clicked twice fast)
+      // Browser-support gate: Safari / Firefox have no Web Serial API.
+      // The page-load banner (#browser-warning) already tells the user,
+      // but the Monitor button is still rendered and clickable; without
+      // this guard we'd hit `navigator.serial.requestPort()` and the
+      // resulting TypeError would be swallowed by openPortPicker's
+      // catch, leaving the user with a non-responsive button. Show the
+      // existing banner explicitly so a click here surfaces the cause.
+      if (!("serial" in navigator)) {
+        document.getElementById("browser-warning").style.display = "block";
+        document.getElementById("browser-warning").scrollIntoView({behavior: "smooth"});
+        return;
+      }
+      if (!pickedPort) {
+        // Trigger the port picker; openMonitor was called from a user
+        // gesture (Monitor button click), so requestPort() is allowed.
+        await openPortPicker();
+        if (!pickedPort) return;  // user cancelled
+      }
+      monitorOutput.textContent = "";
+      setMonitorStatus("Opening port at 115200…");
+      monitorBackdrop.classList.add("open");
+      try {
+        await pickedPort.open({ baudRate: 115200 });
+      } catch (e) {
+        // Already-open errors get caught here — the orchestrator opens
+        // the port at flash time; if a prior install left it open we just
+        // proceed (the reader still works on an open port).
+        if (!String(e.message || "").includes("already open")) {
+          setMonitorStatus(`Failed to open: ${e.message || e}`);
+          return;
+        }
+      }
+      _monitor.port = pickedPort;
+      setMonitorStatus("Reading (115200 8N1)…");
+      readLoop().catch(e => {
+        // Read errors land here once — surface and shut down. Don't loop
+        // forever on a dead port.
+        if (!_monitor.closing) setMonitorStatus(`Read error: ${e.message || e}`);
+      });
+    }
+
+    async function readLoop() {
+      const decoder = new TextDecoder("utf-8", { fatal: false });
+      _monitor.reader = _monitor.port.readable.getReader();
+      try {
+        while (true) {
+          const { value, done } = await _monitor.reader.read();
+          if (done) break;
+          if (value && value.length) appendMonitor(decoder.decode(value, { stream: true }));
+        }
+      } finally {
+        try { _monitor.reader.releaseLock(); } catch (_) { /* already released */ }
+        _monitor.reader = null;
+      }
+    }
+
+    async function closeMonitor() {
+      if (_monitor.closing) return;
+      _monitor.closing = true;
+      monitorBackdrop.classList.remove("open");
+      try {
+        if (_monitor.reader) {
+          // cancel() makes the pending read() return {done:true}; the read
+          // loop then exits and releases the lock in its finally.
+          await _monitor.reader.cancel();
+        }
+      } catch (_) { /* ignore */ }
+      try {
+        if (_monitor.port) await _monitor.port.close();
+      } catch (_) { /* ignore */ }
+      _monitor.port = null;
+      _monitor.closing = false;
+    }
+
+    // Pulse RTS low → high to trigger the device's auto-reset circuit
+    // (DTR/RTS combo mirrors what esptool does pre-flash; for a bare
+    // reset, toggling RTS alone is enough on most USB-Serial bridges).
+    // setSignals() requires the port to be open — we are, since the
+    // monitor is running. After the pulse the device reboots and its
+    // boot log starts streaming through the read loop already in place.
+    async function monitorReset() {
+      if (!_monitor.port) return;
+      try {
+        await _monitor.port.setSignals({ dataTerminalReady: false, requestToSend: true });
+        await new Promise(r => setTimeout(r, 100));
+        await _monitor.port.setSignals({ dataTerminalReady: false, requestToSend: false });
+        appendMonitor("\n--- reset ---\n");
+      } catch (e) {
+        setMonitorStatus(`Reset failed: ${e.message || e}`);
+      }
+    }
+
+    monitorBtn.addEventListener("click", openMonitor);
+    document.getElementById("monitor-close").addEventListener("click", closeMonitor);
+    document.getElementById("monitor-clear").addEventListener("click", () => {
+      monitorOutput.textContent = "";
+    });
+    document.getElementById("monitor-reset").addEventListener("click", monitorReset);
+    // Esc closes the monitor (same affordance the install modal has via
+    // closeModal — keeps the two dialogs symmetric).
+    document.addEventListener("keydown", (e) => {
+      if (e.key === "Escape" && monitorBackdrop.classList.contains("open")) {
+        closeMonitor();
+      }
+    });
+
+    // --- Picker wiring -------------------------------------------------
+    const _pickerReady = installPicker.init({
+      container: document.getElementById("picker-mount"),
+      ownFirmwareKey: null,  // web installer flashes any firmware variant
+      installRowExtras: document.getElementById("erase-row"),
+      boardSupport,  // board catalog + chip detection (web-installer-only module)
+      // Gate Install on a picked USB port — the web installer requires the user
+      // to choose the port in the dropdown before flashing. (notifyPortChanged()
+      // below re-evaluates the button whenever pickedPort changes.)
+      hasPort: () => !!pickedPort,
+      onDetect: async () => {
+        // The monitor (if open) holds the port — release it before esptool
+        // claims it, same as the install path. detect() keeps the port open
+        // afterwards so the following Install reuses it.
+        if (_monitor.port) await closeMonitor();
+        return await installer.detect({ port: pickedPort, onLog: appendLog });
+      },
+      onInstall: async (firmware, manifestUrl /*, binaryUrl */) => {
+        // If the monitor is open it holds the port — release it before
+        // esptool tries to claim it. The reverse lock (monitor button
+        // disabled for the install's duration) lives in openModal /
+        // closeModal so the user can't reopen the monitor mid-flash.
+        if (_monitor.port) await closeMonitor();
+        const localUrl = toLocalUrl(manifestUrl);
+        const board = installPicker.getSelectedBoard();
+        const txPower = installPicker.getSelectedBoardTxPower();
+        openModal(board ? `Installing projectMM on ${board}` : `Installing ${firmware}`);
+        showSection("connecting");
+        document.getElementById("connecting-detail").textContent = "";
+        const eraseBefore = document.getElementById("erase-before-flash").checked;
+        // Apply the device-model's catalog defaults (modules + controls) after flashing.
+        // Default-ticked-with-erase (see the change listener below): a clean slate wants
+        // defaults; re-flashing a configured device should NOT silently re-inject (the
+        // catalog's replaceChildren would delete the user's effects). Untick to flash the
+        // firmware while keeping the device's current config. txPower (the brown-out cap)
+        // is a hardware trait, not a "default", so it still applies regardless — only the
+        // module/control inject is gated.
+        const applyDefaults = document.getElementById("apply-device-defaults").checked;
+        // Ethernet-only firmware: WiFi compiled out (firmwares.json `eth_only`). Keyed off the
+        // name like isCompatible's `-eth*` rule — a `-eth` variant is eth-only UNLESS it's the
+        // `-eth-wifi` co-processor build. The orchestrator uses this to skip WiFi provisioning
+        // (the build has no WIFI_SETTINGS RPC) and tell the user to connect Ethernet instead.
+        const ethOnly = /-eth$/.test(firmware);
+        await installer.start({
+          // pickedPort may be null — orchestrator falls back to requestPort.
+          port: pickedPort,
+          manifestUrl: localUrl,
+          board,         // names the install title + identifies the catalog entry
+          applyDefaults, // gates the APPLY_OP config push (not txPower, sent earlier)
+          txPower,
+          eraseBefore,
+          ethOnly,
+          onProgress: handleProgress,
+          uiWaitForCreds,
+          uiWaitForIp,
+          uiShowNeedsIpRetrying: showNeedsIpRetrying,
+          uiWaitForPortRetry,
+          onSuccess: handleSuccess,
+          onError: handleError,
+          onLog: appendLog,
+        });
+      },
+    });
+
+    // Auto-tie "Apply device defaults" to "Erase chip first": ticking erase (a clean
+    // slate) ticks defaults; unticking erase unticks it. The user can still override
+    // either box independently afterwards — the tie only fires on an erase toggle. Both
+    // start unticked (erase's default), so a plain re-flash keeps the device's config.
+    (() => {
+      const eraseBox = document.getElementById("erase-before-flash");
+      const defaultsBox = document.getElementById("apply-device-defaults");
+      if (eraseBox && defaultsBox) {
+        eraseBox.addEventListener("change", () => { defaultsBox.checked = eraseBox.checked; });
+      }
+    })();
+
+    myDevices.init({
+      container: document.getElementById("devices-mount"),
+      onErase: async (device) => {
+        if (!confirm(
+            `Erase ${device.name}? This wipes WiFi credentials and all ` +
+            `module state. You can flash a fresh firmware afterwards.`)) {
+          return;
+        }
+        // Same port-lock concern as install: release the monitor before
+        // esptool tries to claim the port.
+        if (_monitor.port) await closeMonitor();
+        openModal(`Erasing ${device.name}`);
+        showSection("connecting");
+        document.getElementById("connecting-detail").textContent = "";
+        await installer.eraseOnly({
+          port: pickedPort,
+          onProgress: handleProgress,
+          uiWaitForPortRetry,
+          onSuccess: () => {
+            disarmUnloadGuard();   // erase finished — drop the tab-close warning
+            showSection("done");
+            // Reset any header left by a prior install in this session — erase is
+            // not "Device is online!".
+            document.getElementById("done-status").textContent = "Erase complete";
+            const a = document.getElementById("done-url");
+            a.removeAttribute("href");
+            a.textContent = "Erase complete — flash a fresh firmware to use the device again.";
+            document.getElementById("done-url-mdns").hidden = true;  // no device URL after erase
+            document.getElementById("done-defaults").hidden = true;  // nothing applied on erase
+          },
+          onError: handleError,
+          onLog: appendLog,
+        });
+      },
+    });
+
+    // Show the unsupported-browser banner when Web Serial isn't available.
+    if (!("serial" in navigator)) {
+      document.getElementById("browser-warning").style.display = "block";
+    }
+
+    // --- picture board grid --------------------------------
+    // Renders deviceModels.json as a visual card grid; on select it drives the shared
+    // picker's own (hidden) #rp-board <select> via a dispatched change event, so
+    // the existing release/firmware narrowing + flash flow runs unchanged. The
+    // shared install-picker.js is NOT modified.
+    (async function boardGrid() {
+      let boards = [];
+      try {
+        const res = await fetch("./deviceModels.json");   // same catalog as the picker
+        boards = await res.json();
+      } catch (e) {
+        document.getElementById("board-grid").textContent = "Could not load deviceModels.json: " + e;
+        return;
+      }
+      await _pickerReady;   // ensure the picker has mounted its (hidden) #rp-board
+
+      const gridEl    = document.getElementById("board-grid");
+      const searchEl  = document.getElementById("board-search");
+      const summaryEl = document.getElementById("board-summary");
+      const labelEl   = document.getElementById("board-summary-label");
+      const thumbEl   = document.getElementById("board-summary-thumb");
+      const expandEl  = document.getElementById("board-expand");
+      const clearEl   = document.getElementById("board-clear");
+      let selected = installPicker.getSelectedBoard() || "";   // honour a restored pick
+
+      function ledDriver(b) {
+        const d = (b.modules || []).find(m => /LedDriver$/.test(m.type || ""));
+        return d ? d.type.replace(/Driver$/, "") : null;
+      }
+      // A supported capability is "active" (configured) when deviceModels.json has a module
+      // backing it. The capability→module link is implicit in the data, so this map
+      // names it in one place (bespoke, but it just reads the modules[] already there —
+      // no duplicated `active` field to drift). A capability with no entry here, or no
+      // matching module, stays merely "supported". Each predicate gets the whole module
+      // object so it can inspect controls — needed to tell Ethernet from WiFi: both ride
+      // NetworkModule, but Ethernet is only ACTUALLY wired when the board's NetworkModule
+      // carries an ethType control set to a real PHY (not absent / "None"/0). WiFi is
+      // active wherever NetworkModule exists (the radio is always available); a board
+      // that lists WiFi as supported but ships no NetworkModule entry stays "supported".
+      const ethConfigured = (m) => {
+        const t = m.controls && m.controls.ethType;
+        return t !== undefined && t !== 0 && t !== "0" && t !== "None";
+      };
+      const CAP_MODULE = {
+        LEDs:     m => /LedDriver$/.test(m.type || ""),
+        Ethernet: m => m.type === "NetworkModule" && ethConfigured(m),
+        WiFi:     m => m.type === "NetworkModule",
+        Audio:    m => /^Audio/.test(m.type || ""),
+      };
+      function capActive(b, cap) {
+        const test = CAP_MODULE[cap];
+        return !!test && (b.modules || []).some(m => test(m));
+      }
+      function setExpanded(open) {
+        expandEl.hidden = !open;
+        summaryEl.setAttribute("aria-expanded", open ? "true" : "false");
+        if (open) { searchEl.focus(); }
+      }
+      // Reflect the current pick in the collapsed summary (label + thumbnail).
+      function updateSummary() {
+        const b = boards.find(x => x.name === selected);
+        if (b) {
+          labelEl.textContent = b.name;
+          if (b.image) { thumbEl.hidden = false; thumbEl.style.backgroundImage = `url("${b.image}")`; }
+          else { thumbEl.hidden = true; }
+        } else {
+          labelEl.textContent = "Pick a device";
+          thumbEl.hidden = true;
+        }
+      }
+      function pickBoard(name) {
+        selected = name;
+        // Drive the shared picker's hidden <select>: set value + fire change so
+        // its listener updates state.selectedBoard and re-filters firmware.
+        const rpBoard = document.getElementById("rp-board");
+        if (rpBoard) {
+          // A Detect narrows #rp-board's options to one family. With "show all
+          // boards" the grid can pick a board from ANOTHER family — whose option
+          // isn't in the narrowed list, so `value = name` would silently no-op
+          // (value stays "") and the firmware list wouldn't narrow. Ensure the
+          // option exists first so the assignment takes and selectedBoard is set.
+          if (name && !Array.from(rpBoard.options).some(o => o.value === name)) {
+            const o = document.createElement("option");
+            o.value = name; o.textContent = name;
+            rpBoard.appendChild(o);
+          }
+          rpBoard.value = name;
+          rpBoard.dispatchEvent(new Event("change", { bubbles: true }));
+        }
+        updateSummary();
+        setExpanded(false);   // collapse back to the summary after a pick
+        render();             // keep the grid's selected-card state in sync for next open
+      }
+      // After a Detect, the shared picker narrows its hidden #rp-board <select>
+      // to the matching-family boards (applyDetectedChip → fillBoardOptions). The
+      // grid mirrors that: it shows only boards whose name is a current #rp-board
+      // option. Before any detect, #rp-board holds the FULL catalog (plus the
+      // "(any board)" / "Other…" pass-through, which has no value), so the grid
+      // shows everything — only a detect narrows it. Returns null = no constraint.
+      // `showAll` is the user's escape hatch (the "show all boards" toggle) for a
+      // wrong/unhelpful detection — when set, the filter is bypassed.
+      let showAll = false;
+      function narrowedNames() {
+        const sel = document.getElementById("rp-board");
+        if (!sel) return null;
+        const names = Array.from(sel.options).map(o => o.value).filter(Boolean);
+        // If the option set equals the full catalog, there's no narrowing.
+        return names.length && names.length < boards.length ? new Set(names) : null;
+      }
+      function allowedNames() {
+        return showAll ? null : narrowedNames();
+      }
+      // The detected family label (from the narrowed boards' shared chip), for the
+      // "Detected <family> · show all" notice. null when not narrowed.
+      function detectedFamily() {
+        const allow = narrowedNames();
+        if (!allow) return null;
+        const fams = new Set(boards.filter(b => allow.has(b.name)).map(b => b.chip));
+        return fams.size === 1 ? [...fams][0] : null;
+      }
+      function renderFilterNotice() {
+        const notice = document.getElementById("board-filter-notice");
+        const fam = detectedFamily();
+        if (!fam) { notice.hidden = true; notice.replaceChildren(); return; }
+        notice.hidden = false;
+        notice.replaceChildren();
+        if (showAll) {
+          notice.append(`Showing all boards. `);
+          const a = document.createElement("button");
+          a.textContent = `Filter to detected ${fam}`;
+          a.onclick = () => { showAll = false; render(); };
+          notice.append(a);
+        } else {
+          notice.append(`Detected ${fam}. `);
+          const a = document.createElement("button");
+          a.textContent = "Show all boards";
+          a.title = "Detection wrong, or your board isn't in this family? Show the full catalog.";
+          a.onclick = () => { showAll = true; render(); };
+          notice.append(a);
+        }
+      }
+      function render() {
+        const q = (searchEl.value || "").toLowerCase();
+        const allow = allowedNames();
+        const shown = boards.filter(b =>
+          (!q || b.name.toLowerCase().includes(q)) &&
+          (!allow || allow.has(b.name)));
+        renderFilterNotice();
+        gridEl.replaceChildren();
+        const byChip = {};
+        for (const b of shown) (byChip[b.chip] ||= []).push(b);
+        for (const chip of Object.keys(byChip).sort()) {
+          const lbl = document.createElement("div");
+          lbl.className = "bg-chip-label"; lbl.textContent = chip;
+          gridEl.appendChild(lbl);
+          for (const b of byChip[chip]) gridEl.appendChild(card(b));
+        }
+        if (!shown.length) {
+          const e = document.createElement("p"); e.className = "note"; e.textContent = "No boards match.";
+          gridEl.appendChild(e);
+        }
+      }
+      function card(b) {
+        const el = document.createElement("div");
+        el.className = "bg-card" + (selected === b.name ? " selected" : "");
+        // Keyboard-accessible: a focusable option that picks on Enter/Space, the
+        // same affordance the click handler gives the mouse.
+        el.tabIndex = 0;
+        el.setAttribute("role", "option");
+        el.setAttribute("aria-selected", selected === b.name ? "true" : "false");
+        el.onclick = (ev) => { if (!ev.target.classList.contains("bg-link")) pickBoard(b.name); };
+        el.onkeydown = (ev) => {
+          if (ev.key === "Enter" || ev.key === " ") { ev.preventDefault(); pickBoard(b.name); }
+        };
+        const thumb = document.createElement("div");
+        thumb.className = "bg-thumb" + (b.image ? "" : " noimg");
+        // the deploy stages a copy of deviceModels.json
+        // + the referenced board images alongside this page, so an "image" path of
+        // "assets/boards/<slug>.jpg" resolves same-origin from this page.
+        if (b.image) thumb.style.backgroundImage = `url("${b.image}")`;
+        el.appendChild(thumb);
+        const body = document.createElement("div"); body.className = "bg-body";
+        const nm = document.createElement("div"); nm.className = "bg-name"; nm.textContent = b.name; body.appendChild(nm);
+        const meta = document.createElement("div"); meta.className = "bg-meta";
+        meta.textContent = b.chip + (ledDriver(b) ? " · " + ledDriver(b) : "");
+        body.appendChild(meta);
+        // Capability chips, three states by colour (not text): green = active
+        // (supported AND a module configured in deviceModels.json), yellow = supported
+        // (firmware supports it, not pre-configured), orange = planned (no module
+        // yet — the backlog seed). All chips are shown (labels kept short in
+        // deviceModels.json so they fit the card).
+        const caps = [
+          ...(Array.isArray(b.supported) ? b.supported.map(c =>
+            capActive(b, c) ? { c, cls: "act", label: "active" }
+                            : { c, cls: "sup", label: "supported" }) : []),
+          ...(Array.isArray(b.planned) ? b.planned.map(c => ({ c, cls: "plan", label: "planned" })) : []),
+        ];
+        if (caps.length) {
+          const capsEl = document.createElement("div"); capsEl.className = "bg-caps";
+          for (const { c, cls, label } of caps) {
+            const chip = document.createElement("span");
+            chip.className = "bg-cap " + cls;
+            chip.textContent = c;   // colour conveys active / supported / planned
+            chip.title = c + " — " + label;
+            capsEl.appendChild(chip);
+          }
+          body.appendChild(capsEl);
+        }
+        if (b.url) {
+          const a = document.createElement("a"); a.className = "bg-link"; a.href = b.url;
+          a.target = "_blank"; a.rel = "noopener"; a.textContent = "product page ↗"; body.appendChild(a);
+        }
+        // "details" opens the full deviceModels.json entry in a popup. It carries the
+        // bg-link class so the card's onclick treats it as a non-select region
+        // (same guard the product-page link relies on).
+        const det = document.createElement("a");
+        det.className = "bg-link bg-details"; det.textContent = "details ⓘ";
+        det.setAttribute("role", "button"); det.tabIndex = 0;
+        det.onclick = (ev) => { ev.stopPropagation(); showBoardDetails(b); };
+        det.onkeydown = (ev) => {
+          if (ev.key === "Enter" || ev.key === " ") { ev.preventDefault(); ev.stopPropagation(); showBoardDetails(b); }
+        };
+        body.appendChild(det);
+        el.appendChild(body);
+        return el;
+      }
+      // Fill + open the board-details popup from a deviceModels.json entry: a readable
+      // summary (chip, firmwares, capabilities, modules + their controls) plus a
+      // collapsible raw-JSON block for the exact entry. Built with DOM nodes (not
+      // innerHTML) so board-supplied strings can't inject markup.
+      function showBoardDetails(b) {
+        const dlg = document.getElementById("board-details");
+        document.getElementById("bd-title").textContent = b.name || "Device";
+        const body = document.getElementById("bd-body");
+        body.replaceChildren();
+        const row = (key, val) => {
+          const r = document.createElement("div"); r.className = "bd-row";
+          const k = document.createElement("span"); k.className = "bd-key"; k.textContent = key;
+          const v = document.createElement("span"); v.className = "bd-val"; v.textContent = val;
+          r.append(k, v); body.appendChild(r);
+        };
+        // Same shape as row(), but the value is a clickable link. href + textContent
+        // only (no innerHTML), so a board-supplied URL can't inject markup. Opens in
+        // a new tab; only http(s) links are made clickable (else fall back to text).
+        const rowLink = (key, url) => {
+          const r = document.createElement("div"); r.className = "bd-row";
+          const k = document.createElement("span"); k.className = "bd-key"; k.textContent = key;
+          const v = document.createElement("span"); v.className = "bd-val";
+          const a = document.createElement("a");
+          a.href = url; a.target = "_blank"; a.rel = "noopener"; a.textContent = url;
+          v.appendChild(a); r.append(k, v); body.appendChild(r);
+        };
+        if (b.chip) row("Chip", b.chip);
+        if (Array.isArray(b.firmwares)) row("Firmwares", b.firmwares.join(", "));
+        if (Array.isArray(b.supported) && b.supported.length) row("Supported", b.supported.join(", "));
+        if (Array.isArray(b.planned) && b.planned.length) row("Planned", b.planned.join(", "));
+        if (b.url) {
+          if (/^https?:\/\//.test(b.url)) rowLink("Product page", b.url);
+          else row("Product page", b.url);
+        }
+
+        if (Array.isArray(b.modules) && b.modules.length) {
+          const h = document.createElement("div"); h.className = "bd-section"; h.textContent = "Modules";
+          body.appendChild(h);
+          for (const m of b.modules) {
+            const mod = document.createElement("div"); mod.className = "bd-mod";
+            const nm = document.createElement("div"); nm.className = "bd-mod-name";
+            nm.textContent = m.type || "?";
+            if (m.id && m.id !== m.type) {
+              const idEl = document.createElement("span"); idEl.className = "bd-mod-id";
+              idEl.textContent = "  (" + m.id + ")"; nm.appendChild(idEl);
+            }
+            mod.appendChild(nm);
+            const ctrls = m.controls && typeof m.controls === "object" ? m.controls : null;
+            if (ctrls) {
+              for (const [k, v] of Object.entries(ctrls)) {
+                const c = document.createElement("div"); c.className = "bd-ctrl";
+                const code = document.createElement("code"); code.textContent = k + " = " + v;
+                c.appendChild(code); mod.appendChild(c);
+              }
+            }
+            body.appendChild(mod);
+          }
+        }
+
+        // Collapsible raw JSON — the exact entry, for developers.
+        const raw = document.createElement("details"); raw.className = "bd-raw";
+        const sum = document.createElement("summary"); sum.textContent = "Raw JSON";
+        const pre = document.createElement("pre"); pre.textContent = JSON.stringify(b, null, 2);
+        raw.append(sum, pre); body.appendChild(raw);
+
+        dlg.showModal();
+      }
+      searchEl.oninput = render;
+      summaryEl.addEventListener("click", () => setExpanded(expandEl.hidden));
+      clearEl.addEventListener("click", () => pickBoard(""));   // generic / no board
+
+      // Re-render when a Detect narrows the picker: applyDetectedChip swaps out
+      // #rp-board's <option>s, so observe its child list. The grid then filters
+      // to the detected family (allowedNames), and updateSummary picks up any
+      // auto-selected single match.
+      const rpBoard = document.getElementById("rp-board");
+      if (rpBoard) {
+        new MutationObserver(() => {
+          showAll = false;   // a fresh detect is a new context — re-apply the filter
+          // Take the picker's value verbatim — an empty string means it cleared the
+          // selection (detected family with multiple matches → generic mode), and
+          // `|| selected` would wrongly keep the stale board in the summary.
+          selected = installPicker.getSelectedBoard();
+          updateSummary();
+          render();
+        }).observe(rpBoard, { childList: true });
+      }
+
+      updateSummary();   // reflect any restored pick in the collapsed summary
+      render();
+    })();
diff --git a/docs/moonmodules/core/AudioModule.md b/docs/moonmodules/core/AudioModule.md
index 96fc114..0fc50b4 100644
--- a/docs/moonmodules/core/AudioModule.md
+++ b/docs/moonmodules/core/AudioModule.md
@@ -68,7 +68,7 @@ Audio-reactive lighting is a long-standing idea in the LED-controller world (WLE
 - **Analog line-in.** Long held to "only the original ESP32," but the field has moved: **[DedeHai](https://github.com/DedeHai) got analog input working on the S3**, and **Troy got it working in his ParrotRadio project**. Troy flags a *testing-confidence* nuance worth recording: he considers his own ParrotRadio analog path **better exercised** — he was actually recording and playing audio back through it and chasing down real issues — whereas an unlistened-to analog path elsewhere may not be as accurate as it looks, "if nobody's ever listened to it." So if projectMM adopts analog line-in, **validate by listening**, not just by watching the level meter move.
 - **I²C-configured codecs** (e.g. the **ES8311**): the right move is explicitly **not** to hand-roll each codec's register config (which is what Troy did in WLED). Espressif ships an **[`esp_codec_dev`](https://components.espressif.com/components/espressif/esp_codec_dev) "codecs" component** for IDF that already carries the option tables for many codecs; pulling it in would support "a bunch more codecs for free" and let users configure them for their own hardware. If something Troy hand-rolled turns out to be missing from the component, the codec class is extensible — but he doubts anything is. This is the [*Industry standards, our own code*](../../../CLAUDE.md#principles) call applied to codec bring-up: take Espressif's component rather than a bespoke per-codec config.
 
-Troy also has **DSP boards on his desk** — essentially I²S front-ends "waaaaay beyond the regular codecs" — a class of source recorded here so the line-in / codec work leaves room for it rather than only the simple cases. All of the above is **source-seam** work: it widens what feeds the pipeline, leaving the DC-blocker / RMS / FFT / band analysis untouched. Tracked under [backlog § sensor input](../../backlog/backlog.md#sensor-input-on-raspberry-pi-5--microphone-imu-line-in-post-10-multi-commit).
+Troy also has **DSP boards on his desk** — essentially I²S front-ends "waaaaay beyond the regular codecs" — a class of source recorded here so the line-in / codec work leaves room for it rather than only the simple cases. All of the above is **source-seam** work: it widens what feeds the pipeline, leaving the DC-blocker / RMS / FFT / band analysis untouched. Tracked under [backlog](../../backlog/README.md).
 
 ## Adaptive noise gate: forward-looking
 
@@ -95,7 +95,7 @@ Five design constraints come with it, and they are the load-bearing part: (1) sa
 
 ### Does our per-band floor already cover part of this?
 
-Partly, and that overlap is the key to sequencing. The backlogged [per-band noise-floor](../../backlog/backlog.md#sensors-and-audio-reactive-input) learns each band's idle baseline and subtracts it, so a *steady single-frequency* tone (our bench's ~258 Hz mains hum) gates to dark while the other bands stay live. The proposed time-domain gate answers a *different* question, "is there any sound at all," across the whole signal. They are complementary halves, not competitors: the per-band floor is the **frequency-domain** noise floor, the gate is the **time-domain** one. The per-band floor is also the smaller, already-planned step, so it is the natural first increment, and it is genuinely "part of this idea," not a thing the gate replaces.
+Partly, and that overlap is the key to sequencing. The backlogged [per-band noise-floor](../../backlog/README.md) learns each band's idle baseline and subtracts it, so a *steady single-frequency* tone (our bench's ~258 Hz mains hum) gates to dark while the other bands stay live. The proposed time-domain gate answers a *different* question, "is there any sound at all," across the whole signal. They are complementary halves, not competitors: the per-band floor is the **frequency-domain** noise floor, the gate is the **time-domain** one. The per-band floor is also the smaller, already-planned step, so it is the natural first increment, and it is genuinely "part of this idea," not a thing the gate replaces.
 
 ### How to decompose it: cherry-pick, step by step
 
@@ -108,7 +108,7 @@ The whole proposal is more than one increment. Taken apart, most of its value la
 
 Each step is its own commit, host-tested red-first, and leaves the system working; none requires touching `AudioBands.h` or the effect consumers. Steps 1–2 deliver most of the benefit (a self-calibrating floor in both domains) with almost no timing cost; 3–4 are polish to layer on only if the bench says they earn their place.
 
-**What it eventually retires:** the `floor` knob's role as a hard squelch. `floor` would become the *display* noise-floor only (the dB-window bottom in `magToByte`), while the learned gate decides "is there sound." That is a clean subtraction, but it is the *end* of the path, not the first step. Tracked under [backlog § audio follow-ups](../../backlog/backlog.md#sensors-and-audio-reactive-input).
+**What it eventually retires:** the `floor` knob's role as a hard squelch. `floor` would become the *display* noise-floor only (the dB-window bottom in `magToByte`), while the learned gate decides "is there sound." That is a clean subtraction, but it is the *end* of the path, not the first step. Tracked under [backlog](../../backlog/README.md).
 
 ## Tests
 
diff --git a/docs/moonmodules/core/Control.md b/docs/moonmodules/core/Control.md
index edc721b..eed36ef 100644
--- a/docs/moonmodules/core/Control.md
+++ b/docs/moonmodules/core/Control.md
@@ -28,7 +28,7 @@ Each `controls_.addX(name, var, …)` call (signatures in `Control.h`) binds one
 Notes on the non-obvious ones (the rest are self-describing):
 
 - **Password** serializes XOR-obfuscated + base64 over `/api/state`, not plaintext — a first line of defence, trivially reversible by design (the XOR key is shared with `app.js`), not encryption.
-- **Int16** is for coordinate-style values where negatives are legal — e.g. a Layer's `startX`/`endX` dragged outside the visible grid by a modifier. Default bounds are the full int16 range; pass explicit bounds for a tighter one. The UI renders it as a slider (an unbounded int16 falls back to a ±percentage slider for Layer positions).
+- **Int16** is for coordinate-style values where negatives are legal. Default bounds are the full int16 range; pass explicit bounds for a tighter one. The UI renders it as a slider (an unbounded int16 falls back to a ±percentage slider).
 - **Pin** is a GPIO number — `int8_t` (one byte; a GPIO never exceeds ~54), `−1` = unused/default. Distinct from Int16 so the UI renders a plain **number input** (a GPIO has no meaningful range to drag) and to keep the byte. `min`/`max` are the valid-GPIO span, used only as a server-side write-clamp. [NetworkModule](NetworkModule.md)'s eth pin controls are the first users; LED-driver pins follow.
 - **ReadOnlyInt** stores 1 byte + a unit suffix instead of a ~10-byte string — see [coding-standards § Prefer integers](../../coding-standards.md#prefer-integers-store-values-in-their-native-shape). [NetworkModule](NetworkModule.md)'s `rssi` (`-58 dBm`) and `txPower` (`19 dBm`) are the first users.
 - **IPv4** stores 4 bytes but converts to/from the dotted-quad string at the JSON boundary (`parseDottedQuad`/`formatDottedQuad` in `Control.h`, used by API, persistence, and scenario set-control). Used for [NetworkModule](NetworkModule.md)'s static-IP fields.
diff --git a/docs/moonmodules/core/FirmwareUpdateModule.md b/docs/moonmodules/core/FirmwareUpdateModule.md
index 7666168..491eba5 100644
--- a/docs/moonmodules/core/FirmwareUpdateModule.md
+++ b/docs/moonmodules/core/FirmwareUpdateModule.md
@@ -8,13 +8,14 @@ A thin status surface for OTA flashing. The flash itself is driven by `POST /api
 
 | Name | Type | Description |
 |---|---|---|
-| `version` | read-only string | Semver from library.json (`MM_VERSION`), plus the release channel in parentheses when the build was published under one: `1.0.0-rc2 (latest)`, `1.0.0 (v1.0.0)`. The channel (`MM_RELEASE`) is burned in by `release.yml` via `build_esp32.py --release <tag>`; a local / dev build has no channel and shows the bare semver. Semver answers *what code*; the channel answers *which release this device was flashed from* — a moving `latest` build and a tagged release can share a semver but differ in channel. Desktop builds show the bare semver today (the desktop packager doesn't set the channel). |
+| `version` | read-only string | Pure semver (`MM_VERSION`). A stable release is a clean `X.Y.Z` (e.g. `2.0.0`); a moving `latest` build is a monotonic prerelease `<core>-dev.<N>` (e.g. `2.1.0-dev.7`, where `N` is the commit count since the last `vX.Y.Z` tag — see `scripts/build/compute_version.py`), so successive `latest` builds are orderable (semver.org §9/§11); a local/dev build carries library.json's bare `<core>-dev`. The prerelease suffix marks a not-yet-released build; a clean `X.Y.Z` is a stable release. The release channel is derivable from the version (prerelease suffix → not stable), so it is not mixed into this string — the version stays a clean, machine-comparable semver, which the UI's "update available" check compares against the newest GitHub release (stable, and the moving `latest` for devices already on a `-dev` build). |
 | `build` | read-only string | Build date/time (`MM_BUILD_DATE`). |
 | `firmware` | read-only string | Build-time firmware variant key from `src/core/build_info.h` (`MM_FIRMWARE_NAME`): `esp32`, `esp32-eth`, `esp32-16mb`, `esp32s3-n16r8`, … for the shipped firmware variants (the full list is the `FIRMWARES` dict in `build_esp32.py`); `desktop-macos-arm64` / `desktop-windows-x64` for packaged desktop binaries; `desktop-dev` for unpackaged local desktop builds. A device carrying the legacy `esp32-eth-wifi` key OTA-maps to `esp32`. Identifies which release asset matches the device — the same key appears in the firmware filenames published by `release.yml`. The compiled binary; the physical hardware it runs on is SystemModule's `deviceModel` control. `install-picker.js`'s `isCompatible()` reads this string. |
 | `firmwarePartition` | progress (used/total) | Running app image size / total firmware (app) partition size — how full the partition is. Named distinctly from the `firmware` string control so a `controls.find(c => c.name === "firmware")` caller resolves the string, not this progress value. |
-| `update_status` | read-only string | One of: `idle`, `starting`, `downloading`, `flashing`, `rebooting`, `error: <reason>`. |
 | `update_pct` | progress (bytes/total) | Live byte counters rendered as "X KB / Y KB"; `total` is 0 until `esp_https_ota_get_image_size` reports it just after the TLS handshake. The name is historical (it predates the percent→bytes migration); the wire shape is bytes. |
 
+The OTA flash phase (`idle`, `starting`, `downloading`, `flashing`, `rebooting`, `error: <reason>`) is not a control — it surfaces through the module's shared status slot (`MoonModule::setStatus()`), the same per-module banner every module uses (NetworkModule's IP line, DevicesModule's sweep count). An `error:` prefix maps to `Severity::Error`; `idle` clears the banner; everything else is neutral `Severity::Status`.
+
 ## Wire contract
 
 ### `POST /api/firmware/url`
@@ -27,12 +28,12 @@ Request body:
 
 Response:
 
-- `202 Accepted` `{"ok":true}` — task spawned; UI polls `update_status` for progress.
+- `202 Accepted` `{"ok":true}` — task spawned; UI watches the module status slot + `update_pct` for progress.
 - `400` — missing URL, or URL doesn't start with `http://` / `https://`.
 - `500` — task failed to spawn (rare; out of memory).
 - `501` — platform doesn't support OTA (desktop returns this; `if constexpr (mm::platform::hasOta)`).
 
-The route returns immediately. Real progress streams via `update_status` + `update_pct` over the same WebSocket the UI uses for everything else.
+The route returns immediately. Real progress streams via the module status slot + `update_pct` over the same WebSocket the UI uses for everything else.
 
 ### Compatibility
 
@@ -58,7 +59,7 @@ The status buffer surfaces any failure with the prefix `error: ` followed by the
 - `error: ota finish <ESP-IDF error name>` — commit / boot-pointer-flip failure.
 - `error: task create failed` — `xTaskCreate` returned non-`pdPASS` (out of memory). No retry; reboot.
 
-After an error, `update_status` stays on the error message until the next `/api/firmware/url` POST clears it back to `"starting"`. `update_pct` is left at the last value.
+After an error, the status slot stays on the error message until the next `/api/firmware/url` POST clears it back to `"starting"`. `update_pct` is left at the last value.
 
 ## Prior art
 
diff --git a/docs/moonmodules/light/BlendMap.md b/docs/moonmodules/light/BlendMap.md
index 2f592a0..11779a4 100644
--- a/docs/moonmodules/light/BlendMap.md
+++ b/docs/moonmodules/light/BlendMap.md
@@ -1,10 +1,14 @@
 # BlendMap
 
-`blendMap` is a free function that reads a Layer's buffer and writes mapped output into a destination buffer, called by the Drivers container each frame. The destination is cleared first, so physical cells with no source (a sparse layout's lattice gaps) stay black.
+`blendMap` is a free function that reads a Layer's buffer and writes mapped output into a destination buffer, called by the [Drivers](Drivers.md) container for each enabled layer each frame. It takes a blend op (`Overwrite` / `Alpha` / `Additive`), an `opacity` (0–255), and a `clearFirst` flag — the bottom (first-composited) layer passes `clearFirst=true` so physical cells with no source (a sparse layout's lattice gaps) stay black; layers above pass `false` to accumulate onto the frame below.
 
-The LUT picks one of two paths: when each physical light is written at most once (every current layout/modifier — mirror, shuffle, sparse box→driver), it overwrite-copies source→destination (no read-back, no clamp, ~4× faster); when sources can overlap a destination (multi-layer composition), it additively blends with clamping. Physical indices are bounds-checked so an out-of-range LUT entry can't overrun the buffer.
+The combine math is integer-only (the hot-path per-light rule), with one tight specialised loop per op chosen once per layer:
 
-Configurable per-layer blend modes (beyond additive) land with multi-layer composition — a [backlog](../../backlog/backlog.md) item.
+- **Overwrite** (the default / bottom layer): plain copy, no read-back. For a dense grid (no LUT) it's a `memcpy`; for a single-write LUT (mirror, shuffle, sparse box→driver) it copies source→destination per mapped light. A non-overwriting LUT (one that folds several logical lights onto one physical cell) routes through the additive accumulate path so the overlaps sum-with-clamp rather than last-writer-win.
+- **Additive**: `dst = clamp(dst + src·opacity)` — sum with saturation at 255, opacity scaling the source.
+- **Alpha** (over): `dst = (src·α + dst·(255−α)) / 255` — the textbook 8-bit alpha-over, division by 255 via the fast `(x + (x>>8) + 1) >> 8` reciprocal. Full opacity (255) collapses to a plain overwrite (no blend cost).
+
+A dense-grid layer has no LUT, so its buffer blends 1:1 (source index = physical index, no lookup); a layer with a LUT maps each logical light to its physical destination(s) first. Physical indices come from the LUT, which is built in-range from the shared Layouts, so they address the buffer in bounds by construction. The per-Layer `blendMode`/`opacity` controls that select the op live on [Layer](Layer.md#blendmode--opacity-controls); Drivers reads them and the layer stack order.
 
 ## Source
 
diff --git a/docs/moonmodules/light/Drivers.md b/docs/moonmodules/light/Drivers.md
index b35355e..eb6447e 100644
--- a/docs/moonmodules/light/Drivers.md
+++ b/docs/moonmodules/light/Drivers.md
@@ -10,10 +10,14 @@ Top-level container for one or more drivers. The consumer side of the pipeline 
 
 The shared output buffer is necessary because blend+map writes to arbitrary physical positions (via LUT) — the output is not filled sequentially. A driver cannot read chunk-by-chunk until the full buffer is populated.
 
-Exception: when memory is tight AND mapping is 1:1 unshuffled (single layer, grid layout, no serpentine), Drivers can skip its own buffer and let drivers read directly from the layer's buffer at the cost of parallelism. See [architecture.md § Parallelism](../../architecture.md#parallelism).
+Exception: when exactly one layer is enabled AND its mapping is 1:1 unshuffled (no LUT — grid layout, no serpentine), Drivers skips its own buffer and lets drivers read directly from the layer's buffer (the zero-copy fast path, at the cost of parallelism). See [architecture.md § Parallelism](../../architecture.md#parallelism).
 
 It uses the same `Buffer` type a Layer does, sized by the Layouts container.
 
+## Multi-layer composition
+
+When two or more layers are enabled, Drivers composites them into the shared output buffer each frame, in [Layers](Layers.md) container order (bottom→top, via `forEachEnabledLayer`). The bottom layer clears and overwrites the buffer; each layer above blends onto the accumulated frame per its own `blendMode` and `opacity` (the inert per-Layer controls — see [Layer](Layer.md#blendmode--opacity-controls)). Drivers owns the orchestration because only it sees the stack order and the output buffer; the layers carry only the parameters. The per-pixel blend math lives in [BlendMap](BlendMap.md) (integer-only, per the hot-path rule). A full-opacity overwrite/additive layer pays no alpha arithmetic, so the per-frame cost scales with the enabled-layer count. With a single enabled layer there is no composite: the fast path above applies (no-LUT → zero-copy; with a LUT → one blend+map pass into the output buffer).
+
 ## Output correction
 
 The Drivers container owns the shared output-correction state and exposes two controls; each *physical* driver child (ArtNet today, future LED drivers) applies it per-light as it reads the source buffer. Preview ignores it (shows the raw logical buffer).
@@ -23,7 +27,7 @@ The Drivers container owns the shared output-correction state and exposes two co
 | `brightness` | uint8 (0–255) | Global brightness. Scales every channel through a 256-entry LUT (`(v × brightness) / 255`). Changing it rebuilds only the LUT on the cheap `onUpdate` tier — no pipeline realloc, so the slider is fluent. Gamma / white-balance fold into this LUT later as a per-channel R/G/B split. |
 | `lightPreset` | select | The physical wire format: channel order and whether the light is RGBW. Options: `RGB`, `RBG`, `GRB`, `GBR`, `BRG`, `BGR`, `RGBW`, `GRBW`. Defaults to `GRB` — the WS2812/SK6812 wire order, so a strip shows correct colours out of the box (PreviewDriver reads the RGB source buffer directly and is unaffected). RGBW presets make each driver emit 4 channels per light with white derived as `min(R,G,B)` from the (brightness-scaled) RGB. |
 
-The state lives on `Correction` (`src/light/drivers/Correction.h`): a brightness LUT, channel-order table, output channel count, derive-white flag. `Drivers::onUpdate` rebuilds it on a `brightness`/`lightPreset` change and hands each child a `const Correction*`. Every driver currently sees the same blended output of the active layer; per-driver layer assignment is a [backlog](../../backlog/backlog.md) item that lands with multi-layer composition.
+The state lives on `Correction` (`src/light/drivers/Correction.h`): a brightness LUT, channel-order table, output channel count, derive-white flag. `Drivers::onUpdate` rebuilds it on a `brightness`/`lightPreset` change and hands each child a `const Correction*`. Every driver sees the same composited output; per-driver layer assignment (different drivers reading different layers) is a [backlog](../../backlog/README.md) item.
 
 ## Prior art
 
diff --git a/docs/moonmodules/light/Layer.md b/docs/moonmodules/light/Layer.md
index 2d5c75a..243f316 100644
--- a/docs/moonmodules/light/Layer.md
+++ b/docs/moonmodules/light/Layer.md
@@ -11,13 +11,9 @@ A `Layer` MoonModule (role `ModuleRole::Layer`, child of the [Layers](Layers.md)
 - **Effects** (ordered list) — write lights into buffer. No hard-coded max — dynamic list (heap-allocated, grown as needed).
 - **Modifiers** (ordered list) — transform LUT or light values. Same dynamic list approach.
 
-## start/end controls
+## blendMode / opacity controls
 
-Each Layer carries six `int16_t` controls — `startX`, `startY`, `startZ`, `endX`, `endY`, `endZ` — that select a region of the shared Layouts **expressed as percentages of the physical extent on each axis**. Defaults are `start = 0, end = 100` (the full layout). Percentages are resilient to physical layout changes: a `startX = 25` Layer stays at the same relative position when the panel resizes from 64×64 to 128×128, rather than ending up at the wrong absolute pixel.
-
-Negative values and values > 100 are legal: a future modifier could drag a Layer in or out of the visible area by shifting start/end past 0% or 100% (e.g. `startX = -50` means the Layer extends 50% off the left edge of the layout). `ControlType::Int16` is the wire type so negative values round-trip correctly through `/api/state`, `/api/types`, and persistence.
-
-Today (single-Layer pipeline) `rebuildLUT()` ignores the controls — the values are persisted state, not yet wired. They surface in the UI now so the surface stays stable when the composition follow-up activates them. **Rounding rule (when activated):** `start` percentages round toward the lower pixel (floor), `end` percentages round toward the higher pixel (ceiling). This guarantees a non-zero region on small panels (e.g. `start = 33, end = 66` on a 4-wide axis produces pixels 1..3 inclusive, not 1..2 or 2..2). Spec: [architecture.md § Layers and Layer](../../architecture.md#layers-and-layer).
+Two controls govern how this Layer composites onto the layers below it: `blendMode` (a select — `alpha` over, or `additive` sum-with-clamp) and `opacity` (`uint8`, 0 = invisible, 255 = full). They are **inert on the Layer** — the Layer never reads them; it just carries them so they travel through add / delete / reorder with no separate synchronised list. The [Drivers](Drivers.md) container reads each enabled Layer's two values plus the [Layers](Layers.md) container's child order and does the actual compositing (bottom layer overwrites, each layer above blends per its mode + opacity). The bottom (first-composited) Layer's `blendMode`/`opacity` are moot — nothing sits under it. The blend math itself lives in [BlendMap](BlendMap.md). Precedent for "value here, logic in Drivers": the per-X `Correction` data Drivers applies.
 
 ## Key operations
 
@@ -55,7 +51,7 @@ See [EffectBase § Dimensions and auto-extrusion](EffectBase.md#dimensions-and-a
 
 ## Status
 
-The Layer's status line (the `MoonModule` status slot) shows the **logical** box the effects render into — `"<w>×<h>×<d>"`, the dimensions a modifier and the start/end region carving reshape. This differs from the physical bounding box shown on the [Layouts](Layouts.md#status) container: a Mirror-XY modifier on a 128×128 physical layout renders into a 64×64 logical box (the half that gets folded), so the Layer reads `64×64×1` while Layouts reads `128×128×1`. The gap between the two is the modifier's effect, made visible.
+The Layer's status line (the `MoonModule` status slot) shows the **logical** box the effects render into — `"<w>×<h>×<d>"`, the dimensions its modifiers reshape. This differs from the physical bounding box shown on the [Layouts](Layouts.md#status) container: a Mirror-XY modifier on a 128×128 physical layout renders into a 64×64 logical box (the half that gets folded), so the Layer reads `64×64×1` while Layouts reads `128×128×1`. The gap between the two is the modifier's effect, made visible.
 
 The same slot carries memory-degradation warnings (`Severity::Warning`/`Error`) when a build can't fit: `"modifier LUT skipped — not enough memory"`, `"sparse LUT build failed — not enough memory"`, `"buffer reduced — not enough memory"`, `"buffer allocation failed — not enough memory"`. A warning wins over the neutral box line — when the Layer is degraded, that's what the user needs to see. Recomputed on every rebuild (`onBuildState`), not per tick.
 
diff --git a/docs/moonmodules/light/Layers.md b/docs/moonmodules/light/Layers.md
index 0295462..c0eefe6 100644
--- a/docs/moonmodules/light/Layers.md
+++ b/docs/moonmodules/light/Layers.md
@@ -8,9 +8,9 @@ Top-level container for one or more layers. Each layer renders independently int
 
 ## Why a container
 
-Multi-layer composition (alpha-blend, additive, layered overlays) needs a place to walk every layer in order and merge their buffers before drivers consume the result. Layers is that place. Today the boot pipeline creates **one layer inside Layers**, so the container is a thin pass-through: `loop()` runs the single child and returns; behaviour is byte-identical to the previous single-layer pipeline.
+Multi-layer composition (alpha-blend, additive, layered overlays) needs a place to walk every layer in order so drivers can merge their buffers before consuming the result. Layers is that place. With one layer inside it the container is a thin pass-through: `loop()` runs the single child and returns; behaviour is byte-identical to the single-layer pipeline.
 
-The container owns no buffer: each layer owns its own, and the Drivers container owns the composed output. It wires the shared Layouts into every child so each can size its buffer. While a single layer is active, `activeLayer()` (the first enabled child) is what Drivers reads; multi-layer blending — where Layers iterates and Drivers composites across all of them — is a [backlog](../../backlog/backlog.md) item.
+The container owns no buffer: each layer owns its own, and the Drivers container owns the composited output. It wires the shared Layouts into every child so each can size its buffer. Two queries serve the Drivers compositor: `activeLayer()` (the first enabled child) answers physical dimensions and is the source for the single-layer fast path, and `forEachEnabledLayer(cb)` walks the enabled children in container order (bottom→top) — the order Drivers blends them, with `cb(layer, isFirst)` marking the bottom layer that clears the buffer. `enabledLayerCount()` lets Drivers pick the fast path (one enabled layer → hand its buffer straight to the driver) versus the composite path (≥2 → blend into the output buffer). The blend modes and the value-on-Layer / logic-in-Drivers split are documented on [Layer](Layer.md#blendmode--opacity-controls) and [Drivers](Drivers.md).
 
 ## Prior art
 
diff --git a/docs/moonmodules/light/drivers/LcdLedDriver.md b/docs/moonmodules/light/drivers/LcdLedDriver.md
index 9b0f4b6..38e29db 100644
--- a/docs/moonmodules/light/drivers/LcdLedDriver.md
+++ b/docs/moonmodules/light/drivers/LcdLedDriver.md
@@ -36,7 +36,7 @@ Full case list in the generated [unit tests § LcdLedDriver](../../../tests/unit
 
 - **Encoder (CI, host):** byte-exact 3-slot triplets — transpose across lanes, MSB-first, the unequal-lane idle-LOW rule, GRB via Correction, RGBW rows.
 - **Driver (CI, host):** lane slicing (including unequal leds-per-lane), frame-byte math (RGBW growth, alignment rounding), bad-pin status + recovery, the exactly-8-pins rule, the empty-default idle (no GPIO claimed until pins are set), zero-grid robustness, teardown.
-- **`loopbackTxPin` control (CI, host):** the conditional control — bound always, shown only while `loopbackTest` is on. The lane-0 override mechanism is shared with the Parlio driver (same `ParallelLedDriver` base) and hardware-verified there; the LCD hardware path itself is exercised by the loopback self-test above. The catalog-add path is verified on the sibling RMT/Parlio drivers (S3 boards currently default to RMT — LcdLed needs all 8 lanes, see the [backlog 1..8-pin LCD note](../../../backlog/backlog.md)).
+- **`loopbackTxPin` control (CI, host):** the conditional control — bound always, shown only while `loopbackTest` is on. The lane-0 override mechanism is shared with the Parlio driver (same `ParallelLedDriver` base) and hardware-verified there; the LCD hardware path itself is exercised by the loopback self-test above. The catalog-add path is verified on the sibling RMT/Parlio drivers (S3 boards currently default to RMT — LcdLed needs all 8 lanes).
 - **Hardware:** the loopback self-test above (jumper), and tick-scaling across grid sizes proves frames really clock out.
 
 ## Prior art
diff --git a/docs/moonmodules/light/drivers/NetworkSendDriver.md b/docs/moonmodules/light/drivers/NetworkSendDriver.md
index 39a3da6..fe0f9a0 100644
--- a/docs/moonmodules/light/drivers/NetworkSendDriver.md
+++ b/docs/moonmodules/light/drivers/NetworkSendDriver.md
@@ -27,11 +27,11 @@ E1.31 framing facts an integrator needs: CID is stable per device (derived from
 ## Interop notes
 
 - **Universe rule (both ends):** buffer offset = (universe − `universe_start`) × 510, and the sender emits from `universe_start` verbatim — no hidden 1-based adjustment for E1.31. Strict sACN gear reserves universe 0, so set `universe_start ≥ 1` on **both** ends when talking to it; the matching default of 0 on our own receiver keeps device↔device pairs aligned out of the box.
-- **Unicast or broadcast; not multicast.** The destination can be a single device (unicast) or the limited-broadcast address `255.255.255.255` (the default), which sprays the frame to every device on the LAN — the platform socket sets `SO_BROADCAST` so this works for all three protocols. The standard Art-Net convention is broadcast; a device↔device pair works out of the box with no IP typed. E1.31 multicast (group 239.255.x.x) is not implemented — the platform has no IGMP join; MoonLight ships without it too. See the backlog entry for the planned work.
+- **Unicast or broadcast; not multicast.** The destination can be a single device (unicast) or the limited-broadcast address `255.255.255.255` (the default), which sprays the frame to every device on the LAN — the platform socket sets `SO_BROADCAST` so this works for all three protocols. The standard Art-Net convention is broadcast; a device↔device pair works out of the box with no IP typed. E1.31 multicast (group 239.255.x.x) is not implemented — the platform has no IGMP join; MoonLight ships without it too.
 
 ## Synchronous send (blocks the render tick)
 
-The whole frame goes out inline in `loop()` — ~35 ms over Ethernet / ~90 ms over WiFi at 128×128 with ArtNet (DDP proportionally less). The dedicated send task that decouples the wire from the render tick is a backlog item gated on PSRAM ([backlog](../../../backlog/backlog.md)). FPS limiting plus the all-universes-in-one-burst shape is what receivers expect.
+The whole frame goes out inline in `loop()` — ~35 ms over Ethernet / ~90 ms over WiFi at 128×128 with ArtNet (DDP proportionally less). The dedicated send task that decouples the wire from the render tick is a backlog item gated on PSRAM ([backlog](../../../backlog/README.md)). FPS limiting plus the all-universes-in-one-burst shape is what receivers expect.
 
 ## Cross-domain wiring
 
diff --git a/docs/moonmodules/light/modifiers/RegionModifier.md b/docs/moonmodules/light/modifiers/RegionModifier.md
new file mode 100644
index 0000000..97d2abd
--- /dev/null
+++ b/docs/moonmodules/light/modifiers/RegionModifier.md
@@ -0,0 +1,44 @@
+# Region Modifier
+
+Static modifier. Carves the layer down to a sub-rectangle of the physical bounding box: the effect renders only inside the region, everything outside is dark. The region is given as **percentages of the physical extent on each axis**, so it survives a physical resize — a `0..50` region stays the left half whether the panel is 64 or 128 wide. Default `0..100` on every axis is the full box (an identity carve).
+
+A Layer applies only its **first enabled modifier**, so today a Layer uses *either* Region *or* another modifier (Multiply, …) at a time. Region and Multiply are independent, so stacking them (occupy a region *and* tile/mirror within it — Region then Multiply) is planned via [modifier chaining](../../../backlog/README.md).
+
+## Controls
+
+- `startX` / `startY` / `startZ` (Int16, default 0) — region start, as a percentage of physical width / height / depth.
+- `endX` / `endY` / `endZ` (Int16, default 100) — region end, as a percentage of physical width / height / depth.
+
+`Int16` (not a 0–100 slider) so negative and >100 values round-trip through `/api/state`, `/api/types`, and persistence; the carve math clamps them into the box.
+
+## Region math
+
+Per axis, **half-open** `[startPixel, endPixel)`:
+
+- `startPixel = floor(start% / 100 · extent)`, clamped to `[0, extent-1]`.
+- `endPixel = ceil(end% / 100 · extent)`, **exclusive**, clamped to `[startPixel+1, extent]`.
+- region size = `endPixel − startPixel` (always ≥ 1).
+
+Half-open is what makes abutting regions **tile exactly**: a `0..50` and a `50..100` layer split a 128-wide axis into pixels `0..63` and `64..127` — no overlap, no gap. `start` floors and `end` ceils so a small panel never rounds to an empty region (`start 33 / end 66` on a 4-wide axis → `floor(1.32)=1` .. `ceil(2.64)=3` → pixels 1, 2). Default `end 100` on a `W`-wide axis → `ceil(W)=W` → the full width.
+
+## Effect on the pipeline
+
+- **Logical dimensions = the region size** — `logicalDimensions()` reports the carved rectangle, so the Layer's render buffer (and the Layer status line `w×h×d`) shrinks to the region. The effect only ever renders the region; the rest of the layer has no logical source and stays dark. This is the same "the box is smaller than the physical box" mechanism a Mirror modifier uses.
+- **1:1 mapping with a start offset** — `mapToPhysical()` translates a region-local cell `(lx,ly,lz)` to the box cell `(lx+startPixelX, ly+startPixelY, lz+startPixelZ)`, a single destination. Because the logical box is already the region size, every region cell is in-bounds; no per-cell drop is needed. `maxMultiplier()` is 1 — it never fans out.
+- **Fast path**: the cheapest carve is *no modifier at all* — then `Layer::rebuildLUT` keeps its identity-memcpy / sparse fast path with zero carving cost. The default is to not add a RegionModifier; a full-region `0..100` one is correct but not the absolute cheapest, so full-coverage layers simply omit it.
+
+## Cross-domain wiring
+
+A Layer applies its first enabled modifier during `rebuildLUT`. Region is a normal `ModifierBase` (no contract change) — it expresses carving entirely through the existing `logicalDimensions()` + `mapToPhysical()` virtuals, the same two the LUT builder already calls. See [architecture.md § Modifiers](../../../architecture.md#layers-and-layer).
+
+## Tests
+
+[Unit tests: RegionModifier](../../../tests/unit-tests.md#regionmodifier) — the region math (full box, exact half, abutting-tile, small-panel rounding, ≥1-pixel floor, out-of-range clamp, degenerate axes) and the coordinate offset mapping. [Unit tests: Layer](../../../tests/unit-tests.md#layer) adds the integration case: a RegionModifier shrinks the Layer's logical box to the region and the LUT maps only region cells.
+
+## Prior art
+
+The crop / region node of any compositor (After Effects' crop, a shader scissor rect): restrict rendering to a rectangle, the rest is transparent. MoonLight has no single "region" modifier — its layers map through the same coordinate-transform mechanism, which is the lineage for expressing this as a modifier rather than a Layer control.
+
+## Source
+
+[RegionModifier.h](../../../../src/light/modifiers/RegionModifier.h)
diff --git a/docs/performance.md b/docs/performance.md
index a3a022c..7eab440 100644
--- a/docs/performance.md
+++ b/docs/performance.md
@@ -250,6 +250,10 @@ Absolute tick at each step (the diff vs the prior row is that subsystem's cost):
 
 **Expected, and confirmed everywhere:** audio is a small fixed per-tick cost; idle discovery is free; output drivers are cheap at a capped 64-LED output (none dominates the render path). The modifier's +~190µs at 16² is the one notable per-frame add — explained below (it's the blend+map, and it *pays for itself* at large grids).
 
+**Multi-layer composition** (the `Drivers` composite loop): a single enabled Layer is the pass-through fast path (the driver reads the Layer's buffer directly — zero composite cost, the figures above). Each *additional* enabled Layer adds one `blendMap` pass over the physical buffer (integer alpha-over or additive, branch-resolved once per layer), so N enabled layers cost ≈ N × the per-layer write — linear in layer count, same shape as the per-effect sweep. The RegionModifier adds nothing unless present (no modifier = the identity fast path).
+
+**Branch re-verification (2026-06-25, multi-layer + RegionModifier):** the live perf scenarios (`scenario_perf_light` / `_full` / `_modifier_swap`) were re-run on all three boards on this branch's firmware. The per-effect and per-modifier numbers match the tables here within run-to-run variance — the new composite/RegionModifier code does not regress the single-layer pipeline (it's opt-in: a one-layer tree runs the same path as before).
+
 ### Effect compute — light vs heavy bracket, across grid sizes (render-only)
 
 Tick µs; FPS in parens for the 16K row:
@@ -267,7 +271,7 @@ Tick µs; FPS in parens for the 16K row:
 | 64² (4K) | 13,547 | 11,235 | 4,358 |
 | 128² (16K) | 62,316 (16 FPS) | 50,555 (20 FPS) | 17,433 (57 FPS) |
 
-All curves scale **~linear in pixel count** (no superlinear blowup → no realloc/fragmentation pathology). The heavy effect is the 16K bottleneck on every board, and the board ranking is P4 ≫ S3 > classic on heavy compute (the P4's 400MHz dual-core is ~3× the S3). **Surprise worth noting:** at light-16K the *classic* (4,360µs) beats the S3 (7,949µs) — the S3's PSRAM-resident buffer has higher access latency than the classic's internal RAM for the cheap Checkerboard inner loop, and classic's uint16 LUT is half the size; on the heavy effect the compute dominates and the S3 pulls ahead again. See the [NoiseEffect cost backlog item](backlog/backlog.md) for the fixed-point / strided-sampling ideas.
+All curves scale **~linear in pixel count** (no superlinear blowup → no realloc/fragmentation pathology). The heavy effect is the 16K bottleneck on every board, and the board ranking is P4 ≫ S3 > classic on heavy compute (the P4's 400MHz dual-core is ~3× the S3). **Surprise worth noting:** at light-16K the *classic* (4,360µs) beats the S3 (7,949µs) — the S3's PSRAM-resident buffer has higher access latency than the classic's internal RAM for the cheap Checkerboard inner loop, and classic's uint16 LUT is half the size; on the heavy effect the compute dominates and the S3 pulls ahead again. Fixed-point / strided-sampling ideas are on the [backlog](backlog/README.md).
 
 ### MultiplyModifier — compute down, memory up (Noise effect)
 
diff --git a/docs/tests/scenario-tests.md b/docs/tests/scenario-tests.md
index edf05b8..ee139e8 100644
--- a/docs/tests/scenario-tests.md
+++ b/docs/tests/scenario-tests.md
@@ -23,9 +23,9 @@ Baseline: the render pipeline runs with no audio module present.
 
 | Board | FPS | heap | block |
 |---|---|---|---|
-| `pc-macos` | — / 100,000-125,000 | — / unlimited | — / unlimited |
+| `pc-macos` | — / 32,258-125,000 | — / unlimited | — / unlimited |
 
-- `pc-macos`: observed 2026-06-12 → 2026-06-14
+- `pc-macos`: observed 2026-06-12 → 2026-06-25
 
 #### `measure-audio-added` (measure)  📏
 
@@ -41,9 +41,9 @@ Pipeline still renders with the (idle, unconfigured) mic added.
 
 | Board | FPS | heap | block |
 |---|---|---|---|
-| `pc-macos` | — / 100,000-125,000 | — / unlimited | — / unlimited |
+| `pc-macos` | — / 34,483-125,000 | — / unlimited | — / unlimited |
 
-- `pc-macos`: observed 2026-06-12 → 2026-06-16
+- `pc-macos`: observed 2026-06-12 → 2026-06-25
 
 #### `measure-pins-configured` (measure)  📏
 
@@ -61,9 +61,9 @@ All three mic pins set via the sequential install-fan-out order: pipeline still
 
 | Board | FPS | heap | block |
 |---|---|---|---|
-| `pc-macos` | — / 90,909-125,000 | — / unlimited | — / unlimited |
+| `pc-macos` | — / 32,258-125,000 | — / unlimited | — / unlimited |
 
-- `pc-macos`: observed 2026-06-13 → 2026-06-14
+- `pc-macos`: observed 2026-06-13 → 2026-06-25
 
 #### `measure-consumer-live` (measure)  📏
 
@@ -79,9 +79,9 @@ Pipeline renders with the producer + consumer both wired.
 
 | Board | FPS | heap | block |
 |---|---|---|---|
-| `pc-macos` | — / 83,333-125,000 | — / unlimited | — / unlimited |
+| `pc-macos` | — / 30,303-125,000 | — / unlimited | — / unlimited |
 
-- `pc-macos`: observed 2026-06-12 → 2026-06-16
+- `pc-macos`: observed 2026-06-12 → 2026-06-25
 
 #### `measure-after-mic-removed` (measure)  📏
 
@@ -97,9 +97,9 @@ Mic gone, consumer remains: pipeline keeps rendering on silent audio (buffer non
 
 | Board | FPS | heap | block |
 |---|---|---|---|
-| `pc-macos` | — / 83,333-125,000 | — / unlimited | — / unlimited |
+| `pc-macos` | — / 31,250-125,000 | — / unlimited | — / unlimited |
 
-- `pc-macos`: observed 2026-06-12 → 2026-06-16
+- `pc-macos`: observed 2026-06-12 → 2026-06-25
 
 #### `measure-back-to-baseline` (measure)  📏
 
@@ -115,9 +115,9 @@ Both audio modules gone: back to the pipeline-only baseline, still rendering.
 
 | Board | FPS | heap | block |
 |---|---|---|---|
-| `pc-macos` | — / 90,909-125,000 | — / unlimited | — / unlimited |
+| `pc-macos` | — / 40,000-125,000 | — / unlimited | — / unlimited |
 
-- `pc-macos`: observed 2026-06-12 → 2026-06-17
+- `pc-macos`: observed 2026-06-12 → 2026-06-25
 
 ## DevicesModule
 
@@ -171,14 +171,16 @@ Set grid height to 128 (alongside default width 128). Measures the heaviest conf
 | `esp32` | — / 4.5 | — / 83KB | — / 48KB |
 | `esp32-eth` | — / 10.7-10.8 | — / 132KB | — / 48KB-52KB |
 | `esp32-eth-wifi` | ≥ 10.0 / 12.4 | ≥ 103KB / 93KB | — / 48KB |
-| `esp32p4-eth` | — / 739-880 | — / 33218KB | — / 376KB |
+| `esp32p4-eth` | — / 739-880 | — / 33206KB-33218KB | — / 376KB |
+| `esp32s3-n16r8` | — / 106-217 | — / 8315KB-8321KB | — / 104KB-108KB |
 | `pc-macos` | ≥ 8,333 / 3,534-10,526 | unlimited / unlimited | — / unlimited |
 | `pc-windows` | — / 3,413-4,566 | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-02
 - `esp32-eth`: observed 2026-06-02
 - `esp32-eth-wifi`: contract set 2026-06-02 "initial contract" · observed 2026-06-02
-- `esp32p4-eth`: observed 2026-06-17
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-22
 - `pc-macos`: contract set 2026-06-02 "initial contract" · observed 2026-06-02 → 2026-06-03
 - `pc-windows`: observed 2026-06-07
 
@@ -193,14 +195,16 @@ Shrink to 128x64. Measured: tick/heap captured so the runner reports the realloc
 | `esp32` | — / 11.1 | — / 63KB | — / 17KB |
 | `esp32-eth` | — / 26.4-26.5 | — / 114KB | — / 48KB |
 | `esp32-eth-wifi` | ≥ 22.2 / 31.8 | ≥ 83KB / 75KB | — / 24KB |
-| `esp32p4-eth` | — / 1,527-1,739 | — / 33226KB | — / 376KB |
+| `esp32p4-eth` | — / 1,527-1,739 | — / 33214KB-33226KB | — / 376KB |
+| `esp32s3-n16r8` | — / 415-787 | — / 8324KB-8331KB | — / 100KB-112KB |
 | `pc-macos` | ≥ 16,667 / 4,695-21,739 | unlimited / unlimited | — / unlimited |
 | `pc-windows` | — / 7,299-10,638 | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-02
 - `esp32-eth`: observed 2026-06-02
 - `esp32-eth-wifi`: contract set 2026-06-02 "initial contract" · observed 2026-06-02
-- `esp32p4-eth`: observed 2026-06-17
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-22
 - `pc-macos`: contract set 2026-06-02 "initial contract" · observed 2026-06-02 → 2026-06-08
 - `pc-windows`: observed 2026-06-07
 
@@ -215,14 +219,16 @@ Grow back to 128x128. Measured: confirms the heap can return to the heavy baseli
 | `esp32` | — / 4.0 | — / 83KB | — / 52KB |
 | `esp32-eth` | — / 10.4 | — / 132KB | — / 48KB |
 | `esp32-eth-wifi` | ≥ 10.0 / 12.2 | ≥ 103KB / 93KB | — / 52KB |
-| `esp32p4-eth` | — / 762-875 | — / 33218KB | — / 376KB |
+| `esp32p4-eth` | — / 762-875 | — / 33206KB-33218KB | — / 376KB |
+| `esp32s3-n16r8` | — / 132-251 | — / 8312KB-8322KB | — / 100KB-112KB |
 | `pc-macos` | ≥ 8,333 / 3,257-10,204 | unlimited / unlimited | — / unlimited |
 | `pc-windows` | — / 3,436-4,608 | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-02
 - `esp32-eth`: observed 2026-06-02
 - `esp32-eth-wifi`: contract set 2026-06-02 "initial contract" · observed 2026-06-02
-- `esp32p4-eth`: observed 2026-06-17
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-22
 - `pc-macos`: contract set 2026-06-02 "initial contract" · observed 2026-06-02 → 2026-06-03
 - `pc-windows`: observed 2026-06-07
 
@@ -314,10 +320,10 @@ Multiply modifier active — pipeline live, LUT folds the grid.
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32-eth` | — / 1,580-7,752 | — / 172KB-225KB | — / 76KB-108KB |
-| `pc-macos` | — / 76,923-166,667 | — / unlimited | — / unlimited |
+| `pc-macos` | — / 50,000-166,667 | — / unlimited | — / unlimited |
 
 - `esp32-eth`: observed 2026-06-07 → 2026-06-08
-- `pc-macos`: observed 2026-06-07 → 2026-06-11
+- `pc-macos`: observed 2026-06-07 → 2026-06-21
 
 #### `checkerboard` (measure)  📏
 
@@ -331,10 +337,10 @@ Checkerboard modifier active — masks half the lights; pipeline stays live (dri
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32-eth` | — / 769-990 | — / 170KB-225KB | — / 76KB-108KB |
-| `pc-macos` | — / 17,544-58,824 | — / unlimited | — / unlimited |
+| `pc-macos` | — / 15,873-58,824 | — / unlimited | — / unlimited |
 
 - `esp32-eth`: observed 2026-06-07 → 2026-06-08
-- `pc-macos`: observed 2026-06-07 → 2026-06-11
+- `pc-macos`: observed 2026-06-07 → 2026-06-25
 
 #### `multiply-2` (measure)  📏
 
@@ -348,10 +354,10 @@ Back to Multiply — replace round-trips cleanly, pipeline live again.
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32-eth` | — / 1,587-2,278 | — / 169KB-225KB | — / 76KB-108KB |
-| `pc-macos` | — / 66,667-166,667 | — / unlimited | — / unlimited |
+| `pc-macos` | — / 45,455-166,667 | — / unlimited | — / unlimited |
 
 - `esp32-eth`: observed 2026-06-07 → 2026-06-08
-- `pc-macos`: observed 2026-06-07 → 2026-06-11
+- `pc-macos`: observed 2026-06-07 → 2026-06-25
 
 ### scenario_perf_full
 
@@ -376,14 +382,14 @@ Bare minimum at 16²: Grid + Layer + Checkerboard, no output driver, audio/disco
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32` | — / 7,752 | — / 134KB | — / 108KB |
-| `esp32p4-eth` | — / 14,925-15,873 | — / 33243KB-33244KB | — / 376KB |
-| `esp32s3-n16r8` | — / 7,519-8,197 | — / 8340KB | — / 104KB |
-| `pc-macos` | — / — | — / unlimited | — / unlimited |
+| `esp32p4-eth` | — / 14,925-17,241 | — / 33226KB-33244KB | — / 376KB |
+| `esp32s3-n16r8` | — / 5,376-9,009 | — / 8340KB-8346KB | — / 104KB-112KB |
+| `pc-macos` | — / 1,000,000-— | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-17
-- `esp32p4-eth`: observed 2026-06-17
-- `esp32s3-n16r8`: observed 2026-06-17
-- `pc-macos`: observed 2026-06-17
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-17 → 2026-06-22
+- `pc-macos`: observed 2026-06-17 → 2026-06-25
 
 #### `measure-no-audio` (measure)  📏
 
@@ -395,14 +401,14 @@ Bare minimum at 16²: Grid + Layer + Checkerboard, no output driver, audio/disco
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32` | — / 8,621 | — / 134KB | — / 108KB |
-| `esp32p4-eth` | — / 18,519-18,868 | — / 33243KB-33244KB | — / 376KB |
-| `esp32s3-n16r8` | — / 9,009-9,091 | — / 8338KB-8340KB | — / 104KB |
-| `pc-macos` | — / — | — / unlimited | — / unlimited |
+| `esp32p4-eth` | — / 18,182-18,868 | — / 33228KB-33244KB | — / 376KB |
+| `esp32s3-n16r8` | — / 8,065-9,901 | — / 8338KB-8346KB | — / 104KB-112KB |
+| `pc-macos` | — / 1,000,000-— | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-17
-- `esp32p4-eth`: observed 2026-06-17
-- `esp32s3-n16r8`: observed 2026-06-17
-- `pc-macos`: observed 2026-06-17
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-17 → 2026-06-22
+- `pc-macos`: observed 2026-06-17 → 2026-06-25
 
 #### `measure-quiet` (measure)  📏
 
@@ -416,14 +422,14 @@ Quiet baseline: render-only, audio + discovery off. The cleanest render floor; t
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32` | — / 8,621 | — / 131KB | — / 108KB |
-| `esp32p4-eth` | — / 17,544-17,857 | — / 33243KB | — / 376KB |
-| `esp32s3-n16r8` | — / 8,929-9,091 | — / 8337KB-8340KB | — / 100KB-104KB |
-| `pc-macos` | — / — | — / unlimited | — / unlimited |
+| `esp32p4-eth` | — / 17,544-18,519 | — / 33226KB-33243KB | — / 376KB |
+| `esp32s3-n16r8` | — / 8,696-9,901 | — / 8337KB-8346KB | — / 100KB-112KB |
+| `pc-macos` | — / 1,000,000-— | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-17
-- `esp32p4-eth`: observed 2026-06-17
-- `esp32s3-n16r8`: observed 2026-06-17
-- `pc-macos`: observed 2026-06-17
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-17 → 2026-06-22
+- `pc-macos`: observed 2026-06-17 → 2026-06-25
 
 #### `measure-modifier` (measure)  📏
 
@@ -435,14 +441,14 @@ Quiet baseline: render-only, audio + discovery off. The cleanest render floor; t
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32` | — / 3,175 | — / 130KB | — / 108KB |
-| `esp32p4-eth` | — / 10,204-10,417 | — / 33241KB | — / 376KB |
-| `esp32s3-n16r8` | — / 3,425-3,968 | — / 8336KB-8338KB | — / 104KB |
-| `pc-macos` | — / — | — / unlimited | — / unlimited |
+| `esp32p4-eth` | — / 9,434-10,638 | — / 33224KB-33241KB | — / 376KB |
+| `esp32s3-n16r8` | — / 3,413-4,237 | — / 8336KB-8344KB | — / 104KB-112KB |
+| `pc-macos` | — / 1,000,000-— | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-17
-- `esp32p4-eth`: observed 2026-06-17
-- `esp32s3-n16r8`: observed 2026-06-17
-- `pc-macos`: observed 2026-06-17
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-17 → 2026-06-22
+- `pc-macos`: observed 2026-06-17 → 2026-06-25
 
 #### `measure-preview` (measure)  📏
 
@@ -455,14 +461,14 @@ Quiet baseline: render-only, audio + discovery off. The cleanest render floor; t
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32` | — / 8,696 | — / 123KB | — / 108KB |
-| `esp32p4-eth` | — / 15,873-17,857 | — / 33243KB | — / 376KB |
-| `esp32s3-n16r8` | — / 8,475-8,772 | — / 8335KB-8340KB | — / 100KB-104KB |
-| `pc-macos` | — / — | — / unlimited | — / unlimited |
+| `esp32p4-eth` | — / 15,873-17,857 | — / 33228KB-33243KB | — / 376KB |
+| `esp32s3-n16r8` | — / 8,065-9,434 | — / 8335KB-8346KB | — / 92KB-112KB |
+| `pc-macos` | — / 200,000-— | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-17
-- `esp32p4-eth`: observed 2026-06-17
-- `esp32s3-n16r8`: observed 2026-06-17
-- `pc-macos`: observed 2026-06-17
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-17 → 2026-06-22
+- `pc-macos`: observed 2026-06-17 → 2026-06-25
 
 #### `measure-network` (measure)  📏
 
@@ -474,14 +480,14 @@ Quiet baseline: render-only, audio + discovery off. The cleanest render floor; t
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32` | — / 7,194 | — / 131KB | — / 108KB |
-| `esp32p4-eth` | — / 14,925-17,544 | — / 33240KB | — / 376KB |
-| `esp32s3-n16r8` | — / 7,092-8,065 | — / 8334KB-8337KB | — / 84KB-100KB |
-| `pc-macos` | — / — | — / unlimited | — / unlimited |
+| `esp32p4-eth` | — / 14,493-17,544 | — / 33226KB-33240KB | — / 376KB |
+| `esp32s3-n16r8` | — / 7,092-8,065 | — / 8334KB-8344KB | — / 84KB-112KB |
+| `pc-macos` | — / 1,000,000-— | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-17
-- `esp32p4-eth`: observed 2026-06-17
-- `esp32s3-n16r8`: observed 2026-06-17
-- `pc-macos`: observed 2026-06-17
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-17 → 2026-06-22
+- `pc-macos`: observed 2026-06-17 → 2026-06-25
 
 #### `measure-rmt` (measure)  📏
 
@@ -494,14 +500,14 @@ Quiet baseline: render-only, audio + discovery off. The cleanest render floor; t
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32` | — / 6,579 | — / 106KB | — / 84KB |
-| `esp32p4-eth` | — / 17,241-17,857 | — / 33219KB | — / 376KB |
-| `esp32s3-n16r8` | — / 8,333-8,475 | — / 8307KB-8315KB | — / 84KB-104KB |
-| `pc-macos` | — / — | — / unlimited | — / unlimited |
+| `esp32p4-eth` | — / 15,873-17,857 | — / 33200KB-33219KB | — / 376KB |
+| `esp32s3-n16r8` | — / 8,333-9,259 | — / 8307KB-8321KB | — / 84KB-112KB |
+| `pc-macos` | — / 1,000,000-— | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-17
-- `esp32p4-eth`: observed 2026-06-17
-- `esp32s3-n16r8`: observed 2026-06-17
-- `pc-macos`: observed 2026-06-17
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-17 → 2026-06-22
+- `pc-macos`: observed 2026-06-17 → 2026-06-25
 
 #### `measure-lcd` (measure)  📏
 
@@ -514,14 +520,14 @@ Quiet baseline: render-only, audio + discovery off. The cleanest render floor; t
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32` | — / 8,403 | — / 126KB | — / 108KB |
-| `esp32p4-eth` | — / 16,129-17,544 | — / 33243KB | — / 376KB |
-| `esp32s3-n16r8` | — / 7,042-8,403 | — / 8336KB-8338KB | — / 92KB-104KB |
-| `pc-macos` | — / — | — / unlimited | — / unlimited |
+| `esp32p4-eth` | — / 16,129-17,857 | — / 33225KB-33243KB | — / 376KB |
+| `esp32s3-n16r8` | — / 7,042-9,259 | — / 8336KB-8345KB | — / 92KB-112KB |
+| `pc-macos` | — / 1,000,000-— | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-17
-- `esp32p4-eth`: observed 2026-06-17
-- `esp32s3-n16r8`: observed 2026-06-17
-- `pc-macos`: observed 2026-06-17
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-17 → 2026-06-22
+- `pc-macos`: observed 2026-06-17 → 2026-06-24
 
 #### `measure-parlio` (measure)  📏
 
@@ -534,14 +540,14 @@ Quiet baseline: render-only, audio + discovery off. The cleanest render floor; t
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32` | — / 8,475 | — / 135KB | — / 108KB |
-| `esp32p4-eth` | — / 15,873-17,544 | — / 33243KB | — / 376KB |
-| `esp32s3-n16r8` | — / 7,692-8,475 | — / 8338KB | — / 104KB |
-| `pc-macos` | — / — | — / unlimited | — / unlimited |
+| `esp32p4-eth` | — / 15,873-17,857 | — / 33225KB-33243KB | — / 376KB |
+| `esp32s3-n16r8` | — / 7,692-9,434 | — / 8338KB-8346KB | — / 104KB-112KB |
+| `pc-macos` | — / 1,000,000-— | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-17
-- `esp32p4-eth`: observed 2026-06-17
-- `esp32s3-n16r8`: observed 2026-06-17
-- `pc-macos`: observed 2026-06-17
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-17 → 2026-06-22
+- `pc-macos`: observed 2026-06-17 → 2026-06-24
 
 #### `measure-light-16` (measure)  📏
 
@@ -556,14 +562,14 @@ Quiet baseline: render-only, audio + discovery off. The cleanest render floor; t
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32` | — / 6,711 | — / 134KB | — / 108KB |
-| `esp32p4-eth` | — / 16,393-18,868 | — / 33243KB | — / 376KB |
-| `esp32s3-n16r8` | — / 8,403-9,091 | — / 8336KB-8337KB | — / 100KB |
-| `pc-macos` | — / — | — / unlimited | — / unlimited |
+| `esp32p4-eth` | — / 15,385-18,868 | — / 33226KB-33243KB | — / 376KB |
+| `esp32s3-n16r8` | — / 8,403-9,901 | — / 8336KB-8346KB | — / 100KB-112KB |
+| `pc-macos` | — / 1,000,000-— | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-17
-- `esp32p4-eth`: observed 2026-06-17
-- `esp32s3-n16r8`: observed 2026-06-17
-- `pc-macos`: observed 2026-06-17
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-17 → 2026-06-22
+- `pc-macos`: observed 2026-06-17 → 2026-06-24
 
 #### `measure-light-32` (measure)  📏
 
@@ -576,14 +582,14 @@ Quiet baseline: render-only, audio + discovery off. The cleanest render floor; t
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32` | — / 2,801 | — / 134KB | — / 108KB |
-| `esp32p4-eth` | — / 7,463-7,519 | — / 33241KB | — / 376KB |
-| `esp32s3-n16r8` | — / 3,049-3,367 | — / 8331KB-8338KB | — / 100KB |
-| `pc-macos` | — / 1,000,000 | — / unlimited | — / unlimited |
+| `esp32p4-eth` | — / 7,246-7,519 | — / 33225KB-33241KB | — / 376KB |
+| `esp32s3-n16r8` | — / 3,049-3,597 | — / 8331KB-8343KB | — / 100KB-112KB |
+| `pc-macos` | — / 333,333-1,000,000 | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-17
-- `esp32p4-eth`: observed 2026-06-17
-- `esp32s3-n16r8`: observed 2026-06-17
-- `pc-macos`: observed 2026-06-17
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-17 → 2026-06-22
+- `pc-macos`: observed 2026-06-17 → 2026-06-24
 
 #### `measure-light-64` (measure)  📏
 
@@ -596,14 +602,14 @@ Quiet baseline: render-only, audio + discovery off. The cleanest render floor; t
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32` | — / 872 | — / 125KB | — / 108KB |
-| `esp32p4-eth` | — / 2,008-2,212 | — / 33232KB | — / 376KB |
-| `esp32s3-n16r8` | — / 917-998 | — / 8312KB-8330KB | — / 88KB-104KB |
-| `pc-macos` | — / 250,000 | — / unlimited | — / unlimited |
+| `esp32p4-eth` | — / 2,008-2,212 | — / 33218KB-33232KB | — / 376KB |
+| `esp32s3-n16r8` | — / 917-1,011 | — / 8312KB-8334KB | — / 88KB-112KB |
+| `pc-macos` | — / 12,658-250,000 | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-17
-- `esp32p4-eth`: observed 2026-06-17
-- `esp32s3-n16r8`: observed 2026-06-17
-- `pc-macos`: observed 2026-06-17
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-17 → 2026-06-22
+- `pc-macos`: observed 2026-06-17 → 2026-06-24
 
 #### `measure-light-128` (measure)  📏
 
@@ -616,14 +622,14 @@ Quiet baseline: render-only, audio + discovery off. The cleanest render floor; t
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32` | — / 229 | — / 89KB | — / 62KB |
-| `esp32p4-eth` | — / 515-559 | — / 33196KB | — / 376KB |
-| `esp32s3-n16r8` | — / 126-128 | — / 8291KB-8294KB | — / 100KB-104KB |
-| `pc-macos` | — / 58,824-62,500 | — / unlimited | — / unlimited |
+| `esp32p4-eth` | — / 515-573 | — / 33182KB-33196KB | — / 376KB |
+| `esp32s3-n16r8` | — / 126-134 | — / 8291KB-8298KB | — / 100KB-112KB |
+| `pc-macos` | — / 5,348-62,500 | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-17
-- `esp32p4-eth`: observed 2026-06-17
-- `esp32s3-n16r8`: observed 2026-06-17
-- `pc-macos`: observed 2026-06-17
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-17 → 2026-06-22
+- `pc-macos`: observed 2026-06-17 → 2026-06-24
 
 #### `measure-heavy-16` (measure)  📏
 
@@ -637,14 +643,14 @@ Quiet baseline: render-only, audio + discovery off. The cleanest render floor; t
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32` | — / 990 | — / 136KB | — / 108KB |
-| `esp32p4-eth` | — / 2,899-3,311 | — / 33243KB | — / 376KB |
-| `esp32s3-n16r8` | — / 1,252-1,355 | — / 8342KB | — / 108KB |
-| `pc-macos` | — / 250,000-333,333 | — / unlimited | — / unlimited |
+| `esp32p4-eth` | — / 2,899-3,311 | — / 33229KB-33243KB | — / 376KB |
+| `esp32s3-n16r8` | — / 1,148-1,361 | — / 8342KB-8346KB | — / 108KB-112KB |
+| `pc-macos` | — / 62,500-333,333 | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-17
-- `esp32p4-eth`: observed 2026-06-17
-- `esp32s3-n16r8`: observed 2026-06-17
-- `pc-macos`: observed 2026-06-17
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-17 → 2026-06-22
+- `pc-macos`: observed 2026-06-17 → 2026-06-25
 
 #### `measure-heavy-32` (measure)  📏
 
@@ -657,14 +663,14 @@ Quiet baseline: render-only, audio + discovery off. The cleanest render floor; t
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32` | — / 312 | — / 134KB | — / 108KB |
-| `esp32p4-eth` | — / 799-893 | — / 33241KB | — / 376KB |
-| `esp32s3-n16r8` | — / 353-356 | — / 8339KB-8340KB | — / 108KB |
-| `pc-macos` | — / 62,500-71,429 | — / unlimited | — / unlimited |
+| `esp32p4-eth` | — / 799-893 | — / 33227KB-33241KB | — / 376KB |
+| `esp32s3-n16r8` | — / 290-356 | — / 8339KB-8343KB | — / 108KB-112KB |
+| `pc-macos` | — / 15,152-71,429 | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-17
-- `esp32p4-eth`: observed 2026-06-17
-- `esp32s3-n16r8`: observed 2026-06-17
-- `pc-macos`: observed 2026-06-17
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-17 → 2026-06-22
+- `pc-macos`: observed 2026-06-17 → 2026-06-25
 
 #### `measure-heavy-64` (measure)  📏
 
@@ -677,14 +683,14 @@ Quiet baseline: render-only, audio + discovery off. The cleanest render floor; t
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32` | — / 73.8 | — / 125KB | — / 108KB |
-| `esp32p4-eth` | — / 222-229 | — / 33232KB | — / 376KB |
-| `esp32s3-n16r8` | — / 89.0-89.8 | — / 8330KB-8331KB | — / 108KB |
-| `pc-macos` | — / 14,085-16,129 | — / unlimited | — / unlimited |
+| `esp32p4-eth` | — / 196-229 | — / 33218KB-33232KB | — / 376KB |
+| `esp32s3-n16r8` | — / 87.9-90.3 | — / 8330KB-8334KB | — / 108KB-112KB |
+| `pc-macos` | — / 2,924-16,129 | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-17
-- `esp32p4-eth`: observed 2026-06-17
-- `esp32s3-n16r8`: observed 2026-06-17
-- `pc-macos`: observed 2026-06-17 → 2026-06-19
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-17 → 2026-06-22
+- `pc-macos`: observed 2026-06-17 → 2026-06-21
 
 #### `measure-heavy-128` (measure)  📏
 
@@ -697,14 +703,14 @@ Quiet baseline: render-only, audio + discovery off. The cleanest render floor; t
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32` | — / 16.0 | — / 89KB | — / 62KB |
-| `esp32p4-eth` | — / 55.5-57.4 | — / 33196KB | — / 376KB |
-| `esp32s3-n16r8` | — / 19.8-20.3 | — / 8295KB | — / 108KB |
-| `pc-macos` | — / 2,915-3,247 | — / unlimited | — / unlimited |
+| `esp32p4-eth` | — / 55.5-57.4 | — / 33182KB-33196KB | — / 376KB |
+| `esp32s3-n16r8` | — / 19.6-20.8 | — / 8293KB-8298KB | — / 104KB-112KB |
+| `pc-macos` | — / 1,094-3,247 | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-17
-- `esp32p4-eth`: observed 2026-06-17
-- `esp32s3-n16r8`: observed 2026-06-17
-- `pc-macos`: observed 2026-06-17 → 2026-06-19
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-17 → 2026-06-22
+- `pc-macos`: observed 2026-06-17 → 2026-06-25
 
 #### `measure-mod-16` (measure)  📏
 
@@ -718,14 +724,14 @@ Quiet baseline: render-only, audio + discovery off. The cleanest render floor; t
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32` | — / 2,193 | — / 135KB | — / 108KB |
-| `esp32p4-eth` | — / 6,135-6,494 | — / 33241KB | — / 376KB |
-| `esp32s3-n16r8` | — / 2,597 | — / 8340KB | — / 108KB |
-| `pc-macos` | — / 1,000,000 | — / unlimited | — / unlimited |
+| `esp32p4-eth` | — / 6,098-6,494 | — / 33224KB-33241KB | — / 376KB |
+| `esp32s3-n16r8` | — / 2,193-2,618 | — / 8340KB-8344KB | — / 108KB-112KB |
+| `pc-macos` | — / 333,333-1,000,000 | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-17
-- `esp32p4-eth`: observed 2026-06-17
-- `esp32s3-n16r8`: observed 2026-06-17
-- `pc-macos`: observed 2026-06-17
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-17 → 2026-06-22
+- `pc-macos`: observed 2026-06-17 → 2026-06-25
 
 #### `measure-mod-32` (measure)  📏
 
@@ -738,14 +744,14 @@ Quiet baseline: render-only, audio + discovery off. The cleanest render floor; t
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32` | — / 553 | — / 130KB | — / 108KB |
-| `esp32p4-eth` | — / 1,821-1,876 | — / 33235KB | — / 376KB |
-| `esp32s3-n16r8` | — / 636 | — / 8329KB | — / 100KB |
-| `pc-macos` | — / 250,000-333,333 | — / unlimited | — / unlimited |
+| `esp32p4-eth` | — / 1,631-1,876 | — / 33218KB-33235KB | — / 376KB |
+| `esp32s3-n16r8` | — / 600-710 | — / 8329KB-8337KB | — / 100KB-112KB |
+| `pc-macos` | — / 90,909-333,333 | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-17
-- `esp32p4-eth`: observed 2026-06-17
-- `esp32s3-n16r8`: observed 2026-06-17
-- `pc-macos`: observed 2026-06-17
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-17 → 2026-06-22
+- `pc-macos`: observed 2026-06-17 → 2026-06-25
 
 #### `measure-mod-64` (measure)  📏
 
@@ -758,14 +764,14 @@ Quiet baseline: render-only, audio + discovery off. The cleanest render floor; t
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32` | — / 144 | — / 111KB | — / 96KB |
-| `esp32p4-eth` | — / 461-486 | — / 33208KB | — / 376KB |
-| `esp32s3-n16r8` | — / 153 | — / 8307KB | — / 108KB |
-| `pc-macos` | — / 62,500-71,429 | — / unlimited | — / unlimited |
+| `esp32p4-eth` | — / 438-486 | — / 33194KB-33208KB | — / 376KB |
+| `esp32s3-n16r8` | — / 153-162 | — / 8307KB-8311KB | — / 108KB-112KB |
+| `pc-macos` | — / 23,256-71,429 | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-17
-- `esp32p4-eth`: observed 2026-06-17
-- `esp32s3-n16r8`: observed 2026-06-17
-- `pc-macos`: observed 2026-06-17
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-17 → 2026-06-22
+- `pc-macos`: observed 2026-06-17 → 2026-06-25
 
 #### `measure-mod-128` (measure)  📏
 
@@ -778,14 +784,14 @@ Quiet baseline: render-only, audio + discovery off. The cleanest render floor; t
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32` | — / 35.1 | — / 36KB | — / 26KB |
-| `esp32p4-eth` | — / 98.6-102 | — / 33103KB | — / 376KB |
-| `esp32s3-n16r8` | — / 33.7 | — / 8202KB | — / 108KB |
-| `pc-macos` | — / 14,286-15,873 | — / unlimited | — / unlimited |
+| `esp32p4-eth` | — / 98.2-102 | — / 33089KB-33103KB | — / 376KB |
+| `esp32s3-n16r8` | — / 29.5-35.6 | — / 8202KB-8205KB | — / 108KB-112KB |
+| `pc-macos` | — / 5,263-16,129 | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-17
-- `esp32p4-eth`: observed 2026-06-17
-- `esp32s3-n16r8`: observed 2026-06-17
-- `pc-macos`: observed 2026-06-17 → 2026-06-18
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-17 → 2026-06-22
+- `pc-macos`: observed 2026-06-17 → 2026-06-25
 
 ### scenario_perf_light
 
@@ -812,14 +818,14 @@ Bare minimum: Grid(16²) + Layer + Checkerboard (light effect). No modifier, no
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32` | — / 6,173-8,772 | — / 125KB-131KB | — / 108KB |
-| `esp32p4-eth` | — / 13,889-18,519 | — / 33243KB-33244KB | — / 376KB |
-| `esp32s3-n16r8` | — / 7,143-8,850 | — / 8316KB-8335KB | — / 80KB-100KB |
-| `pc-macos` | — / — | — / unlimited | — / unlimited |
+| `esp32p4-eth` | — / 13,699-18,519 | — / 33228KB-33244KB | — / 376KB |
+| `esp32s3-n16r8` | — / 6,711-8,850 | — / 8316KB-8339KB | — / 80KB-104KB |
+| `pc-macos` | — / 1,000,000-— | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-17
-- `esp32p4-eth`: observed 2026-06-17
-- `esp32s3-n16r8`: observed 2026-06-17
-- `pc-macos`: observed 2026-06-17
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-17 → 2026-06-22
+- `pc-macos`: observed 2026-06-17 → 2026-06-24
 
 #### `measure-with-modifier` (measure)  📏
 
@@ -833,13 +839,13 @@ Cost of the modifier + LUT over the minimal pipeline. Heap delta vs measure-mini
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32` | — / 3,077-3,289 | — / 131KB-135KB | — / 108KB |
-| `esp32p4-eth` | — / 9,615-10,204 | — / 33241KB-33242KB | — / 376KB |
-| `esp32s3-n16r8` | — / 3,922-4,032 | — / 8330KB-8331KB | — / 96KB |
+| `esp32p4-eth` | — / 9,615-10,204 | — / 33226KB-33242KB | — / 376KB |
+| `esp32s3-n16r8` | — / 3,922-4,032 | — / 8330KB-8335KB | — / 96KB-100KB |
 | `pc-macos` | — / — | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-17
-- `esp32p4-eth`: observed 2026-06-17
-- `esp32s3-n16r8`: observed 2026-06-17
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-17 → 2026-06-22
 - `pc-macos`: observed 2026-06-17
 
 #### `measure-with-preview` (measure)  📏
@@ -851,13 +857,13 @@ PreviewDriver is the pre-wired apparatus — it survives clear_children and is a
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32` | — / 3,247-3,289 | — / 132KB-133KB | — / 108KB |
-| `esp32p4-eth` | — / 10,638-10,753 | — / 33241KB | — / 376KB |
-| `esp32s3-n16r8` | — / 4,115-4,149 | — / 8330KB-8333KB | — / 96KB-100KB |
+| `esp32p4-eth` | — / 10,526-10,753 | — / 33226KB-33241KB | — / 376KB |
+| `esp32s3-n16r8` | — / 4,115-4,202 | — / 8330KB-8334KB | — / 96KB-100KB |
 | `pc-macos` | — / — | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-17
-- `esp32p4-eth`: observed 2026-06-17
-- `esp32s3-n16r8`: observed 2026-06-17
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-17 → 2026-06-22
 - `pc-macos`: observed 2026-06-17
 
 #### `measure-heavy-16` (measure)  📏
@@ -870,14 +876,14 @@ PreviewDriver is the pre-wired apparatus — it survives clear_children and is a
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32` | — / 1,905-3,268 | — / 131KB | — / 108KB |
-| `esp32p4-eth` | — / 5,556-6,494 | — / 33241KB | — / 376KB |
-| `esp32s3-n16r8` | — / 2,463-2,469 | — / 8333KB | — / 100KB |
-| `pc-macos` | — / 1,000,000 | — / unlimited | — / unlimited |
+| `esp32p4-eth` | — / 5,556-6,494 | — / 33224KB-33241KB | — / 376KB |
+| `esp32s3-n16r8` | — / 2,463-2,506 | — / 8332KB-8333KB | — / 88KB-100KB |
+| `pc-macos` | — / 333,333-1,000,000 | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-17
-- `esp32p4-eth`: observed 2026-06-17
-- `esp32s3-n16r8`: observed 2026-06-17
-- `pc-macos`: observed 2026-06-17
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-17 → 2026-06-22
+- `pc-macos`: observed 2026-06-17 → 2026-06-25
 
 #### `measure-heavy-32` (measure)  📏
 
@@ -890,14 +896,14 @@ PreviewDriver is the pre-wired apparatus — it survives clear_children and is a
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32` | — / 539-826 | — / 130KB | — / 108KB |
-| `esp32p4-eth` | — / 1,876-1,880 | — / 33235KB | — / 376KB |
-| `esp32s3-n16r8` | — / 562-655 | — / 8330KB-8333KB | — / 100KB-104KB |
-| `pc-macos` | — / 250,000-333,333 | — / unlimited | — / unlimited |
+| `esp32p4-eth` | — / 1,818-1,880 | — / 33221KB-33235KB | — / 376KB |
+| `esp32s3-n16r8` | — / 562-715 | — / 8330KB-8333KB | — / 100KB-104KB |
+| `pc-macos` | — / 90,909-333,333 | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-17
-- `esp32p4-eth`: observed 2026-06-17
-- `esp32s3-n16r8`: observed 2026-06-17
-- `pc-macos`: observed 2026-06-17
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
+- `esp32s3-n16r8`: observed 2026-06-17 → 2026-06-22
+- `pc-macos`: observed 2026-06-17 → 2026-06-25
 
 #### `measure-heavy-64` (measure)  📏
 
@@ -910,14 +916,48 @@ PreviewDriver is the pre-wired apparatus — it survives clear_children and is a
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32` | — / 151-227 | — / 111KB | — / 88KB-96KB |
-| `esp32p4-eth` | — / 485-491 | — / 33208KB | — / 376KB |
+| `esp32p4-eth` | — / 473-491 | — / 33195KB-33208KB | — / 376KB |
 | `esp32s3-n16r8` | — / 146-157 | — / 8305KB-8307KB | — / 96KB-108KB |
-| `pc-macos` | — / 62,500-71,429 | — / unlimited | — / unlimited |
+| `pc-macos` | — / 22,727-71,429 | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-17
-- `esp32p4-eth`: observed 2026-06-17
+- `esp32p4-eth`: observed 2026-06-17 → 2026-06-22
 - `esp32s3-n16r8`: observed 2026-06-17
-- `pc-macos`: observed 2026-06-17
+- `pc-macos`: observed 2026-06-17 → 2026-06-25
+
+## Layers
+
+### scenario_Layers_composition
+
+`test/scenarios/light/scenario_Layers_composition.json` — Multi-layer composition end-to-end: Layouts→Grid, TWO Layers under one Layers container (bottom Checkerboard, top Rainbow), Drivers→NetworkSendDriver. Proves the Drivers composite loop builds, allocates its output buffer, blends both enabled layers and feeds the result to the driver without crashing, and gates the bounded FPS so the N-pass composite cost is tracked. The exact alpha/additive blend math and the disable-drops-to-single-layer path are pinned by the unit tests (unit_BlendMap, unit_Layers_container); construct-mode set_control can't apply controls (built post-scheduler), so this scenario uses each Layer's default blend (alpha, full opacity) and asserts wired liveness + tick, not per-byte blend output.
+
+**Mode**: `construct` · **Also touches**: Layer, GridLayout, RainbowEffect, CheckerboardEffect, Drivers, NetworkSendDriver
+
+#### `add-artnet` (add_module)  📏
+
+Add NetworkSendDriver and run the bounded FPS measurement over the two-layer composite (min_pct gates on hardware; skipped with a WARN in the desktop runner).
+
+**Setup** (preceding non-measured steps):
+- `add-layout-group` (add_module) — Top-level Layouts container.
+- `add-grid` (add_module) — 128x128 GridLayout under Layouts (above host clock resolution so the composite tick is measurable).
+- `add-layers-group` (add_module) — Top-level Layers container — the multi-layer composition host.
+- `add-bottom-layer` (add_module) — Bottom Layer (composited first — clears + overwrites the output buffer). RGB.
+- `add-bottom-effect` (add_module) — A Checkerboard base as the bottom layer's effect.
+- `add-top-layer` (add_module) — Top Layer (composited second — blends onto the bottom with its default blend). RGB.
+- `add-top-effect` (add_module) — Rainbow as the top layer's effect — composited over the Checkerboard base.
+- `add-driver-group` (add_module) — Top-level Drivers container wired to the Layers container (composites all enabled layers into its output buffer).
+
+**Bounds**:
+- FPS ≥ 80% of baseline
+- FPS × lights ≥ 294,912
+
+**Performance** (contract / observed) — tick stored, FPS shown:
+
+| Board | FPS | heap | block |
+|---|---|---|---|
+| `pc-macos` | — / 6,135-10,417 | — / unlimited | — / unlimited |
+
+- `pc-macos`: observed 2026-06-25
 
 ## Layouts
 
@@ -939,11 +979,11 @@ Baseline: a single 64x64 grid layout drives the pipeline.
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32-eth` | — / 41,667 | — / 224KB | — / 108KB |
-| `pc-macos` | — / 29,412-125,000 | — / unlimited | — / unlimited |
+| `pc-macos` | — / 25,000-125,000 | — / unlimited | — / unlimited |
 | `pc-windows` | — / 32,258-37,037 | — / unlimited | — / unlimited |
 
 - `esp32-eth`: observed 2026-06-08
-- `pc-macos`: observed 2026-06-05
+- `pc-macos`: observed 2026-06-05 → 2026-06-25
 - `pc-windows`: observed 2026-06-07
 
 #### `measure-two-layouts` (measure)  📏
@@ -961,11 +1001,11 @@ Pipeline still renders with two layouts wired (buffer non-null, fps measurable).
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32-eth` | — / 37,037 | — / 223KB | — / 108KB |
-| `pc-macos` | — / 21,739-111,111 | — / unlimited | — / unlimited |
+| `pc-macos` | — / 11,905-111,111 | — / unlimited | — / unlimited |
 | `pc-windows` | — / 16,393-23,810 | — / unlimited | — / unlimited |
 
 - `esp32-eth`: observed 2026-06-08
-- `pc-macos`: observed 2026-06-05 → 2026-06-11
+- `pc-macos`: observed 2026-06-05 → 2026-06-25
 - `pc-windows`: observed 2026-06-07
 
 #### `measure-after-replace` (measure)  📏
@@ -983,11 +1023,11 @@ Pipeline still renders after replacing a grid with a sphere (different layout ty
 | Board | FPS | heap | block |
 |---|---|---|---|
 | `esp32-eth` | — / 38,462 | — / 223KB | — / 108KB |
-| `pc-macos` | — / 5,747-100,000 | — / unlimited | — / unlimited |
+| `pc-macos` | — / 3,690-100,000 | — / unlimited | — / unlimited |
 | `pc-windows` | — / 5,848-9,009 | — / unlimited | — / unlimited |
 
 - `esp32-eth`: observed 2026-06-08
-- `pc-macos`: observed 2026-06-05 → 2026-06-11
+- `pc-macos`: observed 2026-06-05 → 2026-06-25
 - `pc-windows`: observed 2026-06-07
 
 #### `measure-after-remove` (measure)  📏
@@ -1042,14 +1082,14 @@ Set NoiseEffect.scale=4 and measure baseline FPS (mirror on). Effect controls do
 | `esp32-eth` | — / 10.5-10.6 | — / 133KB | — / 48KB-50KB |
 | `esp32-eth-wifi` | ≥ 10.0 / 12.2 | ≥ 103KB / 94KB | — / 48KB |
 | `esp32p4-eth` | — / 4,926-6,250 | — / 33238KB | — / 376KB |
-| `pc-macos` | ≥ 8,333 / 4,505-10,309 | unlimited / unlimited | — / unlimited |
+| `pc-macos` | ≥ 8,333 / 3,165-10,309 | unlimited / unlimited | — / unlimited |
 | `pc-windows` | — / 4,000-4,405 | — / unlimited | — / unlimited |
 
 - `esp32`: observed 2026-06-02
 - `esp32-eth`: observed 2026-06-02
 - `esp32-eth-wifi`: contract set 2026-06-02 "initial contract" · observed 2026-06-02
 - `esp32p4-eth`: observed 2026-06-17
-- `pc-macos`: contract set 2026-06-02 "initial contract" · observed 2026-06-02 → 2026-06-07
+- `pc-macos`: contract set 2026-06-02 "initial contract" · observed 2026-06-02 → 2026-06-25
 - `pc-windows`: observed 2026-06-07
 
 #### `disable-mirrorX` (set_control)  📏
@@ -1179,10 +1219,10 @@ Add NetworkSendDriver and run the bounded FPS measurement (mirror + LUT path mus
 
 | Board | FPS | heap | block |
 |---|---|---|---|
-| `pc-macos` | ≥ 8,333 / 4,065-1,000,000 | unlimited / unlimited | — / unlimited |
+| `pc-macos` | ≥ 8,333 / 3,676-1,000,000 | unlimited / unlimited | — / unlimited |
 | `pc-windows` | — / 3,953-4,444 | — / unlimited | — / unlimited |
 
-- `pc-macos`: contract set 2026-06-02 "initial contract" · observed 2026-06-02 → 2026-06-05
+- `pc-macos`: contract set 2026-06-02 "initial contract" · observed 2026-06-02 → 2026-06-25
 - `pc-windows`: observed 2026-06-07
 
 ## NetworkModule
@@ -1332,9 +1372,9 @@ Baseline: the pipeline renders with one driver (Preview) wired.
 
 | Board | FPS | heap | block |
 |---|---|---|---|
-| `pc-macos` | — / 90,909-125,000 | — / unlimited | — / unlimited |
+| `pc-macos` | — / 29,412-125,000 | — / unlimited | — / unlimited |
 
-- `pc-macos`: observed 2026-06-13 → 2026-06-16
+- `pc-macos`: observed 2026-06-13 → 2026-06-24
 
 #### `measure-two-drivers` (measure)  📏
 
@@ -1350,9 +1390,9 @@ Pipeline renders with both drivers wired.
 
 | Board | FPS | heap | block |
 |---|---|---|---|
-| `pc-macos` | — / 100,000-125,000 | — / unlimited | — / unlimited |
+| `pc-macos` | — / 17,857-125,000 | — / unlimited | — / unlimited |
 
-- `pc-macos`: observed 2026-06-13 → 2026-06-16
+- `pc-macos`: observed 2026-06-13 → 2026-06-22
 
 #### `measure-three-drivers` (measure)  📏
 
@@ -1368,9 +1408,9 @@ Pipeline renders with three drivers wired.
 
 | Board | FPS | heap | block |
 |---|---|---|---|
-| `pc-macos` | — / 100,000-125,000 | — / unlimited | — / unlimited |
+| `pc-macos` | — / 38,462-125,000 | — / unlimited | — / unlimited |
 
-- `pc-macos`: observed 2026-06-13 → 2026-06-16
+- `pc-macos`: observed 2026-06-13 → 2026-06-25
 
 #### `measure-after-first-remove` (measure)  📏
 
@@ -1386,9 +1426,9 @@ One ArtNet gone, Preview + ArtNet2 remain: pipeline keeps rendering (buffer non-
 
 | Board | FPS | heap | block |
 |---|---|---|---|
-| `pc-macos` | — / 100,000-125,000 | — / unlimited | — / unlimited |
+| `pc-macos` | — / 30,303-125,000 | — / unlimited | — / unlimited |
 
-- `pc-macos`: observed 2026-06-13 → 2026-06-16
+- `pc-macos`: observed 2026-06-13 → 2026-06-24
 
 #### `measure-back-to-one-driver` (measure)  📏
 
@@ -1404,6 +1444,6 @@ Both added drivers gone, back to the single Preview baseline, still rendering 
 
 | Board | FPS | heap | block |
 |---|---|---|---|
-| `pc-macos` | — / 100,000-125,000 | — / unlimited | — / unlimited |
+| `pc-macos` | — / 38,462-125,000 | — / unlimited | — / unlimited |
 
-- `pc-macos`: observed 2026-06-13 → 2026-06-15
+- `pc-macos`: observed 2026-06-13 → 2026-06-24
diff --git a/docs/tests/unit-tests.md b/docs/tests/unit-tests.md
index b95a4f3..5f96101 100644
--- a/docs/tests/unit-tests.md
+++ b/docs/tests/unit-tests.md
@@ -48,9 +48,19 @@ Unit tests are the fastest tier in the [test strategy](../testing.md): they run
 - Identity mapping (logical N → physical N) leaves every byte unchanged.
 - One logical light routed to multiple physical positions copies the colour to each (mirror-style mappings work).
 - A paged LUT (forced via the maxAllocBlock test cap) must produce a byte-identical dst to a single-alloc LUT with the same mapping. Paging is an allocation detail; blendMap output must not depend on it. This is the end-to-end pin for the no-PSRAM-fragmentation fix.
-- An additive (overwrites=false) LUT folding two sources onto one physical light adds and clamps at 255 (no overflow). overwrites=false is the opt-in for the rare overlap case (future multi-layer compositing); the default copy path would instead overwrite, so this pins the additive contract explicitly.
+- An additive (overwrites=false) LUT folding two sources onto one physical light adds and clamps at 255 (no overflow). overwrites=false is the opt-in for the within-layer overlap case; the default copy path would instead overwrite, and a full-opacity Overwrite op still routes through this additive accumulate, so this pins the contract explicitly (the regression after the multi-layer rewrite).
 - The default (overwrites=true) path plain-copies: two sources mapped to the same physical means the LAST writer wins, no addition. Pins the fast path.
 - Sparse overwrite mapping clears untouched physical cells. A sphere-style layout maps only a subset of the physical box to a source; the rest must end up black, not retain stale data from a previous frame. Pre-fills dst dirty and asserts unmapped cells are zeroed — fails if BlendMap's dst.clear() is removed (the regression target).
+- Alpha-over at half opacity: dst = src*α + dst*(255-α). With dst=200, src=100, α=128 → 100*128 + 200*127 = 12800 + 25400 = 38200; /255 ≈ 150.
+- Alpha at full opacity collapses to overwrite (src replaces dst exactly).
+- Alpha at opacity 0 is a no-op (dst unchanged) — the invisible-layer case.
+- Additive with opacity scales the source before adding, then clamps. dst=100, src=200, opacity=128 → add 200*128/255 ≈ 100 → 200.
+- clearFirst=false preserves dst cells the source doesn't touch — the mechanic that lets a top layer blend onto the bottom layer's already-composited frame.
+- No-LUT alpha-over at half opacity: dst = div255(src*α + dst*(255-α)). dst=200, src=100, α=128 → div255(100*128 + 200*127) = div255(38200) = 149.
+- No-LUT alpha at full opacity collapses to a plain copy (overwrite).
+- No-LUT alpha at opacity 0 is a no-op (the invisible top layer).
+- No-LUT additive with opacity scales the source then clamps at 255. dst=100, src=200, opacity=128 → 100 + div255(200*128)=100 → 200.
+- No-LUT additive at full opacity saturates: 200 + 100 = 300 → clamp 255.
 
 ## Buffer
 
@@ -110,6 +120,9 @@ Unit tests are the fastest tier in the [test strategy](../testing.md): they run
 - The core regression: a control bound with a non-zero value, overlaid with a JSON that does NOT contain its key, must keep its value — not snap to 0.
 - A present key still applies (the fix must not break the normal load path).
 - A present key whose value IS 0 must apply the 0 (don't confuse "present 0" with "absent"). Guards against an over-eager fix that skipped on value rather than key.
+- _a per-control validator accepts a valid value and rejects bad input_
+- Length boundary of the deviceModel validator (accepts 1..31). Uses a buffer wider than the validator's limit so the 32-char value reaches the validator intact (parseString truncates to bufSize-1, so the buffer must exceed 32 for the validator's own length check — not parse truncation — to be what rejects it). The scratch buffer in applyControlValue is sized to bufSize, so a long value isn't truncated before validation.
+- _a Text control with no validator accepts anything that fits_
 
 `test/unit/core/unit_Control_list.cpp`
 
@@ -178,7 +191,7 @@ Unit tests are the fastest tier in the [test strategy](../testing.md): they run
 - Companion to the wiredByCode case above: when the JSON describes a different type at the position where a code-wired child lives, the position-replacement must NOT kill the code-wired child. Stop reconciliation at that index instead and let the next save re-write the file with the actual tree shape. When the saved JSON wants a different type at the position where a code-wired child lives, reconciliation stops at that index instead of destroying the wired child.
 - Round-trip persistence with children: write a Layer subtree that contains both controls and child modules with controls of their own, then read the file back as text and verify it parses as valid JSON. Regresses the missing-comma bug between each child's "N.type" field and that child's first control (e.g. "0.type":"X""0.foo":1 instead of "0.type":"X","0.foo":1). Saving a Layer with multiple children produces valid JSON — comma separators between child `N.type` and the child's first control field are present.
 - Singleton survives probe lifecycle: /api/types factory-creates a probe of every registered type (including FilesystemModule) to capture defaults, then deletes it. The probe's destructor must NOT clear the singleton — otherwise every save path (noteDirty, debounced loop1s, flushPending on reboot) silently no-ops for the rest of the device's life. The fix is to register the singleton in setScheduler(), not in the constructor. This test catches that singleton-clear regression. /api/types factory-creates a temporary FilesystemModule probe; its destruction must NOT clear the static singleton (otherwise every later save silently no-ops).
-- Regression: Int16 controls (GridLayout's width/height/depth, Layer's start/end) round-tripped through the filesystem load path were clamped to c.min/c.max, which default to 0,0 because ControlDescriptor.min/max are uint8_t and can't represent an int16 range. Every Int16 control loaded as 0 — so a 128×128 grid became 0×0×0 after restart and the whole pipeline allocated no buffers. Int16 controls (GridLayout width/height, Layer start/end) preserve their saved value across load — no zero-clamping from uint8 min/max bounds.
+- Int16 controls preserve their saved value across a filesystem load — the load path does not clamp them to `c.min`/`c.max` (which are `uint8_t` and so default to 0,0, a range that can't represent an int16). Without this a 128×128 grid would reload as 0×0×0 and the pipeline would allocate no buffers; the test pins the round-trip so an Int16 value survives unclamped.
 
 ## FireEffect
 
@@ -188,6 +201,12 @@ Unit tests are the fastest tier in the [test strategy](../testing.md): they run
 - With sparking at max, the buffer contains non-zero pixels within 50 frames (sparks emerge and propagate).
 - Disabling the effect releases its heat buffer back (dynamicBytes drops to 0).
 
+## FirmwareUpdateModule
+
+`test/unit/core/unit_FirmwareUpdateModule.cpp`
+
+- The `firmware` control is always present and non-empty (either a real firmware key from build_info.h or the fallback "unknown"). The firmware card owns firmware identity (version/build/firmware) + the partition usage.
+
 ## GameOfLifeEffect
 
 `test/unit/light/unit_GameOfLifeEffect.cpp`
@@ -209,11 +228,22 @@ Unit tests are the fastest tier in the [test strategy](../testing.md): they run
 *Also touches: Layouts.*
 
 - A 4×4×1 grid yields 16 lights iterated row-major: x sweeps fastest, then y, then z.
+- Serpentine reverses x on odd rows (boustrophedon), so the strip snakes back and forth: driver index advances linearly while the emitted x zigzags. Even rows L→R, odd rows R→L. The COORDINATE is always the true (x,y) — only the index→position order changes, which is what makes the mapping non-identity.
 - A 3D 2×2×2 grid yields 8 lights with z-plane separation (indices 0-3 at z=0, 4-7 at z=1).
 - A single-light grid (1×1×1) is a valid layout: one coordinate at (0,0,0).
 - Layouts with a single child delegates totalLightCount and forEachCoord to that child directly.
 - Two child layouts produce contiguous physical indices: the second layout's coords are offset by the first's lightCount.
 
+## HttpServerModule
+
+`test/unit/core/unit_HttpServerModule_apply.cpp`
+
+- _apply-core: applyAddModule adds a child, idempotent on the id_
+- _apply-core: applySetControl writes a value, rejects out-of-range / unknown_
+- _apply-core: applyClearChildren empties a container (replaceChildren)_
+- _apply-core: applyOp dispatches each op type and tolerates bad input_
+- A per-control validator (like SystemModule.deviceModel's printable-ASCII rule) is enforced THROUGH the apply-core — so the APPLY_OP `set` the installer pushes over serial is guarded exactly like an HTTP write, with no per-transport special-casing. This is the point of moving validation onto the control: one backend check, every path.
+
 ## ImprovFrame
 
 `test/unit/core/unit_ImprovFrame.cpp`
@@ -233,6 +263,21 @@ Unit tests are the fastest tier in the [test strategy](../testing.md): they run
 - Every defined ImprovFrameType (CurrentState, ErrorState, Rpc, RpcResponse) round-trips through builder + parser cleanly.
 - After FrameReady the parser returns to Magic0 and parses the next frame on the same instance without reset.
 
+## ImprovOpReassembler
+
+`test/unit/core/unit_ImprovOpReassembler.cpp`
+
+- _a single-frame op (seq 0, last 1) is Ready with the exact bytes_
+- _a multi-chunk op reassembles in order and NUL-terminates_
+- _a duplicate chunk is rejected and resets the buffer_
+- _an out-of-order chunk (skipped seq) is rejected_
+- _a non-zero opening seq (no fresh start) is rejected_
+- _overflow past the buffer (minus the NUL) is rejected, not truncated_
+- _exactly buffer-minus-one bytes fits (boundary)_
+- _seq 0 mid-stream abandons a partial op and starts fresh_
+- _an empty final chunk still completes (last with zero bytes)_
+- _reset() drops a partial op_
+
 ## JsonUtil
 
 `test/unit/core/unit_JsonUtil_parse.cpp`
@@ -274,6 +319,7 @@ Unit tests are the fastest tier in the [test strategy](../testing.md): they run
 `test/unit/light/unit_Layer_sparse_mapping.cpp`
 
 - Dense grid: every box cell is a light, so no LUT — the identity/memcpy fast path is preserved exactly (the grid short-circuit).
+- Serpentine grid: dense (every box cell is a light, so the count check alone would pick the identity fast path) but SHUFFLED (driver index i != box cell i). isNaturalOrder() measures that from the coords and routes it through the box->driver LUT instead. This is the lever for exercising the non-identity mapping path without a sparse layout or a modifier.
 - Sparse sphere: a LUT is built; its destinations are driver indices in [0, lightCount), and the render buffer stays the dense bounding box.
 - Sphere + Mirror: the modifier's box-coordinate destinations are translated into driver-index space; no destination escapes [0, lightCount).
 - REGRESSION: a high fan-out Multiply (8×8×4 = 256) on a 128×128 grid must build a NON-EMPTY LUT that covers every physical light. The maxDest estimate (logicalCount × maxMultiplier) is computed in 64-bit; before that fix it overflowed uint16 on no-PSRAM boards (256 × 256 = 65536 wraps to 0), sized the LUT to ~nothing, and blanked the display. Here we assert the LUT actually maps the full light set, in range — the symptom that black-screened the device.
@@ -302,6 +348,9 @@ Unit tests are the fastest tier in the [test strategy](../testing.md): they run
 
 - A Layers container with one child Layer must produce the same output as that Layer used directly (no-op container).
 - With two child Layers, each one's loop() runs and writes its own buffer (the container iterates all enabled children).
+- Multi-layer composition: Drivers blends ≥2 enabled Layers into its own output buffer and hands THAT to drivers (not a single Layer's buffer). Bottom layer overwrites; top layer blends per its blendMode/opacity. This is the end-to-end pin for the composite loop in Drivers::loop.
+- Disabling the top layer drops cleanly to the single (bottom) layer — no crash, the driver now sees the bottom layer's content. Pins the robustness path.
+- Drivers' composition/output-buffer allocation contract (architecture.md § Adaptive allocation). The driver output buffer exists ONLY when the pipeline must blend into physical space; otherwise the lone layer's buffer is handed to drivers directly (zero-copy). dynamicBytes() reflects outputBuffer_.bytes(), so it's 0 ⇔ no buffer. Pins all three cases in one place: 1. one identity (no-LUT) layer  → NO output buffer (zero-copy) 2. two enabled layers           → output buffer (must composite) 3. one layer WITH a LUT         → output buffer (must map logical→physical)
 - activeLayer() returns the first enabled child, or the only child if all are disabled (so dimensions stay queryable during boot/toggle-off).
 - If the container holds only non-Layer children, activeLayer() returns nullptr (the role-guard skips, never miscasts).
 
@@ -566,9 +615,17 @@ Unit tests are the fastest tier in the [test strategy](../testing.md): they run
 - A sphere sends its SHELL lights (210), not the dense 9x9x9 box (729).
 - Per-frame 0x02 RGB count matches the coordinate-table count.
 - A small grid sends every light at its grid position (stride 1, exact).
-- A large layout is index-downsampled (stride > 1) so the payload fits the send-buffer cap — but at REAL positions, not a padded box.
+- A large layout is SPATIALLY downsampled (a regular per-axis lattice, not every-Nth-flat- index) so the payload fits the send-buffer cap without the diagonal moiré that linear stride produced on a grid whose width didn't divide the stride. The wire "stride" field carries the per-axis lattice/downscale factor (colour k still maps 1:1 to coord k).
+- A SPARSE layout under the cap must NOT be downsampled for its big BOUNDING BOX alone: the lattice bound is the layout's LIGHT count, not its box cell count, so a sphere whose shell fits the cap sends every light at stride 1 (a radius-8 sphere → ~812 shell lights, well under the 4096 display cap, in a 17³≈4913-cell box). (A genuinely huge sparse layout above the cap downsamples like any other — the cap is about points streamed, not box size.)
 - Default fps is the rate-limited preview stream rate.
+- Regression: a coordinate table dropped under backpressure must be RETRIED, and colour frames withheld until it lands — otherwise the device sends 0x02 frames the browser skips (count mismatch) and the preview freezes for the whole session. Drives loop() (where the coord-pending logic lives) with a broadcaster that drops every 0x03, then lets it through.
 - Regression: deleting the active Layer must not leave a driver holding a dangling layer_ pointer. Previously Drivers::passBufferToDrivers early-returned when the active Layer was null, leaving PreviewDriver's layer_ pointing at the freed Layer; the next onBuildState read layer_->layouts() on freed memory and crashed the device (LoadProhibited → boot loop, since the broken tree persists). Now passBufferToDrivers clears the drivers' layer_/sourceBuffer_ to null, a safe idle state. This drives the real path: Drivers bound to a Layers CONTAINER (self-healing), the Layer removed, then buildState re-resolves activeLayer()=null.
+- Coordinates are sent ONLY when the geometry changes or a new client connects — never per-frame and never on a timer (a periodic full-table rebuild would starve the tick). A new client (clientGeneration bump) re-sends immediately so a page refresh shows the preview at once. Driven through loop() with a frozen clock for determinism.
+- A full-res RGB frame is sent through the RESUMABLE buffered path (sendBufferedFrame), whose body is the DRIVER (consumer) buffer itself — no copy. For a dense identity grid that's the Layer's dense box buffer; for a sparse/mapped layout it's the LUT-mapped output buffer (the real lights), the same buffer the LED drivers consume — NOT the dense box.
+- Sparse layout: the buffered send streams the LUT-mapped DRIVER buffer (only the real lights, in driver order), exactly like the LED drivers — NOT the dense bounding box. So coordCount == the shell count and the frame is sent whole at full res through the resumable path.
+- Dense-grid CLOSED-FORM downsample, exact colour placement: a 200×1 strip pinned over a small cap strides in x only, so the kept lights are columns 0,s,2s,… The colour pass must read each from its dense buffer index (closed-form x for a 1-row grid) and pack them in the SAME order as the coord table — no forEachCoord. Painting a known colour at a kept column and finding it at the matching frame position pins the index math + the lattice order.
+- ADAPTIVE FRAME RATE: while a buffered send is still draining (a slow link), loop() must NOT start a new frame — it waits for bufferedSendIdle(). So the effective rate self-limits to the link.
+- USE-AFTER-FREE GUARD: a geometry rebuild (resize) frees+reallocs the producer buffer, so any in-flight buffered send (which holds a pointer into it) MUST be cancelled in onBuildState before the buffer goes away — else drainPreviewSend would read freed memory.
 
 ## RainbowEffect
 
@@ -698,7 +755,6 @@ Unit tests are the fastest tier in the [test strategy](../testing.md): they run
 - deviceName is the single network identity, so SystemModule keeps it a valid hostname. A live edit to an invalid value ("My Room!") is coerced on the next loop1s tick (mm::sanitizeHostname), the same path mDNS/AP/DHCP read — so they never see spaces.
 - An all-invalid name collapses to empty after sanitising; the MAC fallback then fills it, so deviceName is never empty (mDNS/AP/DHCP always have a name to register).
 - An already-valid name is left untouched (idempotent) — a normal user name survives.
-- The `firmware` control is always present and non-empty (either a real firmware key from build_info.h or the fallback "unknown").
 - The `bootReason` control is populated from platform::resetReason; on desktop it reports "OK".
 - SystemModule accepts user-added Peripheral children (sensors/actuators the user solders on); the role string drives the type-picker filter + add policy.
 - Regression: SystemModule overrides setup() and loop1s(); both must chain to MoonModule's base so a Peripheral child's setup()/loop1s() actually fire. Without the chain a sensor would never init or poll (the "children miss callbacks" trap from history/decisions.md). loop20ms() isn't overridden, so the base default already propagates it.
diff --git a/esp32/main/CMakeLists.txt b/esp32/main/CMakeLists.txt
index 1d234cb..362864a 100644
--- a/esp32/main/CMakeLists.txt
+++ b/esp32/main/CMakeLists.txt
@@ -69,6 +69,14 @@ if(MM_RELEASE)
     # #ifndef "" default.
     target_compile_definitions(${COMPONENT_LIB} PRIVATE MM_RELEASE=${MM_RELEASE})
 endif()
+if(MM_VERSION)
+    # Same quoting note again. The computed semver (compute_version.py): the core
+    # for a stable tag, <core>-dev.<N> for a moving latest build. Only the release
+    # pipeline sets it; a local build falls through to build_info.h's #ifndef
+    # default (library.json). Overrides the header's #ifndef so the binary, the
+    # release asset names, and the manifest all carry the same version.
+    target_compile_definitions(${COMPONENT_LIB} PRIVATE MM_VERSION=${MM_VERSION})
+endif()
 if(MM_ETH_ONLY)
     target_compile_definitions(${COMPONENT_LIB} PRIVATE MM_NO_WIFI)
 endif()
diff --git a/library.json b/library.json
index 9c16d76..8f844fa 100644
--- a/library.json
+++ b/library.json
@@ -1,5 +1,5 @@
 {
   "name": "projectMM",
-  "version": "2.0.0",
+  "version": "2.1.0-dev",
   "description": "Multi-platform LED/DMX lighting system"
 }
diff --git a/scripts/build/build_esp32.py b/scripts/build/build_esp32.py
index 5aead96..3ef1b2c 100644
--- a/scripts/build/build_esp32.py
+++ b/scripts/build/build_esp32.py
@@ -43,7 +43,7 @@
 # *build-time* cost only: the linker dead-strips the unused code, so they add ~0
 # bytes of flash to esp32p4-eth (our coprocessorWifi() is the empty stub there, so
 # no esp_hosted symbol is referenced — confirmed: their .text size is 0x0 in the
-# .map). Left as-is rather than fought; see docs/backlog/backlog.md.
+# .map). Left as-is rather than fought; see docs/backlog/.
 ETH_ONLY_EXCLUDE = ["esp_wifi", "wpa_supplicant", "esp_coex"]
 
 # Firmware catalogue. Each entry describes one shipping firmware variant.
@@ -288,12 +288,17 @@ def idf_cmd(idf_path: Path) -> list[str]:
     return [python_exe, str(idf_path / "tools" / "idf.py")]
 
 
-def firmware_cmake_args(firmware: str, release: str = "") -> list[str]:
+def firmware_cmake_args(firmware: str, release: str = "", version: str = "") -> list[str]:
     """Extra -D cache args for the requested firmware.
 
     `release` is the release-channel tag (e.g. "latest", "v1.0.0") to burn
     into the binary as MM_RELEASE. Empty for local builds — SystemModule
     then shows the bare semver with no channel suffix.
+
+    `version` overrides MM_VERSION with the pipeline-computed semver
+    (compute_version.py): the core for a stable tag, `<core>-dev.<N>` for a
+    moving `latest` build. Empty for local builds — build_info.h's #ifndef
+    default (library.json) applies.
     """
     spec = FIRMWARES[firmware]
     fragments = ";".join(spec["fragments"])
@@ -307,6 +312,9 @@ def firmware_cmake_args(firmware: str, release: str = "") -> list[str]:
     # local build needs no flag.
     if release:
         args.append(f'-DMM_RELEASE="{release}"')
+    # Same for the computed version — empty leaves build_info.h's library.json default.
+    if version:
+        args.append(f'-DMM_VERSION="{version}"')
     if spec["eth_only"]:
         # Drop the WiFi components from the link, and tell our code to compile
         # out the WiFi paths (MM_ETH_ONLY → esp32/main/CMakeLists.txt).
@@ -378,6 +386,20 @@ def stale_feature_cache(build_dir: Path, extra: list[str]) -> str | None:
         if wanted != cached:
             return (f"{flag} {'set' if cached else 'unset'} in cache but "
                     f"firmware wants it {'set' if wanted else 'unset'}")
+    # Value flags (not just present/absent): MM_VERSION / MM_RELEASE carry a string
+    # that changes per build. CMake keeps the OLD cached value when the same dir is
+    # reused, so a changed --version would silently build the stale version (it's a
+    # compile-time define, like the feature flags above). Detect a value mismatch and
+    # force a clean reconfigure so the binary never lies about its version.
+    for flag in ("MM_VERSION", "MM_RELEASE"):
+        wanted = next((a[len(f"-D{flag}="):] for a in extra
+                       if a.startswith(f"-D{flag}=")), None)
+        if wanted is None:
+            continue  # not passed this build — leave the cache alone
+        m = re.search(rf"^{flag}:[^=]*=(.*)$", text, re.MULTILINE)
+        cached = m.group(1) if m else None
+        if cached is not None and cached != wanted:
+            return f"{flag} cached as {cached!r} but this build wants {wanted!r}"
     return None
 
 
@@ -406,6 +428,11 @@ def main():
                         help="Release-channel tag to burn into the binary as "
                              "MM_RELEASE (e.g. 'latest', 'v1.0.0'). Set by the "
                              "release workflow; omit for local builds.")
+    parser.add_argument("--version", default="",
+                        help="Override MM_VERSION with the pipeline-computed semver "
+                             "(see compute_version.py): core for a stable tag, "
+                             "'<core>-dev.<N>' for latest. Omit for local builds "
+                             "(library.json applies).")
     args = parser.parse_args()
 
     firmware = resolve_firmware(args)
@@ -459,9 +486,9 @@ def main():
     #   rm -rf build/esp32-esp32p4-eth-wifi && idf.py -B <dir> -DSDKCONFIG=<dir>/sdkconfig \
     #     -DSDKCONFIG_DEFAULTS="..." set-target esp32p4 && (same) build
     # but this wrapper does not yet reproduce it reliably — tracked in
-    # docs/backlog/backlog.md (ESP32-P4 round 3). Until fixed, build this variant
+    # docs/backlog/ (ESP32-P4 round 3). Until fixed, build this variant
     # with the manual sequence above.
-    extra = firmware_cmake_args(firmware, args.release)
+    extra = firmware_cmake_args(firmware, args.release, args.version)
 
     # Guard against a build dir configured for a different feature set (a stale
     # MM_NO_ETH / MM_ETH_ONLY in CMakeCache that a plain reconfigure won't clear).
diff --git a/scripts/build/compute_version.py b/scripts/build/compute_version.py
new file mode 100644
index 0000000..0dfc2da
--- /dev/null
+++ b/scripts/build/compute_version.py
@@ -0,0 +1,118 @@
+#!/usr/bin/env python3
+"""Compute the semver string a build should carry, per build type.
+
+`library.json` holds the in-development version with a `-dev` prerelease suffix
+(e.g. `2.1.0-dev`). That's right for a local build, but a *published* build needs
+a precise, comparable version:
+
+  - Stable release (a `vX.Y.Z` tag): the CORE semver, suffix dropped — `2.1.0`.
+    (The release ritual already bumps library.json to the core before tagging;
+    this just normalises in case the suffix lingers.)
+  - Moving `latest` build (every push to main): a MONOTONIC prerelease —
+    `<core>-dev.<N>` where N = commits since the last stable `vX.Y.Z` tag
+    (git-describe style). Successive `latest` builds get `…-dev.6`, `…-dev.7`, …
+    which semver §11 orders numerically, so a device can tell it's behind the
+    newest `latest`. Without N, every `latest` build claims the same version.
+
+N counts since the last `v*` tag specifically — NOT `git describe`'s nearest tag,
+which would pick the moving `latest` tag and give a meaningless count. With no
+`v*` tag yet, N falls back to the total commit count from the root.
+
+The same string is burned into the binary (-DMM_VERSION), the release asset names
+(firmware-<F>-v<V>.bin), and the ESP Web Tools manifest, so all three agree.
+
+Usage:
+  compute_version.py --tag latest              # auto → latest → <core>-dev.<N>, e.g. 2.1.0-dev.6
+  compute_version.py --tag v2.1.0              # auto → stable → core, e.g. 2.1.0
+  compute_version.py --tag v2.1.0-rc1          # auto → stable → the RC semver, e.g. 2.1.0-rc1
+  compute_version.py --channel local           # library.json verbatim, e.g. 2.1.0-dev
+
+The release workflow passes only `--tag`; the channel is derived from it (the one
+place that mapping lives), so the build and release jobs can't disagree.
+"""
+
+import argparse
+import json
+import subprocess
+import sys
+from pathlib import Path
+
+ROOT = Path(__file__).resolve().parent.parent.parent
+LIBRARY_JSON = ROOT / "library.json"
+
+
+def core_version(version: str) -> str:
+    """Strip any -prerelease / +build suffix → the MAJOR.MINOR.PATCH core."""
+    return version.split("-")[0].split("+")[0]
+
+
+def commits_since_last_stable() -> int:
+    """Commits since the last `vX.Y.Z` tag (not the moving `latest` tag).
+
+    Falls back to the total commit count when no `v*` tag exists yet.
+    """
+    try:
+        last = subprocess.run(
+            ["git", "describe", "--tags", "--abbrev=0", "--match", "v*"],
+            cwd=ROOT, capture_output=True, text=True, check=True,
+        ).stdout.strip()
+        rng = f"{last}..HEAD"
+    except subprocess.CalledProcessError:
+        rng = "HEAD"  # no v* tag yet — count from the root
+    out = subprocess.run(
+        ["git", "rev-list", "--count", rng],
+        cwd=ROOT, capture_output=True, text=True, check=True,
+    ).stdout.strip()
+    return int(out)
+
+
+def channel_for_tag(tag: str) -> str:
+    """Derive the build channel from the release tag — the single source of that mapping.
+
+    `latest` → the moving prerelease channel; any other tag (a `vX.Y.Z` / `vX.Y.Z-rcN`,
+    or empty) → stable (which handles an -rc suffix inside `compute`). Centralised here so
+    the workflow's two Compute-version steps can't disagree on the channel.
+    """
+    return "latest" if tag == "latest" else "stable"
+
+
+def compute(channel: str, tag: str = "") -> str:
+    version = json.loads(LIBRARY_JSON.read_text(encoding="utf-8"))["version"]
+    core = core_version(version)
+    if channel == "stable":
+        # A vX.Y.Z-rcN tag is itself a precise prerelease semver — carry it through
+        # verbatim (minus the leading v) rather than collapsing to the core X.Y.Z, or
+        # the RC binary/manifest would lie about being the stable release. A plain
+        # vX.Y.Z (or no tag) yields the core.
+        if tag:
+            t = tag[1:] if tag.startswith("v") else tag
+            if "-" in t:  # has a prerelease identifier (rc, beta, …)
+                return t
+        return core
+    if channel == "latest":
+        return f"{core}-dev.{commits_since_last_stable()}"
+    return version  # local: library.json verbatim
+
+
+def main() -> int:
+    parser = argparse.ArgumentParser(description=__doc__)
+    parser.add_argument(
+        "--channel", choices=["stable", "latest", "local", "auto"], default="auto",
+        help="auto (default) → derive from --tag (latest tag → latest, else stable); "
+             "stable → core semver (or the tag's prerelease semver for an -rc tag); "
+             "latest → <core>-dev.<N>; local → library.json verbatim",
+    )
+    parser.add_argument(
+        "--tag", default="",
+        help="The release tag (e.g. latest, v2.1.0, v2.1.0-rc1). With --channel auto it "
+             "selects the channel; for a prerelease tag on the stable channel, its semver "
+             "is used verbatim instead of the core.",
+    )
+    args = parser.parse_args()
+    channel = channel_for_tag(args.tag) if args.channel == "auto" else args.channel
+    print(compute(channel, args.tag))
+    return 0
+
+
+if __name__ == "__main__":
+    sys.exit(main())
diff --git a/scripts/build/generate_build_info.py b/scripts/build/generate_build_info.py
index 5eb15de..a627950 100644
--- a/scripts/build/generate_build_info.py
+++ b/scripts/build/generate_build_info.py
@@ -4,7 +4,12 @@
 Writes a single header carrying every compile-time identity fact the runtime
 exposes through SystemModule:
 
-  MM_VERSION       — semver, from library.json. Auto-generated section.
+  MM_VERSION       — semver. Defaults to library.json (local/dev builds), but
+                     the release pipeline overrides it with a -D flag (same
+                     mechanism as MM_RELEASE / MM_FIRMWARE_NAME) so a published
+                     build carries a precise version: the core semver for a
+                     stable release, or a monotonic `<core>-dev.<N>` for a
+                     moving `latest` build (see scripts/build/compute_version.py).
   MM_BUILD_DATE    — __DATE__ " " __TIME__, evaluated by the compiler.
   MM_FIRMWARE_NAME — set by the build system as a -D flag (see
                      scripts/build/build_esp32.py firmware_cmake_args() and
@@ -38,7 +43,14 @@
 // Auto-generated from library.json by scripts/build/generate_build_info.py
 // -- do not edit by hand. Regenerated when library.json changes.
 
+// MM_VERSION defaults to the in-tree library.json semver, but the release
+// pipeline overrides it with -DMM_VERSION="<computed>" (compute_version.py):
+// the core semver for a stable tag, or `<core>-dev.<N>` for a moving `latest`
+// build so successive latest builds are orderable. #ifndef so a local build
+// needs no flag.
+#ifndef MM_VERSION
 #define MM_VERSION    "{version}"
+#endif
 #define MM_BUILD_DATE __DATE__ " " __TIME__
 
 // Compile-time identity from build flags. The build script that knows the
diff --git a/scripts/build/setup_esp_idf.py b/scripts/build/setup_esp_idf.py
index b580f65..cbf34d0 100644
--- a/scripts/build/setup_esp_idf.py
+++ b/scripts/build/setup_esp_idf.py
@@ -20,7 +20,7 @@
 # the clone), but it warns loudly when the installed IDF differs — a silent
 # `git pull` or a fresh shallow clone landing on a newer dev-branch commit is
 # exactly what turns a green build red with no code change (see
-# docs/backlog/backlog.md "ESP-IDF version pinning"). To pin: in ~/esp/esp-idf,
+# docs/backlog/, "ESP-IDF version pinning"). To pin: in ~/esp/esp-idf,
 # `git fetch && git checkout <commit>`. Migrating off this dev snapshot to a
 # stable tag (v6.1 lands 2026-07-31) is a deliberate re-test pass, not a pull.
 PINNED_IDF_COMMIT = "d1b91b79b5ff12d9d4b21fe1cf5406ab6044b8ff"
diff --git a/scripts/build/verify_version.py b/scripts/build/verify_version.py
index f31cc2d..9151010 100644
--- a/scripts/build/verify_version.py
+++ b/scripts/build/verify_version.py
@@ -8,9 +8,16 @@
 Tag → version mapping: strip a leading 'v'. Both `v1.0.0` and `1.0.0` are
 accepted as the tag, but the in-tree version is the bare semver.
 
-The `latest` tag is a moving prerelease published on every merge to main,
-not a semver release — library.json keeps the last real release's version.
-The script accepts it and skips the equality check.
+Release ritual (develop-on-a-prerelease, the standard semver flow): between
+releases, library.json carries the NEXT version with a `-dev` prerelease suffix
+(e.g. `2.1.0-dev`), so a moving/`latest` build self-reports a clean prerelease
+semver. Cutting the stable release drops the suffix: tag `v2.1.0` releases what
+was `2.1.0-dev`. So the check compares the tag's semver to library.json's CORE
+version (the part before any `-prerelease` suffix) — `v2.1.0` ↔ `2.1.0-dev`
+passes (same core), while a wrong core like `v2.2.0` ↔ `2.1.0-dev` still fails.
+
+The `latest` tag is the moving prerelease channel published on every merge to
+main, not a semver release — the script accepts it and skips the equality check.
 
 Inputs:
   GITHUB_REF_NAME  — the tag, set by GitHub Actions on a `push: tags` event
@@ -59,11 +66,17 @@ def main() -> int:
         print(f"verify_version: 'version' missing from {LIBRARY_JSON}.")
         return 2
 
-    if tag_version != in_tree:
+    # Compare the CORE semver (drop any `-prerelease` / `+build` suffix from the
+    # in-tree version) so the release ritual works: cutting `v2.1.0` releases the
+    # in-development `2.1.0-dev`. A mismatched core (e.g. `v2.2.0` vs `2.1.0-dev`)
+    # still fails. The tag itself is a real release, so it carries no suffix.
+    in_tree_core = in_tree.split("-")[0].split("+")[0]
+    if tag_version != in_tree_core:
         print(
-            f"verify_version: tag '{tag}' (version {tag_version}) "
-            f"does not match library.json version '{in_tree}'.\n"
-            f"Bump library.json to {tag_version}, commit, retag, push."
+            f"verify_version: tag '{tag}' (version {tag_version}) does not match "
+            f"library.json core version '{in_tree_core}' (from '{in_tree}').\n"
+            f"To release, set library.json version to {tag_version} (drop the "
+            f"-dev suffix), commit, retag, push."
         )
         return 1
 
diff --git a/src/core/Control.h b/src/core/Control.h
index d7249e0..df1558b 100644
--- a/src/core/Control.h
+++ b/src/core/Control.h
@@ -81,9 +81,8 @@ enum class ControlType : uint8_t {
     Uint8,
     Uint16,
     Int16,      // signed 16-bit. For coordinate-style controls where negative
-                // values are legal — e.g. a Layer's start/end dragged out of the
-                // visible area by a future modifier. (The light domain's grid
-                // coordinate type is int16 for this reason.)
+                // values are legal. (The light domain's grid coordinate type is
+                // int16 for this reason.)
     Pin,        // a GPIO number (int8_t storage, -1 = unused/default). Distinct
                 // from Int16 so the UI renders a plain number input, not a slider:
                 // a GPIO has no meaningful range to drag, and pins span 0..~52
diff --git a/src/core/FirmwareUpdateModule.h b/src/core/FirmwareUpdateModule.h
index e6063f7..4728c0b 100644
--- a/src/core/FirmwareUpdateModule.h
+++ b/src/core/FirmwareUpdateModule.h
@@ -58,17 +58,19 @@ class FirmwareUpdateModule : public MoonModule {
         // first WS state push surfaces a coherent "idle" / 0 pair.
         std::strncpy(statusStr_, g_otaStatus, sizeof(statusStr_) - 1);
         statusStr_[sizeof(statusStr_) - 1] = '\0';
+        publishStatus();
         bytesRead_ = g_otaBytesRead;
         totalSnap_ = g_otaBytesTotal;
 
-        // Firmware identity (static for this build). version = semver + release channel when the
-        // pipeline burned one in ("1.0.0-rc2 (latest)"); kRelease is "" on local/dev builds, where
-        // we show the bare semver (build_info.h's MM_VERSION vs MM_RELEASE split).
-        if (kRelease[0] != 0) {
-            std::snprintf(versionStr_, sizeof(versionStr_), "%s (%s)", kVersion, kRelease);
-        } else {
-            std::snprintf(versionStr_, sizeof(versionStr_), "%s", kVersion);
-        }
+        // Firmware identity (static for this build). version is PURE SEMVER (kVersion from
+        // library.json): a clean "2.0.0" on a stable release, or a prerelease like "2.1.0-dev" on a
+        // moving/dev build (semver.org §9 — the prerelease suffix is how a not-yet-released build is
+        // expressed). The release channel is derivable from the version itself (a prerelease suffix
+        // means "not a stable release"), so it is NOT mixed into the string; kRelease stays the
+        // separate build-channel tag (which git tag this binary shipped under) without polluting the
+        // machine-comparable version. This keeps `version` a clean semver the UI's update check can
+        // compare against the newest GitHub release.
+        std::snprintf(versionStr_, sizeof(versionStr_), "%s", kVersion);
         std::snprintf(buildStr_, sizeof(buildStr_), "%s", kBuildDate);
         std::snprintf(firmwareStr_, sizeof(firmwareStr_), "%s", kFirmwareName);
     }
@@ -85,7 +87,11 @@ class FirmwareUpdateModule : public MoonModule {
             controls_.addProgress("firmwarePartition", firmwareSizeVal_, totalFlashVal_);
         }
 
-        controls_.addReadOnly("update_status", statusStr_, sizeof(statusStr_));
+        // OTA status goes through MoonModule::setStatus() (the per-module status
+        // slot every module shares), not a bespoke read-only control — same
+        // choice DevicesModule made. The error-prefixed states map to
+        // Severity::Error; everything else is neutral. See publishStatus().
+        //
         // Total is captured by value into the descriptor's `aux`; we re-bind
         // (via markDirty → HttpServerModule rebuildControls) when totalSnap_
         // changes. Initially 0; the UI shows "0KB / 0KB" until esp_https_ota
@@ -99,6 +105,7 @@ class FirmwareUpdateModule : public MoonModule {
         // read shows as a brief mid-update glimpse — visually harmless.
         std::strncpy(statusStr_, g_otaStatus, sizeof(statusStr_) - 1);
         statusStr_[sizeof(statusStr_) - 1] = '\0';
+        publishStatus();
         bytesRead_ = g_otaBytesRead;
         // Re-bind on total transition. Only fires once per OTA (and once on
         // any later OTA the user starts — we deliberately don't reset the
@@ -112,12 +119,28 @@ class FirmwareUpdateModule : public MoonModule {
         }
     }
 
+    // Point the shared status slot at our owned buffer, choosing the severity
+    // from the status text: the platform OTA task prefixes every failure with
+    // "error: " (see platform_esp32_ota.cpp), so that prefix is the Error gate.
+    // "idle" is the quiescent state and reads better as no banner than as an
+    // info banner, so it clears the slot. setStatus doesn't copy — statusStr_
+    // outlives every call, so the pointer stays valid.
+    void publishStatus() {
+        if (std::strcmp(statusStr_, "idle") == 0) {
+            clearStatus();
+        } else {
+            setStatus(statusStr_,
+                      std::strncmp(statusStr_, "error:", 6) == 0 ? Severity::Error
+                                                                 : Severity::Status);
+        }
+    }
+
 private:
     char     statusStr_[64] = "idle";
     uint32_t bytesRead_     = 0;
     uint32_t totalSnap_     = 0;
     // Firmware identity (static for this build) + the running app-partition usage.
-    char     versionStr_[32] = {};   // semver + " (channel)" — e.g. "1.0.0-rc2 (latest)"
+    char     versionStr_[32] = {};   // pure semver — e.g. "2.0.0" or "2.1.0-dev.7"
     char     buildStr_[24]   = {};
     char     firmwareStr_[24] = {};  // build variant name, e.g. "esp32s3-n16r8"
     uint32_t firmwareSizeVal_ = 0;   // bytes used in the app partition
diff --git a/src/core/HttpServerModule.cpp b/src/core/HttpServerModule.cpp
index cd7e3d8..3d95d9d 100644
--- a/src/core/HttpServerModule.cpp
+++ b/src/core/HttpServerModule.cpp
@@ -129,6 +129,7 @@ void HttpServerModule::handleConnection(platform::TcpConnection& conn) {
         if (std::strcmp(path, "/") == 0) serveFile(conn, "index.html", "text/html");
         else if (std::strcmp(path, "/app.js") == 0) serveFile(conn, "app.js", "application/javascript");
         else if (std::strcmp(path, "/install-picker.js") == 0) serveFile(conn, "install-picker.js", "application/javascript");
+        else if (std::strcmp(path, "/semver.js") == 0) serveFile(conn, "semver.js", "application/javascript");
         else if (std::strcmp(path, "/preview3d.js") == 0) serveFile(conn, "preview3d.js", "application/javascript");
         else if (std::strcmp(path, "/style.css") == 0) serveFile(conn, "style.css", "text/css");
         else if (std::strcmp(path, "/moonlight-logo.png") == 0) serveFile(conn, "moonlight-logo.png", "image/png");
@@ -300,6 +301,7 @@ void HttpServerModule::serveFile(platform::TcpConnection& conn, const char* file
     if (std::strcmp(filename, "index.html") == 0) { data = ui::indexHtml; dataLen = ui::indexHtmlLen; gzipped = true; }
     else if (std::strcmp(filename, "app.js") == 0) { data = ui::appJs; dataLen = ui::appJsLen; gzipped = true; }
     else if (std::strcmp(filename, "install-picker.js") == 0) { data = ui::installPickerJs; dataLen = ui::installPickerJsLen; gzipped = true; }
+    else if (std::strcmp(filename, "semver.js") == 0) { data = ui::semverJs; dataLen = ui::semverJsLen; gzipped = true; }
     else if (std::strcmp(filename, "preview3d.js") == 0) { data = ui::preview3dJs; dataLen = ui::preview3dJsLen; gzipped = true; }
     else if (std::strcmp(filename, "style.css") == 0) { data = ui::styleCss; dataLen = ui::styleCssLen; gzipped = true; }
     else if (std::strcmp(filename, "moonlight-logo.png") == 0) { data = ui::logoPng; dataLen = ui::logoPngLen; }
diff --git a/src/light/drivers/Drivers.h b/src/light/drivers/Drivers.h
index 36c0b1f..5709039 100644
--- a/src/light/drivers/Drivers.h
+++ b/src/light/drivers/Drivers.h
@@ -161,18 +161,30 @@ class Drivers : public MoonModule {
         // was cleared and rebuilt via the API is picked up here (self-healing).
         // setLayer() pins a Layer directly and leaves layers_ null — skip then.
         if (layers_) layer_ = layers_->activeLayer();
-        // Output buffer needed if any layer has a LUT (currently single layer).
-        // Multi-layer: check all layers, allocate if at least one has a LUT.
-        // If allocation fails (no contiguous heap large enough — a real risk on
-        // ESP32 without PSRAM when the Layer pipeline has fragmented DRAM),
-        // outputBuffer_ stays with data_=nullptr. loop() must check that before
-        // calling blendMap, otherwise blendMap will dereference a null
-        // outputBuffer_.data() and panic with LoadProhibited. Same defensive
-        // pattern Layer::allocateBuffer uses for its pixel buffer.
-        if (layer_ && layer_->lut().hasLUT()) {
-            if (!outputBuffer_.allocate(layer_->physicalLightCount(), layer_->channelsPerLight())) {
+        // The output (composition) buffer is needed when we must blend into a
+        // physical-space buffer rather than hand a driver a Layer's logical buffer
+        // directly: whenever ≥2 layers composite, OR a single layer has a LUT
+        // (logical≠physical). A lone no-LUT layer needs no output buffer (drivers
+        // read its buffer directly — the zero-copy fast path).
+        // If allocation fails (no contiguous heap — a real risk on no-PSRAM ESP32
+        // with fragmented DRAM), outputBuffer_ stays data_=nullptr; loop() checks
+        // that before blending (else a null deref panics — same defensive pattern
+        // Layer::allocateBuffer uses). Sized from the active layer: every layer
+        // composites into the same physical space, so its physicalLightCount() /
+        // channelsPerLight() is the composite extent.
+        // Output selection keys off an *enabled* source layer, never the disabled
+        // fallback activeLayer() may return (which exists only so geometry stays
+        // queryable while every layer is toggled off). With no enabled layer there
+        // is nothing to emit, so no output buffer — drivers go idle (see
+        // passBufferToDrivers). A pinned setLayer() (layers_ null) is always treated
+        // as the live source.
+        Layer* const out = layers_ ? layers_->firstEnabledLayer() : layer_;
+        const uint8_t enabled = layers_ ? layers_->enabledLayerCount() : (layer_ ? 1 : 0);
+        const bool needOutput = out && (enabled > 1 || out->lut().hasLUT());
+        if (needOutput) {
+            if (!outputBuffer_.allocate(out->physicalLightCount(), out->channelsPerLight())) {
                 std::printf("  DEGRADE  Drivers::outputBuffer_ allocate failed for %u lights\n",
-                            static_cast<unsigned>(layer_->physicalLightCount()));
+                            static_cast<unsigned>(out->physicalLightCount()));
                 outputBuffer_.free();   // leaves data_=nullptr, bytes()=0
             }
         } else {
@@ -184,15 +196,39 @@ class Drivers : public MoonModule {
     }
 
     void loop() override {
-        // outputBuffer_.data() can be null if onBuildState failed to claim
-        // a contiguous block (heap fragmentation). Skip the blend in that case
-        // — drivers run on raw Layer buffer or simply have nothing to send.
-        if (layer_ && layer_->lut().hasLUT() && outputBuffer_.data()) {
-            blendMap(layer_->buffer(), outputBuffer_, layer_->lut(), layer_->channelsPerLight());
+        // Composite into outputBuffer_ when one is allocated (≥2 enabled layers,
+        // or a single layer with a LUT — see onBuildState). A null data_ means
+        // onBuildState couldn't claim a block (heap fragmentation): skip the blend;
+        // drivers then read the raw Layer buffer / send nothing.
+        if (outputBuffer_.data() && layers_ && layers_->enabledLayerCount() > 1) {
+            // Multi-layer composite: blend each enabled layer in container order.
+            // The first (bottom) layer clears + overwrites; each subsequent layer
+            // blends onto the accumulated frame per its own blendMode + opacity.
+            // blendMap resolves the op/opacity branch once per layer (a tight
+            // specialized loop each — no-LUT layers blend 1:1, LUT layers map),
+            // and a full-opacity additive/overwrite layer pays no alpha math, so
+            // cost scales with enabled-layer count only.
+            layers_->forEachEnabledLayer([&](Layer* L, bool first) {
+                BlendOp op = first ? BlendOp::Overwrite : L->blendOp();
+                uint8_t op_opacity = first ? 255 : L->opacity;
+                blendMap(L->buffer(), outputBuffer_, L->lut(), L->channelsPerLight(),
+                         op, op_opacity, /*clearFirst=*/first);
+            });
+        } else if (Layer* out = layers_ ? layers_->firstEnabledLayer() : layer_;
+                   outputBuffer_.data() && out && out->lut().hasLUT()) {
+            // Single layer with a LUT (the only enabled one, or a pinned setLayer):
+            // map its logical buffer into physical space. The original fast path.
+            // `out` is the enabled source, never activeLayer()'s disabled fallback;
+            // the outputBuffer_.data() guard already excludes the all-disabled case
+            // (needOutput is false then), this keeps the source choice explicit.
+            blendMap(out->buffer(), outputBuffer_, out->lut(), out->channelsPerLight());
         }
-        // Option A: parent work first (blendMap), then chain to base to tick
-        // children on the freshly-blended buffer. Per-child enabled gating and
-        // timing accumulation live in MoonModule::tickChildren.
+        // (A lone enabled no-LUT layer skips the above — drivers read its logical
+        // buffer directly, the zero-copy path set in passBufferToDrivers.)
+        //
+        // Option A: parent work first (blend), then chain to base to tick children
+        // on the freshly-composited buffer. Per-child enabled gating + timing live
+        // in MoonModule::tickChildren.
         MoonModule::loop();
     }
 
@@ -209,12 +245,28 @@ class Drivers : public MoonModule {
         // dangling layer_ pointing at the freed Layer — PreviewDriver then read
         // layer_->layouts() on freed memory and crashed (LoadProhibited). A
         // driver with a null layer/buffer is a well-defined idle state.
-        Buffer* buf = layer_ ? (layer_->lut().hasLUT() ? &outputBuffer_ : &layer_->buffer())
-                             : nullptr;
+        // Drivers read the composed outputBuffer_ when we composite (≥2 enabled
+        // layers) or when the single layer needs a LUT map; otherwise the lone
+        // no-LUT layer's buffer is handed directly (zero-copy fast path). Mirrors
+        // the same decision loop() makes (outputBuffer_ is allocated iff this).
+        // The source is the first *enabled* layer, never the disabled fallback
+        // activeLayer() returns when all layers are off — with no enabled layer
+        // buf stays null and every driver idles (its last frame is not re-sent).
+        // A pinned setLayer() (layers_ null) is always the live source.
+        Layer* const out = layers_ ? layers_->firstEnabledLayer() : layer_;
+        const bool composing = layers_ && layers_->enabledLayerCount() > 1;
+        Buffer* buf = out ? ((composing || out->lut().hasLUT()) ? &outputBuffer_
+                                                               : &out->buffer())
+                          : nullptr;
         for (uint8_t i = 0; i < childCount(); i++) {
             auto* drv = static_cast<DriverBase*>(child(i));
             drv->setSourceBuffer(buf);
-            drv->setLayer(layer_);  // null when no active Layer; drivers must tolerate it
+            // Geometry uses layer_ (activeLayer()'s fallback — valid even when every
+            // layer is disabled) so a PreviewDriver keeps its width/height/depth and
+            // coordinate table; buf above uses the enabled source only, so output
+            // still idles (no stale frame) when nothing is enabled. layer_ is null
+            // only when no Layer is registered at all (the documented idle state).
+            drv->setLayer(layer_);
             drv->setCorrection(&correction_);  // physical drivers apply it; Preview ignores
         }
     }
diff --git a/src/light/layers/BlendMap.h b/src/light/layers/BlendMap.h
index a342435..0dee148 100644
--- a/src/light/layers/BlendMap.h
+++ b/src/light/layers/BlendMap.h
@@ -7,27 +7,76 @@
 
 namespace mm {
 
-// Reads from logical buffer (src), writes to physical buffer (dst) via LUT.
-// Two paths chosen by MappingLUT::overwrites(): when true (every current
-// layout/modifier — each physical light written at most once), it overwrite-
-// copies src→dst (fast, no read-back); when false, it additively blends with
-// clamping (for multi-layer composition where sources overlap on a destination).
-// Either way dst is cleared first so physical cells with no source stay black.
-inline void blendMap(const Buffer& src, Buffer& dst, const MappingLUT& lut, uint8_t channelsPerLight) {
+// How a layer's pixels combine into the destination during composition.
+//   Overwrite — dst = src (replace; the first/bottom layer, fastest)
+//   Alpha     — dst = src*opacity + dst*(255-opacity)  (opacity-weighted over)
+//   Additive  — dst = clamp(dst + src*opacity/255)      (adds light, never dims)
+enum class BlendOp : uint8_t { Overwrite, Alpha, Additive };
+
+// Fast 8-bit "divide by 255": exact for 0..65535. Avoids a real divide on the
+// hot path (the textbook (x + (x>>8) + 1) >> 8 trick).
+inline uint8_t div255(uint16_t x) { return static_cast<uint8_t>((x + (x >> 8) + 1) >> 8); }
+
+// Reads from logical buffer (src), writes/blends to physical buffer (dst) via LUT.
+//
+// `op` + `opacity` decide how each light combines into dst; `clearFirst` clears
+// dst before writing (the first/bottom layer in a composite — so physical cells
+// with no source stay black; subsequent layers blend ONTO the accumulated frame).
+// For a single layer the caller passes op=Overwrite, opacity=255, clearFirst=true,
+// which takes the exact fast path this had before composition (memcpy / plain copy).
+//
+// The op/opacity branch is resolved ONCE here, before the per-light loop, so each
+// path is a tight specialized loop with no per-pixel mode check (hot-path rule).
+inline void blendMap(const Buffer& src, Buffer& dst, const MappingLUT& lut,
+                     uint8_t channelsPerLight,
+                     BlendOp op = BlendOp::Overwrite, uint8_t opacity = 255,
+                     bool clearFirst = true) {
+    // No LUT = identity map (dense grid, logical index == physical index — the
+    // common case). Blend 1:1, src byte i → dst byte i, no LUT lookup. The
+    // first/bottom full-opacity overwrite is a plain memcpy (the fast path);
+    // a composited layer above it blends per op/opacity straight over dst.
     if (!lut.hasLUT()) {
-        std::memcpy(dst.data(), src.data(), src.bytes());
+        const size_t n = src.bytes() < dst.bytes() ? src.bytes() : dst.bytes();
+        const uint8_t* s = src.data();
+        uint8_t* d = dst.data();
+        if (op == BlendOp::Overwrite && opacity == 255) {
+            std::memcpy(d, s, n);
+            return;
+        }
+        const bool full = (opacity == 255);
+        if (op == BlendOp::Additive) {
+            for (size_t i = 0; i < n; i++) {
+                uint16_t sv = full ? s[i] : div255(static_cast<uint16_t>(s[i]) * opacity);
+                uint16_t sum = static_cast<uint16_t>(d[i]) + sv;
+                d[i] = sum > 255 ? 255 : static_cast<uint8_t>(sum);
+            }
+        } else {  // Alpha (over)
+            const uint16_t inv = static_cast<uint16_t>(255 - opacity);
+            for (size_t i = 0; i < n; i++) {
+                d[i] = full ? s[i]
+                            : div255(static_cast<uint16_t>(s[i]) * opacity +
+                                     static_cast<uint16_t>(d[i]) * inv);
+            }
+        }
         return;
     }
 
-    // Clear first so physical cells with no source (sparse layouts — a sphere's
-    // lattice gaps) stay black.
-    dst.clear();
-    nrOfLightsType logCount = lut.logicalCount();
+    if (clearFirst) dst.clear();   // bottom layer: cells with no source stay black
+    const nrOfLightsType logCount = lut.logicalCount();
+    const bool full = (opacity == 255);
 
-    if (lut.overwrites()) {
-        // Each destination is written by at most one source (mirror, shuffle,
-        // sparse box→driver), so plain-copy — no read-back, no clamp. This is
-        // ~4× the additive path and is the case every current layout takes.
+    // Overwrite is the default op (single layer / bottom of a composite). It
+    // defers to the LUT's own overwrites() flag: a mapping where each physical
+    // cell is written once (mirror, shuffle, sparse box→driver) plain-copies;
+    // a mapping that folds several logical lights onto one physical cell
+    // (overwrites()=false) additively accumulates *within the layer* with clamp.
+    // (Cross-layer Additive/Alpha are the explicit ops below.) So a full-opacity
+    // Overwrite on a non-overwriting LUT routes to the additive accumulate path.
+    const bool effectiveAdditive = (op == BlendOp::Additive) ||
+                                   (op == BlendOp::Overwrite && !lut.overwrites());
+
+    // --- Plain overwrite (replace) — single-write LUT; copy, no read-back. ---
+    if (op == BlendOp::Overwrite && full && lut.overwrites()) {
         for (nrOfLightsType li = 0; li < logCount; li++) {
             const uint8_t* srcLight = src.data() + static_cast<size_t>(li) * channelsPerLight;
             lut.forEachDestination(li, [&](nrOfLightsType physIdx) {
@@ -38,15 +87,32 @@ inline void blendMap(const Buffer& src, Buffer& dst, const MappingLUT& lut, uint
         return;
     }
 
-    // Additive blend with clamping — for a map that folds multiple sources onto
-    // one destination (e.g. future multi-layer compositing).
+    // --- Additive with clamp; opacity scales the source. full-opacity skips the scale. ---
+    if (effectiveAdditive) {
+        for (nrOfLightsType li = 0; li < logCount; li++) {
+            const uint8_t* srcLight = src.data() + static_cast<size_t>(li) * channelsPerLight;
+            lut.forEachDestination(li, [&](nrOfLightsType physIdx) {
+                uint8_t* dstLight = dst.data() + static_cast<size_t>(physIdx) * channelsPerLight;
+                for (uint8_t c = 0; c < channelsPerLight; c++) {
+                    uint16_t s = full ? srcLight[c] : div255(static_cast<uint16_t>(srcLight[c]) * opacity);
+                    uint16_t sum = static_cast<uint16_t>(dstLight[c]) + s;
+                    dstLight[c] = sum > 255 ? 255 : static_cast<uint8_t>(sum);
+                }
+            });
+        }
+        return;
+    }
+
+    // --- Alpha (over): dst = src*α + dst*(255-α). full-opacity collapses to overwrite. ---
+    const uint16_t inv = static_cast<uint16_t>(255 - opacity);
     for (nrOfLightsType li = 0; li < logCount; li++) {
         const uint8_t* srcLight = src.data() + static_cast<size_t>(li) * channelsPerLight;
         lut.forEachDestination(li, [&](nrOfLightsType physIdx) {
             uint8_t* dstLight = dst.data() + static_cast<size_t>(physIdx) * channelsPerLight;
             for (uint8_t c = 0; c < channelsPerLight; c++) {
-                uint16_t sum = static_cast<uint16_t>(dstLight[c]) + srcLight[c];
-                dstLight[c] = sum > 255 ? 255 : static_cast<uint8_t>(sum);
+                if (full) { dstLight[c] = srcLight[c]; continue; }
+                dstLight[c] = div255(static_cast<uint16_t>(srcLight[c]) * opacity +
+                                     static_cast<uint16_t>(dstLight[c]) * inv);
             }
         });
     }
diff --git a/src/light/layers/Layer.h b/src/light/layers/Layer.h
index a0bf056..68b5c2d 100644
--- a/src/light/layers/Layer.h
+++ b/src/light/layers/Layer.h
@@ -4,6 +4,7 @@
 #include "light/layouts/Layouts.h"
 #include "light/effects/EffectBase.h"
 #include "light/layers/MappingLUT.h"
+#include "light/layers/BlendMap.h"   // BlendOp, for blendOp()
 #include "light/modifiers/ModifierBase.h"
 #include "platform/platform.h"
 
@@ -17,49 +18,33 @@ class Layer : public MoonModule {
     ModuleRole role() const override { return ModuleRole::Layer; }
     const char* acceptsChildRoles() const override { return "effect,modifier"; }
 
-    // start/end carve a region of the shared Layouts into this Layer's buffer,
-    // expressed as **percentages of the physical extent on each axis**.
-    // `start = 0, end = 100` is the full layout — the defaults below — and is
-    // byte-identical to the pre-Layers pipeline. Percentages are resilient to
-    // physical layout changes: a `startX = 25` Layer stays at the same
-    // relative position when the panel resizes from 64×64 to 128×128, rather
-    // than ending up at the wrong absolute pixel.
-    //
-    // Negative values and values > 100 are legal: a future modifier could drag
-    // a Layer in or out of the visible area by shifting start/end past 0% or
-    // 100% (e.g. `startX = -50` means the Layer extends 50% off the left edge
-    // of the layout). ControlType::Int16 is the wire type so negative values
-    // round-trip correctly through /api/state, /api/types, and persistence.
-    // `lengthType` (int16_t) is reused so the type matches width/height/depth
-    // — the *semantics* (percent vs pixel) live in the field name and spec.
-    //
-    // Spec: docs/architecture.md § Layers and Layer.
-    // NOTE: start/end are not yet read in onBuildState/rebuildLUT — they don't
-    // affect the buffer size today, so Layer doesn't override controlChangeTriggersBuildState.
-    // When they become functional (carving a sub-region → different buffer size), add
-    // `bool controlChangeTriggersBuildState(const char*) const override { return true; }` so a
-    // start/end change triggers the pipeline rebuild.
-    lengthType startX = 0;
-    lengthType startY = 0;
-    lengthType startZ = 0;
-    lengthType endX = 100;
-    lengthType endY = 100;
-    lengthType endZ = 100;
+
+    // Composition parameters — INERT on the Layer (it never reads them; a Layer
+    // can't know its position in the stack or what's beneath it). The Drivers
+    // container reads each enabled Layer's blendMode + opacity and composites the
+    // layers in container order into the physical buffer (see Drivers::loop). The
+    // value lives here so it travels with the Layer through add/delete/reorder —
+    // no separate, sync-prone blend list on Drivers. The bottom (first-composited)
+    // layer's blendMode is moot: it fills the cleared buffer regardless.
+    uint8_t blendMode = 0;     // index into kBlendModeOptions; 0 = alpha (over)
+    uint8_t opacity = 255;     // 0 = invisible, 255 = full
 
     void onBuildControls() override {
-        // Names match the field names; the percent semantic lives in the spec
-        // (Layer.md § start/end controls) and is reflected in the comment above.
-        controls_.addInt16("startX", startX);
-        controls_.addInt16("startY", startY);
-        controls_.addInt16("startZ", startZ);
-        controls_.addInt16("endX",   endX);
-        controls_.addInt16("endY",   endY);
-        controls_.addInt16("endZ",   endZ);
+        static constexpr const char* kBlendModeOptions[] = {"alpha", "additive"};
+        controls_.addSelect("blendMode", blendMode, kBlendModeOptions, 2);
+        controls_.addUint8("opacity", opacity, 0, 255);
         // Cascade to children (effects and modifiers) — preserves the default
         // base behaviour we just overrode.
         MoonModule::onBuildControls();
     }
 
+    // How this Layer composites when stacked above another (read by Drivers).
+    // Maps the blendMode select index to the BlendMap op. Index order must match
+    // kBlendModeOptions above.
+    BlendOp blendOp() const {
+        return blendMode == 1 ? BlendOp::Additive : BlendOp::Alpha;
+    }
+
     void setLayouts(Layouts* lg) { layouts_ = lg; }
     // The active Layouts, for consumers that need per-light coordinates (e.g.
     // PreviewDriver builds its coordinate table from layouts()->forEachCoord).
diff --git a/src/light/layers/Layers.h b/src/light/layers/Layers.h
index 92420b0..528f759 100644
--- a/src/light/layers/Layers.h
+++ b/src/light/layers/Layers.h
@@ -9,12 +9,13 @@ namespace mm {
 
 // Top-level container for one or more `Layer` children. Each child Layer
 // renders into its own buffer using the shared `Layouts` instance for physical
-// topology. `Drivers` composes the resulting buffers (today's "first wins"
-// placeholder, alpha-blend / additive in the composition follow-up).
+// topology. `Drivers` composites the resulting buffers in container order
+// (bottom→top) per each Layer's blendMode + opacity.
 //
 // With one child Layer this is a thin pass-through: loop() runs the child
-// Layer's loop() in order; behaviour matches the previous single-Layer
-// pipeline byte-for-byte. The container itself owns no buffer.
+// Layer's loop() in order; behaviour matches the single-Layer pipeline
+// byte-for-byte (Drivers takes its single-layer fast path). The container
+// itself owns no buffer — the composite buffer lives in Drivers.
 class Layers : public MoonModule {
 public:
     const char* acceptsChildRoles() const override { return "layer"; }
@@ -60,9 +61,10 @@ class Layers : public MoonModule {
         }
     }
 
-    // Single-Layer placeholder until composition lands: hand `Drivers` the
-    // first enabled Layer to read for buffer + dimensions. Returns nullptr
-    // when no Layer is registered (drivers handle that gracefully today).
+    // The first enabled Layer — `Drivers` reads it for physical dimensions
+    // (every layer composites into the same physical space, so any one answers
+    // width/height/depth). Also the source for the single-layer fast path.
+    // Returns nullptr when no Layer is registered (drivers handle that gracefully).
     // Non-Layer children are skipped — same guard as setLayouts above.
     Layer* activeLayer() const {
         MoonModule* fallback = nullptr;
@@ -75,6 +77,45 @@ class Layers : public MoonModule {
         return static_cast<Layer*>(fallback);  // nullptr if no Layer children
     }
 
+    // The first *enabled* Layer, or nullptr when none is enabled. Distinct from
+    // activeLayer(), which falls back to a disabled registered Layer so geometry
+    // (width/height/depth) stays queryable while everything is toggled off. Output
+    // selection must use *this* one: handing a disabled layer's stale buffer to the
+    // drivers would keep emitting its last frame instead of going idle.
+    Layer* firstEnabledLayer() const {
+        for (uint8_t i = 0; i < childCount(); i++) {
+            MoonModule* c = child(i);
+            if (!c || c->role() != ModuleRole::Layer || !c->enabled()) continue;
+            return static_cast<Layer*>(c);
+        }
+        return nullptr;
+    }
+
+    // Count of enabled Layer children — Drivers uses it to pick the single-layer
+    // fast path (==1) vs the composite path (>1), and to know if anything renders.
+    uint8_t enabledLayerCount() const {
+        uint8_t n = 0;
+        for (uint8_t i = 0; i < childCount(); i++) {
+            MoonModule* c = child(i);
+            if (c && c->role() == ModuleRole::Layer && c->enabled()) n++;
+        }
+        return n;
+    }
+
+    // Walk enabled Layers in container (composition) order — the order Drivers
+    // blends them, bottom (first) to top (last). `cb(layer, isFirst)`: isFirst
+    // marks the bottom layer (clears the buffer; the rest blend onto it).
+    template <typename Fn>
+    void forEachEnabledLayer(Fn cb) const {
+        bool first = true;
+        for (uint8_t i = 0; i < childCount(); i++) {
+            MoonModule* c = child(i);
+            if (!c || c->role() != ModuleRole::Layer || !c->enabled()) continue;
+            cb(static_cast<Layer*>(c), first);
+            first = false;
+        }
+    }
+
 private:
     Layouts* layouts_ = nullptr;
 };
diff --git a/src/light/modifiers/RegionModifier.h b/src/light/modifiers/RegionModifier.h
new file mode 100644
index 0000000..df88bf1
--- /dev/null
+++ b/src/light/modifiers/RegionModifier.h
@@ -0,0 +1,106 @@
+#pragma once
+
+#include "light/modifiers/ModifierBase.h"
+
+namespace mm {
+
+// Carves the layer down to a sub-region of the physical bounding box: the effect
+// renders only into the region, everything outside is dark. The region is given
+// as PERCENTAGES of the physical extent on each axis (start 0 / end 100 = the
+// full box, an identity carve), so it survives a physical resize — a 0..50 region
+// stays the left half whether the panel is 64 or 128 wide.
+//
+// It is a region *crop*, the textbook crop/region node of any compositor: it
+// resizes the logical box to the region (logicalDimensions) and maps each
+// region-local cell 1:1 to its box cell at the region's start offset
+// (mapToPhysical). Because the logical box is already the region size, every
+// region cell is in-bounds — the "drop outside" is achieved by the smaller box,
+// exactly as a Mirror shrinks the box to the half it folds. Never fans out
+// (maxMultiplier == 1), same 1:1 family as CheckerboardModifier.
+//
+// Rounding rule (spec: docs/moonmodules/light/RegionModifier.md): HALF-OPEN
+// [startPixel, endPixel). start% floors to the lower pixel; end% ceils to an
+// EXCLUSIVE pixel. This makes abutting regions tile exactly — a 0..50 and a
+// 50..100 layer split a 128-wide axis into 0..63 and 64..127 with no overlap and
+// no gap. Clamped so the region is always ≥1 pixel and never runs off the box.
+// (start 33 / end 66 on a 4-wide axis → floor(1.32)=1 .. ceil(2.64)=3 → pixels
+// 1..2, width 2; end 100 on a W-wide axis → ceil(W)=W → full width.) Negative /
+// >100 percentages are legal on the wire (Int16) but clamp to the box here.
+//
+// Fast path: the cheapest carve is *no modifier* — then Layer::rebuildLUT takes
+// its identity/memcpy path with zero carving cost. Adding a full-region (0/100)
+// RegionModifier is correct but not free; the default is to not add one.
+class RegionModifier : public ModifierBase {
+public:
+    lengthType startX = 0,   startY = 0,   startZ = 0;
+    lengthType endX   = 100, endY   = 100, endZ   = 100;
+
+    nrOfLightsType maxMultiplier() const override { return 1; }  // 1:1 inside, never fans out
+
+    void onBuildControls() override {
+        // Int16 so negative / >100 percentages round-trip; the carve math clamps.
+        controls_.addInt16("startX", startX);
+        controls_.addInt16("startY", startY);
+        controls_.addInt16("startZ", startZ);
+        controls_.addInt16("endX",   endX);
+        controls_.addInt16("endY",   endY);
+        controls_.addInt16("endZ",   endZ);
+    }
+
+    void logicalDimensions(lengthType physW, lengthType physH, lengthType physD,
+                           lengthType& logW, lengthType& logH, lengthType& logD) const override {
+        logW = axisCount(startX, endX, physW);
+        logH = axisCount(startY, endY, physH);
+        logD = axisCount(startZ, endZ, physD);
+    }
+
+    void mapToPhysical(lengthType lx, lengthType ly, lengthType lz,
+                       lengthType physW, lengthType physH, lengthType physD,
+                       nrOfLightsType* outPhysicals, nrOfLightsType& outCount,
+                       nrOfLightsType maxOut) const override {
+        outCount = 0;
+        if (maxOut == 0) return;
+        // Region-local → box coordinate: add each axis's start-pixel offset. lx/ly/lz
+        // are already bounded by the region size logicalDimensions reported, so the
+        // result is always in-box; no per-cell drop needed.
+        const lengthType bx = lx + axisStart(startX, physW);
+        const lengthType by = ly + axisStart(startY, physH);
+        const lengthType bz = lz + axisStart(startZ, physD);
+        outPhysicals[0] = static_cast<nrOfLightsType>(bz) * static_cast<nrOfLightsType>(physW) * static_cast<nrOfLightsType>(physH) +
+                          static_cast<nrOfLightsType>(by) * static_cast<nrOfLightsType>(physW) +
+                          static_cast<nrOfLightsType>(bx);
+        outCount = 1;
+    }
+
+private:
+    // First pixel of the region on an axis: floor(start% · extent), clamped to
+    // [0, extent-1]. Shared by logicalDimensions (via axisCount) and mapToPhysical
+    // so the two can't drift.
+    static lengthType axisStart(lengthType startPct, lengthType extent) {
+        if (extent <= 0) return 0;
+        long p = (static_cast<long>(startPct) * extent) / 100;   // floor for non-negative; clamps below anyway
+        if (p < 0) p = 0;
+        if (p > extent - 1) p = extent - 1;
+        return static_cast<lengthType>(p);
+    }
+
+    // Region size on an axis (half-open): count = endPixel - startPixel, where
+    // endPixel is ceil(end% · extent) treated as EXCLUSIVE, clamped to
+    // [startPixel+1, extent] so the region is ≥1 pixel and stays in the box.
+    // Spec example: start 33 / end 66 on extent 4 → s=floor(1.32)=1,
+    // endExcl=ceil(2.64)=3 → count = 3-1 = 2 (pixels 1,2). Default end 100 on
+    // extent W → ceil(W)=W → count = W (full width). 0..50 then 50..100 on 128 →
+    // 0..64 and 64..128 exclusive → 64 + 64, tiling exactly.
+    static lengthType axisCount(lengthType startPct, lengthType endPct, lengthType extent) {
+        if (extent <= 0) return 0;
+        const lengthType s = axisStart(startPct, extent);
+        // Ceiling division of (endPct * extent) / 100, for non-negative endPct.
+        long num = static_cast<long>(endPct) * extent;
+        long e = num <= 0 ? 0 : (num + 99) / 100;   // ceil, EXCLUSIVE end pixel
+        if (e < s + 1) e = s + 1;                    // ≥1-pixel region
+        if (e > extent) e = extent;                  // never past the box
+        return static_cast<lengthType>(e - s);
+    }
+};
+
+} // namespace mm
diff --git a/src/main.cpp b/src/main.cpp
index 1a1ccc6..9361914 100644
--- a/src/main.cpp
+++ b/src/main.cpp
@@ -27,6 +27,7 @@
 #include "light/modifiers/CheckerboardModifier.h"
 #include "light/modifiers/RandomMapModifier.h"
 #include "light/modifiers/RotateModifier.h"
+#include "light/modifiers/RegionModifier.h"
 #include "light/drivers/NetworkSendDriver.h"
 #include "light/drivers/PreviewDriver.h"
 // LED drivers are compiled in per chip, gated on the SOC peripheral the driver
@@ -105,6 +106,7 @@ static void registerModuleTypes() {
     mm::ModuleFactory::registerType<mm::CheckerboardModifier>("CheckerboardModifier", "light/modifiers/CheckerboardModifier.md");
     mm::ModuleFactory::registerType<mm::RandomMapModifier>("RandomMapModifier", "light/modifiers/RandomMapModifier.md");
     mm::ModuleFactory::registerType<mm::RotateModifier>("RotateModifier", "light/modifiers/RotateModifier.md");
+    mm::ModuleFactory::registerType<mm::RegionModifier>("RegionModifier", "light/modifiers/RegionModifier.md");
     mm::ModuleFactory::registerType<mm::NetworkSendDriver>("NetworkSendDriver", "light/drivers/NetworkSendDriver.md");
     mm::ModuleFactory::registerType<mm::PreviewDriver>("PreviewDriver", "light/drivers/PreviewDriver.md");
     // Register only the LED drivers this chip's silicon can run (see the gated
diff --git a/src/ui/app.js b/src/ui/app.js
index 15c2980..b3bc430 100644
--- a/src/ui/app.js
+++ b/src/ui/app.js
@@ -5,6 +5,7 @@
 // default; entry-point is the WS init at the bottom — no ordering surprises.
 import { installPicker } from "/install-picker.js";
 import { preview } from "/preview3d.js";
+import { isNewer, parse } from "/semver.js";
 
 // Sections (top to bottom):
 //   1. State + storage
@@ -143,6 +144,7 @@ window.addEventListener("pageshow", (e) => {
 async function init() {
     applyTheme(theme);
     setupStatusBarButtons();
+    setupUpdateBadge();
     try {
         const resp = await fetch("/api/state");
         state = await resp.json();
@@ -567,6 +569,10 @@ function createCard(mod, depth) {
     // device fetches the binary via /api/firmware/url — no browser CORS in
     // the data path. See docs/architecture.md § Firmware vs board.
     if (mod.type === "FirmwareUpdateModule") {
+        // Opening the Firmware card forces a fresh update check (the badge otherwise refreshes
+        // only on the 1 h cache cadence) — so the badge agrees with the picker the user is about
+        // to use. Fire-and-forget; best-effort.
+        checkFirmwareUpdate(true);
         const ownFirmwareKey = (() => {
             // The `firmware` variant key is this module's own control now (moved here from
             // SystemModule), so read it straight off mod — no cross-module lookup.
@@ -985,7 +991,7 @@ function createControl(moduleName, moduleType, ctrl) {
         case "int16": {
             // ctrl.min/ctrl.max are always present (server sends them). Sentinel
             // values INT16_MIN (-32768) / INT16_MAX (32767) mean "unbounded" —
-            // fall back to the percentage range used by Layer start/end controls.
+            // fall back to a ±percentage range.
             const rawMin = Number(ctrl.min ?? -32768);
             const rawMax = Number(ctrl.max ?? 32767);
             const min = rawMin <= -32768 ? -100 : rawMin;
@@ -1112,11 +1118,30 @@ function createControl(moduleName, moduleType, ctrl) {
                 if (i === ctrl.value) o.selected = true;
                 sel.appendChild(o);
             });
-            sel.addEventListener("change", async () => {
+            // Protect the dropdown while the user has it open. A native <select>
+            // popup stays open for several frames (seconds, if deliberating) while
+            // a continuously-refreshed module keeps pushing state over the WS; an
+            // unguarded `sel.value = ctrl.value` patch during that window snaps the
+            // menu back to the old option and visibly closes it — the user never
+            // gets to pick. We mark the select "open" on pointerdown (fires BEFORE
+            // the popup opens, unlike focus, which some browsers delay or skip) and
+            // clear it on change/blur; updateModuleControls skips any select marked
+            // open. pointerdown also stamps the dragTs cooldown as a belt-and-braces
+            // fallback for the post-close frames.
+            sel.dataset.open = "false";
+            const markOpen = () => { sel.dataset.open = "true"; dragTs[key] = Date.now(); };
+            sel.addEventListener("pointerdown", markOpen);
+            sel.addEventListener("focus", markOpen);
+            sel.addEventListener("blur", () => { sel.dataset.open = "false"; });
+            sel.addEventListener("change", () => {
+                sel.dataset.open = "false";
                 dragTs[key] = Date.now();
-                await sendControl(moduleName, ctrl.name, parseInt(sel.value));
-                // Server may rebuild this module's controls (dynamic onBuildControls); refetch
-                setTimeout(refetchState, 200);
+                sendControl(moduleName, ctrl.name, parseInt(sel.value));
+                // No refetch/re-render here: blendMode/opacity-style selects don't
+                // change the control SET, and a control that does (a hidden-flag
+                // flip) is reconciled in place by syncVisibleControls on the next
+                // WS push — so the card (and its expanded state) is preserved.
+                // A full refetchState() rebuilt the DOM and collapsed the card.
             });
             row.appendChild(sel);
             appendResetButton(row, moduleName, ctrl, def, () => { sel.value = def; });
@@ -1552,7 +1577,14 @@ function allModules() {
 function syncVisibleControls(mod) {
     const card = document.querySelector(`.card[data-module="${cssEscape(mod.name)}"]`);
     if (!card) return false;
-    const host = card.querySelector(".card-controls-collapse") || card;
+    // The controls host is THIS card's own collapse wrapper — must be a DIRECT
+    // child (`:scope >`), not any descendant: a container card (e.g. Layers) nests
+    // its child cards (Layer) inside .card-children, and a plain
+    // `card.querySelector(".card-controls-collapse")` would reach down and match
+    // the CHILD's wrapper. That made Layers adopt Layer's control rows as its own,
+    // so both cards saw a control-set mismatch every WS frame and rebuilt each
+    // other's rows in a loop — tearing down (and closing) any open <select>.
+    const host = card.querySelector(":scope > .card-controls-collapse") || card;
 
     const wantNames = mod.controls.filter(c => !c.hidden).map(c => c.name);
     const haveRows = [...host.querySelectorAll(":scope > .control-row[data-key]")];
@@ -1652,7 +1684,14 @@ function updateModuleControls(mod) {
             }
             case "select": {
                 const sel = document.querySelector(`select[data-mid="${mid}"][data-key="${k}"]`);
-                if (sel && Number(sel.value) !== Number(ctrl.value)) sel.value = ctrl.value;
+                // Never overwrite a select the user currently has OPEN (popup
+                // showing) or focused. data-open is set on pointerdown/focus and
+                // cleared on change/blur — more reliable than document.activeElement,
+                // which is ambiguous while a native popup is up (the popup is a
+                // separate OS layer on macOS). The 1s dragTs cooldown is the
+                // additional fallback for the frames right after the popup closes.
+                if (sel && sel.dataset.open !== "true" && sel !== document.activeElement &&
+                    Number(sel.value) !== Number(ctrl.value)) sel.value = ctrl.value;
                 break;
             }
             case "display": {
@@ -2158,6 +2197,175 @@ function updateStatusBar() {
         if (crashed) rebootBtn.title = "Last boot: " + reasonCtrl.value + " (click to reboot)";
         else rebootBtn.title = "Reboot device";
     }
+
+    // Cache-first update check: instant from the localStorage cache, background-fetches only
+    // when stale (>1 h). Fire-and-forget — best-effort, never blocks the status-bar render.
+    checkFirmwareUpdate(false);
+}
+
+// ---------------------------------------------------------------------------
+// 8b. Firmware-update badge
+// ---------------------------------------------------------------------------
+// Browser-side "a newer firmware is out" check, modelled on ESP32-sveltekit's
+// UpdateIndicator (the upstream firmware lineage) — our own code. The device fetches
+// nothing; the browser compares the running version (FirmwareUpdateModule.version, pure
+// semver) against GitHub releases and, when newer AND a compatible .bin exists, shows the
+// status-bar badge. Two channels:
+//   - STABLE: a device compares against the newest stable release (the /latest endpoint
+//     excludes prereleases). Applies to every device.
+//   - DEV (latest): a device already on a prerelease build (-dev.<N>) ALSO compares against
+//     the moving `latest` release, so a stale latest build is nudged to the newest latest.
+//     The `latest` release's tag is "latest" (not a semver), so its version is read from the
+//     per-firmware manifest (manifest-<firmware>.json carries "version", e.g. 2.1.0-dev.7).
+// A stable update wins over a dev update. Cached in localStorage (1 h TTL) so it doesn't
+// slow page load; a fresh check is forced when the Firmware card opens. Best-effort: any
+// failure hides the badge, never throws.
+
+const RELEASES_API = "https://api.github.com/repos/MoonModules/projectMM/releases";
+const UPDATE_TTL_MS = 60 * 60 * 1000;                     // 1 h — best-effort, well under GitHub's rate limit
+const PICKER_RELEASE_KEY = "projectMM.picker.releaseTag"; // install-picker restores from this on init
+
+function safeLocalGet(key) { try { return localStorage.getItem(key); } catch (_) { return null; } }
+function safeLocalSet(key, v) { try { localStorage.setItem(key, v); } catch (_) { /* ignore */ } }
+
+// In-flight fetches keyed by cache slot. updateStatusBar() calls checkFirmwareUpdate(false)
+// every WS tick (1 Hz); on a cold cache they'd each start a duplicate releases/latest request
+// before the first writes the cache. Share the pending promise so concurrent callers reuse it.
+const inFlightFetches = {};
+
+// A cached JSON fetch: returns the parsed body, re-fetching only when the cache is older than
+// the TTL or `force` is set, and serving stale on a fetch failure. `key` is the cache slot.
+async function cachedJson(url, key, force) {
+    if (!force) {
+        const raw = safeLocalGet(key);
+        if (raw) {
+            try {
+                const obj = JSON.parse(raw);
+                if (Date.now() - obj.ts < UPDATE_TTL_MS) return obj.data;
+            } catch (_) { /* fall through to fetch */ }
+        }
+    }
+    // Coalesce concurrent fetches for the same slot onto one request.
+    if (inFlightFetches[key]) return inFlightFetches[key];
+    const p = (async () => {
+        try {
+            const res = await fetch(url, { headers: { accept: "application/json" } });
+            if (!res.ok) throw new Error(`HTTP ${res.status}`);
+            const data = await res.json();
+            safeLocalSet(key, JSON.stringify({ ts: Date.now(), data }));
+            return data;
+        } catch (e) {
+            // console.debug, not warn: an update check failing is routine and not
+            // actionable (the device may simply be offline, or GitHub rate-limited),
+            // so keep it out of the default console — debug is hidden unless the user
+            // opts into verbose. Both callers hit api.github.com, which sends
+            // Access-Control-Allow-Origin and so reads fine from the device origin;
+            // the failure path here is for the no-network / rate-limit case.
+            console.debug("[update] fetch failed:", url, e && e.message ? e.message : e);
+            const raw = safeLocalGet(key);                   // serve stale on failure
+            if (raw) {
+                try {
+                    const obj = JSON.parse(raw);
+                    // Refresh the timestamp so the per-tick check doesn't re-attempt a
+                    // failing fetch every second — back off until the next TTL window.
+                    safeLocalSet(key, JSON.stringify({ ts: Date.now(), data: obj.data }));
+                    return obj.data;
+                } catch (_) { /* none */ }
+            }
+            // No stale entry to serve: NEGATIVE-CACHE the failure (data:null) with a
+            // fresh timestamp so the TTL guard above suppresses the next attempt for
+            // the back-off window. Without this, every status-bar render (≈4×/s on
+            // each WS push) re-runs the failing fetch — an error storm in the console
+            // whenever the device is offline. A null cache hit returns "no update".
+            safeLocalSet(key, JSON.stringify({ ts: Date.now(), data: null }));
+            return null;
+        } finally {
+            delete inFlightFetches[key];                     // clear once settled, ok or not
+        }
+    })();
+    inFlightFetches[key] = p;
+    return p;
+}
+
+// Read the device's running version + firmware-variant key off the FirmwareUpdateModule.
+function deviceFirmwareInfo() {
+    if (!state || !state.modules) return null;
+    const fw = findModule("Firmware") || (state.modules.find(m => m.type === "FirmwareUpdateModule"));
+    if (!fw) return null;
+    const ctrls = fw.controls || [];
+    const version = (ctrls.find(c => c.name === "version") || {}).value;
+    const firmware = (ctrls.find(c => c.name === "firmware") || {}).value;
+    return version ? { version, firmware } : null;
+}
+
+// Light the badge for an available update. `tag` is the release the picker should pre-select
+// (a vX.Y.Z stable tag, or "latest"); `label` is what the badge shows.
+function showUpdateBadge(badge, tag, label) {
+    badge.textContent = `⬆ ${label}`;
+    badge.title = `Firmware update available: ${label} — open Firmware to install`;
+    badge.dataset.tag = tag;
+    badge.hidden = false;
+}
+
+// Is there a newer STABLE release than the device's version, with a compatible .bin?
+// Returns the stable tag (e.g. "v2.1.0") or null. /latest excludes prereleases.
+async function stableUpdate(dev, force) {
+    const rel = await cachedJson(`${RELEASES_API}/latest`, "projectMM.update.latest.v1", force);
+    if (!rel || !rel.tag_name) return null;
+    const assetNames = (rel.assets || []).map(a => a.name);
+    const hasBinary = !dev.firmware ||
+        assetNames.some(n => n === `firmware-${dev.firmware}-${rel.tag_name}.bin`);
+    return (isNewer(rel.tag_name, dev.version) && hasBinary) ? rel.tag_name : null;
+}
+
+// For a device already on a -dev build: is the moving `latest` release newer? Returns its
+// version string (e.g. "2.1.0-dev.7") or null. The latest release's tag is "latest"; its
+// version is published as the release `name` (release.yml), which the GitHub API exposes
+// CORS-readably — unlike the manifest-*.json asset, whose release-asset URL redirects to
+// release-assets.githubusercontent.com (no CORS header), so the device-hosted UI can't read it.
+// We also require the matching firmware .bin asset so the badge never points at a build the
+// device can't install.
+async function devUpdate(dev, force) {
+    if (!dev.firmware) return null;                          // can't match an asset without the key
+    const rel = await cachedJson(`${RELEASES_API}/tags/latest`, "projectMM.update.dev.v1", force);
+    const v = rel && rel.name;
+    if (!v) return null;
+    // Assets are versioned, not tagged: the `latest` release ships
+    // firmware-<fw>-v<version>.bin (release.yml stages PREFIX="firmware-...-v$V").
+    const hasBinary = (rel.assets || []).some(a => a.name === `firmware-${dev.firmware}-v${v}.bin`);
+    return (hasBinary && isNewer(v, dev.version)) ? v : null;
+}
+
+// Show/hide the badge. `force` bypasses the cache (used when the Firmware card opens).
+// Stable update takes precedence; a -dev device additionally checks the latest channel.
+async function checkFirmwareUpdate(force) {
+    const badge = document.getElementById("fw-update-badge");
+    if (!badge) return;
+    const dev = deviceFirmwareInfo();
+    if (!dev) { badge.hidden = true; return; }
+
+    const stableTag = await stableUpdate(dev, force);
+    if (stableTag) { showUpdateBadge(badge, stableTag, stableTag); return; }
+
+    // Only a prerelease (-dev…) build follows the moving latest channel; a stable device is
+    // not nudged toward an unreleased build.
+    const onPrerelease = (parse(dev.version)?.prerelease.length || 0) > 0;
+    if (onPrerelease) {
+        const devVer = await devUpdate(dev, force);
+        if (devVer) { showUpdateBadge(badge, "latest", `latest (${devVer})`); return; }
+    }
+    badge.hidden = true;
+}
+
+// Badge click → pre-select the new release in the picker (it restores from PICKER_RELEASE_KEY
+// on init) and open the Firmware card, so the user lands one click from Install.
+function setupUpdateBadge() {
+    const badge = document.getElementById("fw-update-badge");
+    if (!badge) return;
+    badge.addEventListener("click", () => {
+        if (badge.dataset.tag) safeLocalSet(PICKER_RELEASE_KEY, badge.dataset.tag);
+        selectModule("Firmware");
+    });
 }
 
 // ---------------------------------------------------------------------------
diff --git a/src/ui/embed_ui.cmake b/src/ui/embed_ui.cmake
index 0ec169f..0fde741 100644
--- a/src/ui/embed_ui.cmake
+++ b/src/ui/embed_ui.cmake
@@ -52,6 +52,7 @@ gzip_file_hex("index.html" INDEX_HTML)
 gzip_file_hex("app.js" APP_JS)
 gzip_file_hex("style.css" STYLE_CSS)
 gzip_file_hex("install-picker.js" INSTALL_PICKER_JS)
+gzip_file_hex("semver.js" SEMVER_JS)
 gzip_file_hex("preview3d.js" PREVIEW3D_JS)
 file(READ "${UI_DIR}/moonlight-logo.png" LOGO_PNG HEX)
 
@@ -74,6 +75,7 @@ hex_to_c_array("${INDEX_HTML}" "indexHtml" INDEX_ARRAY)
 hex_to_c_array("${APP_JS}" "appJs" APP_ARRAY)
 hex_to_c_array("${STYLE_CSS}" "styleCss" STYLE_ARRAY)
 hex_to_c_array("${INSTALL_PICKER_JS}" "installPickerJs" INSTALL_PICKER_ARRAY)
+hex_to_c_array("${SEMVER_JS}" "semverJs" SEMVER_ARRAY)
 hex_to_c_array("${PREVIEW3D_JS}" "preview3dJs" PREVIEW3D_ARRAY)
 hex_to_c_array("${LOGO_PNG}" "logoPng" LOGO_ARRAY)
 
@@ -81,12 +83,14 @@ string(LENGTH "${INDEX_HTML}" INDEX_HEX_LEN)
 string(LENGTH "${APP_JS}" APP_HEX_LEN)
 string(LENGTH "${STYLE_CSS}" STYLE_HEX_LEN)
 string(LENGTH "${INSTALL_PICKER_JS}" INSTALL_PICKER_HEX_LEN)
+string(LENGTH "${SEMVER_JS}" SEMVER_HEX_LEN)
 string(LENGTH "${PREVIEW3D_JS}" PREVIEW3D_HEX_LEN)
 string(LENGTH "${LOGO_PNG}" LOGO_HEX_LEN)
 math(EXPR INDEX_LEN "${INDEX_HEX_LEN} / 2")
 math(EXPR APP_LEN "${APP_HEX_LEN} / 2")
 math(EXPR STYLE_LEN "${STYLE_HEX_LEN} / 2")
 math(EXPR INSTALL_PICKER_LEN "${INSTALL_PICKER_HEX_LEN} / 2")
+math(EXPR SEMVER_LEN "${SEMVER_HEX_LEN} / 2")
 math(EXPR PREVIEW3D_LEN "${PREVIEW3D_HEX_LEN} / 2")
 math(EXPR LOGO_LEN "${LOGO_HEX_LEN} / 2")
 
@@ -100,6 +104,8 @@ file(APPEND "${OUT}" "constexpr uint8_t styleCss[] = {${STYLE_ARRAY}};\n")
 file(APPEND "${OUT}" "constexpr size_t styleCssLen = ${STYLE_LEN};\n")
 file(APPEND "${OUT}" "constexpr uint8_t installPickerJs[] = {${INSTALL_PICKER_ARRAY}};\n")
 file(APPEND "${OUT}" "constexpr size_t installPickerJsLen = ${INSTALL_PICKER_LEN};\n")
+file(APPEND "${OUT}" "constexpr uint8_t semverJs[] = {${SEMVER_ARRAY}};\n")
+file(APPEND "${OUT}" "constexpr size_t semverJsLen = ${SEMVER_LEN};\n")
 file(APPEND "${OUT}" "constexpr uint8_t preview3dJs[] = {${PREVIEW3D_ARRAY}};\n")
 file(APPEND "${OUT}" "constexpr size_t preview3dJsLen = ${PREVIEW3D_LEN};\n")
 file(APPEND "${OUT}" "constexpr uint8_t logoPng[] = {${LOGO_ARRAY}};\n")
diff --git a/src/ui/index.html b/src/ui/index.html
index d837c43..623ad9f 100644
--- a/src/ui/index.html
+++ b/src/ui/index.html
@@ -15,6 +15,10 @@
         <span id="device-name"></span>
         <span id="sys-stats"></span>
         <span class="spacer"></span>
+        <!-- Shown only when a newer stable GitHub release exists for this device's firmware
+             (app.js::checkFirmwareUpdate). Click opens the Firmware card with that release
+             pre-selected. Hidden by default; never blocks if GitHub is unreachable. -->
+        <button type="button" id="fw-update-badge" class="fw-update-badge" hidden></button>
         <span id="ws-dot" class="ws-dot disconnected" title="WebSocket"></span>
         <button type="button" id="reboot-btn" class="header-btn" aria-label="Reboot device" title="Reboot device">⏻</button>
         <button type="button" id="theme-toggle" class="header-btn" aria-label="Toggle light/dark theme" title="Toggle light/dark theme">☀</button>
diff --git a/src/ui/semver.js b/src/ui/semver.js
new file mode 100644
index 0000000..61ffc8c
--- /dev/null
+++ b/src/ui/semver.js
@@ -0,0 +1,71 @@
+// projectMM semver — a tiny, dependency-free Semantic Versioning compare.
+//
+// One home for version comparison (the firmware-update check needs it; the install picker can adopt
+// it for its dropdown ordering later). Implements the parts of https://semver.org we use:
+//   §2  version core: MAJOR.MINOR.PATCH (numeric)
+//   §9  pre-release: a `-` then dot-separated identifiers (e.g. 2.1.0-dev, 1.0.0-rc.2)
+//   §10 build metadata: a `+` then identifiers — IGNORED for precedence (per spec)
+//   §11 precedence: compare core numerically; a version WITH a pre-release is LOWER than the same
+//       core without one; otherwise compare pre-release identifiers left-to-right (numeric < non-
+//       numeric, numerics compared as numbers, alphanumerics by ASCII, longer set wins if all equal).
+//
+// Our own code (not a port of `compare-versions`/`semver` npm) — carry the idea forward, write it
+// fresh against our needs. Tested in test/js/semver.test.mjs.
+
+// Parse "v?MAJOR.MINOR.PATCH(-prerelease)?(+build)?" → {major, minor, patch, prerelease: string[]}.
+// Returns null if it isn't a parseable version core (so callers can treat junk as "can't compare").
+// A leading `v` is tolerated (git tags). Build metadata is dropped (it has no precedence).
+export function parse(version) {
+    if (typeof version !== "string") return null;
+    const s = version.trim().replace(/^v/, "");
+    // core (-prerelease)? (+build)?
+    const m = /^(\d+)\.(\d+)\.(\d+)(?:-([0-9A-Za-z.-]+))?(?:\+[0-9A-Za-z.-]+)?$/.exec(s);
+    if (!m) return null;
+    return {
+        major: Number(m[1]),
+        minor: Number(m[2]),
+        patch: Number(m[3]),
+        prerelease: m[4] ? m[4].split(".") : [],
+    };
+}
+
+// Compare two pre-release identifier arrays per §11. Returns -1/0/1.
+function comparePrerelease(a, b) {
+    // A version with NO pre-release outranks one WITH a pre-release (e.g. 1.0.0 > 1.0.0-rc.1).
+    if (a.length === 0 && b.length === 0) return 0;
+    if (a.length === 0) return 1;   // a is the release, b is a pre-release → a is higher
+    if (b.length === 0) return -1;
+    const len = Math.min(a.length, b.length);
+    for (let i = 0; i < len; i++) {
+        const ai = a[i], bi = b[i];
+        const an = /^\d+$/.test(ai), bn = /^\d+$/.test(bi);
+        if (an && bn) {                                  // both numeric → compare as numbers
+            const d = Number(ai) - Number(bi);
+            if (d !== 0) return d < 0 ? -1 : 1;
+        } else if (an !== bn) {                          // numeric identifiers are LOWER than alphanumeric
+            return an ? -1 : 1;
+        } else if (ai !== bi) {                          // both alphanumeric → ASCII order
+            return ai < bi ? -1 : 1;
+        }
+    }
+    // All shared identifiers equal → the LONGER set is higher (more identifiers = more specific).
+    return a.length === b.length ? 0 : (a.length < b.length ? -1 : 1);
+}
+
+// Compare two version strings. Returns -1 (a<b), 0 (a==b), 1 (a>b).
+// An unparseable side is treated as the LOWEST (so a comparison against junk never claims an update).
+export function compare(a, b) {
+    const pa = parse(a), pb = parse(b);
+    if (!pa && !pb) return 0;
+    if (!pa) return -1;
+    if (!pb) return 1;
+    for (const k of ["major", "minor", "patch"]) {
+        if (pa[k] !== pb[k]) return pa[k] < pb[k] ? -1 : 1;
+    }
+    return comparePrerelease(pa.prerelease, pb.prerelease);
+}
+
+// True iff `candidate` is a strictly newer version than `current` (the update-available test).
+export function isNewer(candidate, current) {
+    return compare(candidate, current) === 1;
+}
diff --git a/src/ui/style.css b/src/ui/style.css
index 47ebe5d..4ba5ad7 100644
--- a/src/ui/style.css
+++ b/src/ui/style.css
@@ -97,6 +97,21 @@ body {
 .ws-dot.connected { background: var(--green); }
 .ws-dot.disconnected { background: #888; }
 
+/* Firmware-update badge: shown by app.js when a newer stable release exists for this device.
+   Accent-filled pill (attention, not alarm) sitting in the status bar; click opens Firmware. */
+.fw-update-badge {
+    border: 1px solid var(--accent);
+    background: color-mix(in srgb, var(--accent) 18%, transparent);
+    color: var(--accent);
+    font-size: 12px;
+    line-height: 1;
+    padding: 4px 8px;
+    border-radius: 12px;
+    cursor: pointer;
+    white-space: nowrap;
+}
+.fw-update-badge:hover { background: color-mix(in srgb, var(--accent) 30%, transparent); }
+
 .header-btn {
     background: transparent;
     border: 1px solid var(--border);
diff --git a/test/CMakeLists.txt b/test/CMakeLists.txt
index fc0989c..81fc0c8 100644
--- a/test/CMakeLists.txt
+++ b/test/CMakeLists.txt
@@ -60,6 +60,7 @@ add_executable(mm_tests
     unit/light/unit_CheckerboardModifier.cpp
     unit/light/unit_RandomMapModifier.cpp
     unit/light/unit_RotateModifier.cpp
+    unit/light/unit_RegionModifier.cpp
     unit/light/unit_NoiseEffect.cpp
     unit/light/unit_ParticlesEffect.cpp
     unit/light/unit_PlasmaEffect.cpp
diff --git a/test/js/semver.test.mjs b/test/js/semver.test.mjs
new file mode 100644
index 0000000..a17aa6c
--- /dev/null
+++ b/test/js/semver.test.mjs
@@ -0,0 +1,62 @@
+// Semver compare contract — pins the parse + precedence rules src/ui/semver.js implements
+// (semver.org §2/§9/§11). The firmware "update available" badge relies on these: a clean stable
+// release must out-rank a `-dev` build of the same core, and a real bump must register as newer.
+// Run: `node --test test/js`.
+
+import { test } from "node:test";
+import assert from "node:assert/strict";
+import { parse, compare, isNewer } from "../../src/ui/semver.js";
+
+test("parse: core, prerelease, leading v, build metadata", () => {
+    assert.deepEqual(parse("2.0.0"), { major: 2, minor: 0, patch: 0, prerelease: [] });
+    assert.deepEqual(parse("v2.1.0"), { major: 2, minor: 1, patch: 0, prerelease: [] });  // leading v tolerated
+    assert.deepEqual(parse("2.1.0-dev"), { major: 2, minor: 1, patch: 0, prerelease: ["dev"] });
+    assert.deepEqual(parse("1.0.0-rc.2"), { major: 1, minor: 0, patch: 0, prerelease: ["rc", "2"] });
+    assert.deepEqual(parse("1.2.3+build.7"), { major: 1, minor: 2, patch: 3, prerelease: [] });  // build dropped
+    assert.equal(parse("not-a-version"), null);
+    assert.equal(parse("2.0"), null);          // incomplete core
+    assert.equal(parse(undefined), null);
+});
+
+test("compare: numeric core ordering", () => {
+    assert.equal(compare("2.0.0", "1.0.0"), 1);
+    assert.equal(compare("1.0.0", "2.0.0"), -1);
+    assert.equal(compare("2.1.0", "2.0.5"), 1);   // minor beats patch
+    assert.equal(compare("2.0.1", "2.0.0"), 1);
+    assert.equal(compare("2.0.0", "2.0.0"), 0);
+    assert.equal(compare("v2.0.0", "2.0.0"), 0);  // leading v doesn't change value
+});
+
+test("compare: a release out-ranks a prerelease of the same core (§11)", () => {
+    assert.equal(compare("2.1.0", "2.1.0-dev"), 1);    // stable > dev — the badge's core case
+    assert.equal(compare("2.1.0-dev", "2.1.0"), -1);
+    assert.equal(compare("1.0.0-rc.1", "1.0.0"), -1);
+});
+
+test("compare: prerelease identifier precedence (§11)", () => {
+    assert.equal(compare("1.0.0-alpha", "1.0.0-beta"), -1);          // ASCII: alpha < beta
+    assert.equal(compare("1.0.0-rc.2", "1.0.0-rc.1"), 1);           // numeric identifiers as numbers
+    assert.equal(compare("1.0.0-rc.10", "1.0.0-rc.2"), 1);         // 10 > 2 numerically (not string)
+    assert.equal(compare("1.0.0-1", "1.0.0-alpha"), -1);          // numeric id < alphanumeric id
+    assert.equal(compare("1.0.0-rc.1.1", "1.0.0-rc.1"), 1);       // longer set wins when prefix equal
+});
+
+test("compare: monotonic -dev.<N> ordering (the latest-channel case)", () => {
+    assert.equal(compare("2.1.0-dev.7", "2.1.0-dev.6"), 1);   // newer latest build
+    assert.equal(compare("2.1.0-dev.10", "2.1.0-dev.9"), 1);  // numeric, not string (10 > 9)
+    assert.equal(compare("2.1.0-dev.1", "2.1.0-dev"), 1);     // a numbered dev outranks the bare -dev (local)
+    assert.equal(isNewer("2.1.0-dev.7", "2.1.0-dev.7"), false); // same latest build → no update
+});
+
+test("compare: unparseable side sorts lowest (never falsely claims newer)", () => {
+    assert.equal(compare("garbage", "1.0.0"), -1);
+    assert.equal(compare("1.0.0", "garbage"), 1);
+    assert.equal(compare("garbage", "junk"), 0);
+});
+
+test("isNewer: the update-available predicate", () => {
+    assert.equal(isNewer("2.1.0", "2.0.0"), true);      // newer stable available
+    assert.equal(isNewer("2.0.0", "2.0.0"), false);     // up to date
+    assert.equal(isNewer("2.0.0", "2.1.0-dev"), false); // dev build is AHEAD of latest stable → no update
+    assert.equal(isNewer("1.0.0", "2.0.0"), false);     // device newer than candidate
+});
diff --git a/test/python/test_compute_version.py b/test/python/test_compute_version.py
new file mode 100644
index 0000000..515b632
--- /dev/null
+++ b/test/python/test_compute_version.py
@@ -0,0 +1,87 @@
+# /// script
+# dependencies = ["pytest"]
+# ///
+"""compute_version tests — pins the per-channel version string.
+
+A stable build carries the core semver; a `latest` build carries a monotonic
+`<core>-dev.<N>` so successive latest builds are orderable; a local build is
+library.json verbatim. N counts since the last `v*` tag, with a tag-less fallback.
+
+Run: `uv run pytest test/python`.
+"""
+
+import json
+import sys
+from pathlib import Path
+
+sys.path.insert(0, str(Path(__file__).resolve().parents[2] / "scripts" / "build"))
+import compute_version as cv  # noqa: E402
+
+
+def _lib(tmp_path, version):
+    """Write a throwaway library.json holding `version`, return its path."""
+    f = tmp_path / "library.json"
+    f.write_text(json.dumps({"name": "projectMM", "version": version}))
+    return f
+
+
+def test_core_strips_prerelease_and_build():
+    assert cv.core_version("2.1.0-dev") == "2.1.0"
+    assert cv.core_version("2.1.0-dev.6") == "2.1.0"
+    assert cv.core_version("2.1.0+build.7") == "2.1.0"
+    assert cv.core_version("2.0.0") == "2.0.0"
+
+
+def test_stable_is_core(monkeypatch, tmp_path):
+    monkeypatch.setattr(cv, "LIBRARY_JSON", _lib(tmp_path, "2.1.0-dev"))
+    assert cv.compute("stable") == "2.1.0"
+
+
+def test_latest_is_core_dev_n(monkeypatch, tmp_path):
+    monkeypatch.setattr(cv, "LIBRARY_JSON", _lib(tmp_path, "2.1.0-dev"))
+    monkeypatch.setattr(cv, "commits_since_last_stable", lambda: 6)
+    assert cv.compute("latest") == "2.1.0-dev.6"
+
+
+def test_local_is_verbatim(monkeypatch, tmp_path):
+    monkeypatch.setattr(cv, "LIBRARY_JSON", _lib(tmp_path, "2.1.0-dev"))
+    assert cv.compute("local") == "2.1.0-dev"
+
+
+def test_channel_for_tag_centralizes_the_mapping():
+    # The release workflow passes only --tag; the channel derives from it here, so
+    # the build job and release job can't disagree.
+    assert cv.channel_for_tag("latest") == "latest"
+    assert cv.channel_for_tag("v2.1.0") == "stable"
+    assert cv.channel_for_tag("v2.1.0-rc1") == "stable"   # -rc handled inside compute(), still stable channel
+    assert cv.channel_for_tag("") == "stable"
+
+
+def test_stable_rc_tag_keeps_prerelease(monkeypatch, tmp_path):
+    # An -rc tag is itself a precise prerelease semver — carried through verbatim
+    # (minus the leading v), not collapsed to the core, so the RC binary doesn't
+    # masquerade as the stable release.
+    monkeypatch.setattr(cv, "LIBRARY_JSON", _lib(tmp_path, "2.1.0-dev"))
+    assert cv.compute("stable", "v2.1.0-rc1") == "2.1.0-rc1"
+    assert cv.compute("stable", "v2.1.0") == "2.1.0"      # plain stable tag → core
+    assert cv.compute("stable", "") == "2.1.0"            # no tag → core
+
+
+def test_no_tag_fallback_counts_from_root(monkeypatch, tmp_path):
+    # First-release case: with no v* tag, `git describe --match v*` fails and the
+    # helper falls back to counting all commits from the root (rev-list HEAD).
+    import subprocess
+    calls = []
+
+    def fake_run(cmd, **kw):
+        calls.append(cmd)
+        if "describe" in cmd:
+            raise subprocess.CalledProcessError(128, cmd)   # no v* tag
+        # rev-list --count HEAD → some count
+        return subprocess.CompletedProcess(cmd, 0, stdout="42\n", stderr="")
+
+    monkeypatch.setattr(cv.subprocess, "run", fake_run)
+    assert cv.commits_since_last_stable() == 42
+    # The fallback range must be HEAD (not <tag>..HEAD).
+    rev_list = next(c for c in calls if "rev-list" in c)
+    assert rev_list[-1] == "HEAD"
diff --git a/test/python/test_verify_version.py b/test/python/test_verify_version.py
new file mode 100644
index 0000000..573f410
--- /dev/null
+++ b/test/python/test_verify_version.py
@@ -0,0 +1,57 @@
+# /// script
+# dependencies = ["pytest"]
+# ///
+"""verify_version release-ritual tests.
+
+Pins the develop-on-a-prerelease flow: between releases library.json carries the NEXT
+version with a `-dev` suffix (e.g. `2.1.0-dev`), and cutting the stable tag drops the
+suffix. So `verify_version.py` must accept `v2.1.0` against `library.json 2.1.0-dev`
+(same core) while still rejecting a wrong core. The `latest` moving tag skips the check.
+
+Run: `uv run pytest test/python`.
+"""
+
+import json
+import subprocess
+import sys
+from pathlib import Path
+
+ROOT = Path(__file__).resolve().parents[2]
+SCRIPT = ROOT / "scripts" / "build" / "verify_version.py"
+
+
+def run(tag, version, tmp_path):
+    """Run verify_version against a throwaway library.json holding `version`."""
+    lib = tmp_path / "library.json"
+    lib.write_text(json.dumps({"name": "projectMM", "version": version}))
+    # verify_version reads ROOT/library.json; point it at the temp copy via cwd is not enough
+    # (it resolves ROOT from __file__), so patch by running a tiny wrapper that swaps the path.
+    code = (
+        f"import runpy, sys; "
+        f"import scripts.build.verify_version as v; "
+        f"v.LIBRARY_JSON = __import__('pathlib').Path(r'{lib}'); "
+        f"sys.argv = ['verify_version', '--tag', r'{tag}']; "
+        f"sys.exit(v.main())"
+    )
+    return subprocess.run(
+        [sys.executable, "-c", code], cwd=ROOT, capture_output=True, text=True
+    ).returncode
+
+
+def test_stable_tag_matches_dev_library(tmp_path):
+    # The release ritual: tag v2.1.0 releases the in-development 2.1.0-dev.
+    assert run("v2.1.0", "2.1.0-dev", tmp_path) == 0
+
+
+def test_stable_tag_matches_clean_library(tmp_path):
+    assert run("v2.0.0", "2.0.0", tmp_path) == 0
+
+
+def test_wrong_core_fails(tmp_path):
+    # A tag whose CORE differs from library.json must still fail.
+    assert run("v2.2.0", "2.1.0-dev", tmp_path) == 1
+
+
+def test_latest_skips(tmp_path):
+    # The moving prerelease channel has no in-tree version to match.
+    assert run("latest", "2.1.0-dev", tmp_path) == 0
diff --git a/test/scenarios/core/scenario_MoonModule_control_change.json b/test/scenarios/core/scenario_MoonModule_control_change.json
index a154b19..ca9e57d 100644
--- a/test/scenarios/core/scenario_MoonModule_control_change.json
+++ b/test/scenarios/core/scenario_MoonModule_control_change.json
@@ -118,7 +118,7 @@
         "pc-macos": {
           "tick_us": [
             97,
-            222
+            316
           ],
           "free_heap": [
             0,
@@ -130,7 +130,7 @@
           ],
           "at": [
             "2026-06-02",
-            "2026-06-07"
+            "2026-06-25"
           ]
         },
         "esp32-eth-wifi": {
diff --git a/test/scenarios/light/scenario_Audio_mutation.json b/test/scenarios/light/scenario_Audio_mutation.json
index 0ae0a61..755fe70 100644
--- a/test/scenarios/light/scenario_Audio_mutation.json
+++ b/test/scenarios/light/scenario_Audio_mutation.json
@@ -88,7 +88,7 @@
         "pc-macos": {
           "tick_us": [
             8,
-            21
+            31
           ],
           "free_heap": [
             0,
@@ -100,7 +100,7 @@
           ],
           "at": [
             "2026-06-12",
-            "2026-06-24"
+            "2026-06-25"
           ]
         }
       }
@@ -127,7 +127,7 @@
         "pc-macos": {
           "tick_us": [
             8,
-            20
+            29
           ],
           "free_heap": [
             0,
@@ -139,7 +139,7 @@
           ],
           "at": [
             "2026-06-12",
-            "2026-06-22"
+            "2026-06-25"
           ]
         }
       }
@@ -182,7 +182,7 @@
         "pc-macos": {
           "tick_us": [
             8,
-            20
+            31
           ],
           "free_heap": [
             0,
@@ -194,7 +194,7 @@
           ],
           "at": [
             "2026-06-13",
-            "2026-06-24"
+            "2026-06-25"
           ]
         }
       }
@@ -221,7 +221,7 @@
         "pc-macos": {
           "tick_us": [
             8,
-            32
+            33
           ],
           "free_heap": [
             0,
@@ -233,7 +233,7 @@
           ],
           "at": [
             "2026-06-12",
-            "2026-06-24"
+            "2026-06-25"
           ]
         }
       }
@@ -258,7 +258,7 @@
         "pc-macos": {
           "tick_us": [
             8,
-            23
+            32
           ],
           "free_heap": [
             0,
@@ -270,7 +270,7 @@
           ],
           "at": [
             "2026-06-12",
-            "2026-06-24"
+            "2026-06-25"
           ]
         }
       }
@@ -295,7 +295,7 @@
         "pc-macos": {
           "tick_us": [
             8,
-            20
+            25
           ],
           "free_heap": [
             0,
@@ -307,7 +307,7 @@
           ],
           "at": [
             "2026-06-12",
-            "2026-06-24"
+            "2026-06-25"
           ]
         }
       }
diff --git a/test/scenarios/light/scenario_Driver_mutation.json b/test/scenarios/light/scenario_Driver_mutation.json
index c3e9df6..ae3af8e 100644
--- a/test/scenarios/light/scenario_Driver_mutation.json
+++ b/test/scenarios/light/scenario_Driver_mutation.json
@@ -155,7 +155,7 @@
         "pc-macos": {
           "tick_us": [
             8,
-            21
+            26
           ],
           "free_heap": [
             0,
@@ -167,7 +167,7 @@
           ],
           "at": [
             "2026-06-13",
-            "2026-06-24"
+            "2026-06-25"
           ]
         }
       }
diff --git a/test/scenarios/light/scenario_Layers_composition.json b/test/scenarios/light/scenario_Layers_composition.json
new file mode 100644
index 0000000..c8810bb
--- /dev/null
+++ b/test/scenarios/light/scenario_Layers_composition.json
@@ -0,0 +1,128 @@
+{
+  "name": "scenario_Layers_composition",
+  "module": "Layers",
+  "mode": "construct",
+  "also": [
+    "Layer",
+    "GridLayout",
+    "RainbowEffect",
+    "CheckerboardEffect",
+    "Drivers",
+    "NetworkSendDriver"
+  ],
+  "description": "Multi-layer composition end-to-end: Layouts→Grid, TWO Layers under one Layers container (bottom Checkerboard, top Rainbow), Drivers→NetworkSendDriver. Proves the Drivers composite loop builds, allocates its output buffer, blends both enabled layers and feeds the result to the driver without crashing, and gates the bounded FPS so the N-pass composite cost is tracked. The exact alpha/additive blend math and the disable-drops-to-single-layer path are pinned by the unit tests (unit_BlendMap, unit_Layers_container); construct-mode set_control can't apply controls (built post-scheduler), so this scenario uses each Layer's default blend (alpha, full opacity) and asserts wired liveness + tick, not per-byte blend output.",
+  "steps": [
+    {
+      "name": "add-layout-group",
+      "description": "Top-level Layouts container.",
+      "op": "add_module",
+      "id": "Layouts",
+      "type": "Layouts"
+    },
+    {
+      "name": "add-grid",
+      "description": "128x128 GridLayout under Layouts (above host clock resolution so the composite tick is measurable).",
+      "op": "add_module",
+      "id": "Grid",
+      "type": "GridLayout",
+      "parent_id": "Layouts",
+      "props": {
+        "width": 128,
+        "height": 128
+      }
+    },
+    {
+      "name": "add-layers-group",
+      "description": "Top-level Layers container — the multi-layer composition host.",
+      "op": "add_module",
+      "id": "Layers",
+      "type": "Layers",
+      "props": {
+        "layouts": "Layouts"
+      }
+    },
+    {
+      "name": "add-bottom-layer",
+      "description": "Bottom Layer (composited first — clears + overwrites the output buffer). RGB.",
+      "op": "add_module",
+      "id": "LayerBottom",
+      "type": "Layer",
+      "parent_id": "Layers",
+      "props": {
+        "channelsPerLight": 3
+      }
+    },
+    {
+      "name": "add-bottom-effect",
+      "description": "A Checkerboard base as the bottom layer's effect.",
+      "op": "add_module",
+      "id": "Checker",
+      "type": "CheckerboardEffect",
+      "parent_id": "LayerBottom"
+    },
+    {
+      "name": "add-top-layer",
+      "description": "Top Layer (composited second — blends onto the bottom with its default blend). RGB.",
+      "op": "add_module",
+      "id": "LayerTop",
+      "type": "Layer",
+      "parent_id": "Layers",
+      "props": {
+        "channelsPerLight": 3
+      }
+    },
+    {
+      "name": "add-top-effect",
+      "description": "Rainbow as the top layer's effect — composited over the Checkerboard base.",
+      "op": "add_module",
+      "id": "Rainbow",
+      "type": "RainbowEffect",
+      "parent_id": "LayerTop"
+    },
+    {
+      "name": "add-driver-group",
+      "description": "Top-level Drivers container wired to the Layers container (composites all enabled layers into its output buffer).",
+      "op": "add_module",
+      "id": "Drivers",
+      "type": "Drivers",
+      "props": {
+        "layers": "Layers"
+      }
+    },
+    {
+      "name": "add-artnet",
+      "description": "Add NetworkSendDriver and run the bounded FPS measurement over the two-layer composite (min_pct gates on hardware; skipped with a WARN in the desktop runner).",
+      "op": "add_module",
+      "id": "ArtNet",
+      "type": "NetworkSendDriver",
+      "parent_id": "Drivers",
+      "measure": true,
+      "bounds": {
+        "fps": {
+          "min_pct": 80,
+          "min_fps_led_product": 294912
+        }
+      },
+      "observed": {
+        "pc-macos": {
+          "tick_us": [
+            54,
+            163
+          ],
+          "free_heap": [
+            0,
+            0
+          ],
+          "max_alloc_block": [
+            0,
+            0
+          ],
+          "at": [
+            "2026-06-25",
+            "2026-06-25"
+          ]
+        }
+      }
+    }
+  ]
+}
diff --git a/test/scenarios/light/scenario_Layouts_mutation.json b/test/scenarios/light/scenario_Layouts_mutation.json
index 4ef3a78..66baeaf 100644
--- a/test/scenarios/light/scenario_Layouts_mutation.json
+++ b/test/scenarios/light/scenario_Layouts_mutation.json
@@ -79,7 +79,7 @@
         "pc-macos": {
           "tick_us": [
             8,
-            35
+            40
           ],
           "free_heap": [
             0,
@@ -91,7 +91,7 @@
           ],
           "at": [
             "2026-06-05",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "pc-windows": {
@@ -158,7 +158,7 @@
         "pc-macos": {
           "tick_us": [
             9,
-            82
+            84
           ],
           "free_heap": [
             0,
@@ -170,7 +170,7 @@
           ],
           "at": [
             "2026-06-05",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "pc-windows": {
@@ -232,7 +232,7 @@
         "pc-macos": {
           "tick_us": [
             10,
-            225
+            271
           ],
           "free_heap": [
             0,
@@ -244,7 +244,7 @@
           ],
           "at": [
             "2026-06-05",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "pc-windows": {
diff --git a/test/scenarios/light/scenario_MultiplyModifier_pipeline.json b/test/scenarios/light/scenario_MultiplyModifier_pipeline.json
index 5c7a5e2..93f031d 100644
--- a/test/scenarios/light/scenario_MultiplyModifier_pipeline.json
+++ b/test/scenarios/light/scenario_MultiplyModifier_pipeline.json
@@ -90,7 +90,7 @@
         "pc-macos": {
           "tick_us": [
             1,
-            249
+            272
           ],
           "free_heap": [
             0,
@@ -102,7 +102,7 @@
           ],
           "at": [
             "2026-06-02",
-            "2026-06-24"
+            "2026-06-25"
           ]
         },
         "pc-windows": {
diff --git a/test/scenarios/light/scenario_modifier_swap.json b/test/scenarios/light/scenario_modifier_swap.json
index f2d1ba1..927dc9a 100644
--- a/test/scenarios/light/scenario_modifier_swap.json
+++ b/test/scenarios/light/scenario_modifier_swap.json
@@ -184,6 +184,60 @@
             "2026-06-07",
             "2026-06-08"
           ]
+        },
+        "esp32p4-eth": {
+          "tick_us": [
+            165,
+            179
+          ],
+          "free_heap": [
+            34041219,
+            34041231
+          ],
+          "max_alloc_block": [
+            385024,
+            385024
+          ],
+          "at": [
+            "2026-06-25",
+            "2026-06-25"
+          ]
+        },
+        "esp32s3-n16r8": {
+          "tick_us": [
+            389,
+            564
+          ],
+          "free_heap": [
+            8550715,
+            8550879
+          ],
+          "max_alloc_block": [
+            94208,
+            94208
+          ],
+          "at": [
+            "2026-06-25",
+            "2026-06-25"
+          ]
+        },
+        "esp32": {
+          "tick_us": [
+            459,
+            561
+          ],
+          "free_heap": [
+            148616,
+            148900
+          ],
+          "max_alloc_block": [
+            110592,
+            110592
+          ],
+          "at": [
+            "2026-06-25",
+            "2026-06-25"
+          ]
         }
       }
     },
@@ -202,7 +256,7 @@
         "pc-macos": {
           "tick_us": [
             17,
-            57
+            63
           ],
           "free_heap": [
             0,
@@ -214,7 +268,7 @@
           ],
           "at": [
             "2026-06-07",
-            "2026-06-11"
+            "2026-06-25"
           ]
         },
         "esp32-eth": {
@@ -234,6 +288,60 @@
             "2026-06-07",
             "2026-06-08"
           ]
+        },
+        "esp32p4-eth": {
+          "tick_us": [
+            362,
+            364
+          ],
+          "free_heap": [
+            34039983,
+            34039995
+          ],
+          "max_alloc_block": [
+            385024,
+            385024
+          ],
+          "at": [
+            "2026-06-25",
+            "2026-06-25"
+          ]
+        },
+        "esp32s3-n16r8": {
+          "tick_us": [
+            1060,
+            1082
+          ],
+          "free_heap": [
+            8549471,
+            8549607
+          ],
+          "max_alloc_block": [
+            94208,
+            94208
+          ],
+          "at": [
+            "2026-06-25",
+            "2026-06-25"
+          ]
+        },
+        "esp32": {
+          "tick_us": [
+            1085,
+            1121
+          ],
+          "free_heap": [
+            148044,
+            148064
+          ],
+          "max_alloc_block": [
+            110592,
+            110592
+          ],
+          "at": [
+            "2026-06-25",
+            "2026-06-25"
+          ]
         }
       }
     },
@@ -252,7 +360,7 @@
         "pc-macos": {
           "tick_us": [
             6,
-            15
+            22
           ],
           "free_heap": [
             0,
@@ -264,7 +372,7 @@
           ],
           "at": [
             "2026-06-07",
-            "2026-06-11"
+            "2026-06-25"
           ]
         },
         "esp32-eth": {
@@ -284,6 +392,60 @@
             "2026-06-07",
             "2026-06-08"
           ]
+        },
+        "esp32p4-eth": {
+          "tick_us": [
+            156,
+            158
+          ],
+          "free_heap": [
+            34041219,
+            34041231
+          ],
+          "max_alloc_block": [
+            385024,
+            385024
+          ],
+          "at": [
+            "2026-06-25",
+            "2026-06-25"
+          ]
+        },
+        "esp32s3-n16r8": {
+          "tick_us": [
+            384,
+            466
+          ],
+          "free_heap": [
+            8549087,
+            8550715
+          ],
+          "max_alloc_block": [
+            94208,
+            94208
+          ],
+          "at": [
+            "2026-06-25",
+            "2026-06-25"
+          ]
+        },
+        "esp32": {
+          "tick_us": [
+            453,
+            481
+          ],
+          "free_heap": [
+            148608,
+            148916
+          ],
+          "max_alloc_block": [
+            110592,
+            110592
+          ],
+          "at": [
+            "2026-06-25",
+            "2026-06-25"
+          ]
         }
       }
     }
diff --git a/test/scenarios/light/scenario_perf_full.json b/test/scenarios/light/scenario_perf_full.json
index 05413dc..d444512 100644
--- a/test/scenarios/light/scenario_perf_full.json
+++ b/test/scenarios/light/scenario_perf_full.json
@@ -87,7 +87,7 @@
         "pc-macos": {
           "tick_us": [
             0,
-            0
+            1
           ],
           "free_heap": [
             0,
@@ -99,7 +99,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32s3-n16r8": {
@@ -109,25 +109,25 @@
           ],
           "free_heap": [
             8540003,
-            8546675
+            8552543
           ],
           "max_alloc_block": [
-            106496,
+            94208,
             114688
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "esp32": {
           "tick_us": [
-            129,
-            129
+            112,
+            130
           ],
           "free_heap": [
             137376,
-            137376
+            150116
           ],
           "max_alloc_block": [
             110592,
@@ -135,17 +135,17 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32p4-eth": {
           "tick_us": [
-            58,
+            57,
             67
           ],
           "free_heap": [
             34023535,
-            34042067
+            34043067
           ],
           "max_alloc_block": [
             385024,
@@ -153,7 +153,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         }
       }
@@ -176,7 +176,7 @@
         "pc-macos": {
           "tick_us": [
             0,
-            0
+            1
           ],
           "free_heap": [
             0,
@@ -188,7 +188,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32s3-n16r8": {
@@ -198,25 +198,25 @@
           ],
           "free_heap": [
             8538439,
-            8546019
+            8552531
           ],
           "max_alloc_block": [
-            106496,
+            94208,
             114688
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "esp32": {
           "tick_us": [
-            116,
+            101,
             116
           ],
           "free_heap": [
             137676,
-            137676
+            150108
           ],
           "max_alloc_block": [
             110592,
@@ -224,7 +224,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32p4-eth": {
@@ -234,7 +234,7 @@
           ],
           "free_heap": [
             34025103,
-            34041643
+            34043067
           ],
           "max_alloc_block": [
             385024,
@@ -242,7 +242,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         }
       }
@@ -265,7 +265,7 @@
         "pc-macos": {
           "tick_us": [
             0,
-            0
+            1
           ],
           "free_heap": [
             0,
@@ -277,35 +277,35 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32s3-n16r8": {
           "tick_us": [
             101,
-            115
+            129
           ],
           "free_heap": [
             8536747,
-            8545823
+            8552527
           ],
           "max_alloc_block": [
-            102400,
+            94208,
             114688
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "esp32": {
           "tick_us": [
-            116,
+            101,
             116
           ],
           "free_heap": [
             134032,
-            134032
+            149816
           ],
           "max_alloc_block": [
             110592,
@@ -313,7 +313,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32p4-eth": {
@@ -323,7 +323,7 @@
           ],
           "free_heap": [
             34023519,
-            34041019
+            34043067
           ],
           "max_alloc_block": [
             385024,
@@ -331,7 +331,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         }
       }
@@ -352,7 +352,7 @@
         "pc-macos": {
           "tick_us": [
             0,
-            0
+            1
           ],
           "free_heap": [
             0,
@@ -364,7 +364,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32s3-n16r8": {
@@ -374,25 +374,25 @@
           ],
           "free_heap": [
             8536423,
-            8544003
+            8550727
           ],
           "max_alloc_block": [
-            106496,
+            94208,
             114688
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "esp32": {
           "tick_us": [
-            315,
-            315
+            293,
+            359
           ],
           "free_heap": [
             132632,
-            132632
+            148920
           ],
           "max_alloc_block": [
             110592,
@@ -400,17 +400,17 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32p4-eth": {
           "tick_us": [
             94,
-            106
+            114
           ],
           "free_heap": [
             34021595,
-            34039211
+            34041231
           ],
           "max_alloc_block": [
             385024,
@@ -418,7 +418,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         }
       }
@@ -446,7 +446,7 @@
         "pc-macos": {
           "tick_us": [
             0,
-            0
+            5
           ],
           "free_heap": [
             0,
@@ -458,7 +458,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32s3-n16r8": {
@@ -468,7 +468,7 @@
           ],
           "free_heap": [
             8535099,
-            8545827
+            8552527
           ],
           "max_alloc_block": [
             94208,
@@ -476,17 +476,17 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "esp32": {
           "tick_us": [
-            115,
+            105,
             115
           ],
           "free_heap": [
             126208,
-            126208
+            150108
           ],
           "max_alloc_block": [
             110592,
@@ -494,17 +494,17 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32p4-eth": {
           "tick_us": [
-            56,
+            55,
             63
           ],
           "free_heap": [
             34024991,
-            34041015
+            34043067
           ],
           "max_alloc_block": [
             385024,
@@ -512,7 +512,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         }
       }
@@ -533,7 +533,7 @@
         "pc-macos": {
           "tick_us": [
             0,
-            0
+            1
           ],
           "free_heap": [
             0,
@@ -545,7 +545,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32s3-n16r8": {
@@ -555,7 +555,7 @@
           ],
           "free_heap": [
             8533659,
-            8544519
+            8551087
           ],
           "max_alloc_block": [
             86016,
@@ -563,17 +563,17 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "esp32": {
           "tick_us": [
             139,
-            139
+            164
           ],
           "free_heap": [
             134168,
-            134168
+            148380
           ],
           "max_alloc_block": [
             110592,
@@ -581,7 +581,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32p4-eth": {
@@ -591,7 +591,7 @@
           ],
           "free_heap": [
             34023679,
-            34038003
+            34041623
           ],
           "max_alloc_block": [
             385024,
@@ -599,7 +599,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         }
       }
@@ -631,7 +631,7 @@
         "pc-macos": {
           "tick_us": [
             0,
-            0
+            1
           ],
           "free_heap": [
             0,
@@ -643,17 +643,17 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32s3-n16r8": {
           "tick_us": [
             108,
-            120
+            139
           ],
           "free_heap": [
             8506847,
-            8520667
+            8527371
           ],
           "max_alloc_block": [
             86016,
@@ -661,25 +661,25 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "esp32": {
           "tick_us": [
-            152,
+            109,
             152
           ],
           "free_heap": [
             108912,
-            108912
+            124952
           ],
           "max_alloc_block": [
             86016,
-            86016
+            110592
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32p4-eth": {
@@ -689,7 +689,7 @@
           ],
           "free_heap": [
             33996811,
-            34015891
+            34017903
           ],
           "max_alloc_block": [
             385024,
@@ -697,7 +697,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         }
       }
@@ -751,26 +751,26 @@
             142
           ],
           "free_heap": [
-            8536135,
-            8545247
+            8533127,
+            8551951
           ],
           "max_alloc_block": [
-            94208,
+            90112,
             114688
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "esp32": {
           "tick_us": [
-            119,
+            101,
             119
           ],
           "free_heap": [
             128832,
-            128832
+            150112
           ],
           "max_alloc_block": [
             110592,
@@ -778,17 +778,17 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32p4-eth": {
           "tick_us": [
             56,
-            62
+            63
           ],
           "free_heap": [
             34022847,
-            34040463
+            34042483
           ],
           "max_alloc_block": [
             385024,
@@ -796,7 +796,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         }
       }
@@ -851,25 +851,25 @@
           ],
           "free_heap": [
             8537691,
-            8545823
+            8552603
           ],
           "max_alloc_block": [
-            106496,
+            94208,
             114688
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "esp32": {
           "tick_us": [
-            118,
+            101,
             118
           ],
           "free_heap": [
             138424,
-            138424
+            150316
           ],
           "max_alloc_block": [
             110592,
@@ -877,7 +877,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32p4-eth": {
@@ -887,7 +887,7 @@
           ],
           "free_heap": [
             34022855,
-            34040471
+            34042491
           ],
           "max_alloc_block": [
             385024,
@@ -895,7 +895,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         }
       }
@@ -960,25 +960,25 @@
           ],
           "free_heap": [
             8535703,
-            8545827
+            8552535
           ],
           "max_alloc_block": [
-            102400,
+            94208,
             114688
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "esp32": {
           "tick_us": [
-            149,
+            102,
             149
           ],
           "free_heap": [
             137384,
-            137384
+            150100
           ],
           "max_alloc_block": [
             110592,
@@ -986,7 +986,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32p4-eth": {
@@ -996,7 +996,7 @@
           ],
           "free_heap": [
             34023427,
-            34041007
+            34043067
           ],
           "max_alloc_block": [
             385024,
@@ -1004,7 +1004,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         }
       }
@@ -1053,25 +1053,25 @@
           ],
           "free_heap": [
             8531251,
-            8543527
+            8550235
           ],
           "max_alloc_block": [
-            102400,
+            94208,
             114688
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "esp32": {
           "tick_us": [
-            357,
+            297,
             357
           ],
           "free_heap": [
             136808,
-            136808
+            147516
           ],
           "max_alloc_block": [
             110592,
@@ -1079,17 +1079,17 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32p4-eth": {
           "tick_us": [
-            133,
+            132,
             138
           ],
           "free_heap": [
             34022787,
-            34038703
+            34040763
           ],
           "max_alloc_block": [
             385024,
@@ -1097,7 +1097,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         }
       }
@@ -1142,11 +1142,11 @@
         "esp32s3-n16r8": {
           "tick_us": [
             989,
-            1090
+            1118
           ],
           "free_heap": [
             8510995,
-            8534311
+            8541019
           ],
           "max_alloc_block": [
             90112,
@@ -1154,17 +1154,17 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "esp32": {
           "tick_us": [
-            1147,
-            1147
+            1123,
+            1150
           ],
           "free_heap": [
             127592,
-            127592
+            138300
           ],
           "max_alloc_block": [
             110592,
@@ -1172,17 +1172,17 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32p4-eth": {
           "tick_us": [
-            452,
+            448,
             498
           ],
           "free_heap": [
             34015299,
-            34029487
+            34031547
           ],
           "max_alloc_block": [
             385024,
@@ -1190,7 +1190,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         }
       }
@@ -1235,29 +1235,29 @@
         "esp32s3-n16r8": {
           "tick_us": [
             7488,
-            7949
+            8799
           ],
           "free_heap": [
             8490295,
-            8497459
+            8504331
           ],
           "max_alloc_block": [
-            102400,
+            94208,
             114688
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "esp32": {
           "tick_us": [
-            4360,
-            4360
+            4208,
+            4458
           ],
           "free_heap": [
             90728,
-            90728
+            101728
           ],
           "max_alloc_block": [
             63488,
@@ -1265,7 +1265,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32p4-eth": {
@@ -1275,7 +1275,7 @@
           ],
           "free_heap": [
             33978435,
-            33992623
+            33994683
           ],
           "max_alloc_block": [
             385024,
@@ -1283,7 +1283,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         }
       }
@@ -1318,7 +1318,7 @@
         "pc-macos": {
           "tick_us": [
             3,
-            9
+            16
           ],
           "free_heap": [
             0,
@@ -1330,7 +1330,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-24"
+            "2026-06-25"
           ]
         },
         "esp32s3-n16r8": {
@@ -1340,25 +1340,25 @@
           ],
           "free_heap": [
             8541939,
-            8545831
+            8552519
           ],
           "max_alloc_block": [
-            110592,
+            94208,
             114688
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "esp32": {
           "tick_us": [
-            1010,
+            817,
             1010
           ],
           "free_heap": [
             138948,
-            138948
+            150120
           ],
           "max_alloc_block": [
             110592,
@@ -1366,17 +1366,17 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32p4-eth": {
           "tick_us": [
-            302,
-            345
+            297,
+            349
           ],
           "free_heap": [
             34026819,
-            34041027
+            34043067
           ],
           "max_alloc_block": [
             385024,
@@ -1384,7 +1384,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         }
       }
@@ -1411,7 +1411,7 @@
         "pc-macos": {
           "tick_us": [
             14,
-            59
+            66
           ],
           "free_heap": [
             0,
@@ -1423,7 +1423,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-21"
+            "2026-06-25"
           ]
         },
         "esp32s3-n16r8": {
@@ -1433,25 +1433,25 @@
           ],
           "free_heap": [
             8539631,
-            8543527
+            8550215
           ],
           "max_alloc_block": [
-            110592,
+            94208,
             114688
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "esp32": {
           "tick_us": [
             3203,
-            3203
+            3263
           ],
           "free_heap": [
             136808,
-            136808
+            147524
           ],
           "max_alloc_block": [
             110592,
@@ -1459,17 +1459,17 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32p4-eth": {
           "tick_us": [
-            1120,
+            1113,
             1252
           ],
           "free_heap": [
             34024515,
-            34038723
+            34040763
           ],
           "max_alloc_block": [
             385024,
@@ -1477,7 +1477,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         }
       }
@@ -1522,29 +1522,29 @@
         "esp32s3-n16r8": {
           "tick_us": [
             11073,
-            11371
+            11740
           ],
           "free_heap": [
             8530415,
-            8534311
+            8541023
           ],
           "max_alloc_block": [
-            110592,
+            94208,
             114688
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "esp32": {
           "tick_us": [
-            13547,
+            12745,
             13547
           ],
           "free_heap": [
             127596,
-            127596
+            138600
           ],
           "max_alloc_block": [
             110592,
@@ -1552,7 +1552,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32p4-eth": {
@@ -1562,7 +1562,7 @@
           ],
           "free_heap": [
             34015299,
-            34029507
+            34031547
           ],
           "max_alloc_block": [
             385024,
@@ -1570,7 +1570,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         }
       }
@@ -1597,7 +1597,7 @@
         "pc-macos": {
           "tick_us": [
             308,
-            639
+            914
           ],
           "free_heap": [
             0,
@@ -1609,35 +1609,35 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-24"
+            "2026-06-25"
           ]
         },
         "esp32s3-n16r8": {
           "tick_us": [
             48051,
-            51127
+            51959
           ],
           "free_heap": [
             8491607,
-            8497447
+            8504171
           ],
           "max_alloc_block": [
-            106496,
+            94208,
             114688
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "esp32": {
           "tick_us": [
-            62316,
+            52644,
             62316
           ],
           "free_heap": [
             90732,
-            90732
+            101444
           ],
           "max_alloc_block": [
             63488,
@@ -1645,17 +1645,17 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32p4-eth": {
           "tick_us": [
             17433,
-            18024
+            18626
           ],
           "free_heap": [
             33978435,
-            33992643
+            33994683
           ],
           "max_alloc_block": [
             385024,
@@ -1663,7 +1663,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         }
       }
@@ -1702,21 +1702,21 @@
           ],
           "free_heap": [
             8540231,
-            8543995
+            8550719
           ],
           "max_alloc_block": [
-            110592,
+            94208,
             114688
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "pc-macos": {
           "tick_us": [
             1,
-            2
+            4
           ],
           "free_heap": [
             0,
@@ -1728,17 +1728,17 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-24"
+            "2026-06-25"
           ]
         },
         "esp32": {
           "tick_us": [
-            456,
-            456
+            450,
+            495
           ],
           "free_heap": [
             137940,
-            137940
+            148920
           ],
           "max_alloc_block": [
             110592,
@@ -1746,17 +1746,17 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32p4-eth": {
           "tick_us": [
             154,
-            164
+            190
           ],
           "free_heap": [
             34021691,
-            34039223
+            34041231
           ],
           "max_alloc_block": [
             385024,
@@ -1764,7 +1764,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         }
       }
@@ -1795,21 +1795,21 @@
           ],
           "free_heap": [
             8528551,
-            8537251
+            8543959
           ],
           "max_alloc_block": [
-            102400,
+            94208,
             114688
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "pc-macos": {
           "tick_us": [
             3,
-            7
+            170
           ],
           "free_heap": [
             0,
@@ -1821,17 +1821,17 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-24"
+            "2026-06-25"
           ]
         },
         "esp32": {
           "tick_us": [
-            1808,
-            1808
+            1707,
+            1827
           ],
           "free_heap": [
             133408,
-            133408
+            143808
           ],
           "max_alloc_block": [
             110592,
@@ -1839,7 +1839,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32p4-eth": {
@@ -1849,7 +1849,7 @@
           ],
           "free_heap": [
             34014947,
-            34032479
+            34034487
           ],
           "max_alloc_block": [
             385024,
@@ -1857,7 +1857,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         }
       }
@@ -1884,25 +1884,25 @@
         "esp32s3-n16r8": {
           "tick_us": [
             6165,
-            6552
+            8424
           ],
           "free_heap": [
             8506427,
-            8510275
+            8516999
           ],
           "max_alloc_block": [
-            110592,
+            94208,
             114688
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "pc-macos": {
           "tick_us": [
             14,
-            30
+            43
           ],
           "free_heap": [
             0,
@@ -1914,17 +1914,17 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-24"
+            "2026-06-25"
           ]
         },
         "esp32": {
           "tick_us": [
-            6958,
+            6739,
             6958
           ],
           "free_heap": [
             113820,
-            113820
+            124804
           ],
           "max_alloc_block": [
             98304,
@@ -1932,7 +1932,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32p4-eth": {
@@ -1942,7 +1942,7 @@
           ],
           "free_heap": [
             33991055,
-            34005503
+            34007511
           ],
           "max_alloc_block": [
             385024,
@@ -1950,7 +1950,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         }
       }
@@ -1977,25 +1977,25 @@
         "esp32s3-n16r8": {
           "tick_us": [
             28061,
-            33932
+            59546
           ],
           "free_heap": [
             8398527,
-            8402371
+            8409091
           ],
           "max_alloc_block": [
-            110592,
+            94208,
             114688
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "pc-macos": {
           "tick_us": [
             62,
-            134
+            195
           ],
           "free_heap": [
             0,
@@ -2007,35 +2007,35 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-24"
+            "2026-06-25"
           ]
         },
         "esp32": {
           "tick_us": [
             28466,
-            28466
+            33544
           ],
           "free_heap": [
             36648,
-            36648
+            47620
           ],
           "max_alloc_block": [
-            26624,
+            24576,
             26624
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32p4-eth": {
           "tick_us": [
             9846,
-            10184
+            11588
           ],
           "free_heap": [
             33883359,
-            33897599
+            33899607
           ],
           "max_alloc_block": [
             385024,
@@ -2043,7 +2043,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         }
       }
diff --git a/test/scenarios/light/scenario_perf_light.json b/test/scenarios/light/scenario_perf_light.json
index 195668a..ada97dd 100644
--- a/test/scenarios/light/scenario_perf_light.json
+++ b/test/scenarios/light/scenario_perf_light.json
@@ -120,11 +120,11 @@
         "esp32s3-n16r8": {
           "tick_us": [
             113,
-            149
+            172
           ],
           "free_heap": [
             8515895,
-            8538843
+            8547091
           ],
           "max_alloc_block": [
             81920,
@@ -132,17 +132,17 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "esp32": {
           "tick_us": [
-            114,
+            113,
             162
           ],
           "free_heap": [
             127980,
-            134020
+            150456
           ],
           "max_alloc_block": [
             110592,
@@ -150,7 +150,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32p4-eth": {
@@ -160,7 +160,7 @@
           ],
           "free_heap": [
             34024987,
-            34041859
+            34043695
           ],
           "max_alloc_block": [
             385024,
@@ -168,7 +168,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         }
       }
@@ -208,29 +208,29 @@
         "esp32s3-n16r8": {
           "tick_us": [
             248,
-            255
+            313
           ],
           "free_heap": [
             8530367,
-            8535475
+            8545279
           ],
           "max_alloc_block": [
-            98304,
+            94208,
             102400
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "esp32": {
           "tick_us": [
-            304,
+            103,
             325
           ],
           "free_heap": [
             134620,
-            138024
+            150316
           ],
           "max_alloc_block": [
             110592,
@@ -238,17 +238,17 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32p4-eth": {
           "tick_us": [
-            98,
-            104
+            97,
+            116
           ],
           "free_heap": [
             34023155,
-            34039419
+            34041223
           ],
           "max_alloc_block": [
             385024,
@@ -256,7 +256,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         }
       }
@@ -287,30 +287,30 @@
         },
         "esp32s3-n16r8": {
           "tick_us": [
-            238,
-            243
+            234,
+            263
           ],
           "free_heap": [
             8529571,
-            8533923
+            8545271
           ],
           "max_alloc_block": [
-            98304,
+            86016,
             102400
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "esp32": {
           "tick_us": [
-            304,
-            308
+            102,
+            326
           ],
           "free_heap": [
             135620,
-            136192
+            149812
           ],
           "max_alloc_block": [
             110592,
@@ -318,17 +318,17 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32p4-eth": {
           "tick_us": [
             93,
-            95
+            96
           ],
           "free_heap": [
             34023147,
-            34039207
+            34041223
           ],
           "max_alloc_block": [
             385024,
@@ -336,7 +336,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         }
       }
@@ -357,7 +357,7 @@
         "pc-macos": {
           "tick_us": [
             1,
-            2
+            3
           ],
           "free_heap": [
             0,
@@ -369,17 +369,17 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-24"
+            "2026-06-25"
           ]
         },
         "esp32s3-n16r8": {
           "tick_us": [
             399,
-            406
+            435
           ],
           "free_heap": [
             8532403,
-            8532939
+            8542143
           ],
           "max_alloc_block": [
             90112,
@@ -387,17 +387,17 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "esp32": {
           "tick_us": [
             306,
-            525
+            876
           ],
           "free_heap": [
             134596,
-            134612
+            149804
           ],
           "max_alloc_block": [
             110592,
@@ -405,7 +405,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32p4-eth": {
@@ -415,7 +415,7 @@
           ],
           "free_heap": [
             34021587,
-            34039219
+            34041223
           ],
           "max_alloc_block": [
             385024,
@@ -423,7 +423,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         }
       }
@@ -450,7 +450,7 @@
         "pc-macos": {
           "tick_us": [
             3,
-            8
+            11
           ],
           "free_heap": [
             0,
@@ -462,7 +462,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-24"
+            "2026-06-25"
           ]
         },
         "esp32s3-n16r8": {
@@ -471,26 +471,26 @@
             1778
           ],
           "free_heap": [
-            8530103,
+            8528343,
             8533407
           ],
           "max_alloc_block": [
-            102400,
+            86016,
             106496
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         },
         "esp32": {
           "tick_us": [
             1211,
-            1856
+            3774
           ],
           "free_heap": [
             133364,
-            133396
+            147500
           ],
           "max_alloc_block": [
             110592,
@@ -498,17 +498,17 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32p4-eth": {
           "tick_us": [
             532,
-            550
+            624
           ],
           "free_heap": [
             34018071,
-            34032475
+            34034479
           ],
           "max_alloc_block": [
             385024,
@@ -516,7 +516,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         }
       }
@@ -543,7 +543,7 @@
         "pc-macos": {
           "tick_us": [
             14,
-            35
+            44
           ],
           "free_heap": [
             0,
@@ -555,53 +555,53 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-24"
+            "2026-06-25"
           ]
         },
         "esp32s3-n16r8": {
           "tick_us": [
-            6386,
-            6830
+            6184,
+            7729
           ],
           "free_heap": [
-            8504719,
-            8506427
+            8501355,
+            8517015
           ],
           "max_alloc_block": [
-            98304,
+            94208,
             110592
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32": {
           "tick_us": [
             4412,
-            6633
+            12962
           ],
           "free_heap": [
             113668,
-            113788
+            138576
           ],
           "max_alloc_block": [
             90112,
-            98304
+            110592
           ],
           "at": [
             "2026-06-17",
-            "2026-06-17"
+            "2026-06-25"
           ]
         },
         "esp32p4-eth": {
           "tick_us": [
             2038,
-            2115
+            2432
           ],
           "free_heap": [
             33991263,
-            34005499
+            34007503
           ],
           "max_alloc_block": [
             385024,
@@ -609,7 +609,7 @@
           ],
           "at": [
             "2026-06-17",
-            "2026-06-22"
+            "2026-06-25"
           ]
         }
       }
diff --git a/test/unit/core/unit_FilesystemModule_persistence.cpp b/test/unit/core/unit_FilesystemModule_persistence.cpp
index df96a54..4cb1f3b 100644
--- a/test/unit/core/unit_FilesystemModule_persistence.cpp
+++ b/test/unit/core/unit_FilesystemModule_persistence.cpp
@@ -9,6 +9,7 @@
 #include "light/effects/NoiseEffect.h"
 #include "light/effects/RainbowEffect.h"
 #include "light/modifiers/MultiplyModifier.h"
+#include "light/modifiers/RegionModifier.h"
 #include "light/layers/Layer.h"
 #include "platform/platform.h"
 
@@ -364,7 +365,7 @@ TEST_CASE("FilesystemModule singleton survives probe construct+destruct") {
 // which default to 0,0 because ControlDescriptor.min/max are uint8_t and can't
 // represent an int16 range. Every Int16 control loaded as 0 — so a 128×128 grid
 // became 0×0×0 after restart and the whole pipeline allocated no buffers.
-// Int16 controls (GridLayout width/height, Layer start/end) preserve their saved value across load — no zero-clamping from uint8 min/max bounds.
+// Int16 controls (GridLayout width/height, RegionModifier start/end) preserve their saved value across load — no zero-clamping from uint8 min/max bounds.
 TEST_CASE("FilesystemModule Int16 controls round-trip preserves the saved value") {
     char tmpRoot[256];
     std::snprintf(tmpRoot, sizeof(tmpRoot), "/tmp/mm_int16_test_%u",
@@ -373,9 +374,10 @@ TEST_CASE("FilesystemModule Int16 controls round-trip preserves the saved value"
     std::filesystem::create_directories(std::string(tmpRoot) + "/.config");
     mm::platform::fsSetRoot(tmpRoot);
 
-    // Hand-write a Layer.json with non-zero Int16 values so the load path is
-    // exercised without needing a save-side step.
-    std::ofstream out(std::string(tmpRoot) + "/.config/Layer.json");
+    // Hand-write a RegionModifier.json with non-zero Int16 values (including
+    // negatives, which are legal on the wire) so the load path is exercised
+    // without needing a save-side step.
+    std::ofstream out(std::string(tmpRoot) + "/.config/RegionModifier.json");
     out << "{\"enabled\":true,\"startX\":42,\"startY\":-17,\"startZ\":0,"
         << "\"endX\":100,\"endY\":-100,\"endZ\":0}";
     out.close();
@@ -384,16 +386,16 @@ TEST_CASE("FilesystemModule Int16 controls round-trip preserves the saved value"
     auto* fs = new mm::FilesystemModule();
     fs->setTypeName("FilesystemModule");
     fs->setScheduler(&scheduler);
-    auto* layer = new mm::Layer();
-    layer->setTypeName("Layer");
+    auto* region = new mm::RegionModifier();
+    region->setTypeName("RegionModifier");
     scheduler.addModule(fs);
-    scheduler.addModule(layer);
+    scheduler.addModule(region);
     scheduler.setup();
 
-    CHECK(layer->startX == 42);
-    CHECK(layer->startY == -17);
-    CHECK(layer->endX == 100);
-    CHECK(layer->endY == -100);
+    CHECK(region->startX == 42);
+    CHECK(region->startY == -17);
+    CHECK(region->endX == 100);
+    CHECK(region->endY == -100);
 
     scheduler.teardown();
     std::filesystem::remove_all(tmpRoot);
diff --git a/test/unit/core/unit_FirmwareUpdateModule.cpp b/test/unit/core/unit_FirmwareUpdateModule.cpp
index 20e4ca6..a17b6b8 100644
--- a/test/unit/core/unit_FirmwareUpdateModule.cpp
+++ b/test/unit/core/unit_FirmwareUpdateModule.cpp
@@ -5,8 +5,8 @@
 #include <cstring>
 
 // The `firmware` control is always present and non-empty (either a real firmware key from
-// build_info.h or the fallback "unknown"). Moved here from SystemModule — the firmware card now
-// owns firmware identity (version/build/firmware) + the partition usage.
+// build_info.h or the fallback "unknown"). The firmware card owns firmware identity
+// (version/build/firmware) + the partition usage.
 TEST_CASE("FirmwareUpdateModule firmware control populated") {
     // The firmware control is wired in setup() from kFirmwareName (build_info.h).
     // Local desktop builds fall through to "unknown" because CMake doesn't
@@ -45,3 +45,34 @@ TEST_CASE("FirmwareUpdateModule firmware control populated") {
     CHECK(hasVersion);
     CHECK(hasBuild);
 }
+
+// OTA phase is surfaced through the shared status slot (MoonModule::setStatus()),
+// not a control. publishStatus() runs in setup()/loop1s() and maps the platform
+// OTA status string to a severity: "idle" clears the banner, an "error: " prefix
+// is Severity::Error, anything else is neutral Severity::Status.
+TEST_CASE("FirmwareUpdateModule OTA status routes through the status slot") {
+    mm::FirmwareUpdateModule fw;
+
+    // Boot state: g_otaStatus is "idle" → no banner.
+    std::strncpy(mm::g_otaStatus, "idle", sizeof(mm::g_otaStatus));
+    fw.setup();
+    CHECK(fw.status() == nullptr);
+
+    // An in-flight phase shows as a neutral status banner.
+    std::strncpy(mm::g_otaStatus, "downloading", sizeof(mm::g_otaStatus));
+    fw.loop1s();
+    REQUIRE(fw.status() != nullptr);
+    CHECK(std::strcmp(fw.status(), "downloading") == 0);
+    CHECK(fw.severity() == mm::MoonModule::Severity::Status);
+
+    // A failure (platform prefixes every failure with "error: ") is an error banner.
+    std::strncpy(mm::g_otaStatus, "error: ota perform ESP_FAIL", sizeof(mm::g_otaStatus));
+    fw.loop1s();
+    REQUIRE(fw.status() != nullptr);
+    CHECK(fw.severity() == mm::MoonModule::Severity::Error);
+
+    // Returning to idle clears the banner again.
+    std::strncpy(mm::g_otaStatus, "idle", sizeof(mm::g_otaStatus));
+    fw.loop1s();
+    CHECK(fw.status() == nullptr);
+}
diff --git a/test/unit/light/unit_BlendMap.cpp b/test/unit/light/unit_BlendMap.cpp
index d6911f4..9fdd39d 100644
--- a/test/unit/light/unit_BlendMap.cpp
+++ b/test/unit/light/unit_BlendMap.cpp
@@ -118,8 +118,9 @@ TEST_CASE("blendMap is identical for single-alloc and paged LUTs") {
 
 // An additive (overwrites=false) LUT folding two sources onto one physical light
 // adds and clamps at 255 (no overflow). overwrites=false is the opt-in for the
-// rare overlap case (future multi-layer compositing); the default copy path
-// would instead overwrite, so this pins the additive contract explicitly.
+// within-layer overlap case; the default copy path would instead overwrite, and a
+// full-opacity Overwrite op still routes through this additive accumulate, so this
+// pins the contract explicitly (the regression after the multi-layer rewrite).
 TEST_CASE("blendMap additive clamping (overwrites=false)") {
     mm::Buffer src, dst;
     src.allocate(1, 3);
@@ -198,3 +199,151 @@ TEST_CASE("blendMap overwrite path clears untouched cells (sparse mapping)") {
     CHECK(dst.data()[3] == 0); CHECK(dst.data()[4] == 0); CHECK(dst.data()[5] == 0);
     CHECK(dst.data()[9] == 0); CHECK(dst.data()[10] == 0); CHECK(dst.data()[11] == 0);
 }
+
+// --- Multi-layer composition: BlendOp + opacity + clearFirst (the new params). ---
+
+// Build an identity LUT (1 logical → 1 physical) in place — MappingLUT owns a
+// heap buffer and is non-copyable, so it can't be returned by value.
+static void buildIdentityLut1(mm::MappingLUT& lut) {
+    lut.build(1, 1);
+    mm::nrOfLightsType m[] = {0};
+    lut.setMapping(0, m, 1);
+    lut.finalize();
+}
+
+// Alpha-over at half opacity: dst = src*α + dst*(255-α). With dst=200, src=100,
+// α=128 → 100*128 + 200*127 = 12800 + 25400 = 38200; /255 ≈ 150.
+TEST_CASE("blendMap alpha-over blends src over dst by opacity") {
+    mm::Buffer src, dst;
+    src.allocate(1, 3); dst.allocate(1, 3);
+    src.data()[0] = src.data()[1] = src.data()[2] = 100;
+    dst.data()[0] = dst.data()[1] = dst.data()[2] = 200;
+    mm::MappingLUT lut; buildIdentityLut1(lut);
+    // clearFirst=false: blend ONTO the existing dst (a layer above the bottom).
+    mm::blendMap(src, dst, lut, 3, mm::BlendOp::Alpha, /*opacity=*/128, /*clearFirst=*/false);
+    CHECK(dst.data()[0] == 149);  // div255(100*128 + 200*127) = div255(38200) = 149
+    CHECK(dst.data()[1] == 149);
+    CHECK(dst.data()[2] == 149);
+}
+
+// Alpha at full opacity collapses to overwrite (src replaces dst exactly).
+TEST_CASE("blendMap alpha at opacity 255 == overwrite") {
+    mm::Buffer src, dst;
+    src.allocate(1, 3); dst.allocate(1, 3);
+    src.data()[0] = 10; src.data()[1] = 20; src.data()[2] = 30;
+    dst.data()[0] = dst.data()[1] = dst.data()[2] = 99;
+    mm::MappingLUT lut; buildIdentityLut1(lut);
+    mm::blendMap(src, dst, lut, 3, mm::BlendOp::Alpha, 255, /*clearFirst=*/false);
+    CHECK(dst.data()[0] == 10); CHECK(dst.data()[1] == 20); CHECK(dst.data()[2] == 30);
+}
+
+// Alpha at opacity 0 is a no-op (dst unchanged) — the invisible-layer case.
+TEST_CASE("blendMap alpha at opacity 0 leaves dst unchanged") {
+    mm::Buffer src, dst;
+    src.allocate(1, 3); dst.allocate(1, 3);
+    src.data()[0] = src.data()[1] = src.data()[2] = 200;
+    dst.data()[0] = dst.data()[1] = dst.data()[2] = 77;
+    mm::MappingLUT lut; buildIdentityLut1(lut);
+    mm::blendMap(src, dst, lut, 3, mm::BlendOp::Alpha, 0, /*clearFirst=*/false);
+    CHECK(dst.data()[0] == 77); CHECK(dst.data()[1] == 77); CHECK(dst.data()[2] == 77);
+}
+
+// Additive with opacity scales the source before adding, then clamps. dst=100,
+// src=200, opacity=128 → add 200*128/255 ≈ 100 → 200.
+TEST_CASE("blendMap additive scales source by opacity then clamps") {
+    mm::Buffer src, dst;
+    src.allocate(1, 3); dst.allocate(1, 3);
+    src.data()[0] = src.data()[1] = src.data()[2] = 200;
+    dst.data()[0] = dst.data()[1] = dst.data()[2] = 100;
+    mm::MappingLUT lut; buildIdentityLut1(lut);
+    mm::blendMap(src, dst, lut, 3, mm::BlendOp::Additive, /*opacity=*/128, /*clearFirst=*/false);
+    CHECK(dst.data()[0] == 200);  // 100 + round(200*128/255)=100
+    CHECK(dst.data()[1] == 200);
+    CHECK(dst.data()[2] == 200);
+}
+
+// clearFirst=false preserves dst cells the source doesn't touch — the mechanic
+// that lets a top layer blend onto the bottom layer's already-composited frame.
+TEST_CASE("blendMap clearFirst=false accumulates onto existing frame") {
+    mm::Buffer src, dst;
+    src.allocate(2, 3); dst.allocate(2, 3);
+    // src lights only physical 0; physical 1 left to the previous (bottom) layer.
+    src.data()[0] = src.data()[1] = src.data()[2] = 50;
+    src.data()[3] = src.data()[4] = src.data()[5] = 0;
+    // dst holds a prior frame: physical 1 is green from the layer below.
+    dst.data()[0] = dst.data()[1] = dst.data()[2] = 0;
+    dst.data()[3] = 0; dst.data()[4] = 255; dst.data()[5] = 0;
+
+    mm::MappingLUT lut;
+    lut.build(2, 1);
+    mm::nrOfLightsType m0[] = {0}, m1[] = {1};
+    lut.setMapping(0, m0, 1); lut.setMapping(1, m1, 1);
+    lut.finalize();
+
+    mm::blendMap(src, dst, lut, 3, mm::BlendOp::Additive, 255, /*clearFirst=*/false);
+    // Physical 0 got the additive source; physical 1's prior green survives + its src is 0.
+    CHECK(dst.data()[0] == 50);
+    CHECK(dst.data()[4] == 255);  // bottom layer's green preserved (not cleared)
+}
+
+// --- No-LUT (dense grid, identity 1:1) blend paths. blendMap has a SEPARATE
+// implementation for a layer with no LUT (logical index == physical index, no
+// lookup) — the common dense-grid case that composites directly. These mirror
+// the LUT blend tests above but on the no-LUT branch (an empty MappingLUT, so
+// hasLUT()==false). This is the path that runs on a real grid layer; it was the
+// one that initially failed to composite, so each op is pinned here explicitly.
+
+// No-LUT alpha-over at half opacity: dst = div255(src*α + dst*(255-α)).
+// dst=200, src=100, α=128 → div255(100*128 + 200*127) = div255(38200) = 149.
+TEST_CASE("blendMap no-LUT alpha-over blends 1:1 by opacity") {
+    mm::Buffer src, dst;
+    src.allocate(2, 3); dst.allocate(2, 3);
+    for (size_t i = 0; i < src.bytes(); i++) { src.data()[i] = 100; dst.data()[i] = 200; }
+    mm::MappingLUT lut;   // no build/setMapping → hasLUT()==false (identity 1:1)
+    mm::blendMap(src, dst, lut, 3, mm::BlendOp::Alpha, /*opacity=*/128, /*clearFirst=*/false);
+    for (size_t i = 0; i < dst.bytes(); i++) CHECK(dst.data()[i] == 149);
+}
+
+// No-LUT alpha at full opacity collapses to a plain copy (overwrite).
+TEST_CASE("blendMap no-LUT alpha at opacity 255 == overwrite") {
+    mm::Buffer src, dst;
+    src.allocate(1, 3); dst.allocate(1, 3);
+    src.data()[0] = 10; src.data()[1] = 20; src.data()[2] = 30;
+    dst.data()[0] = dst.data()[1] = dst.data()[2] = 99;
+    mm::MappingLUT lut;
+    mm::blendMap(src, dst, lut, 3, mm::BlendOp::Alpha, 255, /*clearFirst=*/false);
+    CHECK(dst.data()[0] == 10); CHECK(dst.data()[1] == 20); CHECK(dst.data()[2] == 30);
+}
+
+// No-LUT alpha at opacity 0 is a no-op (the invisible top layer).
+TEST_CASE("blendMap no-LUT alpha at opacity 0 leaves dst unchanged") {
+    mm::Buffer src, dst;
+    src.allocate(1, 3); dst.allocate(1, 3);
+    src.data()[0] = src.data()[1] = src.data()[2] = 200;
+    dst.data()[0] = dst.data()[1] = dst.data()[2] = 77;
+    mm::MappingLUT lut;
+    mm::blendMap(src, dst, lut, 3, mm::BlendOp::Alpha, 0, /*clearFirst=*/false);
+    CHECK(dst.data()[0] == 77); CHECK(dst.data()[1] == 77); CHECK(dst.data()[2] == 77);
+}
+
+// No-LUT additive with opacity scales the source then clamps at 255.
+// dst=100, src=200, opacity=128 → 100 + div255(200*128)=100 → 200.
+TEST_CASE("blendMap no-LUT additive scales by opacity then clamps") {
+    mm::Buffer src, dst;
+    src.allocate(2, 3); dst.allocate(2, 3);
+    for (size_t i = 0; i < src.bytes(); i++) { src.data()[i] = 200; dst.data()[i] = 100; }
+    mm::MappingLUT lut;
+    mm::blendMap(src, dst, lut, 3, mm::BlendOp::Additive, /*opacity=*/128, /*clearFirst=*/false);
+    for (size_t i = 0; i < dst.bytes(); i++) CHECK(dst.data()[i] == 200);
+}
+
+// No-LUT additive at full opacity saturates: 200 + 100 = 300 → clamp 255.
+TEST_CASE("blendMap no-LUT additive clamps at 255") {
+    mm::Buffer src, dst;
+    src.allocate(1, 3); dst.allocate(1, 3);
+    src.data()[0] = src.data()[1] = src.data()[2] = 200;
+    dst.data()[0] = dst.data()[1] = dst.data()[2] = 100;
+    mm::MappingLUT lut;
+    mm::blendMap(src, dst, lut, 3, mm::BlendOp::Additive, 255, /*clearFirst=*/false);
+    CHECK(dst.data()[0] == 255); CHECK(dst.data()[1] == 255); CHECK(dst.data()[2] == 255);
+}
diff --git a/test/unit/light/unit_Layer_sparse_mapping.cpp b/test/unit/light/unit_Layer_sparse_mapping.cpp
index f2249fb..a02bf91 100644
--- a/test/unit/light/unit_Layer_sparse_mapping.cpp
+++ b/test/unit/light/unit_Layer_sparse_mapping.cpp
@@ -6,6 +6,7 @@
 #include "light/layouts/GridLayout.h"
 #include "light/layouts/SphereLayout.h"
 #include "light/modifiers/MultiplyModifier.h"
+#include "light/modifiers/RegionModifier.h"
 
 // The driver/output buffer must hold ONLY the real lights, never the dense
 // bounding box. A sphere defines a 9x9x9 (=729) render grid but only 210 shell
@@ -179,3 +180,55 @@ TEST_CASE("Layer: high fan-out Multiply builds a full, in-range LUT (no overflow
     CHECK(total == 16384);   // full physical coverage, not a collapsed/empty LUT
     CHECK(inRange);
 }
+
+// Region carving: a RegionModifier shrinks the Layer's LOGICAL box to the region
+// (so the effect renders only there), and the LUT maps each region cell to its
+// box cell at the start offset — every destination in range, none outside the
+// region. The driver buffer still holds all physical lights; cells outside the
+// region simply get no logical source (dark). Default 0/100 = full box (the
+// no-carve fast path) is covered by unit_RegionModifier; here we carve a quarter.
+TEST_CASE("Layer: RegionModifier carves the logical box to a sub-region") {
+    mm::GridLayout g;
+    g.width = 8; g.height = 8; g.depth = 1;   // 64 lights, dense
+    mm::Layouts group;
+    group.addChild(&g);
+    mm::Layer layer;
+    layer.setLayouts(&group);
+    layer.setChannelsPerLight(3);
+    mm::RegionModifier region;
+    region.startX = 0; region.endX = 50;      // left half  → pixels 0..3
+    region.startY = 0; region.endY = 50;      // top half   → pixels 0..3
+    layer.addChild(&region);
+    layer.onBuildControls();
+    layer.onBuildState();
+
+    // Logical box is the carved quarter (4×4), not the full 8×8 box.
+    CHECK(layer.width() == 4);
+    CHECK(layer.height() == 4);
+    CHECK(layer.lut().hasLUT());
+    CHECK(layer.lut().logicalCount() == 4 * 4);
+
+    // Physical driver buffer is unchanged — all 64 lights still exist; carving
+    // only restricts which of them the effect sources into.
+    CHECK(layer.physicalLightCount() == 64);
+
+    // Every destination is a real box light inside the carved quarter (x<4, y<4),
+    // there are exactly 16 of them (one per logical cell, no fan-out), and they are
+    // all DISTINCT — a 1:1 carve must reach 16 different physical lights, never
+    // collapse two logical cells onto one destination or leave a cell unreached.
+    std::size_t total = 0;
+    bool insideRegion = true;
+    bool seen[64] = {false};     // 8×8 box
+    bool duplicate = false;
+    for (mm::nrOfLightsType li = 0; li < layer.lut().logicalCount(); li++) {
+        layer.lut().forEachDestination(li, [&](mm::nrOfLightsType d) {
+            total++;
+            const mm::nrOfLightsType x = d % 8, y = d / 8;  // 8-wide box
+            if (x >= 4 || y >= 4) insideRegion = false;
+            if (d < 64) { if (seen[d]) duplicate = true; seen[d] = true; }
+        });
+    }
+    CHECK(total == 16);          // 4×4 region, 1:1, nothing outside
+    CHECK(insideRegion);
+    CHECK_FALSE(duplicate);      // 16 distinct physical lights — no cell collapses onto another
+}
diff --git a/test/unit/light/unit_Layers_container.cpp b/test/unit/light/unit_Layers_container.cpp
index 92bd360..c7339ca 100644
--- a/test/unit/light/unit_Layers_container.cpp
+++ b/test/unit/light/unit_Layers_container.cpp
@@ -6,6 +6,8 @@
 #include "light/layouts/GridLayout.h"
 #include "light/effects/RainbowEffect.h"
 #include "light/effects/CheckerboardEffect.h"
+#include "light/modifiers/MultiplyModifier.h"
+#include "light/drivers/Drivers.h"
 #include "platform/platform.h"
 
 #include <cstring>
@@ -110,9 +112,10 @@ TEST_CASE("Layers with two Layers: each child Layer's loop runs and writes its b
     layersContainer.onBuildState();
     layersContainer.loop();
 
-    // Both child Layer buffers must be populated — composition isn't wired
-    // yet so we just verify each Layer's loop ran. (Checkerboard with default
-    // controls writes a checker pattern; Rainbow writes a hue gradient.)
+    // Both child Layer buffers must be populated — each Layer renders its own
+    // buffer here; the Drivers composite of those buffers is pinned by the
+    // "Drivers composites two enabled Layers" case below. (Checkerboard with
+    // default controls writes a checker pattern; Rainbow writes a hue gradient.)
     auto& bufA = layerA.buffer();
     auto& bufB = layerB.buffer();
     REQUIRE(bufA.bytes() == static_cast<size_t>(8 * 8 * 3));
@@ -125,6 +128,213 @@ TEST_CASE("Layers with two Layers: each child Layer's loop runs and writes its b
     CHECK_MESSAGE(bHasNonZero, "Layer B (Checkerboard) wrote no pixels");
 }
 
+// A minimal driver that just records the source buffer it's handed each tick,
+// so a test can inspect the composited output without a real network/LED sink.
+class CaptureDriver : public mm::DriverBase {
+public:
+    void setSourceBuffer(mm::Buffer* buf) override { src_ = buf; }
+    mm::Buffer* src_ = nullptr;
+};
+
+// Multi-layer composition: Drivers blends ≥2 enabled Layers into its own output
+// buffer and hands THAT to drivers (not a single Layer's buffer). Bottom layer
+// overwrites; top layer blends per its blendMode/opacity. This is the end-to-end
+// pin for the composite loop in Drivers::loop.
+TEST_CASE("Drivers composites two enabled Layers into one output buffer") {
+    mm::Layouts layouts;
+    mm::GridLayout grid;
+    grid.width = 4; grid.height = 1; grid.depth = 1;   // 4 lights, dense (no LUT)
+    layouts.addChild(&grid);
+
+    mm::Layers layersContainer;
+    // Bottom layer: a checkerboard base.
+    mm::Layer bottom; bottom.setChannelsPerLight(3);
+    mm::CheckerboardEffect base; bottom.addChild(&base);
+    // Top layer: rainbow, additive at full opacity → bottom + top, clamped.
+    mm::Layer top; top.setChannelsPerLight(3);
+    mm::RainbowEffect over; top.addChild(&over);
+    top.blendMode = 1;   // additive
+    top.opacity = 255;
+
+    layersContainer.addChild(&bottom);
+    layersContainer.addChild(&top);
+    layersContainer.setLayouts(&layouts);
+
+    mm::Drivers drivers;
+    CaptureDriver cap;
+    drivers.addChild(&cap);
+    drivers.setLayers(&layersContainer);
+
+    layersContainer.onBuildState();
+    drivers.onBuildState();      // sizes + allocates the composite output buffer
+    layersContainer.loop();      // both layers render their own buffers
+    drivers.loop();              // composite into outputBuffer_, hand it to cap
+
+    REQUIRE(layersContainer.enabledLayerCount() == 2);
+    // The driver was handed the composite buffer (4 lights × 3ch), not a raw layer.
+    REQUIRE(cap.src_ != nullptr);
+    REQUIRE(cap.src_->bytes() == static_cast<size_t>(4 * 3));
+
+    // The composite must equal additive(bottom, top) per channel, clamped — i.e.
+    // for every byte, output >= bottom (top only adds) and output >= top's contribution.
+    auto& outBuf = *cap.src_;
+    auto& botBuf = bottom.buffer();
+    auto& topBuf = top.buffer();
+    REQUIRE(botBuf.bytes() == outBuf.bytes());
+    REQUIRE(topBuf.bytes() == outBuf.bytes());
+    bool sawSum = false;
+    for (size_t i = 0; i < outBuf.bytes(); i++) {
+        uint16_t expect = static_cast<uint16_t>(botBuf.data()[i]) + topBuf.data()[i];
+        if (expect > 255) expect = 255;
+        CHECK(outBuf.data()[i] == static_cast<uint8_t>(expect));
+        if (botBuf.data()[i] && topBuf.data()[i]) sawSum = true;
+    }
+    CHECK_MESSAGE(sawSum, "expected at least one light where both layers contribute (proves real compositing)");
+}
+
+// Disabling the top layer drops cleanly to the single (bottom) layer — no crash,
+// the driver now sees the bottom layer's content. Pins the robustness path.
+TEST_CASE("Drivers composition drops to single layer when one is disabled") {
+    mm::Layouts layouts;
+    mm::GridLayout grid;
+    grid.width = 4; grid.height = 1; grid.depth = 1;
+    layouts.addChild(&grid);
+
+    mm::Layers layersContainer;
+    mm::Layer bottom; bottom.setChannelsPerLight(3);
+    mm::CheckerboardEffect base; bottom.addChild(&base);
+    mm::Layer top; top.setChannelsPerLight(3);
+    mm::RainbowEffect over; top.addChild(&over);
+    layersContainer.addChild(&bottom);
+    layersContainer.addChild(&top);
+    layersContainer.setLayouts(&layouts);
+
+    mm::Drivers drivers;
+    CaptureDriver cap;
+    drivers.addChild(&cap);
+    drivers.setLayers(&layersContainer);
+
+    top.setEnabled(false);             // only the bottom layer remains
+    layersContainer.onBuildState();
+    drivers.onBuildState();
+    layersContainer.loop();
+    drivers.loop();
+
+    CHECK(layersContainer.enabledLayerCount() == 1);
+    REQUIRE(cap.src_ != nullptr);      // driver still has a valid buffer, no crash
+    REQUIRE(cap.src_->bytes() == static_cast<size_t>(4 * 3));
+}
+
+// Drivers' composition/output-buffer allocation contract (architecture.md §
+// Adaptive allocation). The driver output buffer exists ONLY when the pipeline
+// must blend into physical space; otherwise the lone layer's buffer is handed to
+// drivers directly (zero-copy). dynamicBytes() reflects outputBuffer_.bytes(), so
+// it's 0 ⇔ no buffer. Pins all three cases in one place:
+//   1. one identity (no-LUT) layer  → NO output buffer (zero-copy)
+//   2. two enabled layers           → output buffer (must composite)
+//   3. one layer WITH a LUT         → output buffer (must map logical→physical)
+TEST_CASE("Drivers allocates the output buffer only when compositing or mapping is needed") {
+    // --- Case 1: a single identity (dense-grid, no-LUT) layer → no output buffer ---
+    {
+        mm::Layouts layouts; mm::GridLayout grid;
+        grid.width = 8; grid.height = 8; grid.depth = 1;
+        layouts.addChild(&grid);
+        mm::Layers layers;
+        mm::Layer only; only.setChannelsPerLight(3);
+        mm::CheckerboardEffect eff; only.addChild(&eff);
+        layers.addChild(&only);
+        layers.setLayouts(&layouts);
+        mm::Drivers drivers; CaptureDriver cap; drivers.addChild(&cap);
+        drivers.setLayers(&layers);
+        layers.onBuildState(); drivers.onBuildState();
+
+        CHECK_FALSE(only.lut().hasLUT());            // dense grid → identity, no LUT
+        CHECK(layers.enabledLayerCount() == 1);
+        CHECK(drivers.dynamicBytes() == 0);          // NO output buffer allocated
+        REQUIRE(cap.src_ != nullptr);                // driver reads the layer buffer directly
+        CHECK(cap.src_ == &only.buffer());           // zero-copy: it's the layer's own buffer
+    }
+
+    // --- Case 2: two enabled layers → output buffer (must composite) ---
+    {
+        mm::Layouts layouts; mm::GridLayout grid;
+        grid.width = 8; grid.height = 8; grid.depth = 1;
+        layouts.addChild(&grid);
+        mm::Layers layers;
+        mm::Layer a; a.setChannelsPerLight(3); mm::CheckerboardEffect ea; a.addChild(&ea);
+        mm::Layer b; b.setChannelsPerLight(3); mm::RainbowEffect eb; b.addChild(&eb);
+        layers.addChild(&a); layers.addChild(&b);
+        layers.setLayouts(&layouts);
+        mm::Drivers drivers; CaptureDriver cap; drivers.addChild(&cap);
+        drivers.setLayers(&layers);
+        layers.onBuildState(); drivers.onBuildState();
+
+        CHECK(layers.enabledLayerCount() == 2);
+        CHECK(drivers.dynamicBytes() == static_cast<size_t>(8 * 8 * 3));  // output buffer allocated
+        REQUIRE(cap.src_ != nullptr);
+        CHECK(cap.src_ != &a.buffer());              // driver reads the composite, not a raw layer
+    }
+
+    // --- Case 3: a single layer WITH a LUT (a mirror modifier) → output buffer ---
+    {
+        mm::Layouts layouts; mm::GridLayout grid;
+        grid.width = 8; grid.height = 8; grid.depth = 1;
+        layouts.addChild(&grid);
+        mm::Layers layers;
+        mm::Layer only; only.setChannelsPerLight(3);
+        mm::CheckerboardEffect eff; only.addChild(&eff);
+        mm::MultiplyModifier mirror; mirror.mirrorX = true; only.addChild(&mirror);
+        layers.addChild(&only);
+        layers.setLayouts(&layouts);
+        mm::Drivers drivers; CaptureDriver cap; drivers.addChild(&cap);
+        drivers.setLayers(&layers);
+        layers.onBuildState(); drivers.onBuildState();
+
+        CHECK(only.lut().hasLUT());                  // mirror modifier → a real LUT
+        CHECK(layers.enabledLayerCount() == 1);
+        CHECK(drivers.dynamicBytes() > 0);           // output buffer allocated (map target)
+        REQUIRE(cap.src_ != nullptr);
+        CHECK(cap.src_ != &only.buffer());           // driver reads the mapped output, not the logical buffer
+    }
+
+    // --- Case 4: a live layer is DISABLED → drivers transition to idle, no stale buffer ---
+    // The real-world sequence: a frame is published with the layer enabled, then the
+    // user disables it and the pipeline rebuilds. activeLayer() still surfaces the
+    // (now disabled) layer so geometry stays queryable, but output selection must use
+    // the *enabled* source — with none, the driver's source buffer goes null so it
+    // emits nothing instead of re-sending the last frame off the disabled layer.
+    {
+        mm::Layouts layouts; mm::GridLayout grid;
+        grid.width = 8; grid.height = 8; grid.depth = 1;
+        layouts.addChild(&grid);
+        mm::Layers layers;
+        mm::Layer only; only.setChannelsPerLight(3);
+        mm::CheckerboardEffect eff; only.addChild(&eff);
+        // A LUT modifier so the pre-fix bug would route through the output path —
+        // proves the disabled gate, not just the no-LUT zero-copy branch.
+        mm::MultiplyModifier mirror; mirror.mirrorX = true; only.addChild(&mirror);
+        layers.addChild(&only);
+        layers.setLayouts(&layouts);
+        mm::Drivers drivers; CaptureDriver cap; drivers.addChild(&cap);
+        drivers.setLayers(&layers);
+
+        // Enabled first: the driver has a valid source buffer (a real frame).
+        layers.onBuildState(); drivers.onBuildState();
+        CHECK(layers.firstEnabledLayer() == &only);
+        CHECK(layers.enabledLayerCount() == 1);
+        REQUIRE(cap.src_ != nullptr);                // a frame is being published
+
+        // Now disable the only layer and rebuild — the driver must drop to idle.
+        only.setEnabled(false);
+        layers.onBuildState(); drivers.onBuildState();
+        CHECK(layers.activeLayer() == &only);        // fallback for geometry
+        CHECK(layers.firstEnabledLayer() == nullptr);// no enabled source
+        CHECK(layers.enabledLayerCount() == 0);
+        CHECK(drivers.dynamicBytes() == 0);          // no output buffer allocated
+        CHECK(cap.src_ == nullptr);                  // driver idle — the prior frame is NOT re-sent
+    }
+}
+
 // activeLayer() returns the first enabled child, or the only child if all are disabled (so dimensions stay queryable during boot/toggle-off).
 TEST_CASE("Layers::activeLayer returns first enabled child, or nullptr when empty") {
     mm::Layers empty;
@@ -150,6 +360,27 @@ TEST_CASE("Layers::activeLayer returns first enabled child, or nullptr when empt
     CHECK(twoChildren.activeLayer() == &second);
 }
 
+// firstEnabledLayer() is the output-selection counterpart to activeLayer(): it never
+// falls back to a disabled layer, so it returns nullptr exactly when nothing renders.
+TEST_CASE("Layers::firstEnabledLayer returns first enabled child, nullptr when all disabled") {
+    mm::Layers empty;
+    CHECK(empty.firstEnabledLayer() == nullptr);
+
+    mm::Layers layers;
+    mm::Layer first, second;
+    layers.addChild(&first);
+    layers.addChild(&second);
+    CHECK(layers.firstEnabledLayer() == &first);     // both enabled → first
+
+    first.setEnabled(false);
+    CHECK(layers.firstEnabledLayer() == &second);    // skips the disabled first
+    CHECK(layers.activeLayer() == &second);          // agrees while one stays enabled
+
+    second.setEnabled(false);
+    CHECK(layers.firstEnabledLayer() == nullptr);    // none enabled → nothing renders
+    CHECK(layers.activeLayer() == &first);           // but geometry fallback still resolves
+}
+
 // If the container holds only non-Layer children, activeLayer() returns nullptr (the role-guard skips, never miscasts).
 TEST_CASE("Layers::activeLayer returns nullptr when no child has role Layer") {
     // The role-guard in activeLayer (and setLayouts) skips non-Layer children
diff --git a/test/unit/light/unit_RegionModifier.cpp b/test/unit/light/unit_RegionModifier.cpp
new file mode 100644
index 0000000..97bd5df
--- /dev/null
+++ b/test/unit/light/unit_RegionModifier.cpp
@@ -0,0 +1,132 @@
+// @module RegionModifier
+
+#include "doctest.h"
+#include "light/modifiers/RegionModifier.h"
+
+// RegionModifier carves the layer to a sub-rectangle of the physical box, given
+// as percentages. logicalDimensions reports the region size; mapToPhysical
+// translates a region-local cell to its box cell at the region's start offset.
+// Half-open [start, end): abutting regions tile exactly. Defaults 0/100 = full box.
+
+static mm::nrOfLightsType mapOne(mm::RegionModifier& r,
+                                 mm::lengthType x, mm::lengthType y, mm::lengthType z,
+                                 mm::lengthType w, mm::lengthType h, mm::lengthType d,
+                                 mm::nrOfLightsType& count) {
+    mm::nrOfLightsType phys[8];
+    count = 0;
+    r.mapToPhysical(x, y, z, w, h, d, phys, count, 8);
+    return count ? phys[0] : 0;
+}
+
+// Default region (0/100 on every axis) is the full box: identity dimensions.
+TEST_CASE("RegionModifier default region is the full box") {
+    mm::RegionModifier r;
+    mm::lengthType logW, logH, logD;
+    r.logicalDimensions(128, 64, 4, logW, logH, logD);
+    CHECK(logW == 128);
+    CHECK(logH == 64);
+    CHECK(logD == 4);
+
+    // (0,0,0) → box index 0; the last cell → the last box index.
+    mm::nrOfLightsType count;
+    CHECK(mapOne(r, 0, 0, 0, 128, 64, 4, count) == 0);
+    CHECK(count == 1);
+}
+
+// Half of an axis, half-open: end=50 on 128 → pixels 0..63 (width 64), not 65.
+TEST_CASE("RegionModifier half region is exact (half-open end)") {
+    mm::RegionModifier r;
+    r.endX = 50;  // 0..50% of 128
+    mm::lengthType logW, logH, logD;
+    r.logicalDimensions(128, 64, 1, logW, logH, logD);
+    CHECK(logW == 64);   // exact half, not 65
+    CHECK(logH == 64);   // untouched axis stays full
+    CHECK(logD == 1);
+}
+
+// Two abutting regions tile a 128-wide axis with no overlap and no gap:
+// 0..50 → [0,64), 50..100 → [64,128). The seam pixel 64 belongs to exactly one.
+TEST_CASE("RegionModifier abutting regions tile exactly") {
+    mm::RegionModifier left;  left.startX = 0;  left.endX = 50;
+    mm::RegionModifier right; right.startX = 50; right.endX = 100;
+    mm::lengthType lw, h, d, rw;
+    left.logicalDimensions(128, 1, 1, lw, h, d);
+    right.logicalDimensions(128, 1, 1, rw, h, d);
+    CHECK(lw == 64);
+    CHECK(rw == 64);
+    CHECK(lw + rw == 128);   // no overlap, no gap
+
+    // Right region's local x=0 maps to box pixel 64 (where the left region ended).
+    mm::nrOfLightsType count;
+    CHECK(mapOne(right, 0, 0, 0, 128, 1, 1, count) == 64);
+    CHECK(count == 1);
+}
+
+// Region-local coordinates are translated by the start-pixel offset on each axis.
+TEST_CASE("RegionModifier maps region-local cells to the offset box cell") {
+    mm::RegionModifier r;
+    r.startX = 50; r.endX = 100;   // x: pixels 64..127 on a 128-wide axis
+    r.startY = 0;  r.endY = 50;    // y: pixels 0..63 on a 128-tall axis
+    mm::nrOfLightsType count;
+
+    // Local (0,0) → box (64, 0) → index 0*128 + 64 = 64.
+    CHECK(mapOne(r, 0, 0, 0, 128, 128, 1, count) == 64);
+    CHECK(count == 1);
+
+    // Local (1,2) → box (65, 2) → index 2*128 + 65 = 321.
+    CHECK(mapOne(r, 1, 2, 0, 128, 128, 1, count) == 321);
+    CHECK(count == 1);
+}
+
+// Rounding rule on a small panel: start floors, end ceils to an exclusive pixel.
+// start 33 / end 66 on a 4-wide axis → floor(1.32)=1 .. ceil(2.64)=3 → pixels 1,2.
+TEST_CASE("RegionModifier rounding on a small panel (floor start, ceil end)") {
+    mm::RegionModifier r;
+    r.startX = 33; r.endX = 66;
+    mm::lengthType logW, logH, logD;
+    r.logicalDimensions(4, 1, 1, logW, logH, logD);
+    CHECK(logW == 2);   // pixels 1,2
+
+    mm::nrOfLightsType count;
+    CHECK(mapOne(r, 0, 0, 0, 4, 1, 1, count) == 1);   // local 0 → box pixel 1
+    CHECK(mapOne(r, 1, 0, 0, 4, 1, 1, count) == 2);   // local 1 → box pixel 2
+}
+
+// A region that rounds to nothing still gets a 1-pixel floor (never empties the
+// layer). start 40 / end 41 on a 2-wide axis → would be 0 wide; clamped to 1.
+TEST_CASE("RegionModifier never produces a zero-width region") {
+    mm::RegionModifier r;
+    r.startX = 40; r.endX = 41;
+    mm::lengthType logW, logH, logD;
+    r.logicalDimensions(2, 1, 1, logW, logH, logD);
+    CHECK(logW >= 1);
+}
+
+// Negative / >100 percentages are legal on the wire; the carve math clamps them
+// into the box rather than reading off the ends.
+TEST_CASE("RegionModifier clamps out-of-range percentages to the box") {
+    mm::RegionModifier r;
+    r.startX = -50; r.endX = 200;   // both out of [0,100]
+    mm::lengthType logW, logH, logD;
+    r.logicalDimensions(64, 1, 1, logW, logH, logD);
+    CHECK(logW == 64);   // clamps to the full axis, not past it
+
+    mm::nrOfLightsType count;
+    CHECK(mapOne(r, 0, 0, 0, 64, 1, 1, count) == 0);   // start clamps to pixel 0
+}
+
+// Degenerate axes don't crash: a 1-wide axis stays 1, a 0-extent axis yields 0.
+TEST_CASE("RegionModifier handles degenerate axes") {
+    mm::RegionModifier r;
+    mm::lengthType logW, logH, logD;
+    r.logicalDimensions(1, 0, 4, logW, logH, logD);
+    CHECK(logW == 1);
+    CHECK(logH == 0);
+    CHECK(logD == 4);
+}
+
+// Never fans out — at most one destination, same family as CheckerboardModifier.
+TEST_CASE("RegionModifier maxMultiplier is 1") {
+    mm::RegionModifier r;
+    CHECK(r.maxMultiplier() == 1);
+}