diff --git a/.github/workflows/ci.yaml b/.github/workflows/ci.yaml
index 19a4010..25f2411 100644
--- a/.github/workflows/ci.yaml
+++ b/.github/workflows/ci.yaml
@@ -1,7 +1,7 @@
 name: ci
 # Same shape as Yolean/envoyimage's echo.yaml: separate verify and
 # publish phases, image push gated on the full e2e suite passing
-# first. (No upstream-image cron job — there's nothing for this repo
+# first. (No upstream-image cron job; there's nothing for this repo
 # to mirror in the registry sense.)
 #
 # Third-party actions are pinned to a 40-char commit SHA with the
@@ -102,7 +102,15 @@ jobs:
       uses: docker/build-push-action@bcafcacb16a39f128d818304e6c9c0c18556b85f  # v7.1.0
       with:
         context: .
-        platforms: linux/amd64,linux/arm64
+        # PR/QA runs build linux/amd64 only; the arm64 leg runs under
+        # QEMU on amd64 runners and dominates wall time (Rust +
+        # librdkafka cross-compile). Push events build both arches
+        # because releases ship multi-arch. See issue #2.
+        # GHA's per-branch cache scope means PR caches don't warm main
+        # anyway, so dropping arm64 from PR runs is the simplest
+        # effective fix; switching to a registry-backed cache would
+        # share across branches but needs PR write access to ghcr.
+        platforms: ${{ github.event_name == 'pull_request' && 'linux/amd64' || 'linux/amd64,linux/arm64' }}
         push: ${{ github.event_name != 'pull_request' }}
         tags: ${{ steps.meta.outputs.tags }}
         labels: ${{ steps.meta.outputs.labels }}
diff --git a/Cargo.lock b/Cargo.lock
index 52e7104..f284056 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -1741,6 +1741,7 @@ name = "mirror-bin"
 version = "0.1.0"
 dependencies = [
  "anyhow",
+ "async-trait",
  "clap",
  "metrics",
  "metrics-exporter-prometheus",
@@ -1750,6 +1751,7 @@ dependencies = [
  "mirror-envelope",
  "mirror-fs",
  "mirror-kafka",
+ "mirror-notify-kkv",
  "mirror-s3",
  "object_store",
  "serde",
@@ -1789,6 +1791,7 @@ dependencies = [
  "serde_json",
  "serde_yaml",
  "thiserror",
+ "url",
 ]
 
 [[package]]
@@ -1812,13 +1815,16 @@ version = "0.1.0"
 dependencies = [
  "anyhow",
  "async-trait",
+ "axum",
  "bytes",
  "futures",
  "mirror-cache",
+ "mirror-config",
  "mirror-core",
  "mirror-envelope",
  "mirror-fs",
  "mirror-kafka",
+ "mirror-notify-kkv",
  "mirror-s3",
  "object_store",
  "portpicker",
@@ -1830,6 +1836,7 @@ dependencies = [
  "tokio",
  "tracing",
  "tracing-subscriber",
+ "uuid",
 ]
 
 [[package]]
@@ -1875,6 +1882,27 @@ dependencies = [
  "tracing",
 ]
 
+[[package]]
+name = "mirror-notify-kkv"
+version = "0.1.0"
+dependencies = [
+ "async-trait",
+ "axum",
+ "futures",
+ "indexmap 2.14.0",
+ "metrics",
+ "mirror-config",
+ "mirror-core",
+ "reqwest",
+ "serde",
+ "serde_json",
+ "thiserror",
+ "tokio",
+ "tower",
+ "tracing",
+ "url",
+]
+
 [[package]]
 name = "mirror-s3"
 version = "0.1.0"
diff --git a/Cargo.toml b/Cargo.toml
index 2181166..5eb443b 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -8,6 +8,7 @@ members = [
     "crates/mirror-kafka",
     "crates/mirror-fs",
     "crates/mirror-s3",
+    "crates/mirror-notify-kkv",
     "crates/mirror-bin",
     "crates/xtask",
     "e2e",
@@ -28,6 +29,7 @@ mirror-envelope = { path = "crates/mirror-envelope" }
 mirror-kafka = { path = "crates/mirror-kafka" }
 mirror-fs = { path = "crates/mirror-fs" }
 mirror-s3 = { path = "crates/mirror-s3" }
+mirror-notify-kkv = { path = "crates/mirror-notify-kkv" }
 
 serde = { version = "1", features = ["derive"] }
 serde_json = "1"
@@ -60,6 +62,7 @@ utoipa = { version = "5", features = ["axum_extras"] }
 utoipa-axum = "0.2"
 utoipa-scalar = { version = "0.3", features = ["axum"] }
 reqwest = { version = "0.12", default-features = false, features = ["rustls-tls"] }
+url = "2"
 indexmap = "2"
 
 [profile.release]
diff --git a/KAFKA_KEYVALUE_DROPIN_REPLACEMENT.md b/KAFKA_KEYVALUE_DROPIN_REPLACEMENT.md
index f3d7a01..c4c76b7 100644
--- a/KAFKA_KEYVALUE_DROPIN_REPLACEMENT.md
+++ b/KAFKA_KEYVALUE_DROPIN_REPLACEMENT.md
@@ -188,9 +188,9 @@ parity with KKV.
 | ------------------------------------------- | ------------------------------------- |
 | onupdate webhook dispatcher                 | mirror-v3 does not implement (deferred to a future PR). If a current dependent uses Yolean's KKV in sidecar mode and relies on onupdate, mirror-v3 is **not** a drop-in for them yet. |
 | `POST /_admin/v1/shutdown[/{exitcode}]`     | mirror-v3 has it; not compared        |
-| `/q/health` / `/q/health/ready` (Quarkus)   | mirror-v3 does not implement; we expose `/metrics` (Prometheus) on the metrics port instead |
+| `/q/health/ready` (Quarkus)                 | mirror-v3 implements as a drop-in: same path, same `200`/`503` codes, plus a structured `ReadinessReport` JSON body that names any unhealthy mirror by status enum. Existing `@yolean/kafka-keyvalue` Node clients work unchanged. `/q/health` (the wider SmallRye umbrella) is not implemented; we expose `/metrics` (Prometheus) on the metrics port instead |
 | Multi-partition `/cache/v1/offset/{t}/{p}`  | the fixture topic uses 1 partition; the multi-partition case is unit-tested in `mirror-cache`'s handler tests |
-| Readiness 503 timing                        | both serve 503 before catch-up, sticky after; deeper compare would need a controlled-rate producer |
+| Readiness 503 timing                        | KKV: `caught_up` flips false→true once and sticks. mirror-v3: non-sticky — tracks per-mirror lag against the broker high-watermark, source-partition assignment, and per-destination flush progress; falls back to 503 if any of those degrades. Plus a per-destination YAML opt-out (`affects-readiness: false`) for best-effort secondary sinks. |
 
 ## Open
 
diff --git a/README.md b/README.md
index 7e841b5..5ce0a43 100644
--- a/README.md
+++ b/README.md
@@ -65,16 +65,18 @@ A minimal PodMonitor for the checkit chart points at port 9090; the standard pro
 
 ### `/cache/v1` (drop-in for `Yolean/kafka-keyvalue`)
 
-Per-mirror opt-in via `http-access: { api: cache-v1 }`. When at least one mirror has it set, `mirror-v3 run` starts a second HTTP server on `0.0.0.0:8080` (override with `MIRROR_V3_CACHE_PORT`) that exposes the KKV `/cache/v1` surface:
+Per-mirror opt-in via `http-access: { cache-v1: {} }`. When at least one mirror has it set, `mirror-v3 run` starts a second HTTP server on `0.0.0.0:8080` (override with `MIRROR_V3_CACHE_PORT`) that exposes the KKV-shaped surface under each opt-in mirror's name:
 
 ```
-GET /cache/v1/raw/{key}                  → value bytes (application/octet-stream), 404 if absent
-GET /cache/v1/offset/{topic}/{partition} → decimal text
-GET /cache/v1/keys                       → newline-separated keys
-GET /cache/v1/values                     → newline-separated raw values
+GET /cache/v1/{mirror}/raw/{key}                  → value bytes (application/octet-stream), 404 if absent
+GET /cache/v1/{mirror}/offset/{topic}/{partition} → decimal text
+GET /cache/v1/{mirror}/keys                       → newline-separated keys
+GET /cache/v1/{mirror}/values                     → newline-separated raw values
 ```
 
-Reads carry `x-kkv-last-seen-offsets: <JSON>` and return **503** until every opt-in mirror has caught up to the source's high-watermark captured at startup — same readiness contract as KKV, so dependents don't transiently see an older state across reloads. The cache view updates per-record from the consume loop, decoupled from disk flush cadence (set `flush.max-time-ms` high to save bucket ops without sacrificing freshness). Updates are monotonic; if a future feature ever rewinds source consumption, the cache stays at the highest offset seen.
+Each mirror owns its own `key → latest-value` view; a key only shows up under the mirror that consumed it. Reads carry `x-kkv-last-seen-offsets: <JSON>` and return **503** until that mirror has caught up to its source's high-watermark captured at startup — same readiness contract as KKV, so dependents don't transiently see an older state across reloads. The view updates per-record from the consume loop, decoupled from disk flush cadence (set `flush.max-time-ms` high to save bucket ops without sacrificing freshness). Updates are monotonic; if a future feature ever rewinds source consumption, the cache stays at the highest offset seen.
+
+To keep existing kkv consumers working unmodified during a migration, **one** mirror per process may additionally set `cache-v1-main: {}`. That mounts the unprefixed `/cache/v1/...` paths onto that mirror's view (alias-only — same handlers, no separate data path). The validator rejects more than one `cache-v1-main` in the config. Mirror names that collide with the literal path segments `raw | offset | keys | values` are rejected.
 
 Also exposed on the same port:
 
@@ -153,7 +155,56 @@ docker run --rm -v "$PWD/examples:/cfg" mirror-v3:dev validate --config /cfg/kaf
 
 ## Operational invariants
 
-- **One process owns at most one mirror per `(topic, partition)`.** Run with `replicas: 1` and `strategy.type: Recreate` in Kubernetes for every mirror-v3 deployment. This is non-negotiable — two writers will race on destination naming and trip the corrupt-chain detector on the next restart.
+- **One process owns at most one mirror per `(topic, partition)`.** Run with `replicas: 1` and either `strategy.type: Recreate` or `RollingUpdate` with `maxSurge: 0` and `maxUnavailable: 1` for every mirror-v3 deployment. This is non-negotiable on two counts:
+    1. **Destination races.** Two writers will race on destination naming and trip the corrupt-chain detector on the next restart.
+    2. **Source-side coordination.** mirror-v3 uses `assign()` instead of `subscribe()` for its Kafka consumer, so there is no consumer-group coordinator deciding which pod owns the partition. Two pods up at once would both consume the same partition and race the consumer-offset commit log.
 - **VersityGW specifically:** `If-None-Match: *` is silently ignored (v1.4.1, POSIX backend, verified in e2e), so the deployment guarantee is the *only* atomicity layer for the cross-process race. AWS S3 honors `If-None-Match: *` and gives API-level atomicity on top of the deployment guarantee.
 - **Any unrecoverable error in any mirror exits the entire process.** Restart correctness is the recovery mechanism; supervision belongs to the orchestrator.
 - **For blob destinations, a `(from, to)` filename/key is the durable "offset"** — atomic rename (FS) or single-shot `PutObject` (S3) makes it visible. The destination listing is the source of truth on startup.
+
+## Readiness
+
+`GET /q/health/ready` returns a structured JSON body in every state:
+
+```json
+{
+  "ready": "ready" | "warming" | "degraded",
+  "mirrors": [
+    {
+      "name": "userstate",
+      "status": "ready" | "warming" | "lag_behind_source"
+              | "source_unassigned" | "destination_lagging",
+      "source": {
+        "topic": "userstate", "partition": 0, "assigned": true,
+        "end_offset": 12345, "last_applied_offset": 12345, "lag": 0
+      },
+      "destination": { "name": "userstate-gcs", "lag": 5 }
+    }
+  ],
+  "unhealthy": ["userstate"]
+}
+```
+
+HTTP status is `200` iff every mirror is `ready`; `503` otherwise. The drop-in `@yolean/kafka-keyvalue` Node client only inspects the status code, so the body is transparent to legacy consumers but greppable for on-call.
+
+Per-mirror `/cache/v1/{mirror}/...` routes return the matching `mirrors[i]` element as the `503` body, so a polling consumer sees a meaningful retry signal instead of opaque `503`.
+
+Tuning:
+
+- `MIRROR_V3_READINESS_LAG` (default `0`) — offsets of lag tolerated before `LagBehindSource` fires.
+- `MIRROR_V3_READINESS_POLL_MS` (default `2000`) — how often each mirror's broker high-watermark + consumer assignment is re-checked. `0` disables the poller.
+- `MIRROR_V3_OFFSET_COMMIT_INTERVAL_MS` (default `5000`) — how often the supervisor commits the consumer's progress back to the broker. `0` disables (the mirror still works but loses the between-pods notify guarantee on the next restart).
+
+Per-destination opt-out:
+
+```yaml
+destinations:
+  - type: filesystem
+    root: /var/lib/mirror-v3
+    # affects-readiness: true   # default
+  - type: kafka
+    bootstrap-servers: ghost-cluster:9092
+    affects-readiness: false   # best-effort secondary
+```
+
+A destination with `affects-readiness: false` still records its `flushed_through` for observability but is skipped when computing `DestinationLagging`. Use it for observability replicas or archival sinks that must not flip consumer-pod readiness when they fall behind.
diff --git a/TESTING.md b/TESTING.md
new file mode 100644
index 0000000..3c6aa7e
--- /dev/null
+++ b/TESTING.md
@@ -0,0 +1,170 @@
+# Testing strategy for mirror-v3
+
+This is the entrypoint for "I need to test a spec change; where does
+my test go?" The answer is almost always one of the seven layers
+below. Pick the cheapest one that can actually exercise the
+invariant.
+
+The palette is sorted from cheapest (in-process, no I/O) to most
+expensive (Docker, multi-broker). Each layer lists what kind of
+spec change belongs there, what's already in it, and the
+testability primitives available.
+
+## TL;DR by spec-change shape
+
+| Spec change touches… | Layer | Cost |
+|---|---|---|
+| Pure data (envelopes, config parsing, validation rules) | **L1** unit | ms |
+| The `run_mirror` loop's invariants (offset gates, source events) | **L2** loop_invariants | ms |
+| A sink's internal invariants (buffer/durable split, filename, align) | **L3** sink matrix | ms |
+| The loop + sink combination (mock-vs-real divergence guard) | **L4** loop_invariants_with_real_sink | ~tens of ms |
+| HTTP handler / OpenAPI / cache view | **L5** in-process http (tower::oneshot) | ms |
+| Real Kafka semantics (broker contracts, librdkafka) | **L6** Docker e2e | seconds |
+| Things we know we owe but haven't built yet | **L7** known_coverage_gaps.rs | n/a (placeholder) |
+
+## L1; Per-crate unit tests (in-source `#[cfg(test)] mod tests`)
+
+**Where:** `crates/*/src/*.rs` inline `mod tests {…}` blocks.
+
+**Use when:** the spec is about a pure function: parsing YAML, validating a config rule, encoding/decoding an envelope, computing a file path, expanding env interpolation. No async, no I/O, no traits.
+
+**Existing examples:**
+- `mirror-config/src/envsubst.rs`; `${VAR}` / `${VAR:-default}` expansion algorithm.
+- `mirror-config/src/lib.rs` (daily_tests); `at_utc: "HH:MM:SS"` parsing.
+- `mirror-core/src/cache.rs`; monotonic CacheState, insertion-order keys, tombstone semantics.
+- `mirror-core/src/tee.rs` (tests module); TeeSink's per-sink head logic against in-process mock inner sinks.
+
+**Testability primitives available:** all of `std`, `serde_json::Value` for AST-style assertions, no special harness needed.
+
+## L2; Loop invariants against `MockSink` (`mirror-core/tests/loop_invariants.rs`)
+
+**Where:** `crates/mirror-core/tests/loop_invariants.rs`.
+
+**Use when:** the spec is about `run_mirror`'s decision-making; when it errors, what error variant, how it advances `expected`, what it does on idle. The invariant under test should hold *regardless* of which concrete sink is plugged in, so a mock sink is appropriate.
+
+**Existing examples:**
+- `errors_on_source_offset_gap_in_append_mode`; append mode rejects forward gaps.
+- `errors_on_source_going_backwards`; backwards is always fatal.
+- `compaction_log_accepts_repeated_gaps_mid_stream`; the production-bug repro.
+- `errors_on_destination_drift_during_idle`; idle re-check catches out-of-band writes.
+
+**Testability primitives available:**
+- `mirror_core::mock::MockSource`; script `Record`, `Idle`, `Error`, `Hang` events.
+- `MockSource::with_low_watermark(u64)`; broker low watermark for the bootstrap branch.
+- `MockSource::with_high_watermark(u64)`; broker high watermark, for spec changes that introduce a "sink can't exceed source HWM" gate.
+- `mirror_core::mock::MockSink`; scripted `next_expected_offset`, write-error injection, recorded writes.
+- `MockSink::with_allows_compacted_source(bool)`; gate for compaction-log behaviour.
+- `mirror_core::testing::BlanketMockSink`; closure-per-method Sink for TDD-style spec tests where the existing `MockSink` builder doesn't express what you need. Each method is an `FnMut`, so the closure can capture mutable test state (counters, scripted sequences). All trait-method invocations are recorded in `BlanketMockSink::calls()` for post-hoc assertions. See the `tests` module in `crates/mirror-core/src/testing.rs` for usage shapes.
+- Metric assertions: not yet; emit-side assertion is in [`L7` known_coverage_gaps](#l7--documented-coverage-gaps-e2etestsknown_coverage_gapsrs) until a spec change actually needs it. The typical workaround today is to assert on the visible side-effect (logged message, written record) instead of the metric itself.
+
+**When to escalate to L4:** if the spec touches the sink's *internal* state machine (buffer/durable split, view, filename). MockSink doesn't model those. Promote to L3 if the spec is *about* the sink, or L4 if it's about the loop+sink combination.
+
+## L3; Sink matrix (`mirror-{fs,s3}/tests/sink_matrix.rs`)
+
+**Where:** `crates/mirror-fs/tests/sink_matrix.rs` and `crates/mirror-s3/tests/sink_matrix.rs`.
+
+**Use when:** the spec is about a sink's per-record state machine; what `write` accepts under which mode and buffer state, what `next_expected_offset` returns, what `align_to_source_low_watermark` requires, what filename `flush` produces. The cells are `(compaction-mode × buffer-state × action)`.
+
+**Existing structure:** a `MATRIX: Vec<Case>` with named cells (e.g. `log/non_empty/write_above_expected/ok_midstream_gap`). Each cell:
+- `preload: &[u64]`; records to write before the action.
+- `buffer_state: Empty | NonEmpty`; flush after preload or not.
+- `action: Write | Flush | Align | NextExpected`.
+- `expected: Ok | NextExpectedIs(u64) | UnexpectedPosition{...} | TransportContains("...")`.
+
+**To add a spec test:** append one `Case` to `matrix_cases()`. Pick the cell coordinates (mode, state, action), name it `<mode>/<state>/<action>/<outcome>`. Mirror it row-for-row in the S3 file unless the contract genuinely diverges between backends.
+
+**Testability primitives available:**
+- `tempfile::TempDir` for FS isolation; `object_store::memory::InMemory` for S3 isolation.
+- The `Outcome` enum is exhaustive across the trait surface; extend it if a new spec introduces a new observable outcome.
+
+**When to escalate to L4:** the spec is about how the *run loop* reacts to the sink's state (e.g. "loop must crash if sink rejects in compaction mode"). The matrix is sink-only; the loop interaction belongs in L4.
+
+## L4; Loop + real sink (`mirror-fs/tests/loop_invariants_with_real_sink.rs`)
+
+**Where:** `crates/mirror-fs/tests/loop_invariants_with_real_sink.rs`.
+
+**Use when:** the spec change spans the loop ↔ sink boundary, and either:
+- a similar mock-only test in L2 wouldn't catch a real-sink invariant mismatch, or
+- the spec is "the loop's behaviour AND the sink's behaviour together produce X observable state on disk."
+
+**Existing examples:**
+- `compaction_log_real_sink_accepts_repeated_midstream_gaps`; the production repro (loop accepts forward gaps + sink buffers them + flush emits a `0-470.parquet` with 2 deduplicated keys).
+- `append_mode_real_sink_rejects_source_gap`; loop's `SourceGapAboveExpected` is observable from the test, no disk write.
+
+**Testability primitives available:**
+- `drive_real_fs(compaction, events, grace_duration)` helper drives `run_mirror` against a real FilesystemSink and a scripted MockSource. The shutdown future is a timer (`tokio::time::sleep(grace)`) so the loop has a window to process events before graceful shutdown.
+- All L2 primitives (MockSource, BlanketMock* via mirror_core::testing).
+
+**When to escalate to L6:** real librdkafka, real broker semantics (compaction policy, transactional offsets, metadata-fetch latency), or anything that requires a network address.
+
+## L5; In-process HTTP (`mirror-cache/tests/handlers.rs`)
+
+**Where:** `crates/mirror-cache/tests/handlers.rs`.
+
+**Use when:** the spec is about the `/cache/v1/*` HTTP surface (routing, status codes, headers, response bodies). Uses `tower::ServiceExt::oneshot` against the `axum::Router`; no socket, no port allocation, no flakes.
+
+**Pattern:**
+```rust
+let app = build_router(state, shutdown_tx);
+let resp = app.oneshot(Request::get("/cache/v1/raw/k0").body(Body::empty())?).await?;
+assert_eq!(resp.status(), StatusCode::OK);
+```
+
+**When to escalate to L6:** the spec involves real network behaviour (TLS, concurrent clients, real backpressure).
+
+## L6; Docker e2e (`e2e/tests/*.rs`)
+
+**Where:** `e2e/tests/*.rs`. Provisioned via `mirror_e2e::docker::DockerProvisioner` (Redpanda + VersityGW + Toxiproxy as needed).
+
+**Use when:** the spec is about a broker contract you can't honestly fake (cleanup policies, low/high watermark behaviour, librdkafka client lifecycle), or about a multi-component scenario (mirror + cache + HTTP server, crash + restart with real durable state on disk, fault injection via Toxiproxy).
+
+**Cost:** seconds per test, sequenced via `--test-threads=1` because tests share Docker resources.
+
+**Existing patterns:**
+- `kafka_helpers::create_topic`, `produce_records`, `drain_partition`; Kafka fixture utilities.
+- `mirror_runner::spawn_kafka_to_filesystem`, `spawn_kafka_to_s3`, `spawn_kafka_to_tee`; start a mirror in-process against the provisioned source/sink.
+- `stack.source_bootstrap()`, `stack.target_kafka_bootstrap()`, `stack.s3_endpoint()`, `stack.target_down()`; environment handles.
+
+**When to escalate to L7:** the spec needs a broker behaviour we don't yet have a harness for (real compaction, multi-broker metadata race, large-scale fixtures).
+
+## L7; Documented coverage gaps (`e2e/tests/known_coverage_gaps.rs`)
+
+**Where:** `e2e/tests/known_coverage_gaps.rs`.
+
+**Use when:** the test infrastructure for a spec doesn't exist yet, but the contract is real and should be visible. Each entry is an `#[ignore = "TODO: ..."]` test with `unimplemented!()` body and a doc-comment naming the contract and the layer it would belong in once implementable.
+
+**Discovery:** `cargo test --list -p mirror-e2e | grep ignored`.
+
+**Pattern:** add a stub with the ignore reason pointing at `REVIEW_TEST_STRATEGY.md §X`. When the harness arrives, drop `#[ignore]` and fill in the body.
+
+## Adding a new layer
+
+If a spec's natural test wouldn't fit anywhere above; for example, a property-based test against the gate semantics, or a CPU-bench fixture; add a new file at the appropriate crate level and document it here. Resist the temptation to overload an existing layer with a new responsibility; the catalogue is most useful when each layer has one clear charter.
+
+## Quick reference: writing a test for a brand-new invariant
+
+Example spec: *"The mirror must crash with a specific error variant if `sink.next_expected_offset()` ever exceeds `source.high_watermark()`. This catches destination chains that have somehow advanced past the broker (out-of-band writes, restored from a too-recent backup)."*
+
+1. **Pick the layer.** The check belongs in `run_mirror`'s startup or idle path, so the test belongs in **L2** (`loop_invariants.rs`).
+2. **Write the test first.** Using the existing palette:
+   ```rust
+   #[test]
+   fn errors_when_sink_is_ahead_of_source_high_watermark() {
+       let source = MockSource::new([MockSourceEvent::Hang])
+           .with_high_watermark(100);
+       let sink = MockSink::starting_at(150); // sink is ahead!
+       let result = drive(run_mirror(source, sink, never()));
+       match result {
+           Err(MirrorError::SinkAheadOfSource { sink_offset, source_hwm }) => {
+               assert_eq!(sink_offset, 150);
+               assert_eq!(source_hwm, 100);
+           }
+           other => panic!("expected SinkAheadOfSource, got {other:?}"),
+       }
+   }
+   ```
+3. **Run it.** It fails to compile (`SinkAheadOfSource` doesn't exist yet); that's the red part of red-green-refactor.
+4. **Add the variant** to `MirrorError`, **add the check** in `run_mirror_with_heartbeat` (`Source::high_watermark` already exists with a u64::MAX default that won't trip existing tests), run again; green.
+5. **No mock infrastructure changes needed.** `with_high_watermark` is already a builder method on `MockSource`. That's the point of the palette.
+
+If the same spec applied to the sink's internal state (e.g. "sink rejects align if its durable position exceeds the requested low_watermark") the test would land in **L3** (`sink_matrix.rs`) instead, by adding a row to `matrix_cases()`. Same flow: write the row, watch it fail, implement the check, watch it pass.
diff --git a/WEBHOOKS.md b/WEBHOOKS.md
new file mode 100644
index 0000000..ed74e29
--- /dev/null
+++ b/WEBHOOKS.md
@@ -0,0 +1,730 @@
+# Proposal: opt-in HTTP notify for mirror-v3
+
+A minimal, configurable outbound webhook surface so mirror-v3 can
+replace `Yolean/kafka-keyvalue` (kkv) end-to-end, not just on the
+read side. The existing `http-access: { cache-v1: {} }` block
+covers the GET surface; this proposal adds the symmetric
+*you-need-to-re-read* push that legacy consumers depend on.
+
+## Background
+
+Legacy kkv was push-based by design. When a source-topic record
+landed, kkv POST'd to each pod backing a `TARGET_SERVICE_NAME`
+headless Kubernetes Service (discovered via the K8s Endpoints API),
+telling the consumer "these keys have changed; re-read them via
+`/cache/v1/raw/<key>`". The downstream client library
+(`@yolean/kafka-keyvalue` for Node) invalidates its in-process cache
+on receipt and re-fetches lazily.
+
+mirror-v3's cache-v1 is pull-only. Consumers' in-process caches
+therefore never refresh after their initial replay. In production
+this manifests as records produced *after* a consumer service
+started up never reaching that service's local view: the source
+topic has the new record, mirror-v3's cache-v1 in-memory map sees
+it, but the consumer's own in-process cache is stuck on the value
+it snapshotted at startup; because nothing tells it to invalidate.
+
+This proposal adds the missing push side as a per-mirror opt-in,
+without resurrecting any of kkv's other behaviour.
+
+## Goals and non-goals
+
+Goals:
+
+- Cover every current kkv deployment shape with one mirror-v3
+  feature (see "Use cases" for the shape catalogue).
+- Match kkv's wire contract exactly so the existing
+  `@yolean/kafka-keyvalue` client (`getOnUpdateRoute()`,
+  `ON_UPDATE_DEFAULT_PATH = "/kafka-keyvalue/v1/updates"`) works
+  unmodified against mirror-v3.
+- Stay K8s-API-free in the binary itself: no `Endpoints` watch, no
+  Kubernetes SDK dependency, no in-cluster RBAC requirement on the
+  mirror's own ServiceAccount.
+- Keep the existing destinations / cache-v1 / compaction:log
+  contracts unchanged. This is additive.
+
+Non-goals (out of scope, deferable):
+
+- Auth on the outbound request (mTLS, bearer, signing). MVP assumes
+  in-cluster targets behind a trusted network boundary; the
+  legacy kkv had the same assumption.
+- Per-key or per-prefix subscription filters. Today all keys go to
+  all targets.
+- Per-target circuit breakers. MVP: any retry-exhausted target
+  failure crashes the mirror task (consistent with mirror-v3's
+  "unrecoverable error exits the process" model).
+- Push-only mode (no cache-v1, just notify). The kkv contract
+  assumes consumers re-fetch via cache-v1 on receipt; require
+  `http-access: { cache-v1: {} }` to coexist for now.
+
+## Use cases this needs to cover
+
+The deployment shape used by every observed kkv instance:
+
+| dimension                | shape                                                        |
+|--------------------------|--------------------------------------------------------------|
+| One mirror per…          | (source topic, partition); same as mirror-v3 already         |
+| Target discovery         | A Kubernetes *headless* Service named after the role          |
+| Target replica count     | 1–N consumer pods behind that Service                         |
+| Target route             | `POST /kafka-keyvalue/v1/updates` on each pod, port 8080      |
+| Consumer client library  | `@yolean/kafka-keyvalue` (Node); mounts the route as-is      |
+
+Consumer-side route mount, identical across every deployment seen:
+
+```js
+const { ON_UPDATE_DEFAULT_PATH, getOnUpdateRoute } = require('@yolean/kafka-keyvalue');
+app.post(ON_UPDATE_DEFAULT_PATH, getOnUpdateRoute());
+```
+
+A single wire format therefore suffices for the entire installed
+fleet. Multi-replica targets are the common case (1–N consumer
+pods behind a headless Service), so notify must fan out across
+the Service's full pod set, not just one pod.
+
+## Proposed config
+
+Per-mirror block, alongside `http-access`:
+
+```yaml
+mirrors:
+  - name: events
+    source: { bootstrap-servers: kafka:9092 }
+    topic: events-stream
+    partition: 0
+    destinations:
+      - type: s3
+        region: us-east-1
+        bucket: my-bucket
+    format: parquet
+    compression: zstd-1
+    compaction: log
+    http-access:
+      cache-v1: {}
+    notify:
+      api: kkv-v1                              # only variant initially
+      targets:
+        - url: http://events-cache-target:8080
+          fan-out: dns-a                        # resolve to all A records, POST to each
+      trigger:
+        on: source-consume                      # or destination-flush; see "Trigger" below
+        debounce:                               # only meaningful for source-consume
+          max-records: 100
+          max-time-ms: 250
+      timeout-ms: 5000                          # per-request HTTP timeout; independent of retry/outcome
+      retry:                                    # shared by every outcome with `retry: true` below
+        max-attempts: 5
+        backoff-ms: 100                         # exponential, capped
+      outcomes:                                 # six independent cases, same shape, different defaults
+        timeout:       { retry: true,  final: fail   }
+        connrefused:  { retry: true,  final: fail   }
+        2xx:           { retry: false, final: accept }
+        3xx:           { retry: false, final: fail   }
+        4xx:           { retry: false, final: fail   }
+        5xx:           { retry: true,  final: fail   }
+    flush:
+      max-time-ms: 60000
+      max-bytes: 67108864
+      max-offsets: 10000
+```
+
+Field-level notes:
+
+- **`notify.api: kkv-v1`** is explicit so future variants
+  (e.g. `notify.api: nats-v1`, or a kkv-v2 with auth) can be added
+  without re-shaping the block. Same pattern as
+  `http-access.api`.
+- **`notify.targets[].url`** is a full URL. The path component
+  defaults to `/kafka-keyvalue/v1/updates` for `api: kkv-v1` if
+  unset; explicit override is allowed for non-kkv clients.
+- **`notify.targets[].fan-out`** decides how the URL's host is
+  resolved:
+  - `none` (default): standard DNS, single connection. Adequate for
+    a single-replica target.
+  - `dns-a`: resolve the host to all A/AAAA records and POST to
+    every address that comes back. Headless Kubernetes Services
+    naturally return one A record per pod, so this gives the same
+    fan-out kkv used to do via the Endpoints API; without mirror-v3
+    needing K8s API access. Resolutions are cached up to the DNS
+    record TTL.
+- **`notify.trigger`** decides what internal event causes a POST.
+  See the dedicated section below; default is `source-consume` with
+  small debounce, matching kkv's "as records arrive" behaviour.
+- **`notify.timeout-ms`** is the per-request HTTP timeout; strictly
+  about how long to wait for *this* request before declaring it a
+  `timeout` outcome. It does not influence retry decisions or
+  exhaustion behaviour; those live in `notify.outcomes` and
+  `notify.retry`.
+- **`notify.retry`** is one shared backoff/exhaust policy used by
+  any outcome marked `retry: true`. There is intentionally no
+  per-outcome backoff override; heterogeneous retry shapes per
+  status class are scope creep for the MVP and can be added later
+  if the four-outcome surface proves insufficient.
+- **`notify.outcomes`** decides what each of six distinct request
+  outcomes means for the mirror. See "Outcomes and retry policy"
+  below; defaults match what kkv operators tend to expect.
+
+The block is **forbidden** unless the mirror also has
+`http-access.cache-v1` set (validator rejects otherwise). The notify
+body tells consumers "go re-read"; that's only meaningful if there's
+somewhere to re-read from.
+
+## Wire contract (`api: kkv-v1`)
+
+Matches the legacy kkv exactly so the upstream Node client works
+unmodified.
+
+**Request.**
+
+- Method: `POST`
+- Path: `/kafka-keyvalue/v1/updates` (default; override via
+  `notify.targets[].path`)
+- Content-Type: `application/json`
+- Headers:
+  - `x-kkv-topic: <source-topic>`
+  - `x-kkv-offsets: <json-encoded {partition: offset}>`
+- Body:
+  ```json
+  {
+    "v": 1,
+    "topic": "<source-topic>",
+    "offsets": { "<partition>": <highest-offset-in-batch> },
+    "updates": { "<key>": null }
+  }
+  ```
+  - `v` is the protocol-version marker. **Load-bearing**:
+    `@yolean/kafka-keyvalue` v1.8.3's `updateListener` (both CJS
+    and ESM builds) does an early `if (requestBody.v !== 1) throw
+    new Error('Unknown kkv onupdate protocol …')` and a missing
+    field surfaces as `undefined`. The throw lands inside an
+    Express middleware as an unhandled rejection and crashloops
+    the consumer pod. The legacy Quarkus kkv server also sends
+    this field on every POST.
+  - `topic` matches the header for double-check robustness.
+  - `offsets` carries the highest source offset across the batch
+    per partition. Single-partition mirrors send `{"0": <max>}`.
+  - `updates` is keyed by Kafka record key. Values are `null` -
+    consumers re-read via `GET /cache/v1/raw/<key>`. (The legacy
+    kkv allowed a payload hint but the upstream client immediately
+    re-fetches via `requireOffset: highestOffset` anyway, so the
+    hint was never load-bearing.)
+
+**Response.**
+
+- 2xx → success, drop the batch.
+- Anything else → retry per `notify.retry`.
+- After retry exhaustion → mirror task errors out
+  (`MirrorError::NotifyTargetExhausted`); process exits; orchestrator
+  restarts the pod; the dropped batch is re-read at startup because
+  the underlying source offsets weren't committed yet.
+
+Batches are sent in source-offset order per target. The mirror does
+not wait for an ACK on batch *N* before issuing batch *N+1*; missed
+intermediate batches are caught up at the consumer level via the
+existing `x-kkv-last-seen-offsets` semantics on cache-v1 reads.
+
+## Trigger: source-consume vs. destination-flush
+
+Two natural points to emit a notify exist. Operators should be able
+to pick between them per mirror.
+
+### `trigger.on: source-consume` (default)
+
+A POST is queued as soon as the source consumer hands a record to
+the mirror loop. The record has already been applied to the
+cache-v1 in-memory view (`write()` does that per-record), so a
+consumer that re-fetches `/cache/v1/raw/<key>` immediately on
+notify sees the just-updated value. Destination flush cadence is
+irrelevant; flushes can lag minutes or hours and cache freshness
+on the consumer side is unaffected.
+
+This is what kkv did, and what every existing `@yolean/kafka-keyvalue`
+consumer expects: sub-second invalidation, decoupled from any
+blob-storage flush.
+
+Because per-record HTTP would be wasteful at high record rates,
+`source-consume` requires a `debounce` block:
+
+```yaml
+trigger:
+  on: source-consume
+  debounce:
+    max-records: 100     # batch up to N record-changes per POST
+    max-time-ms: 250      # flush partial batch at most this old
+```
+
+A batch is sent when `max-records` is reached OR `max-time-ms`
+has elapsed since the first record entered the batch, whichever
+comes first. Setting `max-records: 1` yields per-record POSTs;
+the higher the value, the better at coalescing bursts (e.g. a
+restart catchup) at the cost of a small invalidation delay.
+
+`debounce` interacts with `notify.timeout-ms` and `retry`: an
+in-flight batch blocks the next batch from being sent on the same
+target, which provides natural backpressure if the receiver is
+slow. (The source consume loop itself doesn't pause; new records
+land in the next batch's buffer.)
+
+### `trigger.on: destination-flush`
+
+A POST is queued only after the destination(s) durably commit a
+batch; i.e. the same moment the `flushed batch` log line fires
+in mirror-fs / mirror-s3. The notify body's offset range matches
+the flushed snapshot's `from`–`to` exactly. No `debounce` block
+applies (the destination's flush triggers ARE the debounce).
+
+Use case: downstream consumers that care about durability rather
+than freshness; e.g. an archival sync job that wants "tell me
+when a parquet file lands so I can copy it elsewhere". Not the
+right fit for cache invalidation, since destination flush cadence
+is typically minutes.
+
+For mirror-v3's TeeSink (multiple destinations per mirror), the
+notify fires when ALL destinations have committed past the batch's
+high-water offset. Single-destination mirrors fire on every flush.
+A mirror with no blob destinations (kafka-only) cannot use
+`destination-flush`; validator rejects.
+
+### Suppression threshold (fresh deploy vs. returning deploy)
+
+Both triggers suppress dispatch for any event below the mirror's
+**suppression threshold**, computed at supervisor startup as:
+
+```
+suppression_threshold = match broker_committed_offset {
+  Some(committed) => committed,   // returning deploy
+  None            => bootstrap_hwm, // fresh deploy
+}
+```
+
+- **Fresh deploy** (group has no committed offset on the broker):
+  threshold = source-partition high-watermark. Records during the
+  cold-start replay-to-current window don't fan webhooks out, the
+  same gate the legacy kkv Quarkus `KafkaCache.Stage` provided.
+- **Returning deploy** (group has a previously-committed offset
+  `C`): threshold = `C`. Records in `[C, bootstrap_hwm)` represent
+  the gap between the previous pod's last commit and this pod's
+  startup; they fire webhooks because the previous pod was supposed
+  to deliver them but exited first. Records below `C` are suppressed
+  because the previous pod already delivered them.
+
+The supervisor's periodic commit task writes the consumer's
+progress back to the broker every
+`MIRROR_V3_OFFSET_COMMIT_INTERVAL_MS` (default 5s) so this works
+across restarts. See `DELIVERY_SEMANTICS_REVISIT.md` for the
+original incident report from the first downstream maintainer.
+
+Suppression bumps
+`mirror_v3_notify_suppressed_records_total{topic,partition}` so
+operators see how much was skipped. The gate is per-mirror: one
+mirror can begin emitting webhooks while another is still warming
+up against its own threshold.
+
+A webhook consumer that re-fetches via `/cache/v1/raw/<key>` on the
+first notify is guaranteed a consistent view because the cache
+HTTP surface is gated on the same per-mirror `MirrorStatus::Ready`
+predicate (see `README.md#readiness`).
+
+### Compatibility / defaults
+
+- Default `trigger.on` is `source-consume` so the kkv replacement
+  path works out of the box.
+- Default `debounce` is `{ max-records: 100, max-time-ms: 250 }`.
+  Operators tune these for their own latency/cost trade-off.
+- `trigger` and `notify.on-response` are independent of each other:
+  the response policy applies to whichever batch is emitted.
+
+## Outcomes and retry policy
+
+Six distinct request outcomes are recognised. Three of them are
+non-HTTP-response cases (no status code came back); the other three
+are status-class buckets.
+
+| outcome        | what it means                                                                       |
+|----------------|-------------------------------------------------------------------------------------|
+| `timeout`      | Request didn't complete within `notify.timeout-ms`.                                  |
+| `connrefused` | TCP refused fast (target's port is closed or the host is missing).                  |
+| `2xx`          | HTTP 200–299.                                                                        |
+| `3xx`          | HTTP 300–399 (redirects; unusual for a webhook).                                    |
+| `4xx`          | HTTP 400–499 (target says "your request is wrong").                                  |
+| `5xx`          | HTTP 500–599 (target says "I'm broken").                                             |
+
+Each outcome carries the same two-field shape:
+
+```yaml
+outcomes:
+  <name>:
+    retry: <bool>             # if true, retry per notify.retry; if false, jump straight to `final`
+    final: accept | skip | fail
+```
+
+`final` is the action taken either immediately (if `retry: false`)
+or after retry exhaustion (if `retry: true`). Possible values:
+
+| action   | meaning                                                                |
+|----------|------------------------------------------------------------------------|
+| `accept` | Count the batch as successfully delivered, advance.                    |
+| `skip`   | Log a WARN, drop the batch silently, advance. No further action.       |
+| `fail`   | Mirror task errors out; orchestrator restarts; mirror replays the batch from durable state. |
+
+The matrix is intentionally orthogonal; every combination of
+`retry × final` is valid and meaningful:
+
+| `retry` | `final`  | behaviour                                                          | typical use                                |
+|---------|----------|--------------------------------------------------------------------|--------------------------------------------|
+| false   | accept   | one attempt, treat as success regardless                           | `2xx` (always)                              |
+| false   | skip     | one attempt, log + drop                                            | `4xx: skip` when targets briefly return 410 during rolling restart |
+| false   | fail     | one attempt, immediate fatal                                       | `3xx`/`4xx` defaults                        |
+| true    | accept   | retry per policy, treat as success on exhaustion                    | best-effort heartbeats (rare)               |
+| true    | skip     | retry per policy, log + drop on exhaustion                          | non-critical notify channel                 |
+| true    | fail     | retry per policy, fatal on exhaustion                               | `5xx` / `timeout` / `connrefused` defaults |
+
+### Defaults
+
+```yaml
+outcomes:
+  timeout:       { retry: true,  final: fail   }
+  connrefused:  { retry: true,  final: fail   }
+  2xx:           { retry: false, final: accept }
+  3xx:           { retry: false, final: fail   }
+  4xx:           { retry: false, final: fail   }
+  5xx:           { retry: true,  final: fail   }
+```
+
+Rationale:
+
+- **`timeout` and `connrefused`** are network-level; the target
+  may be transiently slow / restarting / being rolled. Retry per
+  policy; only exit when the operator's retry budget is exhausted.
+- **`2xx`** is the only success case. `accept`, no retry.
+- **`3xx`** is almost always a misconfiguration: webhook receivers
+  shouldn't be redirecting. Fail loud so the operator notices.
+- **`4xx`** indicates the mirror is sending something the target
+  doesn't accept; retrying the same payload won't change that.
+  Fail loud.
+- **`5xx`** is transient server-side trouble; retry per policy, then
+  fail if it doesn't clear.
+
+### Operator-facing knobs the matrix unlocks
+
+- **"Targets routinely 404 during rolling restart, don't crash on
+  that"** → `4xx: { retry: false, final: skip }`. Downstream cache
+  staleness is recovered next time the consumer reads cache-v1 with
+  the `x-kkv-last-seen-offsets` header.
+- **"Receiver is flaky, never fail the mirror on it"** →
+  `5xx: { retry: true, final: skip }`. Pure best-effort notify.
+- **"Fail fast on slow receivers instead of waiting through retry"**
+  → `timeout: { retry: false, final: fail }`.
+- **"Stop tolerating 5xx after this many attempts"** → tune
+  `notify.retry.max-attempts` (shared across all retryable
+  outcomes).
+
+### Notes
+
+- `timeout-ms`, `retry.max-attempts`, and `retry.backoff-ms` are
+  three independent dials. The first bounds a single attempt's
+  wall-clock; the other two bound the total attempt count and
+  spacing for any outcome with `retry: true`.
+- If the operator needs per-status-code overrides in future (e.g.
+  `429 → always retry regardless of class default`), a `status` map
+  layered ahead of the class buckets is the natural extension. Out
+  of scope for MVP; the six-outcome surface already covers every
+  current kkv use case.
+- `skip` advances the source-offset position (the batch is
+  considered delivered for ordering purposes) but logs at WARN so
+  operators can grep for dropped batches.
+
+## Notify-only mirrors (zero destinations)
+
+A mirror with `destinations: []` and `notify: { … }` set MUST be
+valid. The use case is "consume from source, emit webhooks, don't
+keep anything durable"; a pure invalidation feed, or a fan-out of
+record-change events into a non-mirror-v3 downstream system.
+
+### Why webhook is not a destination
+
+A destination, in mirror-v3's contract, is a thing that **owns its
+own next-expected source offset** and surfaces it via
+`next_expected_offset()` on startup. The whole "restart correctness
+derives from the destination, never from committed group offsets"
+invariant rests on that. Kafka/FS/S3 sinks all satisfy it: they
+inspect what's already durable on their side and report a number.
+
+A webhook receiver fundamentally cannot. There's no generic
+contract that lets mirror-v3 ask a webhook receiver "what's the
+highest source offset you've successfully processed?". Even a
+sophisticated receiver that tracked it internally would have no
+shared protocol for reporting it back to a generic webhook caller.
+The legacy kkv didn't even try; it relied on Kafka consumer-group
+offsets, which mirror-v3 explicitly does not use.
+
+So `notify` is a *side-effect* of consuming records, not a place
+records are stored. Classifying it as a destination would force
+either a fake `next_expected_offset()` (always 0, or always
+"current") or a separate "destinations don't have to report
+offsets" exception; both of which leak into every sink
+implementation. Keeping it on the mirror as a peer to `destinations`
+keeps the destination trait clean and lets webhook-only mirrors
+exist without distorting the model.
+
+### Restart correctness when there are no destinations
+
+With no durable state, there is no `next_expected_offset` to seek
+to. On every startup the source seeks to the broker's *low
+watermark*, i.e. the earliest record the source still has. Under
+`cleanup.policy=compact` that's effectively offset 0 (or whatever
+survived compaction); under `cleanup.policy=delete` it's whatever
+retention has kept. The mirror then re-fires webhooks for every
+record from that point forward.
+
+For kkv-style cache invalidation this is the *correct* behaviour:
+when the mirror restarts, downstream consumers' caches that depend
+on it are themselves either restarting or holding stale data, and a
+full replay re-syncs them. The legacy kkv had the same shape; it
+held nothing durable and replayed on every restart.
+
+Operators should be aware that "notify-only on a busy topic"
+produces a burst of webhook traffic per mirror restart. Tuning
+`notify.trigger.debounce` upward (larger `max-records`, longer
+`max-time-ms`) coalesces the burst. Adding a cheap blob destination
+(`type: filesystem` to a small PVC, or `type: s3` to a low-cost
+bucket) gives durable resume-from-offset and silences the burst at
+the cost of one more sink.
+
+### Validation rules for notify-only
+
+When `destinations` is empty:
+
+- `notify` MUST be set with at least one target.
+- `notify.trigger.on` MUST be `source-consume` (no destinations to
+  ack, so `destination-flush` is meaningless and the validator
+  rejects it).
+- `format`, `compression`, `keys`, `values`, `compaction`, `flush`
+  are forbidden; they all parameterise destinations that don't
+  exist. (`keys`/`values` may stay as a future opt-in for key/value
+  validation on the source; out of scope for MVP.)
+- `http-access` is forbidden. The cache-v1 contract today requires
+  bootstrapping from durable destination state; a notify-only
+  mirror has none. (A future "bootstrap cache by replaying from
+  broker" mode is conceivable but adds complexity; defer.)
+
+When `destinations` is non-empty AND `notify` is set: no change
+from the rules already specified; both `trigger.on` values are
+allowed, and `http-access` works as before.
+
+### Side note: combining notify with cache-v1 + destinations
+
+The kkv replacement use case needs all three on the same mirror:
+a durable blob destination (parquet to S3 or filesystem), cache-v1
+for `GET /cache/v1/raw/<key>`, and notify so consumers know when
+to re-read. This proposal keeps that combination as the "full"
+shape and notify-only as the minimal one; the schema validator
+doesn't need to choose between them.
+
+## Discovery: why DNS-A is enough
+
+Legacy kkv hit the Kubernetes Endpoints API directly (with a
+matching Role / RoleBinding for `endpoints` `get,watch,list`) to
+enumerate target pods. That ties the mirror to the K8s control
+plane and requires per-namespace RBAC.
+
+For the typical kkv deployment topology (every kkv-target is a
+*headless* Service), the DNS A record set already contains exactly
+the pod IPs kkv was enumerating. A standard resolver returns the
+full set on each query; an HTTP fan-out across all returned
+addresses is equivalent to kkv's Endpoints walk without any K8s
+coupling.
+
+mirror-v3's `fan-out: dns-a` should:
+
+1. Resolve the URL's host on first send. Cache the A/AAAA record set
+   up to the DNS TTL (default 30 s if no TTL is published).
+2. Open one HTTP/1.1 keep-alive connection per address (kept inside
+   a pool, capped at the resolved set size).
+3. POST the batch to all addresses concurrently. Aggregate the
+   results; if any address returns non-2xx after retry, the whole
+   batch is failed.
+4. Re-resolve when the cache TTL expires OR when an address fails
+   repeatedly (forces an immediate re-resolve to pick up scale-up /
+   scale-down).
+
+This handles the rolling-update case: during a Deployment rollout,
+the headless Service's A-record set has both old and new pod IPs
+for a few seconds; mirror-v3 POSTs to both, the old terminating
+pods drain on whatever they got, and the next re-resolve drops
+them. Same behaviour kkv had via Endpoints API.
+
+For non-K8s use (a standalone service behind a single hostname),
+`fan-out: none` skips all of that and uses a single keep-alive
+connection. The choice is per-target so a mirror can mix.
+
+## Interaction with cache-v1
+
+The notify path pushes only after the corresponding records have
+already entered the in-memory cache-v1 view. This guarantees that
+when a consumer re-fetches `/cache/v1/raw/<key>` in response to a
+notify, the value reflects at least the just-notified record. The
+legacy kkv had the same ordering by construction (cache write
+before HTTP push, both in the same consume thread).
+
+Under the default `trigger.on: source-consume`, the per-record
+path is:
+
+1. Apply to the cache-v1 view (`mirror-fs` / `mirror-s3` already
+   does this in `write()`).
+2. Push to destinations as today.
+3. Append to the notify batch buffer (NEW).
+4. If `debounce` trips (record count or wall-clock), drain the
+   buffer asynchronously.
+
+The notify buffer is independent of the destination flush buffer.
+It does NOT depend on `flush.max-time-ms` etc.; consumers want
+fresh invalidation; the destinations can buffer for hours if they
+want. Cache freshness on the consumer side is bounded by
+`notify.trigger.debounce.max-time-ms` (default 250 ms).
+
+Under `trigger.on: destination-flush`, step 4 is replaced by "on
+every successful sink flush, post the just-flushed offset range".
+Cache freshness is then bounded by `flush.max-time-ms` (typically
+seconds-to-minutes), so this mode is wrong for kkv-style cache
+invalidation but right for "downstream wants a hint when a parquet
+lands".
+
+## Interaction with `compaction: log`
+
+No special handling needed. The notify body's `updates` map only
+references keys; under compaction:log the cache-v1 view already
+holds the latest-per-key value, so a re-fetch returns that value.
+If the same key changes twice within one batch, the batch carries
+the key once (set semantics on keys) but the body's `offsets`
+field reflects the highest offset, so the consumer's
+`requireOffset` constraint pins the read to the post-batch state.
+
+## Failure modes and supervision
+
+| Failure                                | mirror-v3 behaviour                                                         |
+|----------------------------------------|-----------------------------------------------------------------------------|
+| Target host fails DNS resolution       | per `outcomes.connrefused` (default `{retry: true, final: fail}`)          |
+| Target TCP refused                     | per `outcomes.connrefused`                                                  |
+| Target slow (no response within timeout-ms) | per `outcomes.timeout` (default `{retry: true, final: fail}`)           |
+| Target returns 2xx                     | per `outcomes.2xx` (default `{retry: false, final: accept}`)                |
+| Target returns 3xx                     | per `outcomes.3xx` (default `{retry: false, final: fail}`)                  |
+| Target returns 4xx                     | per `outcomes.4xx` (default `{retry: false, final: fail}`)                  |
+| Target returns 5xx                     | per `outcomes.5xx` (default `{retry: true, final: fail}`)                   |
+| `retry: true` exhausts `max-attempts`  | apply that outcome's `final` action                                          |
+| One address in a dns-a fan-out fails   | applies per-address; whole batch fails as soon as one address's outcome resolves to `fail` |
+| Buffer growth from slow targets        | backpressure: pause the source consume loop until current batch drains; surface as a metric |
+
+Restart correctness is unaffected: notify is best-effort *and*
+ordered. If the process crashes mid-batch, the records weren't
+committed to the source offset position either, so on restart the
+mirror re-consumes from the destination's `next_expected_offset`
+and re-issues the lost batch.
+
+## Metrics
+
+Adds, alongside the existing `mirror_v3_destination_*` counters:
+
+| Metric                                          | Type    | Labels                                  | Meaning                                       |
+|-------------------------------------------------|---------|------------------------------------------|-----------------------------------------------|
+| `mirror_v3_notify_records_total`                | counter | `topic`, `partition`                     | Records appended to a notify batch            |
+| `mirror_v3_notify_batches_total`                | counter | `topic`, `partition`, `result=ok\|fail`  | Batches sent                                  |
+| `mirror_v3_notify_post_duration_seconds`        | histogram | `topic`, `partition`, `target_host`    | Per-target HTTP latency                       |
+| `mirror_v3_notify_inflight_retry`               | gauge   | `topic`, `partition`, `target_host`      | Current retry attempt (1-based, 0 when idle)  |
+| `mirror_v3_notify_buffer_records`               | gauge   | `topic`, `partition`                     | Current buffer depth                          |
+
+`target_host` is the resolved host the request went to; for
+`fan-out: dns-a` this is the pod IP, so dashboards see per-pod
+latency.
+
+## Logging
+
+- One INFO line at startup per notify-enabled mirror:
+  `notify start mirror=<name> api=kkv-v1 targets=<host>[,host…] fan-out=<mode>`.
+- One INFO line per successful batch:
+  `notify sent mirror=<name> batch_records=<n> highest_offset=<o> targets=<n> elapsed_ms=<m>`.
+- One WARN per failed attempt with retry remaining:
+  `notify retry mirror=<name> target=<addr> attempt=<i>/<max> reason=<err>`.
+- One ERROR on retry exhaustion (mirror-task-fatal):
+  `notify exhausted mirror=<name> target=<addr> attempts=<n>`.
+
+Per-record DEBUG only; counters cover the operational signal.
+
+## Validation
+
+- `notify` requires `http-access.cache-v1` on the same mirror.
+- `notify.targets` non-empty.
+- `notify.trigger.debounce.max-records >= 1`, `max-time-ms >= 1`
+  (when `trigger.on: source-consume`).
+- `notify.timeout-ms >= 1`.
+- `notify.retry.max-attempts >= 1`, `notify.retry.backoff-ms >= 1`.
+- `notify.outcomes` may omit keys; omitted keys fall back to the
+  default table above. Listing all six is allowed and
+  recommended for production configs so the policy is explicit.
+- `final: accept` on `timeout`/`connrefused`/`5xx` with
+  `retry: false` is a valid but unusual combination; the validator
+  warns (operator probably meant `retry: true, final: accept`).
+- **Destinations relaxation** (new in this proposal):
+  `destinations` MAY be empty *if and only if* `notify` is set with
+  at least one target. See "Notify-only mirrors" above for the full
+  matrix of which other fields are then forbidden
+  (`format`/`compression`/`compaction`/`flush`/`http-access`) and
+  which trigger modes are required (`trigger.on: source-consume`).
+- `notify.targets[].url` parses as a valid URL with http:// or https://.
+- Each target's resolved host must produce ≥1 address at startup,
+  otherwise validation fails (catches typos / missing Services
+  before the mirror runs).
+
+## Out-of-scope (future)
+
+- **Authentication.** Bearer tokens / mTLS / HMAC-signed bodies.
+- **Selective subscription.** Subscribe to a key prefix or a header.
+- **Push-only mode for kkv-style consumers.** Notify *with* zero
+  destinations (covered in "Notify-only mirrors") is in scope.
+  Notify without cache-v1 *but with destinations*; i.e. the
+  consumer is expected to re-read from the durable destination
+  rather than from cache-v1; is deferred. Requires a slightly
+  different body shape (record-data inline rather than
+  null-valued `updates`) and is unrelated to the kkv replacement
+  use case driving this proposal.
+- **Multi-API targets.** Same mirror notifying both kkv-v1 and a
+  future variant.
+- **Per-target retry budgets.** Independent failure handling so one
+  bad target doesn't crash the mirror.
+
+Each is a small additive change on top of this minimal core.
+
+## Open questions
+
+1. Should `notify` live on the mirror or as a special entry in
+   `destinations[]`? Putting it on the mirror keeps the
+   destinations-are-durable-storage invariant clean (notify is a
+   side-effect, not a sink). Recommendation: on the mirror.
+2. Should the `updates` body be allowed to be empty (`{}`) when a
+   batch hits `max-records` and the buffered key-set would be large?
+   Consumers using `streamValues()` re-fetch everything anyway.
+   Saves bytes; matches the kkv behaviour on large bursts. Probably
+   worth allowing.
+3. Should a failed batch immediately re-resolve DNS, or only after
+   the TTL elapses? Re-resolving immediately recovers from
+   scale-down faster; staying with the cached set is faster on
+   transient single-pod errors. Recommendation: re-resolve on any
+   failure (cheap; same DNS query that's already cached after).
+4. Should `notify` honour `MIRROR_V3_NOTIFY_DISABLED=true` for ops
+   drills (rolling the mirror without invalidating downstream
+   caches)? Useful for some debugging workflows; harmless if
+   omitted.
+
+---
+
+References:
+
+- `@yolean/kafka-keyvalue` Node client (the receiving side):
+  exports `ON_UPDATE_DEFAULT_PATH = "/kafka-keyvalue/v1/updates"`
+  and `getOnUpdateRoute()` from `index.js`; the request body
+  `{ topic, offsets, updates }` is parsed in `KafkaKeyValue.js`
+  and each `key` in `updates` is re-fetched via cache-v1 with the
+  `requireOffset: highestOffset` constraint.
+- Legacy kkv (Yolean/kafka-keyvalue Quarkus): env vars
+  `TARGET_SERVICE_NAME`, `TARGET_SERVICE_PORT`,
+  `TARGET_SERVICE_NAMESPACE` resolve a headless Service via the
+  Kubernetes Endpoints API; one POST per pod IP per consumed batch.
diff --git a/crates/mirror-bin/Cargo.toml b/crates/mirror-bin/Cargo.toml
index 78bbee6..c173d88 100644
--- a/crates/mirror-bin/Cargo.toml
+++ b/crates/mirror-bin/Cargo.toml
@@ -19,10 +19,12 @@ mirror-envelope = { workspace = true }
 mirror-kafka = { workspace = true }
 mirror-fs = { workspace = true }
 mirror-s3 = { workspace = true }
+mirror-notify-kkv = { workspace = true }
 object_store = { workspace = true }
 clap = { workspace = true }
 anyhow = { workspace = true }
 tokio = { workspace = true }
+async-trait = { workspace = true }
 tracing = { workspace = true }
 tracing-subscriber = { workspace = true }
 serde = { workspace = true }
diff --git a/crates/mirror-bin/src/ack_tracker.rs b/crates/mirror-bin/src/ack_tracker.rs
new file mode 100644
index 0000000..58da341
--- /dev/null
+++ b/crates/mirror-bin/src/ack_tracker.rs
@@ -0,0 +1,325 @@
+//! Per-mirror ack tracking and the periodic source-commit task.
+//!
+//! The supervisor builds one [`AckTracker`] per spawned mirror at
+//! startup. The tracker aggregates two kinds of "we delivered through
+//! offset N" signals:
+//!
+//! * A notify-side signal from `KkvV1Notifier` / `FlushDispatcher`
+//!   (when the mirror has a `notify:` block). The notifier installs
+//!   the tracker as its [`mirror_core::AckSink`] via
+//!   `with_ack_sink`; every successful drain calls
+//!   `note_through(batch.high_offset + 1)`.
+//! * One per-destination signal, fed by [`FlushAckShim`] (blob
+//!   sinks) or [`WriteAckShim`] (Kafka sinks). Each shim sits on a
+//!   destination's existing observer hook and bumps the matching
+//!   [`DestAckSlot::flushed_through`] on every flush / write.
+//!
+//! The periodic commit task in [`spawn_periodic_commit_task`] reads
+//! [`AckTracker::commit_offset`] every
+//! `MIRROR_V3_OFFSET_COMMIT_INTERVAL_MS` (default 5 s), stages the
+//! result via [`mirror_kafka::KafkaCommitHandle::commit_through`],
+//! and flushes it with `commit_pending`. The commit handle is a
+//! cheap clone of an `Arc<StreamConsumer>` so the task can run
+//! independently of the source-owning run loop.
+
+use std::sync::atomic::{AtomicU64, Ordering};
+use std::sync::Arc;
+use std::time::Duration;
+
+use mirror_core::{AckSink, FlushObserver, WriteObserver};
+use mirror_kafka::KafkaCommitHandle;
+use tokio::sync::watch;
+
+const DEFAULT_COMMIT_INTERVAL: Duration = Duration::from_secs(5);
+
+/// Read the commit interval from `MIRROR_V3_OFFSET_COMMIT_INTERVAL_MS`,
+/// falling back to [`DEFAULT_COMMIT_INTERVAL`]. A value of `0`
+/// disables the periodic task (the supervisor then never advances
+/// the broker-side committed offset and the mirror behaves as it did
+/// before this work).
+pub fn commit_interval_from_env() -> Duration {
+    match std::env::var("MIRROR_V3_OFFSET_COMMIT_INTERVAL_MS")
+        .ok()
+        .as_deref()
+    {
+        Some(s) => match s.parse::<u64>() {
+            Ok(ms) => Duration::from_millis(ms),
+            Err(_) => DEFAULT_COMMIT_INTERVAL,
+        },
+        None => DEFAULT_COMMIT_INTERVAL,
+    }
+}
+
+/// One destination's ack slot. Held by both the supervisor (in the
+/// [`AckTracker`]) and by the shim observer installed on the
+/// inner sink, via `Arc::clone`.
+#[derive(Debug)]
+pub struct DestAckSlot {
+    /// Operator-chosen destination name; surfaces in logs and (in a
+    /// later commit) in the structured `/q/health/ready` body.
+    #[allow(dead_code)] // surfaced in commit 7 + commit 10
+    pub name: String,
+    /// Highest offset strictly *below which* this destination has
+    /// durably accepted everything. Monotonic via `fetch_max`.
+    pub flushed_through: AtomicU64,
+    /// Whether this destination's ack gates source-side readiness
+    /// (and, for non-notify mirrors, the source commit). Per-
+    /// destination YAML field lands in a later commit; for now the
+    /// supervisor passes `true` for every destination.
+    #[allow(dead_code)] // honoured in commit 7 + commit 9
+    pub affects_readiness: bool,
+}
+
+impl DestAckSlot {
+    pub fn new(name: String, affects_readiness: bool) -> Self {
+        Self {
+            name,
+            flushed_through: AtomicU64::new(0),
+            affects_readiness,
+        }
+    }
+
+    pub fn note_through(&self, through: u64) {
+        self.flushed_through.fetch_max(through, Ordering::AcqRel);
+    }
+}
+
+/// Per-mirror ack tracker. The `notify` slot is `Some` when the
+/// mirror has a `notify:` block (source-consume or destination-
+/// flush); the destinations list always has one entry per
+/// destination in the YAML.
+pub struct AckTracker {
+    notify: Option<AtomicU64>,
+    destinations: Vec<Arc<DestAckSlot>>,
+}
+
+impl AckTracker {
+    pub fn new(notify_present: bool, destinations: Vec<Arc<DestAckSlot>>) -> Self {
+        let notify = if notify_present {
+            Some(AtomicU64::new(0))
+        } else {
+            None
+        };
+        Self {
+            notify,
+            destinations,
+        }
+    }
+
+    /// The offset the supervisor's periodic commit task should
+    /// stage. Returns 0 when nothing has been delivered yet (the
+    /// commit task interprets 0 as "skip this tick").
+    ///
+    /// For notify mirrors the notify-side ack is authoritative;
+    /// destinations are observability-only. For non-notify mirrors
+    /// the highest destination ack wins — the supervisor commits the
+    /// fastest destination's progress, matching the
+    /// `DELIVERY_SEMANTICS_REVISIT.md § 2` rule that non-notify
+    /// commits are observability rather than restart-resume state.
+    pub fn commit_offset(&self) -> u64 {
+        if let Some(notify) = self.notify.as_ref() {
+            notify.load(Ordering::Acquire)
+        } else {
+            self.destinations
+                .iter()
+                .map(|d| d.flushed_through.load(Ordering::Acquire))
+                .max()
+                .unwrap_or(0)
+        }
+    }
+}
+
+impl AckSink for AckTracker {
+    fn note_through(&self, through: u64) {
+        // Only the notify slot is fed via the AckSink trait surface;
+        // destinations have their own shim observers writing
+        // directly to their `DestAckSlot`s.
+        if let Some(notify) = self.notify.as_ref() {
+            notify.fetch_max(through, Ordering::AcqRel);
+        }
+    }
+}
+
+/// Bridges a blob sink's `FlushObserver` callback into a per-
+/// destination ack slot. The slot's `flushed_through` advances to
+/// `to + 1` after each flush.
+pub struct FlushAckShim {
+    pub dest: Arc<DestAckSlot>,
+}
+
+impl FlushObserver for FlushAckShim {
+    fn on_flushed(&self, _from: u64, to: u64) {
+        self.dest.note_through(to + 1);
+    }
+}
+
+/// Bridges a Kafka sink's `WriteObserver` callback into a per-
+/// destination ack slot. The slot's `flushed_through` advances to
+/// `source_offset + 1` after each accepted produce.
+pub struct WriteAckShim {
+    pub dest: Arc<DestAckSlot>,
+}
+
+impl WriteObserver for WriteAckShim {
+    fn on_written(&self, source_offset: u64) {
+        self.dest.note_through(source_offset + 1);
+    }
+}
+
+/// Spawn the periodic commit task for one mirror. Returns the
+/// `JoinHandle`; callers can drop it (the task self-terminates when
+/// `shutdown_rx` flips `true` or the process exits).
+///
+/// The task is best-effort: it logs and continues on any commit
+/// error rather than crashing the supervisor. The next tick retries,
+/// and the destination chain's own restart-correctness logic is
+/// what protects against lost records — the broker-side committed
+/// offset is an *optimisation* (closes the between-pods notify gap
+/// on next restart) plus an observability handle, not the durable
+/// source of truth.
+pub fn spawn_periodic_commit_task(
+    handle: KafkaCommitHandle,
+    tracker: Arc<AckTracker>,
+    interval: Duration,
+    mirror_name: String,
+    mut shutdown_rx: watch::Receiver<bool>,
+) -> tokio::task::JoinHandle<()> {
+    tokio::spawn(async move {
+        if interval.is_zero() {
+            tracing::info!(
+                mirror = %mirror_name,
+                "MIRROR_V3_OFFSET_COMMIT_INTERVAL_MS=0; periodic commit task disabled"
+            );
+            return;
+        }
+        let mut iv = tokio::time::interval(interval);
+        iv.set_missed_tick_behavior(tokio::time::MissedTickBehavior::Skip);
+        // Consume the immediate tick `tokio::time::interval` fires.
+        iv.tick().await;
+        let mut last_committed: u64 = 0;
+        loop {
+            tokio::select! {
+                biased;
+                _ = shutdown_rx.changed() => {
+                    if *shutdown_rx.borrow() {
+                        tracing::debug!(
+                            mirror = %mirror_name,
+                            "shutdown requested; periodic commit task exiting"
+                        );
+                        return;
+                    }
+                }
+                _ = iv.tick() => {
+                    let off = tracker.commit_offset();
+                    if off == 0 || off == last_committed {
+                        continue;
+                    }
+                    if let Err(e) = handle.commit_through(off) {
+                        tracing::warn!(
+                            mirror = %mirror_name,
+                            offset = off,
+                            error = %e,
+                            "commit_through failed; will retry next tick"
+                        );
+                        continue;
+                    }
+                    if let Err(e) = handle.commit_pending() {
+                        tracing::warn!(
+                            mirror = %mirror_name,
+                            offset = off,
+                            error = %e,
+                            "commit_pending failed; offset is staged, retry next tick"
+                        );
+                        continue;
+                    }
+                    tracing::debug!(
+                        mirror = %mirror_name,
+                        offset = off,
+                        prev = last_committed,
+                        "committed source offset"
+                    );
+                    last_committed = off;
+                }
+            }
+        }
+    })
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn notify_tracker_commit_offset_reflects_note_through() {
+        let tracker = AckTracker::new(true, vec![]);
+        assert_eq!(tracker.commit_offset(), 0);
+        tracker.note_through(5);
+        assert_eq!(tracker.commit_offset(), 5);
+        tracker.note_through(7);
+        assert_eq!(tracker.commit_offset(), 7);
+    }
+
+    #[test]
+    fn notify_tracker_ignores_regressions() {
+        let tracker = AckTracker::new(true, vec![]);
+        tracker.note_through(7);
+        tracker.note_through(3);
+        assert_eq!(
+            tracker.commit_offset(),
+            7,
+            "fetch_max means a lower value cannot regress the slot"
+        );
+    }
+
+    #[test]
+    fn non_notify_tracker_uses_max_destination_ack() {
+        let a = Arc::new(DestAckSlot::new("a".into(), true));
+        let b = Arc::new(DestAckSlot::new("b".into(), true));
+        let tracker = AckTracker::new(false, vec![Arc::clone(&a), Arc::clone(&b)]);
+        assert_eq!(tracker.commit_offset(), 0);
+        a.note_through(10);
+        assert_eq!(tracker.commit_offset(), 10);
+        b.note_through(5);
+        assert_eq!(tracker.commit_offset(), 10, "max wins");
+        b.note_through(20);
+        assert_eq!(tracker.commit_offset(), 20);
+    }
+
+    #[test]
+    fn non_notify_tracker_ignores_ack_sink_note_through() {
+        let dest = Arc::new(DestAckSlot::new("d".into(), true));
+        let tracker = AckTracker::new(false, vec![Arc::clone(&dest)]);
+        // `AckSink::note_through` only feeds the notify slot. A
+        // mirror with no notify block has no notify slot, so this
+        // call is silently dropped — destinations are the only
+        // signal source.
+        tracker.note_through(42);
+        assert_eq!(tracker.commit_offset(), 0);
+        dest.note_through(7);
+        assert_eq!(tracker.commit_offset(), 7);
+    }
+
+    #[test]
+    fn flush_ack_shim_advances_dest_to_to_plus_one() {
+        let dest = Arc::new(DestAckSlot::new("fs".into(), true));
+        let shim = FlushAckShim {
+            dest: Arc::clone(&dest),
+        };
+        shim.on_flushed(0, 9);
+        assert_eq!(dest.flushed_through.load(Ordering::Acquire), 10);
+        shim.on_flushed(10, 19);
+        assert_eq!(dest.flushed_through.load(Ordering::Acquire), 20);
+    }
+
+    #[test]
+    fn write_ack_shim_advances_dest_to_offset_plus_one() {
+        let dest = Arc::new(DestAckSlot::new("kafka".into(), true));
+        let shim = WriteAckShim {
+            dest: Arc::clone(&dest),
+        };
+        for off in 0..5 {
+            shim.on_written(off);
+        }
+        assert_eq!(dest.flushed_through.load(Ordering::Acquire), 5);
+    }
+}
diff --git a/crates/mirror-bin/src/main.rs b/crates/mirror-bin/src/main.rs
index ed1224b..c0f31f2 100644
--- a/crates/mirror-bin/src/main.rs
+++ b/crates/mirror-bin/src/main.rs
@@ -4,11 +4,25 @@ use std::sync::Arc;
 
 use anyhow::{Context, Result};
 use clap::{Parser, Subcommand};
-use mirror_config::{Destination, Mirror};
-use mirror_core::{run_mirror, MetricLabels, MIRROR_LABELS};
+use mirror_config::{Destination, HttpAccess, Mirror};
+
+mod ack_tracker;
+mod readiness_poller;
+use ack_tracker::{
+    commit_interval_from_env, spawn_periodic_commit_task, AckTracker, DestAckSlot, FlushAckShim,
+    WriteAckShim,
+};
+use mirror_core::{
+    heartbeat_interval_from_env, run_mirror_with_notifier, MetricLabels, NoOpNotifier, Record,
+    Sink, SinkError, MIRROR_LABELS,
+};
 use mirror_fs::{FilesystemSink, FilesystemSinkConfig};
 use mirror_kafka::{KafkaSink, KafkaSinkConfig, KafkaSource, KafkaSourceConfig};
 use mirror_s3::{S3Sink, S3SinkConfig};
+use readiness_poller::{
+    readiness_lag_tolerance_from_env, readiness_poll_interval_from_env, spawn_readiness_poller,
+    PollSpec,
+};
 use tracing::Instrument;
 use tracing_subscriber::EnvFilter;
 
@@ -452,7 +466,7 @@ async fn run(path: PathBuf) -> Result<()> {
     }
     if enabled_mirrors.is_empty() {
         anyhow::bail!(
-            "all {} mirror(s) are disabled (enabled: false); nothing to do — \
+            "all {} mirror(s) are disabled (enabled: false); nothing to do - \
              enable at least one mirror or scale this deployment to zero replicas",
             total_mirrors
         );
@@ -471,7 +485,7 @@ async fn run(path: PathBuf) -> Result<()> {
     // One shutdown channel, cloned per mirror. Listening for Ctrl-C
     // here means SIGINT triggers graceful flush; in containers,
     // SIGTERM will arrive on the same path because tokio's
-    // ctrl_c handler is the platform's INT handler — for full SIGTERM
+    // ctrl_c handler is the platform's INT handler - for full SIGTERM
     // support a unix-signals branch can be added next.
     let (shutdown_tx, shutdown_rx) = tokio::sync::watch::channel(false);
     let signal_tx = shutdown_tx.clone();
@@ -495,37 +509,63 @@ async fn run(path: PathBuf) -> Result<()> {
         }
     }
 
-    // Build a shared CacheState if any *enabled* mirror opted into
-    // http-access. Capture each opt-in mirror's source-partition
-    // high-watermark *now* so the readiness gate flips only after
-    // we've consumed past whatever was already there at startup. (KKV
-    // semantics — dependents must not see a partially-rebuilt cache
-    // after a reload.) Disabled mirrors never register, otherwise
-    // their slot would never flip ready and the whole cache would
-    // sit at 503 forever.
-    let cache_state = if enabled_mirrors.iter().any(|m| m.http_access.is_some()) {
-        let state = std::sync::Arc::new(mirror_core::CacheState::new());
+    // Every *enabled* mirror gets a `CacheState` slot, regardless of
+    // whether it has `http_access` or `notify`. The slot is what the
+    // structured `/q/health/ready` body enumerates; downstream
+    // features (HTTP routes, notify suppression gate, source-commit
+    // task) only attach when the mirror opts into them. Disabled
+    // mirrors never register: otherwise their slot would never flip
+    // ready and the aggregate /q/health/ready would sit at 503
+    // forever. Capture each registered mirror's source-partition
+    // high-watermark *now* so the gate flips only after we've
+    // consumed past whatever was already there at startup (KKV
+    // semantics: dependents must not see a partially-rebuilt cache,
+    // and webhook subscribers must not see historical-replay
+    // invalidations).
+    let cache_state = if enabled_mirrors.is_empty() {
+        None
+    } else {
+        let tolerance = readiness_lag_tolerance_from_env();
+        let state = std::sync::Arc::new(
+            mirror_core::CacheState::new().with_readiness_lag_tolerance(tolerance),
+        );
         for m in &enabled_mirrors {
-            if m.http_access.is_some() {
-                let hwm = fetch_hwm_for_mirror(m).await?;
-                tracing::info!(
-                    mirror = %m.name,
-                    topic = %m.topic,
-                    partition = m.partition,
-                    bootstrap_hwm = hwm,
-                    "registering mirror with cache readiness gate"
-                );
-                state.register_mirror(&m.name, hwm);
-            }
+            let hwm = fetch_hwm_for_mirror(m).await?;
+            let last_committed = fetch_committed_offset_for_mirror(m).await?;
+            let is_main = m
+                .http_access
+                .as_ref()
+                .is_some_and(|h| h.cache_v1_main.is_some());
+            tracing::info!(
+                mirror = %m.name,
+                topic = %m.topic,
+                partition = m.partition,
+                bootstrap_hwm = hwm,
+                last_committed = ?last_committed,
+                is_main,
+                lag_tolerance = tolerance,
+                "registering mirror with cache readiness gate"
+            );
+            state.register_mirror_with_topic(
+                &m.name,
+                hwm,
+                last_committed,
+                is_main,
+                &m.topic,
+                m.partition,
+            );
         }
         Some(state)
-    } else {
-        None
     };
 
-    // Spawn the cache HTTP server if any mirror has opt-in. Server
-    // runs until shutdown_rx flips OR /_admin/v1/shutdown is hit.
-    if let Some(state) = cache_state.as_ref() {
+    // Spawn the cache HTTP server if any mirror opted into a route
+    // surface (`cache-v1` or `cache-v1-main`). Mirrors that only
+    // need the bootstrap-hwm gate (notify-only) don't pull in the
+    // server. Runs until shutdown_rx flips OR /_admin/v1/shutdown is hit.
+    let wants_http_routes = enabled_mirrors
+        .iter()
+        .any(|m| m.http_access.as_ref().is_some_and(HttpAccess::any_enabled));
+    if let (Some(state), true) = (cache_state.as_ref(), wants_http_routes) {
         let addr = cache_listen_addr();
         let state = std::sync::Arc::clone(state);
         let cache_shutdown_rx = shutdown_rx.clone();
@@ -575,19 +615,22 @@ fn cache_listen_addr() -> std::net::SocketAddr {
     std::net::SocketAddr::from(([0, 0, 0, 0], port))
 }
 
-/// Materialise a `CacheBinding` for the given mirror if it has
-/// `http-access` set and the supervisor built a shared CacheState.
+/// Materialise a `CacheBinding` for the given mirror. Every enabled
+/// mirror now registers a slot in the shared CacheState (the
+/// supervisor enumerates them in the structured `/q/health/ready`
+/// body), so the binding is materialised whenever a `CacheState`
+/// exists at all. The binding wires the consume loop's TeeSink to
+/// that slot so `apply_record` advances the slot's
+/// `last_applied_offset` and flips the readiness gate at the right
+/// point.
 fn mirror_cache_binding(
     mirror: &Mirror,
     cache: Option<&std::sync::Arc<mirror_core::CacheState>>,
 ) -> Option<mirror_core::CacheBinding> {
-    match (mirror.http_access.as_ref(), cache) {
-        (Some(_), Some(state)) => Some(mirror_core::CacheBinding {
-            state: std::sync::Arc::clone(state),
-            mirror_name: mirror.name.clone(),
-        }),
-        _ => None,
-    }
+    cache.map(|state| mirror_core::CacheBinding {
+        state: std::sync::Arc::clone(state),
+        mirror_name: mirror.name.clone(),
+    })
 }
 
 /// Per-mirror bootstrap watermark. Run in a `spawn_blocking` task
@@ -612,6 +655,36 @@ async fn fetch_hwm_for_mirror(mirror: &Mirror) -> Result<u64> {
     Ok(hwm.max(0) as u64)
 }
 
+/// Read the broker's `__consumer_offsets` for this mirror's group
+/// at startup. `Ok(None)` means the group has no committed value yet
+/// (fresh deploy); the `CacheState` then falls back to
+/// `bootstrap_hwm` for the suppression threshold. Like `fetch_hwm_for_mirror`,
+/// this hits `BaseConsumer` synchronously under `spawn_blocking`.
+async fn fetch_committed_offset_for_mirror(mirror: &Mirror) -> Result<Option<u64>> {
+    let bootstrap = mirror.source.bootstrap_servers.clone();
+    let group_id = mirror
+        .source
+        .group_id
+        .clone()
+        .unwrap_or_else(|| format!("mirror-v3-{}", mirror.name));
+    let topic = mirror.topic.clone();
+    let partition = mirror.partition as i32;
+    let mirror_name = mirror.name.clone();
+    let committed = tokio::task::spawn_blocking(move || {
+        mirror_kafka::fetch_committed_offset(
+            &bootstrap,
+            &group_id,
+            &topic,
+            partition,
+            std::time::Duration::from_secs(10),
+        )
+    })
+    .await
+    .with_context(|| format!("mirror {mirror_name}: committed task join"))?
+    .with_context(|| format!("mirror {mirror_name}: fetch committed offset"))?;
+    Ok(committed)
+}
+
 async fn shutdown_signal(mut rx: tokio::sync::watch::Receiver<bool>) {
     if *rx.borrow() {
         return;
@@ -621,7 +694,7 @@ async fn shutdown_signal(mut rx: tokio::sync::watch::Receiver<bool>) {
 
 /// Install the Prometheus exporter on `0.0.0.0:<port>`. Port defaults
 /// to 9090; override with `MIRROR_V3_METRICS_PORT` (set to `0` to
-/// disable). A failure to bind logs at warn level and is non-fatal —
+/// disable). A failure to bind logs at warn level and is non-fatal -
 /// the operator's observability story degrades, but the mirror keeps
 /// running.
 fn install_metrics_exporter() {
@@ -660,6 +733,12 @@ async fn spawn_mirror(
     );
     let source = KafkaSource::open(source_cfg)
         .with_context(|| format!("opening source for mirror {}", mirror.name))?;
+    // Snapshot two commit handles before the run loop takes
+    // ownership of the source. Each `KafkaCommitHandle` clones the
+    // underlying `Arc<StreamConsumer>` (cheap); the periodic commit
+    // task and the readiness poller each get their own.
+    let commit_handle = source.commit_handle();
+    let commit_handle_for_poller = source.commit_handle();
 
     let name = mirror.name.clone();
     let labels = MetricLabels {
@@ -669,27 +748,170 @@ async fn spawn_mirror(
     let compaction = compaction_label(mirror.compaction);
 
     // Build one inner Sink per destination, then wrap them in a tee.
-    // The single-destination case routes through a length-1 tee too —
+    // The single-destination case routes through a length-1 tee too -
     // this keeps the cache binding's per-record fanout on a single
-    // code path.
-    let mut inners: Vec<(String, Box<dyn mirror_core::Sink>)> =
-        Vec::with_capacity(mirror.destinations.len());
+    // code path. A *notify-only* mirror (no destinations + a notify
+    // block, validated upstream) wraps a single in-memory
+    // [`NotifyOnlySink`] in the tee so the rest of the run loop -
+    // bootstrap, low-watermark alignment, idle-drift checks - keeps
+    // its existing shape.
+    let mut inners: Vec<(String, Box<dyn Sink>)> = Vec::with_capacity(
+        // +1 reserved for the notify-only path; harmless when
+        // destinations is non-empty.
+        mirror.destinations.len().max(1),
+    );
     let mut dest_descriptions: Vec<String> = Vec::with_capacity(mirror.destinations.len());
+    // Per-destination ack slots, shared by Arc with the shims
+    // installed on each inner sink and with the AckTracker that the
+    // periodic commit task reads. `affects_readiness` is set from the
+    // YAML `affects-readiness:` field on each destination (default
+    // true): a destination with `affects-readiness: false` still
+    // records `flushed_through` for observability but is skipped when
+    // computing `MirrorStatus::DestinationLagging`.
+    let mut dest_ack_slots: Vec<Arc<DestAckSlot>> = Vec::with_capacity(mirror.destinations.len());
     for dest in &mirror.destinations {
         let inner_name = dest.effective_name(&mirror.name);
         let kind = destination_type(dest);
         dest_descriptions.push(format!("{inner_name}({kind})"));
-        let sink: Box<dyn mirror_core::Sink> =
+        let mut sink: Box<dyn Sink> =
             open_inner_sink(dest, &mirror, &inner_name, cache.as_ref()).await?;
+        let slot = Arc::new(DestAckSlot::new(
+            inner_name.clone(),
+            dest.affects_readiness(),
+        ));
+        // Pick the right observer hook per destination type. Blob
+        // sinks fire `FlushObserver` per buffered flush; Kafka sinks
+        // commit per-record and fire `WriteObserver`. The shim feeds
+        // the destination ack slot in either case.
+        //
+        // Note: when destination-flush trigger is enabled (only on
+        // mirrors with at least one blob destination), the tee-level
+        // `set_flush_observer` call further down replaces the per-
+        // sink FlushObserver installed here with a tee-coordinated
+        // version. That's intentional: in destination-flush mode the
+        // notify ack is authoritative for source-side commits, so
+        // losing the per-destination ack signal for blob sinks is
+        // acceptable.
+        match dest {
+            Destination::Kafka(_) => {
+                sink.set_write_observer(Arc::new(WriteAckShim {
+                    dest: Arc::clone(&slot),
+                }));
+            }
+            Destination::Filesystem(_) | Destination::S3(_) => {
+                sink.set_flush_observer(Arc::new(FlushAckShim {
+                    dest: Arc::clone(&slot),
+                }));
+            }
+        }
+        dest_ack_slots.push(slot);
         inners.push((inner_name, sink));
     }
-    let tee = mirror_core::TeeSink::open(inners, cache.clone())
+    if inners.is_empty() {
+        // Notify-only mirror: spec says "On every startup the source
+        // seeks to the broker's low watermark". `NotifyOnlySink`
+        // declares `allows_compacted_source = true` so the run loop's
+        // bootstrap branch aligns the (in-memory) head to
+        // `low_watermark`. The notifier sees every record from there
+        // forward.
+        inners.push((
+            "notify-only".to_string(),
+            Box::new(NotifyOnlySink::default()) as Box<dyn Sink>,
+        ));
+        dest_descriptions.push("notify-only".to_string());
+    }
+    let mut tee = mirror_core::TeeSink::open(inners, cache.clone())
         .await
         .map_err(|e| anyhow::anyhow!("opening tee for mirror {name}: {e}"))?;
 
+    // Build the per-mirror ack tracker. Notify-side slot exists iff
+    // the mirror has a `notify:` block; destinations always
+    // contribute (commit 9 wires `affects-readiness` to filter).
+    let notify_present = mirror.notify.is_some();
+    let ack_tracker = Arc::new(AckTracker::new(notify_present, dest_ack_slots));
+
+    // Branch on the notify trigger mode (validated upstream in
+    // mirror-config; see WEBHOOKS.md § Trigger):
+    //   * source-consume → build `KkvV1Notifier`, pass as the run
+    //     loop's `N: Notifier`.
+    //   * destination-flush → build `FlushDispatcher`, attach as the
+    //     TeeSink's `FlushObserver`; the run loop's notifier is
+    //     `NoOpNotifier` (records flow through unobserved).
+    //
+    // In both modes the notifier's `with_ack_sink` installs the
+    // per-mirror `AckTracker` so each successful drain/POST feeds
+    // the periodic commit task's view of "delivered through N".
+    let trigger_mode = mirror.notify.as_ref().map(|n| n.trigger.on);
+    let ack_sink_for_notifier: Arc<dyn mirror_core::AckSink> =
+        Arc::clone(&ack_tracker) as Arc<dyn mirror_core::AckSink>;
+    let notifier_opt = match trigger_mode {
+        Some(mirror_config::TriggerOn::SourceConsume) => {
+            build_source_consume_notifier(&mirror, cache.as_ref())?
+                .map(|n| n.with_ack_sink(Arc::clone(&ack_sink_for_notifier)))
+        }
+        _ => None,
+    };
+    if matches!(
+        trigger_mode,
+        Some(mirror_config::TriggerOn::DestinationFlush)
+    ) {
+        let dispatcher = build_flush_dispatcher(&mirror, cache.as_ref())?
+            .with_ack_sink(Arc::clone(&ack_sink_for_notifier));
+        tee.set_flush_observer(std::sync::Arc::new(dispatcher));
+    }
+
+    // Spawn the periodic source-commit task. It reads
+    // `AckTracker::commit_offset()` every
+    // `MIRROR_V3_OFFSET_COMMIT_INTERVAL_MS` (default 5 s), stages
+    // it via the Kafka commit handle, and flushes to the broker.
+    // The handle clones an `Arc<StreamConsumer>` internally so this
+    // task runs independently of the source-owning run loop.
+    let _commit_task = spawn_periodic_commit_task(
+        commit_handle,
+        Arc::clone(&ack_tracker),
+        commit_interval_from_env(),
+        name.clone(),
+        shutdown_rx.clone(),
+    );
+
+    // Spawn the per-mirror readiness poller when a cache slot
+    // exists (i.e. the mirror has `http_access` or `notify`). The
+    // poller refreshes the broker end offset for the lag-based
+    // readiness predicate and detects source-assignment loss.
+    if let Some(binding) = cache.as_ref() {
+        let _poller = spawn_readiness_poller(
+            PollSpec {
+                mirror_name: name.clone(),
+                bootstrap_servers: mirror.source.bootstrap_servers.clone(),
+                topic: mirror.topic.clone(),
+                partition: mirror.partition as i32,
+                commit_handle: commit_handle_for_poller,
+                cache: Arc::clone(&binding.state),
+            },
+            readiness_poll_interval_from_env(),
+            shutdown_rx.clone(),
+        );
+    } else {
+        // No cache slot => no readiness gate to drive. Drop the
+        // extra handle.
+        drop(commit_handle_for_poller);
+    }
+
     let destinations_log = dest_descriptions.join(",");
+    let notify_log = match &mirror.notify {
+        Some(n) => {
+            let targets: Vec<&str> = n.targets.iter().map(|t| t.url.as_str()).collect();
+            let trigger = match n.trigger.on {
+                mirror_config::TriggerOn::SourceConsume => "source-consume",
+                mirror_config::TriggerOn::DestinationFlush => "destination-flush",
+            };
+            format!(" notify=kkv-v1[{}] trigger={trigger}", targets.join(","))
+        }
+        None => String::new(),
+    };
+
     // Single span carries `mirror = <name>` onto every event emitted
-    // from the spawned task — including the mirror-core logs
+    // from the spawned task - including the mirror-core logs
     // (`starting mirror`, `heartbeat`, etc.) that don't otherwise have
     // access to the operator-chosen mirror name. MIRROR_LABELS still
     // carries topic+partition for metric labeling separately.
@@ -699,14 +921,38 @@ async fn spawn_mirror(
             tracing::info!(
                 destinations = %destinations_log,
                 compaction,
+                notify = %notify_log,
                 "loop start"
             );
-            let result = MIRROR_LABELS
-                .scope(
-                    labels,
-                    run_mirror(source, tee, shutdown_signal(shutdown_rx)),
-                )
-                .await;
+            let heartbeat = heartbeat_interval_from_env();
+            let shutdown = shutdown_signal(shutdown_rx);
+            // Match-on-notifier so the generic `N: Notifier`
+            // monomorphises with the right concrete type per branch
+            // without a `Box<dyn Notifier>` allocation.
+            let result = match notifier_opt {
+                Some(n) => {
+                    MIRROR_LABELS
+                        .scope(
+                            labels,
+                            run_mirror_with_notifier(source, tee, n, shutdown, heartbeat),
+                        )
+                        .await
+                }
+                None => {
+                    MIRROR_LABELS
+                        .scope(
+                            labels,
+                            run_mirror_with_notifier(
+                                source,
+                                tee,
+                                NoOpNotifier,
+                                shutdown,
+                                heartbeat,
+                            ),
+                        )
+                        .await
+                }
+            };
             match result {
                 Ok(()) => Ok(()),
                 Err(e) => Err(anyhow::anyhow!("mirror {name}: {e}")),
@@ -716,6 +962,121 @@ async fn spawn_mirror(
     ))
 }
 
+/// Construct the `KkvV1Notifier` for a mirror with
+/// `trigger.on: source-consume`. Returns `None` when the mirror has
+/// no notify block or uses a different trigger (the supervisor
+/// handles the destination-flush case via [`build_flush_dispatcher`]).
+/// Failures bubble up so the supervisor refuses to spawn a mirror
+/// whose webhook surface can't possibly work.
+///
+/// `cache` carries the shared `CacheState` and the per-mirror name
+/// used by the notifier's bootstrap_hwm suppression gate.
+/// `mirror-config` validation requires `http-access: cache-v1`
+/// whenever `notify` is set, so this binding is always present for
+/// any mirror that reaches this branch.
+fn build_source_consume_notifier(
+    mirror: &Mirror,
+    cache: Option<&mirror_core::CacheBinding>,
+) -> Result<Option<mirror_notify_kkv::KkvV1Notifier>> {
+    let Some(notify) = mirror.notify.as_ref() else {
+        return Ok(None);
+    };
+    let binding = cache.ok_or_else(|| {
+        anyhow::anyhow!(
+            "mirror {} has notify but no cache binding; validator should reject this",
+            mirror.name
+        )
+    })?;
+    // Only kkv-v1 exists today; validator rejects other api: values.
+    let notifier = mirror_notify_kkv::KkvV1Notifier::from_config(
+        notify,
+        mirror.topic.clone(),
+        mirror.partition as i32,
+        std::sync::Arc::clone(&binding.state),
+        binding.mirror_name.clone(),
+    )
+    .with_context(|| format!("building notify dispatcher for mirror {}", mirror.name))?;
+    Ok(Some(notifier))
+}
+
+/// Construct the `FlushDispatcher` for a mirror with
+/// `trigger.on: destination-flush`. Validator guarantees the mirror
+/// has notify set; this asserts on the trigger variant.
+fn build_flush_dispatcher(
+    mirror: &Mirror,
+    cache: Option<&mirror_core::CacheBinding>,
+) -> Result<mirror_notify_kkv::FlushDispatcher> {
+    let notify = mirror
+        .notify
+        .as_ref()
+        .expect("build_flush_dispatcher called with no notify block");
+    debug_assert!(matches!(
+        notify.trigger.on,
+        mirror_config::TriggerOn::DestinationFlush
+    ));
+    let binding = cache.ok_or_else(|| {
+        anyhow::anyhow!(
+            "mirror {} has notify but no cache binding; validator should reject this",
+            mirror.name
+        )
+    })?;
+    let dispatcher = mirror_notify_kkv::FlushDispatcher::from_config(
+        notify,
+        mirror.topic.clone(),
+        mirror.partition as i32,
+        std::sync::Arc::clone(&binding.state),
+        binding.mirror_name.clone(),
+    )
+    .with_context(|| {
+        format!(
+            "building notify flush dispatcher for mirror {}",
+            mirror.name
+        )
+    })?;
+    Ok(dispatcher)
+}
+
+/// In-memory sink for `destinations: []` notify-only mirrors. Holds
+/// only its own "next expected offset" and accepts any record at or
+/// above it. `allows_compacted_source = true` so the run loop's
+/// bootstrap branch can align the head to the broker's low
+/// watermark - matching the spec's "seeks to low watermark on every
+/// startup" behaviour for notify-only mirrors.
+#[derive(Debug, Default)]
+struct NotifyOnlySink {
+    position: u64,
+}
+
+#[async_trait::async_trait]
+impl Sink for NotifyOnlySink {
+    async fn next_expected_offset(&mut self) -> Result<u64, SinkError> {
+        Ok(self.position)
+    }
+
+    async fn write(&mut self, record: Record) -> Result<(), SinkError> {
+        if record.source_offset < self.position {
+            return Err(SinkError::UnexpectedPosition {
+                expected: self.position,
+                actual: record.source_offset,
+            });
+        }
+        // Accept forward gaps under compaction:log; bump position to
+        // `record.source_offset + 1`. Matches the loosened write
+        // contract in `mirror-fs` / `mirror-s3` for compacted sources.
+        self.position = record.source_offset + 1;
+        Ok(())
+    }
+
+    fn allows_compacted_source(&self) -> bool {
+        true
+    }
+
+    async fn align_to_source_low_watermark(&mut self, low_watermark: u64) -> Result<(), SinkError> {
+        self.position = low_watermark;
+        Ok(())
+    }
+}
+
 async fn open_inner_sink(
     dest: &Destination,
     mirror: &Mirror,
diff --git a/crates/mirror-bin/src/readiness_poller.rs b/crates/mirror-bin/src/readiness_poller.rs
new file mode 100644
index 0000000..dd6dc32
--- /dev/null
+++ b/crates/mirror-bin/src/readiness_poller.rs
@@ -0,0 +1,154 @@
+//! Per-mirror readiness poller.
+//!
+//! The supervisor spawns one of these per registered mirror at
+//! startup. Every `MIRROR_V3_READINESS_POLL_MS` (default 2 s) the
+//! task:
+//!
+//!   1. Fetches the source partition's high-watermark via
+//!      `mirror_kafka::fetch_high_watermark` (cheap; one
+//!      `BaseConsumer` per call) and pushes it into
+//!      `CacheState::set_broker_end_offset`. The cache's status
+//!      predicate then recomputes lag = end_offset - last_applied.
+//!   2. Reads the run loop's consumer assignment via the shared
+//!      `KafkaCommitHandle`. If `(topic, partition)` is no longer
+//!      assigned, calls `CacheState::mark_source_unassigned`; if it
+//!      reappears, calls `mark_source_assigned`.
+//!
+//! The task is best-effort: a transient fetch error logs and
+//! continues. It exits when the supervisor's shutdown signal flips.
+
+use std::sync::Arc;
+use std::time::Duration;
+
+use mirror_core::CacheState;
+use mirror_kafka::KafkaCommitHandle;
+use tokio::sync::watch;
+
+const DEFAULT_READINESS_POLL: Duration = Duration::from_secs(2);
+
+/// Read the poll interval from `MIRROR_V3_READINESS_POLL_MS`,
+/// falling back to [`DEFAULT_READINESS_POLL`]. A value of `0`
+/// disables the poller.
+pub fn readiness_poll_interval_from_env() -> Duration {
+    match std::env::var("MIRROR_V3_READINESS_POLL_MS").ok().as_deref() {
+        Some(s) => match s.parse::<u64>() {
+            Ok(ms) => Duration::from_millis(ms),
+            Err(_) => DEFAULT_READINESS_POLL,
+        },
+        None => DEFAULT_READINESS_POLL,
+    }
+}
+
+/// Read the lag tolerance from `MIRROR_V3_READINESS_LAG`, falling
+/// back to `0` (any positive lag fires `LagBehindSource`).
+pub fn readiness_lag_tolerance_from_env() -> u64 {
+    std::env::var("MIRROR_V3_READINESS_LAG")
+        .ok()
+        .as_deref()
+        .and_then(|s| s.parse().ok())
+        .unwrap_or(0)
+}
+
+pub struct PollSpec {
+    pub mirror_name: String,
+    pub bootstrap_servers: String,
+    pub topic: String,
+    pub partition: i32,
+    pub commit_handle: KafkaCommitHandle,
+    pub cache: Arc<CacheState>,
+}
+
+/// Spawn the readiness poller for one mirror. Returns the
+/// `JoinHandle`; callers can drop it (the task self-terminates when
+/// the shutdown signal flips).
+pub fn spawn_readiness_poller(
+    spec: PollSpec,
+    interval: Duration,
+    mut shutdown_rx: watch::Receiver<bool>,
+) -> tokio::task::JoinHandle<()> {
+    tokio::spawn(async move {
+        if interval.is_zero() {
+            tracing::info!(
+                mirror = %spec.mirror_name,
+                "MIRROR_V3_READINESS_POLL_MS=0; readiness poller disabled"
+            );
+            return;
+        }
+        let mut iv = tokio::time::interval(interval);
+        iv.set_missed_tick_behavior(tokio::time::MissedTickBehavior::Skip);
+        // Consume the immediate tick `tokio::time::interval` fires.
+        iv.tick().await;
+        loop {
+            tokio::select! {
+                biased;
+                _ = shutdown_rx.changed() => {
+                    if *shutdown_rx.borrow() {
+                        tracing::debug!(
+                            mirror = %spec.mirror_name,
+                            "shutdown; readiness poller exiting"
+                        );
+                        return;
+                    }
+                }
+                _ = iv.tick() => {
+                    // Step 1: source HWM
+                    let bootstrap = spec.bootstrap_servers.clone();
+                    let topic = spec.topic.clone();
+                    let partition = spec.partition;
+                    let hwm_result = tokio::task::spawn_blocking(move || {
+                        mirror_kafka::fetch_high_watermark(
+                            &bootstrap,
+                            &topic,
+                            partition,
+                            Duration::from_secs(5),
+                        )
+                    })
+                    .await;
+                    match hwm_result {
+                        Ok(Ok(hwm)) => {
+                            spec.cache
+                                .set_broker_end_offset(&spec.mirror_name, hwm.max(0) as u64);
+                        }
+                        Ok(Err(e)) => {
+                            tracing::warn!(
+                                mirror = %spec.mirror_name,
+                                error = %e,
+                                "readiness poller: fetch_high_watermark failed; will retry"
+                            );
+                        }
+                        Err(e) => {
+                            tracing::warn!(
+                                mirror = %spec.mirror_name,
+                                error = %e,
+                                "readiness poller: hwm join failed"
+                            );
+                        }
+                    }
+
+                    // Step 2: assignment check
+                    match spec.commit_handle.current_assignment_includes() {
+                        Ok(true) => {
+                            spec.cache.mark_source_assigned(&spec.mirror_name);
+                        }
+                        Ok(false) => {
+                            tracing::warn!(
+                                mirror = %spec.mirror_name,
+                                topic = %spec.topic,
+                                partition = spec.partition,
+                                "readiness poller: source partition is no longer assigned"
+                            );
+                            spec.cache.mark_source_unassigned(&spec.mirror_name);
+                        }
+                        Err(e) => {
+                            tracing::warn!(
+                                mirror = %spec.mirror_name,
+                                error = %e,
+                                "readiness poller: assignment check failed"
+                            );
+                        }
+                    }
+                }
+            }
+        }
+    })
+}
diff --git a/crates/mirror-cache/src/lib.rs b/crates/mirror-cache/src/lib.rs
index a5f5711..6464a9b 100644
--- a/crates/mirror-cache/src/lib.rs
+++ b/crates/mirror-cache/src/lib.rs
@@ -1,21 +1,39 @@
 //! HTTP surface for mirror-v3's KKV-compatibility mode.
 //!
-//! Hosts a drop-in replacement for the `GET /cache/v1/{raw,offset,keys,values}`
-//! endpoints from [Yolean/kafka-keyvalue](https://github.com/Yolean/kafka-keyvalue).
-//! Reads come from the shared [`CacheState`] owned by `mirror-core`;
-//! the sinks (mirror-fs / mirror-s3) populate it per-record from the
-//! consume loop, so freshness is independent of bucket-write cadence.
+//! Two route trees serve the kkv-shaped read surface:
+//!
+//! - `/cache/v1/{mirror}/...` is always mounted; one entry per
+//!   `http-access.cache-v1` opt-in mirror. Each path dispatches to
+//!   that mirror's own per-mirror view and gates on its per-mirror
+//!   [`MirrorStatus`]: 503 (with a [`MirrorReadiness`] JSON body
+//!   naming the unhealthy state) whenever the mirror is not
+//!   `Ready`.
+//! - `/cache/v1/...` (unprefixed) is mounted iff some mirror opted
+//!   into `http-access.cache-v1-main`; the validator enforces
+//!   at-most-one and `[`CacheState::main_mirror`] tracks which one.
+//!   It is a thin alias onto that singleton mirror's per-mirror
+//!   routes — a migration aid for consumers that haven't picked up
+//!   the per-mirror paths yet.
 //!
 //! The server also exposes:
 //!
-//! - `POST /_admin/v1/shutdown` and `POST /_admin/v1/shutdown/{exitcode}` — operator hooks.
-//! - `GET /openapi.json` and `GET /openapi.yaml` — auto-generated OpenAPI 3.1 spec.
-//! - `GET /docs` — Scalar UI rendering the spec.
+//! - `GET /q/health/ready`: drop-in compat alias for the legacy
+//!   Quarkus kkv health endpoint. Returns `200 OK` when every
+//!   registered mirror is `Ready`, `503 Service Unavailable`
+//!   otherwise. Body is a [`ReadinessReport`] in both cases — the
+//!   `@yolean/kafka-keyvalue` Node client inspects only the status
+//!   code, so the JSON body is transparent to it but greppable by
+//!   on-call.
+//! - `POST /_admin/v1/shutdown` and `POST /_admin/v1/shutdown/{exitcode}`: operator hooks.
+//! - `GET /openapi.json` and `GET /openapi.yaml`: auto-generated OpenAPI 3.1 spec.
+//! - `GET /docs`: Scalar UI rendering the spec.
 //!
-//! Readiness: every endpoint under `/cache/v1` returns `503 Service
-//! Unavailable` until `CacheState::is_ready()` flips to `true`
-//! (every registered mirror has caught up to its bootstrap
-//! high-watermark). The flag is sticky — once ready, always ready.
+//! Readiness: every `/cache/v1` route gates on its target mirror's
+//! [`MirrorStatus`]. The aggregate `is_ready()` (every registered
+//! mirror in `Ready`) backs `/q/health/ready`. Status is non-sticky:
+//! a mirror that drops out of `Ready` (lag, source assignment loss,
+//! gating destination falls behind) flips both the per-mirror cache
+//! routes and the aggregate health endpoint back to 503.
 
 use std::net::SocketAddr;
 use std::sync::Arc;
@@ -24,9 +42,10 @@ use axum::{
     extract::{Path, State},
     http::{HeaderMap, HeaderValue, StatusCode},
     response::{IntoResponse, Response},
+    Json,
 };
 use mirror_core::cache::TopicPartitionOffset;
-use mirror_core::CacheState;
+use mirror_core::{CacheState, MirrorStatus, MirrorStatusSnapshot};
 use serde::Serialize;
 use tokio::sync::oneshot;
 use utoipa::OpenApi;
@@ -59,6 +78,156 @@ impl From<&TopicPartitionOffset> for TopicPartitionOffsetJson {
     }
 }
 
+/// Aggregate readiness state for the process. The discriminator
+/// string lets a grep-friendly consumer distinguish "warming up but
+/// expected to clear shortly" (a cold start) from "something is
+/// wrong" (a mirror went degraded after first reaching Ready).
+#[derive(Debug, Clone, Serialize, PartialEq, Eq, utoipa::ToSchema)]
+#[serde(rename_all = "lowercase")]
+pub enum AggregateReadiness {
+    /// Every registered mirror is `Ready`. HTTP status 200.
+    Ready,
+    /// At least one mirror is `Warming` and no mirror is in any
+    /// non-warming non-ready state. HTTP status 503.
+    Warming,
+    /// At least one mirror is in a non-warming non-ready state
+    /// (lag, source unassigned, destination lagging). HTTP status 503.
+    Degraded,
+}
+
+/// One mirror's slice of the readiness response. Returned both as
+/// an element of [`ReadinessReport::mirrors`] and as the standalone
+/// body of the per-mirror `/cache/v1/{mirror}/...` 503 response so a
+/// client library can surface the reason without a second request.
+#[derive(Debug, Clone, Serialize, PartialEq, Eq, utoipa::ToSchema)]
+pub struct MirrorReadiness {
+    pub name: String,
+    /// String discriminator for the status, easy to grep:
+    /// `ready` | `warming` | `lag_behind_source` | `source_unassigned`
+    /// | `destination_lagging`.
+    pub status: &'static str,
+    /// Source-side detail: topic, partition, assignment, offsets.
+    pub source: MirrorReadinessSource,
+    /// Status-specific detail: the lagging destination's name + lag
+    /// (when `status == "destination_lagging"`), or the source lag
+    /// (when `status == "lag_behind_source"`). `None` otherwise.
+    #[serde(skip_serializing_if = "Option::is_none")]
+    pub destination: Option<MirrorReadinessDestination>,
+}
+
+#[derive(Debug, Clone, Serialize, PartialEq, Eq, utoipa::ToSchema)]
+pub struct MirrorReadinessSource {
+    pub topic: String,
+    pub partition: u32,
+    pub assigned: bool,
+    pub end_offset: u64,
+    pub last_applied_offset: u64,
+    /// `end_offset - last_applied_offset`, saturating at 0 so a
+    /// late-arriving high-watermark fetch can't underflow.
+    pub lag: u64,
+}
+
+#[derive(Debug, Clone, Serialize, PartialEq, Eq, utoipa::ToSchema)]
+pub struct MirrorReadinessDestination {
+    pub name: String,
+    pub lag: u64,
+}
+
+/// Full body of the readiness endpoint. Always serialised; the
+/// HTTP status code (200 vs 503) is determined by `ready`.
+#[derive(Debug, Clone, Serialize, PartialEq, Eq, utoipa::ToSchema)]
+pub struct ReadinessReport {
+    pub ready: AggregateReadiness,
+    pub mirrors: Vec<MirrorReadiness>,
+    /// Grep-friendly list of mirror names whose status is not
+    /// `ready`. Empty when `ready == "ready"`.
+    pub unhealthy: Vec<String>,
+}
+
+impl MirrorReadiness {
+    fn from_snapshot(snap: MirrorStatusSnapshot) -> Self {
+        let (status, destination) = match &snap.status {
+            MirrorStatus::Ready => ("ready", None),
+            MirrorStatus::Warming => ("warming", None),
+            MirrorStatus::LagBehindSource { .. } => ("lag_behind_source", None),
+            MirrorStatus::SourceUnassigned { .. } => ("source_unassigned", None),
+            MirrorStatus::DestinationLagging { name, lag } => (
+                "destination_lagging",
+                Some(MirrorReadinessDestination {
+                    name: name.clone(),
+                    lag: *lag,
+                }),
+            ),
+        };
+        let lag = snap
+            .broker_end_offset
+            .saturating_sub(snap.last_applied_offset);
+        Self {
+            name: snap.name,
+            status,
+            source: MirrorReadinessSource {
+                topic: snap.topic,
+                partition: snap.partition,
+                assigned: snap.source_assigned,
+                end_offset: snap.broker_end_offset,
+                last_applied_offset: snap.last_applied_offset,
+                lag,
+            },
+            destination,
+        }
+    }
+}
+
+/// Build the structured readiness report from a `CacheState`
+/// snapshot. The report and the HTTP status code (200 iff every
+/// mirror is `Ready`) are computed together so they cannot drift.
+pub fn build_readiness_report(cache: &CacheState) -> (StatusCode, ReadinessReport) {
+    let mut snaps = cache.status_snapshot();
+    snaps.sort_by(|a, b| a.name.cmp(&b.name));
+    let mut mirrors = Vec::with_capacity(snaps.len());
+    let mut unhealthy = Vec::new();
+    let mut all_ready = !snaps.is_empty();
+    let mut any_warming = false;
+    let mut any_degraded = false;
+    for snap in snaps {
+        let entry = MirrorReadiness::from_snapshot(snap);
+        if entry.status != "ready" {
+            all_ready = false;
+            unhealthy.push(entry.name.clone());
+            if entry.status == "warming" {
+                any_warming = true;
+            } else {
+                any_degraded = true;
+            }
+        }
+        mirrors.push(entry);
+    }
+    let ready = if all_ready {
+        AggregateReadiness::Ready
+    } else if any_degraded {
+        AggregateReadiness::Degraded
+    } else if any_warming {
+        AggregateReadiness::Warming
+    } else {
+        // No registered mirrors: treat as warming, since the
+        // process is up but has nothing to be ready for yet.
+        AggregateReadiness::Warming
+    };
+    let code = if matches!(ready, AggregateReadiness::Ready) {
+        StatusCode::OK
+    } else {
+        StatusCode::SERVICE_UNAVAILABLE
+    };
+    (
+        code,
+        ReadinessReport {
+            ready,
+            mirrors,
+            unhealthy,
+        },
+    )
+}
+
 /// Server-side state shared across handlers.
 #[derive(Clone)]
 struct AppState {
@@ -70,6 +239,10 @@ struct AppState {
 /// metadata attached. Shared between [`build_router`] (live serving)
 /// and [`openapi_doc`] (spec generation) so the wire surface and the
 /// committed spec can't drift.
+///
+/// Only the per-mirror routes are committed to the spec; the
+/// unprefixed `cache-v1-main` aliases are runtime-conditional and
+/// described in the per-mirror operation's description instead.
 fn open_api_router(state: AppState) -> OpenApiRouter {
     OpenApiRouter::with_openapi(ApiDoc::openapi())
         .routes(routes!(raw_by_key))
@@ -95,21 +268,29 @@ pub fn openapi_doc() -> utoipa::openapi::OpenApi {
 }
 
 /// Build the full router for the cache HTTP server, including
-/// `/cache/v1`, `/_admin/v1`, the OpenAPI spec endpoints, and the
-/// Scalar `/docs` UI. The returned router is ready to serve.
+/// per-mirror `/cache/v1/{mirror}/...` routes, the unprefixed
+/// `/cache/v1/...` `cache-v1-main` alias (when set),
+/// `/_admin/v1`, the OpenAPI spec endpoints, and the Scalar `/docs`
+/// UI. The returned router is ready to serve.
 ///
 /// `shutdown_tx` is consumed by `POST /_admin/v1/shutdown[/{exitcode}]`
 /// to signal the supervisor that a clean exit is requested.
 pub fn build_router(cache: Arc<CacheState>, shutdown_tx: oneshot::Sender<i32>) -> axum::Router {
+    // Hold extra clones for closures registered after the main
+    // `state.cache` is moved into the OpenAPI router via
+    // `open_api_router(state)`.
+    let cache_for_ready = Arc::clone(&cache);
+    let main_mirror = cache.main_mirror();
     let state = AppState {
         cache,
         shutdown_tx: Arc::new(tokio::sync::Mutex::new(Some(shutdown_tx))),
     };
+    let main_state = state.clone();
     let (api_router, api) = open_api_router(state).split_for_parts();
 
     let openapi_json = api.clone();
     let openapi_yaml = api.clone();
-    api_router
+    let mut router = api_router
         .route(
             "/openapi.json",
             axum::routing::get(move || async move { axum::Json(openapi_json).into_response() }),
@@ -126,7 +307,95 @@ pub fn build_router(cache: Arc<CacheState>, shutdown_tx: oneshot::Sender<i32>) -
                     .into_response()
             }),
         )
-        .merge(axum::Router::from(Scalar::with_url("/docs", api)))
+        // Drop-in for the Yolean/kafka-keyvalue Quarkus binary's
+        // `/q/health/ready` SmallRye-Health endpoint. The Node
+        // `@yolean/kafka-keyvalue` client's `onReady()` only inspects
+        // the HTTP status code, so a structured JSON body is
+        // transparent to it. The body names the unhealthy mirror(s)
+        // for on-call grep: see [`ReadinessReport`].
+        //
+        // Kept off the OpenAPI spec because the route is a compat
+        // shim; the JSON shape is described by the
+        // `ReadinessReport` `ToSchema` impl exposed in the spec via
+        // its component reference under `/openapi.json`.
+        .route(
+            "/q/health/ready",
+            axum::routing::get(move || {
+                let cache = Arc::clone(&cache_for_ready);
+                async move {
+                    let (code, body) = build_readiness_report(&cache);
+                    (code, Json(body)).into_response()
+                }
+            }),
+        );
+
+    // `cache-v1-main` mounts the unprefixed `/cache/v1/...` paths
+    // onto the named mirror's view; without it, the unprefixed
+    // paths are not served at all (consumers must use the
+    // per-mirror `/cache/v1/{mirror}/...` paths). The handlers reuse
+    // the per-mirror code paths with the resolved name; kept off
+    // the OpenAPI spec because the route set is config-conditional.
+    if let Some(name) = main_mirror {
+        router = router
+            .route(
+                "/cache/v1/raw/{key}",
+                axum::routing::get({
+                    let name = name.clone();
+                    let state = main_state.clone();
+                    move |Path(key): Path<String>| {
+                        let name = name.clone();
+                        let state = state.clone();
+                        async move { raw_by_key(State(state), Path((name, key))).await }
+                    }
+                }),
+            )
+            .route(
+                "/cache/v1/offset/{topic}/{partition}",
+                axum::routing::get({
+                    let name = name.clone();
+                    let state = main_state.clone();
+                    move |Path((topic, partition)): Path<(String, u32)>| {
+                        let name = name.clone();
+                        let state = state.clone();
+                        async move {
+                            offset_for_partition(State(state), Path((name, topic, partition))).await
+                        }
+                    }
+                }),
+            )
+            .route(
+                "/cache/v1/keys",
+                axum::routing::get({
+                    let name = name.clone();
+                    let state = main_state.clone();
+                    move || {
+                        let name = name.clone();
+                        let state = state.clone();
+                        async move { keys(State(state), Path(name)).await }
+                    }
+                }),
+            )
+            .route(
+                "/cache/v1/values",
+                axum::routing::get({
+                    let name = name.clone();
+                    let state = main_state.clone();
+                    move || {
+                        let name = name.clone();
+                        let state = state.clone();
+                        async move { values(State(state), Path(name)).await }
+                    }
+                }),
+            );
+    } else {
+        // No main mirror: the `main_state` clone exists only because
+        // the compiler captures both branches into the same scope.
+        // Drop it explicitly so clippy doesn't warn about an unused
+        // binding in the no-main path.
+        drop(main_state);
+    }
+
+    router.merge(axum::Router::from(Scalar::with_url("/docs", api)))
 }
 
 /// Spawn the HTTP server on `addr` and run until the supervisor
@@ -175,21 +444,33 @@ pub enum ServeError {
 
 /// Aggregate OpenAPI 3.1 document. Endpoints are registered through
 /// `OpenApiRouter::routes!(...)` so the spec stays in lock-step with
-/// the actual handler set — adding or removing a route here without
+/// the actual handler set; adding or removing a route here without
 /// updating the router (or vice versa) is impossible.
 #[derive(OpenApi)]
 #[openapi(
     info(
         title = "mirror-v3 cache",
         description = "Drop-in HTTP surface for Yolean/kafka-keyvalue's /cache/v1. \
-                       The state is a merged in-memory `key → latest-value` view \
-                       across every mirror with `http-access: { api: cache-v1 }`. \
-                       Updates are per-record from the consume loop; reads return \
-                       503 until every registered mirror has caught up to its \
+                       Each opt-in mirror (`http-access.cache-v1`) owns its own \
+                       in-memory `key → latest-value` view, exposed under \
+                       `/cache/v1/{mirror}/...`. A single mirror may additionally \
+                       opt into `cache-v1-main`, which mounts the unprefixed \
+                       `/cache/v1/...` paths onto its view as a migration alias \
+                       for legacy kkv consumers; these unprefixed routes are \
+                       config-conditional and intentionally omitted from this \
+                       spec. Updates are per-record from the consume loop; reads \
+                       return 503 until the target mirror has caught up to its \
                        startup high-watermark.",
         version = "1.0.0",
     ),
-    components(schemas(TopicPartitionOffsetJson)),
+    components(schemas(
+        TopicPartitionOffsetJson,
+        AggregateReadiness,
+        MirrorReadiness,
+        MirrorReadinessSource,
+        MirrorReadinessDestination,
+        ReadinessReport,
+    )),
     tags(
         (name = "cache", description = "Read-only cache API (KKV-compatible)"),
         (name = "admin", description = "Operator endpoints"),
@@ -197,21 +478,43 @@ pub enum ServeError {
 )]
 struct ApiDoc;
 
-// Allowed locally: the `Err` payload IS the response — boxing it
-// would force every readiness-gated handler to deref before
-// returning, with zero observable benefit.
+/// Decide which mirror a `/cache/v1/{mirror}/...` request hits and
+/// gate on its per-mirror readiness state. Returns `Ok(())` for the
+/// handler to proceed, or an already-built response for the failure
+/// cases:
+///
+/// - 404 if the named mirror is not registered;
+/// - 503 with the matching [`MirrorReadiness`] JSON body if the
+///   mirror is registered but is not currently [`MirrorStatus::Ready`].
+///   Same shape as the corresponding element in
+///   `/q/health/ready`'s `mirrors` array, so a client library can
+///   surface the reason without a second request.
+///
+/// Allowed locally: the `Err` payload IS the response; boxing it
+/// would force every readiness-gated handler to deref before
+/// returning, with zero observable benefit.
 #[allow(clippy::result_large_err)]
-fn ready_or_503(state: &AppState) -> Result<(), Response> {
-    if state.cache.is_ready() {
-        Ok(())
-    } else {
-        Err(StatusCode::SERVICE_UNAVAILABLE.into_response())
+fn resolve_mirror(state: &AppState, mirror: &str) -> Result<(), Response> {
+    let Some(snap) = state
+        .cache
+        .status_snapshot()
+        .into_iter()
+        .find(|s| s.name == mirror)
+    else {
+        return Err(StatusCode::NOT_FOUND.into_response());
+    };
+    if matches!(snap.status, MirrorStatus::Ready) {
+        return Ok(());
     }
+    let body = MirrorReadiness::from_snapshot(snap);
+    Err((StatusCode::SERVICE_UNAVAILABLE, Json(body)).into_response())
 }
 
-fn offsets_header(state: &AppState) -> HeaderMap {
+fn offsets_header_for(state: &AppState, mirror: &str) -> HeaderMap {
     let mut headers = HeaderMap::new();
-    let offsets = state.cache.snapshot_offsets();
+    let Some(offsets) = state.cache.snapshot_offsets_for(mirror) else {
+        return headers;
+    };
     let payload: Vec<TopicPartitionOffsetJson> =
         offsets.iter().map(TopicPartitionOffsetJson::from).collect();
     if let Ok(value) = serde_json::to_string(&payload) {
@@ -222,32 +525,40 @@ fn offsets_header(state: &AppState) -> HeaderMap {
     headers
 }
 
-/// GET /cache/v1/raw/{key} — fetch a value by key.
+/// GET /cache/v1/{mirror}/raw/{key}; fetch a value by key from the
+/// named mirror's view. The unprefixed `/cache/v1/raw/{key}` alias
+/// is mounted by `build_router` when one mirror opted into
+/// `http-access.cache-v1-main`, and dispatches here with that
+/// mirror's name.
 #[utoipa::path(
     get,
-    path = "/cache/v1/raw/{key}",
+    path = "/cache/v1/{mirror}/raw/{key}",
     tag = "cache",
     params(
+        ("mirror" = String, Path, description = "Name of the `http-access.cache-v1` mirror to read from"),
         ("key" = String, Path, description = "URL-encoded key (UTF-8 string)")
     ),
     responses(
         (status = 200, description = "Value bytes for the requested key", body = Vec<u8>, content_type = "application/octet-stream"),
         (status = 400, description = "Empty or invalid key"),
-        (status = 404, description = "Key not in cache"),
-        (status = 503, description = "Cache is not yet caught up to the source"),
+        (status = 404, description = "Mirror unknown, or key not in cache"),
+        (status = 503, description = "Mirror is not currently Ready; body is a MirrorReadiness object", body = MirrorReadiness),
     ),
 )]
-async fn raw_by_key(State(state): State<AppState>, Path(key): Path<String>) -> Response {
-    if let Err(r) = ready_or_503(&state) {
+async fn raw_by_key(
+    State(state): State<AppState>,
+    Path((mirror, key)): Path<(String, String)>,
+) -> Response {
+    if let Err(r) = resolve_mirror(&state, &mirror) {
         return r;
     }
     if key.is_empty() {
         return StatusCode::BAD_REQUEST.into_response();
     }
-    match state.cache.get_value(&key) {
+    match state.cache.get_value_for(&mirror, &key) {
         None => StatusCode::NOT_FOUND.into_response(),
         Some(bytes) => {
-            let mut headers = offsets_header(&state);
+            let mut headers = offsets_header_for(&state, &mirror);
             headers.insert(
                 axum::http::header::CONTENT_TYPE,
                 HeaderValue::from_static("application/octet-stream"),
@@ -257,30 +568,36 @@ async fn raw_by_key(State(state): State<AppState>, Path(key): Path<String>) -> R
     }
 }
 
-/// GET /cache/v1/offset/{topic}/{partition} — last-seen offset.
+/// GET /cache/v1/{mirror}/offset/{topic}/{partition}; last-seen
+/// offset for that (topic, partition) within the named mirror.
 #[utoipa::path(
     get,
-    path = "/cache/v1/offset/{topic}/{partition}",
+    path = "/cache/v1/{mirror}/offset/{topic}/{partition}",
     tag = "cache",
     params(
+        ("mirror" = String, Path, description = "Name of the `http-access.cache-v1` mirror to read from"),
         ("topic" = String, Path, description = "Source topic name"),
         ("partition" = u32, Path, description = "Source partition"),
     ),
     responses(
-        (status = 200, description = "Decimal offset of the last applied record, or empty if none yet", body = String, content_type = "text/plain"),
+        (status = 200, description = "Decimal offset of the last applied record on this mirror, or empty if none yet", body = String, content_type = "text/plain"),
         (status = 400, description = "Empty topic"),
+        (status = 404, description = "Mirror unknown"),
     ),
 )]
 async fn offset_for_partition(
     State(state): State<AppState>,
-    Path((topic, partition)): Path<(String, u32)>,
+    Path((mirror, topic, partition)): Path<(String, String, u32)>,
 ) -> Response {
+    if state.cache.snapshot_keys_for(&mirror).is_none() {
+        return StatusCode::NOT_FOUND.into_response();
+    }
     if topic.is_empty() {
         return StatusCode::BAD_REQUEST.into_response();
     }
     let body = state
         .cache
-        .get_offset(&topic, partition)
+        .get_offset_for(&mirror, &topic, partition)
         .map(|o| o.to_string())
         .unwrap_or_default();
     (
@@ -294,33 +611,39 @@ async fn offset_for_partition(
         .into_response()
 }
 
-/// GET /cache/v1/keys — newline-separated key list, every line
-/// (including the last) terminated by `\n`. Order is the order each
-/// key was first seen by the cache (insertion order).
+/// GET /cache/v1/{mirror}/keys; newline-separated key list for the
+/// named mirror's view. Every line (including the last) is
+/// terminated by `\n`. Order is insertion order (the position a key
+/// gets the *first* time the mirror sees it).
 ///
 /// `Content-Type` is `application/octet-stream` to match KKV's
-/// byte-for-byte response shape. A possible future enhancement (gated
-/// on operator demand) is to surface the topic schema in the content
-/// type — see the `values` handler for the same hook.
+/// byte-for-byte response shape.
 #[utoipa::path(
     get,
-    path = "/cache/v1/keys",
+    path = "/cache/v1/{mirror}/keys",
     tag = "cache",
+    params(
+        ("mirror" = String, Path, description = "Name of the `http-access.cache-v1` mirror to read from"),
+    ),
     responses(
         (status = 200, description = "Newline-separated keys (UTF-8, trailing newline included)", body = Vec<u8>, content_type = "application/octet-stream"),
-        (status = 503, description = "Cache is not yet caught up to the source"),
+        (status = 404, description = "Mirror unknown"),
+        (status = 503, description = "Mirror is not currently Ready; body is a MirrorReadiness object", body = MirrorReadiness),
     ),
 )]
-async fn keys(State(state): State<AppState>) -> Response {
-    if let Err(r) = ready_or_503(&state) {
+async fn keys(State(state): State<AppState>, Path(mirror): Path<String>) -> Response {
+    if let Err(r) = resolve_mirror(&state, &mirror) {
         return r;
     }
+    let Some(snapshot) = state.cache.snapshot_keys_for(&mirror) else {
+        return StatusCode::NOT_FOUND.into_response();
+    };
     let mut body = Vec::new();
-    for k in state.cache.snapshot_keys() {
+    for k in snapshot {
         body.extend_from_slice(k.as_bytes());
         body.push(b'\n');
     }
-    let mut headers = offsets_header(&state);
+    let mut headers = offsets_header_for(&state, &mirror);
     headers.insert(
         axum::http::header::CONTENT_TYPE,
         HeaderValue::from_static("application/octet-stream"),
@@ -328,45 +651,37 @@ async fn keys(State(state): State<AppState>) -> Response {
     (StatusCode::OK, headers, body).into_response()
 }
 
-/// GET /cache/v1/values — newline-separated values (raw bytes).
-/// Order matches `/cache/v1/keys`. Every line — including the last —
-/// is terminated by `\n`. Binary-safe **only** when none of the values
-/// contain a `0x0A` byte; binary topics should pin
-/// `values: { type: bytes-base64 }` so the cache returns the
+/// GET /cache/v1/{mirror}/values; newline-separated values for the
+/// named mirror's view, in `keys` order. Binary-safe **only** when
+/// none of the values contain a `0x0A` byte; binary topics should
+/// pin `values: { type: bytes-base64 }` so the cache returns the
 /// base64-encoded form here.
-///
-/// `Content-Type` is `text/plain; charset=utf-8` regardless of the
-/// configured value type. Future work — gated on operator demand —
-/// is to adapt the response content type to the topic schema:
-///
-/// | `values.type`        | proposed `Content-Type`            |
-/// | -------------------- | ---------------------------------- |
-/// | `bytes-base64`       | `application/octet-stream`         |
-/// | `utf8`               | `text/plain; charset=utf-8`        |
-/// | `json` / `json-parseable` | `application/x-ndjson`        |
-///
-/// Not implemented today to keep parity with KKV's
-/// `text/plain;charset=UTF-8` (mirror-v3 emits the RFC-normalised
-/// equivalent).
 #[utoipa::path(
     get,
-    path = "/cache/v1/values",
+    path = "/cache/v1/{mirror}/values",
     tag = "cache",
+    params(
+        ("mirror" = String, Path, description = "Name of the `http-access.cache-v1` mirror to read from"),
+    ),
     responses(
         (status = 200, description = "Newline-separated raw values with trailing newline; binary-safe iff no value contains 0x0A", body = Vec<u8>, content_type = "text/plain"),
-        (status = 503, description = "Cache is not yet caught up to the source"),
+        (status = 404, description = "Mirror unknown"),
+        (status = 503, description = "Mirror is not currently Ready; body is a MirrorReadiness object", body = MirrorReadiness),
     ),
 )]
-async fn values(State(state): State<AppState>) -> Response {
-    if let Err(r) = ready_or_503(&state) {
+async fn values(State(state): State<AppState>, Path(mirror): Path<String>) -> Response {
+    if let Err(r) = resolve_mirror(&state, &mirror) {
         return r;
     }
+    let Some(snapshot) = state.cache.snapshot_values_for(&mirror) else {
+        return StatusCode::NOT_FOUND.into_response();
+    };
     let mut body = Vec::new();
-    for v in state.cache.snapshot_values() {
+    for v in snapshot {
         body.extend_from_slice(&v);
         body.push(b'\n');
     }
-    let mut headers = offsets_header(&state);
+    let mut headers = offsets_header_for(&state, &mirror);
     headers.insert(
         axum::http::header::CONTENT_TYPE,
         HeaderValue::from_static("text/plain; charset=utf-8"),
@@ -374,7 +689,7 @@ async fn values(State(state): State<AppState>) -> Response {
     (StatusCode::OK, headers, body).into_response()
 }
 
-/// POST /_admin/v1/shutdown — request graceful exit.
+/// POST /_admin/v1/shutdown; request graceful exit.
 #[utoipa::path(
     post,
     path = "/_admin/v1/shutdown",
@@ -388,7 +703,7 @@ async fn admin_shutdown(State(state): State<AppState>) -> Response {
     StatusCode::ACCEPTED.into_response()
 }
 
-/// POST /_admin/v1/shutdown/{exitcode} — request graceful exit with a specific code.
+/// POST /_admin/v1/shutdown/{exitcode}; request graceful exit with a specific code.
 #[utoipa::path(
     post,
     path = "/_admin/v1/shutdown/{exitcode}",
diff --git a/crates/mirror-cache/tests/handlers.rs b/crates/mirror-cache/tests/handlers.rs
index a71afbb..62ae42b 100644
--- a/crates/mirror-cache/tests/handlers.rs
+++ b/crates/mirror-cache/tests/handlers.rs
@@ -40,7 +40,7 @@ async fn body_bytes(resp: axum::http::Response<Body>) -> Vec<u8> {
 #[tokio::test]
 async fn raw_returns_503_until_caught_up() {
     let cache = Arc::new(CacheState::new());
-    cache.register_mirror("ops", 2); // needs offsets 0..=1
+    cache.register_mirror("ops", 2, None, true); // needs offsets 0..=1; main mirror
     let app = router_with(Arc::clone(&cache));
     let resp = app
         .clone()
@@ -71,7 +71,7 @@ async fn raw_returns_503_until_caught_up() {
 #[tokio::test]
 async fn raw_404_for_missing_key() {
     let cache = Arc::new(CacheState::new());
-    cache.register_mirror("m", 0); // empty topic → immediately ready
+    cache.register_mirror("m", 0, None, true); // empty topic → immediately ready
     let app = router_with(Arc::clone(&cache));
     let resp = app
         .oneshot(
@@ -87,7 +87,7 @@ async fn raw_404_for_missing_key() {
 #[tokio::test]
 async fn tombstone_makes_key_404() {
     let cache = Arc::new(CacheState::new());
-    cache.register_mirror("m", 2);
+    cache.register_mirror("m", 2, None, true);
     cache.apply_record("m", &rec("t", 0, 0, "alice", Some(br#"{"v":1}"#)));
     cache.apply_record("m", &rec("t", 0, 1, "alice", None)); // tombstone
     let app = router_with(Arc::clone(&cache));
@@ -105,7 +105,7 @@ async fn tombstone_makes_key_404() {
 #[tokio::test]
 async fn keys_and_values_are_newline_terminated_in_insertion_order() {
     let cache = Arc::new(CacheState::new());
-    cache.register_mirror("m", 0);
+    cache.register_mirror("m", 0, None, true);
     cache.apply_record("m", &rec("t", 0, 0, "b", Some(b"vb")));
     cache.apply_record("m", &rec("t", 0, 1, "a", Some(b"va")));
     cache.apply_record("m", &rec("t", 0, 2, "c", Some(b"vc")));
@@ -147,7 +147,7 @@ async fn keys_and_values_are_newline_terminated_in_insertion_order() {
 #[tokio::test]
 async fn offset_endpoint_returns_decimal_or_empty() {
     let cache = Arc::new(CacheState::new());
-    cache.register_mirror("m", 0);
+    cache.register_mirror("m", 0, None, true);
     cache.apply_record("m", &rec("orders", 1, 7, "k", Some(b"v")));
     let app = router_with(Arc::clone(&cache));
 
@@ -181,7 +181,7 @@ async fn offset_endpoint_returns_decimal_or_empty() {
 #[tokio::test]
 async fn openapi_json_and_yaml_are_served() {
     let cache = Arc::new(CacheState::new());
-    cache.register_mirror("m", 0);
+    cache.register_mirror("m", 0, None, true);
     let app = router_with(Arc::clone(&cache));
 
     let resp = app
@@ -193,7 +193,11 @@ async fn openapi_json_and_yaml_are_served() {
     let body = String::from_utf8(body_bytes(resp).await).unwrap();
     let parsed: serde_json::Value = serde_json::from_str(&body).expect("OpenAPI JSON must parse");
     assert_eq!(parsed["openapi"], "3.1.0");
-    assert!(parsed["paths"]["/cache/v1/raw/{key}"].is_object());
+    assert!(parsed["paths"]["/cache/v1/{mirror}/raw/{key}"].is_object());
+    assert!(
+        parsed["paths"]["/cache/v1/raw/{key}"].is_null(),
+        "unprefixed cache-v1-main aliases must stay off the static spec"
+    );
 
     let resp = app
         .oneshot(Request::get("/openapi.yaml").body(Body::empty()).unwrap())
@@ -202,15 +206,15 @@ async fn openapi_json_and_yaml_are_served() {
     assert_eq!(resp.status(), StatusCode::OK);
     let body = String::from_utf8(body_bytes(resp).await).unwrap();
     assert!(
-        body.contains("/cache/v1/raw/{key}"),
-        "yaml must include the cache route: {body}"
+        body.contains("/cache/v1/{mirror}/raw/{key}"),
+        "yaml must include the per-mirror cache route: {body}"
     );
 }
 
 #[tokio::test]
 async fn offsets_header_contents_match_snapshot() {
     let cache = Arc::new(CacheState::new());
-    cache.register_mirror("m", 0);
+    cache.register_mirror("m", 0, None, true);
     cache.apply_record("m", &rec("orders", 0, 5, "k", Some(b"v")));
     cache.apply_record("m", &rec("orders", 1, 3, "k2", Some(b"v")));
     let app = router_with(Arc::clone(&cache));
@@ -233,3 +237,263 @@ async fn offsets_header_contents_match_snapshot() {
     assert_eq!(parsed[1]["partition"], 1);
     assert_eq!(parsed[1]["offset"], 3);
 }
+
+#[tokio::test]
+async fn q_health_ready_returns_503_until_caught_up_then_200() {
+    // Drop-in for the Yolean/kafka-keyvalue Quarkus binary's
+    // `/q/health/ready` SmallRye-Health endpoint. The
+    // `@yolean/kafka-keyvalue` Node client's `onReady()` polls it
+    // every 3 s; consumer pods that don't see a `200` never become
+    // Ready themselves. Same readiness gate as `/cache/v1`.
+    let cache = Arc::new(CacheState::new());
+    cache.register_mirror_with_topic("userstate", 2, None, true, "userstate", 0);
+    let app = router_with(Arc::clone(&cache));
+
+    let resp = app
+        .clone()
+        .oneshot(Request::get("/q/health/ready").body(Body::empty()).unwrap())
+        .await
+        .unwrap();
+    assert_eq!(resp.status(), StatusCode::SERVICE_UNAVAILABLE);
+    let body: serde_json::Value =
+        serde_json::from_slice(&body_bytes(resp).await).expect("body must be JSON");
+    assert_eq!(body["ready"], "warming");
+    assert_eq!(body["mirrors"][0]["name"], "userstate");
+    assert_eq!(body["mirrors"][0]["status"], "warming");
+    assert_eq!(body["mirrors"][0]["source"]["topic"], "userstate");
+    assert_eq!(body["unhealthy"], serde_json::json!(["userstate"]));
+
+    cache.apply_record("userstate", &rec("userstate", 0, 0, "k0", Some(b"v0")));
+    cache.apply_record("userstate", &rec("userstate", 0, 1, "k1", Some(b"v1")));
+
+    let resp = app
+        .oneshot(Request::get("/q/health/ready").body(Body::empty()).unwrap())
+        .await
+        .unwrap();
+    assert_eq!(resp.status(), StatusCode::OK);
+    let body: serde_json::Value =
+        serde_json::from_slice(&body_bytes(resp).await).expect("body must be JSON");
+    assert_eq!(body["ready"], "ready");
+    assert_eq!(body["mirrors"][0]["status"], "ready");
+    assert_eq!(body["unhealthy"], serde_json::json!([]));
+}
+
+#[tokio::test]
+async fn q_health_ready_body_distinguishes_warming_from_degraded() {
+    // Aggregate discriminator: only Warming when every unhealthy
+    // mirror is still warming up; flips to Degraded once at least one
+    // is in a post-warming non-ready state (lag, source unassigned,
+    // destination lagging).
+    let cache = Arc::new(CacheState::new());
+    cache.register_mirror_with_topic("warming-only", 2, None, false, "t", 0);
+    let app = router_with(Arc::clone(&cache));
+    let resp = app
+        .clone()
+        .oneshot(Request::get("/q/health/ready").body(Body::empty()).unwrap())
+        .await
+        .unwrap();
+    assert_eq!(resp.status(), StatusCode::SERVICE_UNAVAILABLE);
+    let body: serde_json::Value = serde_json::from_slice(&body_bytes(resp).await).unwrap();
+    assert_eq!(body["ready"], "warming");
+
+    // Drive past the warming window so the slot is Ready, then push
+    // the broker end-offset out so it flips to LagBehindSource.
+    cache.apply_record("warming-only", &rec("t", 0, 0, "k0", Some(b"v0")));
+    cache.apply_record("warming-only", &rec("t", 0, 1, "k1", Some(b"v1")));
+    cache.set_broker_end_offset("warming-only", 50);
+    let resp = app
+        .oneshot(Request::get("/q/health/ready").body(Body::empty()).unwrap())
+        .await
+        .unwrap();
+    assert_eq!(resp.status(), StatusCode::SERVICE_UNAVAILABLE);
+    let body: serde_json::Value = serde_json::from_slice(&body_bytes(resp).await).unwrap();
+    assert_eq!(body["ready"], "degraded");
+    assert_eq!(body["mirrors"][0]["status"], "lag_behind_source");
+    assert_eq!(body["mirrors"][0]["source"]["lag"], 48);
+}
+
+#[tokio::test]
+async fn cache_503_body_matches_readiness_mirror_entry() {
+    // The per-mirror cache 503 body must equal the corresponding
+    // `mirrors[i]` element of `/q/health/ready`. A consumer hitting
+    // either endpoint can parse the same shape.
+    let cache = Arc::new(CacheState::new());
+    cache.register_mirror_with_topic("warming", 2, None, false, "t", 7);
+    let app = router_with(Arc::clone(&cache));
+
+    let resp = app
+        .clone()
+        .oneshot(Request::get("/q/health/ready").body(Body::empty()).unwrap())
+        .await
+        .unwrap();
+    let ready_body: serde_json::Value = serde_json::from_slice(&body_bytes(resp).await).unwrap();
+    let expected_entry = &ready_body["mirrors"][0];
+
+    let resp = app
+        .oneshot(
+            Request::get("/cache/v1/warming/keys")
+                .body(Body::empty())
+                .unwrap(),
+        )
+        .await
+        .unwrap();
+    assert_eq!(resp.status(), StatusCode::SERVICE_UNAVAILABLE);
+    let cache_body: serde_json::Value = serde_json::from_slice(&body_bytes(resp).await).unwrap();
+    assert_eq!(
+        &cache_body, expected_entry,
+        "503 body must be the same MirrorReadiness object as /q/health/ready returns"
+    );
+}
+
+#[tokio::test]
+async fn per_mirror_paths_serve_only_that_mirrors_view() {
+    // Two mirrors, each with its own keyspace. Hitting one mirror's
+    // /raw/{key} must not surface the other's keys, and vice-versa.
+    // Neither is `cache-v1-main`; the unprefixed paths must 404.
+    let cache = Arc::new(CacheState::new());
+    cache.register_mirror("a", 0, None, false);
+    cache.register_mirror("b", 0, None, false);
+    cache.apply_record("a", &rec("topic-a", 0, 0, "k-a", Some(b"va")));
+    cache.apply_record("b", &rec("topic-b", 0, 0, "k-b", Some(b"vb")));
+    let app = router_with(Arc::clone(&cache));
+
+    let resp = app
+        .clone()
+        .oneshot(
+            Request::get("/cache/v1/a/raw/k-a")
+                .body(Body::empty())
+                .unwrap(),
+        )
+        .await
+        .unwrap();
+    assert_eq!(resp.status(), StatusCode::OK);
+    assert_eq!(body_bytes(resp).await, b"va");
+
+    // Cross-mirror miss: mirror b doesn't have k-a.
+    let resp = app
+        .clone()
+        .oneshot(
+            Request::get("/cache/v1/b/raw/k-a")
+                .body(Body::empty())
+                .unwrap(),
+        )
+        .await
+        .unwrap();
+    assert_eq!(resp.status(), StatusCode::NOT_FOUND);
+
+    // No cache-v1-main: unprefixed paths route to nothing.
+    let resp = app
+        .oneshot(
+            Request::get("/cache/v1/raw/k-a")
+                .body(Body::empty())
+                .unwrap(),
+        )
+        .await
+        .unwrap();
+    assert_eq!(
+        resp.status(),
+        StatusCode::NOT_FOUND,
+        "no main mirror => unprefixed path not mounted"
+    );
+}
+
+#[tokio::test]
+async fn per_mirror_path_unknown_mirror_is_404() {
+    let cache = Arc::new(CacheState::new());
+    cache.register_mirror("real", 0, None, false);
+    let app = router_with(Arc::clone(&cache));
+    let resp = app
+        .oneshot(
+            Request::get("/cache/v1/missing/raw/anything")
+                .body(Body::empty())
+                .unwrap(),
+        )
+        .await
+        .unwrap();
+    assert_eq!(resp.status(), StatusCode::NOT_FOUND);
+}
+
+#[tokio::test]
+async fn per_mirror_path_503_until_that_mirror_caught_up() {
+    // Per-mirror readiness gates each route independently: one
+    // mirror can already serve while the other is still warming up.
+    let cache = Arc::new(CacheState::new());
+    cache.register_mirror("ready-now", 0, None, false); // hwm 0 => ready
+    cache.register_mirror("warming", 2, None, false); // needs offsets 0..=1
+    let app = router_with(Arc::clone(&cache));
+
+    let resp = app
+        .clone()
+        .oneshot(
+            Request::get("/cache/v1/ready-now/keys")
+                .body(Body::empty())
+                .unwrap(),
+        )
+        .await
+        .unwrap();
+    assert_eq!(resp.status(), StatusCode::OK);
+
+    let resp = app
+        .clone()
+        .oneshot(
+            Request::get("/cache/v1/warming/keys")
+                .body(Body::empty())
+                .unwrap(),
+        )
+        .await
+        .unwrap();
+    assert_eq!(resp.status(), StatusCode::SERVICE_UNAVAILABLE);
+}
+
+#[tokio::test]
+async fn unprefixed_paths_dispatch_to_main_mirror_view() {
+    // Two mirrors; `main-m` is cache-v1-main. The unprefixed
+    // /cache/v1/keys must return main-m's keys only.
+    let cache = Arc::new(CacheState::new());
+    cache.register_mirror("main-m", 0, None, true);
+    cache.register_mirror("other", 0, None, false);
+    cache.apply_record("main-m", &rec("t", 0, 0, "main-key", Some(b"vm")));
+    cache.apply_record("other", &rec("t", 0, 0, "other-key", Some(b"vo")));
+    let app = router_with(Arc::clone(&cache));
+
+    let resp = app
+        .clone()
+        .oneshot(Request::get("/cache/v1/keys").body(Body::empty()).unwrap())
+        .await
+        .unwrap();
+    assert_eq!(resp.status(), StatusCode::OK);
+    assert_eq!(body_bytes(resp).await, b"main-key\n");
+
+    let resp = app
+        .oneshot(
+            Request::get("/cache/v1/raw/other-key")
+                .body(Body::empty())
+                .unwrap(),
+        )
+        .await
+        .unwrap();
+    assert_eq!(
+        resp.status(),
+        StatusCode::NOT_FOUND,
+        "unprefixed path does not fall through to the non-main mirror"
+    );
+}
+
+#[tokio::test]
+async fn q_health_ready_is_not_in_openapi_spec() {
+    // Compat shim, intentionally undocumented; public surface is
+    // `/cache/v1` and `/_admin/v1` only.
+    let cache = Arc::new(CacheState::new());
+    cache.register_mirror("m", 0, None, true);
+    let app = router_with(Arc::clone(&cache));
+    let resp = app
+        .oneshot(Request::get("/openapi.json").body(Body::empty()).unwrap())
+        .await
+        .unwrap();
+    assert_eq!(resp.status(), StatusCode::OK);
+    let body = String::from_utf8(body_bytes(resp).await).unwrap();
+    assert!(
+        !body.contains("/q/health/ready"),
+        "/q/health/ready must stay off the OpenAPI spec; got: {body}"
+    );
+}
diff --git a/crates/mirror-config/Cargo.toml b/crates/mirror-config/Cargo.toml
index 34ecd11..bb66c74 100644
--- a/crates/mirror-config/Cargo.toml
+++ b/crates/mirror-config/Cargo.toml
@@ -13,3 +13,4 @@ serde_json = { workspace = true }
 serde_yaml = { workspace = true }
 schemars = { workspace = true }
 thiserror = { workspace = true }
+url = { workspace = true }
diff --git a/crates/mirror-config/src/lib.rs b/crates/mirror-config/src/lib.rs
index 07747ab..7628eca 100644
--- a/crates/mirror-config/src/lib.rs
+++ b/crates/mirror-config/src/lib.rs
@@ -67,6 +67,16 @@ pub struct KafkaDestination {
     /// the source.
     #[serde(default)]
     pub topic: Option<String>,
+    /// Whether this destination gates the mirror's readiness. When
+    /// `true` (default), the supervisor reports
+    /// `MirrorStatus::DestinationLagging` if this destination falls
+    /// behind the source by more than the configured tolerance,
+    /// and the structured `/q/health/ready` body names the
+    /// destination by `name`. Set `false` for best-effort secondary
+    /// destinations (observability replicas, archival sync) that
+    /// should not flip the mirror's status.
+    #[serde(default = "default_true")]
+    pub affects_readiness: bool,
 }
 
 #[derive(Debug, Clone, PartialEq, Serialize, Deserialize, JsonSchema)]
@@ -79,6 +89,9 @@ pub struct FilesystemDestination {
     pub name: Option<String>,
     /// Absolute path to the destination root directory.
     pub root: PathBuf,
+    /// See [`KafkaDestination::affects_readiness`].
+    #[serde(default = "default_true")]
+    pub affects_readiness: bool,
 }
 
 #[derive(Debug, Clone, PartialEq, Serialize, Deserialize, JsonSchema)]
@@ -99,6 +112,13 @@ pub struct S3Destination {
     /// Key prefix prepended to all written object keys.
     #[serde(default)]
     pub prefix: Option<String>,
+    /// See [`KafkaDestination::affects_readiness`].
+    #[serde(default = "default_true")]
+    pub affects_readiness: bool,
+}
+
+fn default_true() -> bool {
+    true
 }
 
 impl Destination {
@@ -121,6 +141,18 @@ impl Destination {
     pub fn is_blob(&self) -> bool {
         !matches!(self, Destination::Kafka(_))
     }
+
+    /// Whether this destination's progress gates the mirror's
+    /// readiness status. When false, the supervisor still tracks
+    /// `flushed_through` for observability but skips the destination
+    /// when computing `MirrorStatus::DestinationLagging`.
+    pub fn affects_readiness(&self) -> bool {
+        match self {
+            Destination::Kafka(k) => k.affects_readiness,
+            Destination::Filesystem(fs) => fs.affects_readiness,
+            Destination::S3(s3) => s3.affects_readiness,
+        }
+    }
 }
 
 #[derive(Debug, Clone, PartialEq, Serialize, Deserialize, JsonSchema)]
@@ -196,7 +228,7 @@ pub struct Mirror {
     pub http_access: Option<HttpAccess>,
 
     /// Whether mirror-v3 should actually spawn this mirror at
-    /// startup. Defaults to `true`. Plain YAML boolean only —
+    /// startup. Defaults to `true`. Plain YAML boolean only -
     /// `true` / `false` (and the YAML-1.2 case variants
     /// `True`/`False`/`TRUE`/`FALSE`). The YAML-1.1 truthy/falsy
     /// strings (`yes`/`no`/`on`/`off`) are deliberately NOT
@@ -218,6 +250,21 @@ pub struct Mirror {
     /// loudly so a misconfigured deployment doesn't silently idle.
     #[serde(default, skip_serializing_if = "Option::is_none")]
     pub enabled: Option<bool>,
+
+    /// Opt-in outbound webhook notify. Closes the legacy
+    /// `Yolean/kafka-keyvalue` (kkv) "onupdate" gap: when a record
+    /// lands in the mirror's view, POST to one or more downstream
+    /// services so their in-process caches can invalidate and
+    /// re-fetch via `/cache/v1/raw/<key>`.
+    ///
+    /// Today the only `api` variant is `kkv-v1`, which matches the
+    /// legacy kkv wire contract byte-for-byte so the upstream
+    /// `@yolean/kafka-keyvalue` Node client works unmodified.
+    ///
+    /// See `WEBHOOKS.md` at the repo root for the full design,
+    /// trigger modes, outcome matrix, and DNS-A fan-out semantics.
+    #[serde(default, skip_serializing_if = "Option::is_none")]
+    pub notify: Option<Notify>,
 }
 
 impl Mirror {
@@ -228,26 +275,302 @@ impl Mirror {
     }
 }
 
-/// HTTP read-access block. Today the only variant is the KKV-compatible
-/// `/cache/v1` surface; the field is grouped so future APIs can be
-/// added without re-shaping the YAML.
+// ============================================================
+//   Notify (outbound webhook) - kkv-v1 drop-in for now
+// ============================================================
+
+/// Per-mirror outbound notify block. Today only the `kkv-v1` API
+/// variant is supported; future variants (e.g. `nats-v1`, a
+/// `kkv-v2` with auth) hang off the same block without re-shaping.
+#[derive(Debug, Clone, PartialEq, Serialize, Deserialize, JsonSchema)]
+#[serde(deny_unknown_fields, rename_all = "kebab-case")]
+pub struct Notify {
+    pub api: NotifyApi,
+    /// One or more downstream targets. Each target carries its own
+    /// URL and fan-out mode. Multi-target notify fan-out is parallel
+    /// and per-target outcomes resolve independently.
+    pub targets: Vec<NotifyTarget>,
+    #[serde(default)]
+    pub trigger: NotifyTrigger,
+    /// Per-request HTTP timeout. Independent of retry policy: timing
+    /// out is one of the six outcomes whose action is configurable.
+    /// Spec default: 5000 ms.
+    #[serde(default = "default_notify_timeout_ms")]
+    pub timeout_ms: u64,
+    #[serde(default)]
+    pub retry: NotifyRetry,
+    #[serde(default)]
+    pub outcomes: NotifyOutcomes,
+}
+
+/// The wire-contract variant this notify block speaks. Today only
+/// the legacy kkv shape exists. New variants must explicitly opt
+/// in - kkv-v1 is not the default to avoid silently changing
+/// behaviour if we ever add e.g. a kkv-v2 with auth.
 #[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize, JsonSchema)]
+#[serde(rename_all = "kebab-case")]
+pub enum NotifyApi {
+    /// `POST /kafka-keyvalue/v1/updates` with the legacy kkv body:
+    /// `{ topic, offsets, updates: { <key>: null } }`. Matches the
+    /// `@yolean/kafka-keyvalue` Node client's
+    /// `getOnUpdateRoute()` / `ON_UPDATE_DEFAULT_PATH`.
+    KkvV1,
+}
+
+#[derive(Debug, Clone, PartialEq, Serialize, Deserialize, JsonSchema)]
 #[serde(deny_unknown_fields, rename_all = "kebab-case")]
-pub struct HttpAccess {
-    pub api: HttpAccessApi,
+pub struct NotifyTarget {
+    /// Full URL of the target. Path defaults to
+    /// `/kafka-keyvalue/v1/updates` under `api: kkv-v1` if `path`
+    /// is unset; explicit override is allowed for non-kkv clients.
+    pub url: String,
+    /// Override the URL's path segment. Defaults to the
+    /// api-variant-defined path (`/kafka-keyvalue/v1/updates`
+    /// for kkv-v1).
+    #[serde(default, skip_serializing_if = "Option::is_none")]
+    pub path: Option<String>,
+    /// How the URL's host is resolved. `none` (default) sends one
+    /// POST to a single keep-alive connection; `dns-a` resolves
+    /// the host to its full A/AAAA record set and POSTs to every
+    /// returned address concurrently - the K8s-headless-Service
+    /// fan-out path without a Kubernetes API dependency.
+    #[serde(default)]
+    pub fan_out: FanOut,
+}
+
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize, JsonSchema, Default)]
+#[serde(rename_all = "kebab-case")]
+pub enum FanOut {
+    /// Standard DNS, single keep-alive connection. Adequate for a
+    /// non-K8s target or a single-replica deployment.
+    #[default]
+    None,
+    /// Resolve the URL's host to all A/AAAA records and POST to
+    /// every address concurrently. Headless Kubernetes Services
+    /// return one A-record per pod, giving the same fan-out the
+    /// legacy kkv did via the Endpoints API.
+    DnsA,
+}
+
+#[derive(Debug, Clone, PartialEq, Serialize, Deserialize, JsonSchema)]
+#[serde(deny_unknown_fields, rename_all = "kebab-case")]
+pub struct NotifyTrigger {
+    pub on: TriggerOn,
+    /// Required when `on: source-consume`; forbidden when
+    /// `on: destination-flush` (the destination's own flush
+    /// triggers ARE the debounce in that mode). Defaults to
+    /// `{ max-records: 100, max-time-ms: 250 }`.
+    #[serde(default, skip_serializing_if = "Option::is_none")]
+    pub debounce: Option<NotifyDebounce>,
+}
+
+impl Default for NotifyTrigger {
+    fn default() -> Self {
+        Self {
+            on: TriggerOn::default(),
+            // `Some(...)` so the YAML-omitted case still has the
+            // spec-default {100, 250} window when source-consume
+            // applies. Validator can still reject explicit
+            // `destination-flush + debounce`.
+            debounce: Some(NotifyDebounce::default()),
+        }
+    }
+}
+
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize, JsonSchema, Default)]
+#[serde(rename_all = "kebab-case")]
+pub enum TriggerOn {
+    /// POST as soon as the consume loop hands a record to the
+    /// mirror - bounded by the `debounce` window. Default;
+    /// matches legacy kkv behaviour.
+    #[default]
+    SourceConsume,
+    /// POST when *every* destination has durably committed past
+    /// the batch's high-water offset. The notify body's offset
+    /// range matches the flushed snapshot's `from`–`to`. Wrong
+    /// for cache invalidation; right for downstream archival
+    /// hints.
+    DestinationFlush,
+}
+
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize, JsonSchema)]
+#[serde(deny_unknown_fields, rename_all = "kebab-case")]
+pub struct NotifyDebounce {
+    pub max_records: u64,
+    pub max_time_ms: u64,
+}
+
+impl Default for NotifyDebounce {
+    fn default() -> Self {
+        Self {
+            max_records: 100,
+            max_time_ms: 250,
+        }
+    }
+}
+
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize, JsonSchema)]
+#[serde(deny_unknown_fields, rename_all = "kebab-case")]
+pub struct NotifyRetry {
+    pub max_attempts: u32,
+    pub backoff_ms: u64,
+}
+
+impl Default for NotifyRetry {
+    fn default() -> Self {
+        Self {
+            max_attempts: 5,
+            backoff_ms: 100,
+        }
+    }
+}
+
+fn default_notify_timeout_ms() -> u64 {
+    5000
+}
+
+/// The six request outcomes and what each one means for the mirror.
+/// Per-field omission falls back to the spec-default for that
+/// outcome only (one outcome being explicit doesn't force the
+/// others to be).
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize, JsonSchema)]
+#[serde(deny_unknown_fields, rename_all = "kebab-case")]
+pub struct NotifyOutcomes {
+    #[serde(default = "default_outcome_timeout")]
+    pub timeout: NotifyOutcome,
+    #[serde(default = "default_outcome_connrefused")]
+    pub connrefused: NotifyOutcome,
+    /// HTTP 2xx - the only success outcome.
+    #[serde(rename = "2xx", default = "default_outcome_2xx")]
+    pub two_xx: NotifyOutcome,
+    /// HTTP 3xx - almost always misconfiguration on a webhook.
+    #[serde(rename = "3xx", default = "default_outcome_3xx")]
+    pub three_xx: NotifyOutcome,
+    /// HTTP 4xx - receiver says "your request is wrong";
+    /// retrying the same payload doesn't help.
+    #[serde(rename = "4xx", default = "default_outcome_4xx")]
+    pub four_xx: NotifyOutcome,
+    /// HTTP 5xx - receiver is transiently broken; retry per
+    /// policy and fail on exhaustion.
+    #[serde(rename = "5xx", default = "default_outcome_5xx")]
+    pub five_xx: NotifyOutcome,
+}
+
+impl Default for NotifyOutcomes {
+    fn default() -> Self {
+        Self {
+            timeout: default_outcome_timeout(),
+            connrefused: default_outcome_connrefused(),
+            two_xx: default_outcome_2xx(),
+            three_xx: default_outcome_3xx(),
+            four_xx: default_outcome_4xx(),
+            five_xx: default_outcome_5xx(),
+        }
+    }
+}
+
+fn default_outcome_timeout() -> NotifyOutcome {
+    NotifyOutcome {
+        retry: true,
+        final_: FinalAction::Fail,
+    }
+}
+fn default_outcome_connrefused() -> NotifyOutcome {
+    NotifyOutcome {
+        retry: true,
+        final_: FinalAction::Fail,
+    }
+}
+fn default_outcome_2xx() -> NotifyOutcome {
+    NotifyOutcome {
+        retry: false,
+        final_: FinalAction::Accept,
+    }
+}
+fn default_outcome_3xx() -> NotifyOutcome {
+    NotifyOutcome {
+        retry: false,
+        final_: FinalAction::Fail,
+    }
+}
+fn default_outcome_4xx() -> NotifyOutcome {
+    NotifyOutcome {
+        retry: false,
+        final_: FinalAction::Fail,
+    }
+}
+fn default_outcome_5xx() -> NotifyOutcome {
+    NotifyOutcome {
+        retry: true,
+        final_: FinalAction::Fail,
+    }
+}
+
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize, JsonSchema)]
+#[serde(deny_unknown_fields, rename_all = "kebab-case")]
+pub struct NotifyOutcome {
+    /// If `true`, the request is retried per [`NotifyRetry`] before
+    /// [`Self::final_`] is applied. If `false`, the action in
+    /// [`Self::final_`] is taken on the first attempt.
+    pub retry: bool,
+    /// What happens once retries (if any) are exhausted.
+    #[serde(rename = "final")]
+    pub final_: FinalAction,
 }
 
-/// Variants of the read API surface mirror-v3 will host. Each opt-in
-/// mirror declares which one applies to it; today only `cache-v1`
-/// exists (a drop-in for `Yolean/kafka-keyvalue`'s `/cache/v1`).
 #[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize, JsonSchema)]
 #[serde(rename_all = "kebab-case")]
-pub enum HttpAccessApi {
-    /// `/cache/v1/raw/{key}`, `/cache/v1/keys`, `/cache/v1/values`,
-    /// `/cache/v1/offset/{topic}/{partition}`. See the `mirror-cache`
-    /// crate for behavior and the committed OpenAPI 3.1 spec in
-    /// `schemas/mirror-v3.cache.openapi.json`.
-    CacheV1,
+pub enum FinalAction {
+    /// Treat the batch as delivered, advance.
+    Accept,
+    /// Log WARN, drop the batch, advance.
+    Skip,
+    /// Mirror task errors out; orchestrator restarts; mirror
+    /// replays from durable state on restart.
+    Fail,
+}
+
+/// HTTP read-access block. Multiple API surfaces can be enabled on
+/// the same mirror; each is configured by its presence under its
+/// own key. The map shape (rather than the original `{ api: ... }`
+/// enum) lets a mirror opt into more than one API and keeps room
+/// for per-API knobs without further config reshaping.
+#[derive(Debug, Clone, Default, PartialEq, Eq, Serialize, Deserialize, JsonSchema)]
+#[serde(deny_unknown_fields, rename_all = "kebab-case")]
+pub struct HttpAccess {
+    /// `/cache/v1/{mirror}/raw/{key}` etc. mounted at the mirror's
+    /// own name. Required if `cache-v1-main` is set. See the
+    /// `mirror-cache` crate for behavior and the committed OpenAPI
+    /// 3.1 spec in `schemas/mirror-v3.cache.openapi.json`.
+    #[serde(default, skip_serializing_if = "Option::is_none")]
+    pub cache_v1: Option<CacheV1Config>,
+    /// `/cache/v1/raw/{key}` etc. mounted at the unprefixed path,
+    /// dispatching to this mirror's per-mirror view. At most one
+    /// mirror in the whole config may set this; the validator
+    /// rejects more than one so a `cache-v1-main` consumer sees a
+    /// single deterministic view. Migration aid; once every consumer
+    /// has moved to `/cache/v1/{mirror}/...` it can be removed.
+    #[serde(default, skip_serializing_if = "Option::is_none")]
+    pub cache_v1_main: Option<CacheV1MainConfig>,
+}
+
+/// Per-API configuration block for `cache-v1`. Empty today, populated
+/// as the field is given operator-tunable knobs.
+#[derive(Debug, Clone, Default, PartialEq, Eq, Serialize, Deserialize, JsonSchema)]
+#[serde(deny_unknown_fields)]
+pub struct CacheV1Config {}
+
+/// Per-API configuration block for `cache-v1-main`. Empty today.
+#[derive(Debug, Clone, Default, PartialEq, Eq, Serialize, Deserialize, JsonSchema)]
+#[serde(deny_unknown_fields)]
+pub struct CacheV1MainConfig {}
+
+impl HttpAccess {
+    /// `true` if any API surface is enabled. Used at validator and
+    /// supervisor sites that don't care which one.
+    pub fn any_enabled(&self) -> bool {
+        self.cache_v1.is_some() || self.cache_v1_main.is_some()
+    }
 }
 
 #[derive(Debug, Clone, PartialEq, Serialize, Deserialize, JsonSchema)]
@@ -351,7 +674,7 @@ pub enum Compaction {
 #[serde(rename_all = "kebab-case")]
 pub enum DestinationFormat {
     /// Apache Parquet. Columnar, embedded schema, compressed.
-    /// Standard data-lake format — readable by DuckDB / Athena /
+    /// Standard data-lake format - readable by DuckDB / Athena /
     /// Spark out of the box.
     #[default]
     Parquet,
@@ -570,16 +893,59 @@ fn validate(cfg: &Config) -> Result<(), LoadError> {
         }
         validate_mirror(m)?;
     }
+    // Cross-mirror: `cache-v1-main` mounts the unprefixed
+    // /cache/v1/... routes onto exactly one mirror's view. Two
+    // mains would race over the same paths so the supervisor would
+    // never know which mirror to dispatch to; reject up front.
+    let mains: Vec<&str> = cfg
+        .mirrors
+        .iter()
+        .filter(|m| {
+            m.http_access
+                .as_ref()
+                .and_then(|h| h.cache_v1_main.as_ref())
+                .is_some()
+        })
+        .map(|m| m.name.as_str())
+        .collect();
+    if mains.len() > 1 {
+        return Err(LoadError::Validation(format!(
+            "`http-access.cache-v1-main` may be set on at most one mirror; \
+             found on: {mains:?}"
+        )));
+    }
     Ok(())
 }
 
+/// Path segments the `/cache/v1/...` router already binds at the
+/// top of the per-mirror tree. A mirror named after one of these
+/// would make `/cache/v1/{mirror}/raw/{key}` ambiguous against the
+/// literal `/cache/v1/keys` etc., so the validator refuses.
+const RESERVED_MIRROR_NAMES_AT_CACHE_V1: &[&str] = &["raw", "offset", "keys", "values"];
+
 fn validate_mirror(m: &Mirror) -> Result<(), LoadError> {
+    // Destinations-empty is allowed ONLY when notify is set with at
+    // least one target (the "notify-only mirror" shape - see
+    // WEBHOOKS.md). Other rules in this function are then either
+    // skipped (everything destination-shaped) or applied with
+    // tighter restrictions (e.g. http-access forbidden).
     if m.destinations.is_empty() {
-        return Err(LoadError::Validation(format!(
-            "mirror {:?}: `destinations` must contain at least one entry",
-            m.name
-        )));
+        let Some(notify) = m.notify.as_ref() else {
+            return Err(LoadError::Validation(format!(
+                "mirror {:?}: `destinations` must contain at least one entry, \
+                 unless `notify` is set (notify-only mirrors are allowed)",
+                m.name
+            )));
+        };
+        if notify.targets.is_empty() {
+            return Err(LoadError::Validation(format!(
+                "mirror {:?}: notify-only mirror requires `notify.targets` to be non-empty",
+                m.name
+            )));
+        }
+        return validate_notify_only(m, notify);
     }
+
     // Per-destination identifiers: explicit `name` is required when a
     // mirror has more than one destination (otherwise the default
     // `mirror.name` would collide). With exactly one destination,
@@ -614,7 +980,10 @@ fn validate_mirror(m: &Mirror) -> Result<(), LoadError> {
             ("compression", m.compression.is_some()),
             ("compaction", m.compaction.is_some()),
             ("flush", m.flush.is_some()),
-            ("http-access", m.http_access.is_some()),
+            (
+                "http-access",
+                m.http_access.as_ref().is_some_and(HttpAccess::any_enabled),
+            ),
         ] {
             if present {
                 return Err(LoadError::Validation(format!(
@@ -659,7 +1028,9 @@ fn validate_mirror(m: &Mirror) -> Result<(), LoadError> {
                 )));
             }
         }
-        if m.http_access.is_some() && matches!(keys.kind, ColumnType::Bytes) {
+        if m.http_access.as_ref().is_some_and(HttpAccess::any_enabled)
+            && matches!(keys.kind, ColumnType::Bytes)
+        {
             return Err(LoadError::Validation(format!(
                 "mirror {:?}: `http-access` requires `keys.type` ∈ {{utf8, json, json-parseable}}; \
                  /cache/v1 routes keys through URL path segments",
@@ -667,9 +1038,190 @@ fn validate_mirror(m: &Mirror) -> Result<(), LoadError> {
             )));
         }
     }
+
+    if let Some(http) = m.http_access.as_ref() {
+        // `cache-v1-main` mounts the unprefixed /cache/v1/... routes
+        // onto this mirror's per-mirror view; it has no value without
+        // the underlying per-mirror surface (and there is no separate
+        // legacy data path).
+        if http.cache_v1_main.is_some() && http.cache_v1.is_none() {
+            return Err(LoadError::Validation(format!(
+                "mirror {:?}: `http-access.cache-v1-main` requires `http-access.cache-v1` \
+                 on the same mirror",
+                m.name
+            )));
+        }
+        // The /cache/v1/{mirror}/raw/{key} router uses {mirror} as a
+        // path parameter directly under /cache/v1/. Names like
+        // `keys` would collide with the literal /cache/v1/keys path
+        // serving cache-v1-main.
+        if http.cache_v1.is_some() && RESERVED_MIRROR_NAMES_AT_CACHE_V1.contains(&m.name.as_str()) {
+            return Err(LoadError::Validation(format!(
+                "mirror {:?}: name collides with a `/cache/v1/...` literal segment ({:?}); \
+                 rename the mirror to enable `http-access.cache-v1`",
+                m.name, RESERVED_MIRROR_NAMES_AT_CACHE_V1
+            )));
+        }
+    }
+
+    // Notify on a mirror with destinations: per WEBHOOKS.md, the
+    // notify body says "go re-read via /cache/v1/raw/<key>". That's
+    // only meaningful when the per-mirror `cache-v1` API is enabled.
+    if let Some(notify) = m.notify.as_ref() {
+        let has_cache_v1 = m.http_access.as_ref().is_some_and(|h| h.cache_v1.is_some());
+        if !has_cache_v1 {
+            return Err(LoadError::Validation(format!(
+                "mirror {:?}: `notify` requires `http-access.cache-v1` on the same \
+                 mirror (the notify body tells consumers to re-read via /cache/v1)",
+                m.name
+            )));
+        }
+        validate_notify_shared(m, notify)?;
+    }
     Ok(())
 }
 
+/// Validation rules that apply to every notify block regardless of
+/// whether the mirror has destinations. URL parses, targets
+/// non-empty, debounce sanity, retry sanity, timeout sanity.
+fn validate_notify_shared(m: &Mirror, notify: &Notify) -> Result<(), LoadError> {
+    if notify.targets.is_empty() {
+        return Err(LoadError::Validation(format!(
+            "mirror {:?}: `notify.targets` must contain at least one entry",
+            m.name
+        )));
+    }
+    for (i, t) in notify.targets.iter().enumerate() {
+        match url::Url::parse(&t.url) {
+            Ok(u) => {
+                let scheme = u.scheme();
+                if scheme != "http" && scheme != "https" {
+                    return Err(LoadError::Validation(format!(
+                        "mirror {:?}: notify.targets[{i}].url must use scheme http or https, \
+                         got {scheme:?}",
+                        m.name
+                    )));
+                }
+                if u.host_str().map(str::is_empty).unwrap_or(true) {
+                    return Err(LoadError::Validation(format!(
+                        "mirror {:?}: notify.targets[{i}].url has no host",
+                        m.name
+                    )));
+                }
+            }
+            Err(e) => {
+                return Err(LoadError::Validation(format!(
+                    "mirror {:?}: notify.targets[{i}].url is not a valid URL: {e}",
+                    m.name
+                )));
+            }
+        }
+    }
+    if notify.timeout_ms < 1 {
+        return Err(LoadError::Validation(format!(
+            "mirror {:?}: `notify.timeout-ms` must be >= 1",
+            m.name
+        )));
+    }
+    if notify.retry.max_attempts < 1 {
+        return Err(LoadError::Validation(format!(
+            "mirror {:?}: `notify.retry.max-attempts` must be >= 1",
+            m.name
+        )));
+    }
+    if notify.retry.backoff_ms < 1 {
+        return Err(LoadError::Validation(format!(
+            "mirror {:?}: `notify.retry.backoff-ms` must be >= 1",
+            m.name
+        )));
+    }
+    match notify.trigger.on {
+        TriggerOn::SourceConsume => {
+            // `debounce` is required (the constructor default
+            // populates it; explicit `debounce: null` is rejected).
+            let debounce = notify.trigger.debounce.as_ref().ok_or_else(|| {
+                LoadError::Validation(format!(
+                    "mirror {:?}: `notify.trigger.debounce` is required when \
+                     `trigger.on: source-consume`",
+                    m.name
+                ))
+            })?;
+            if debounce.max_records < 1 {
+                return Err(LoadError::Validation(format!(
+                    "mirror {:?}: `notify.trigger.debounce.max-records` must be >= 1",
+                    m.name
+                )));
+            }
+            if debounce.max_time_ms < 1 {
+                return Err(LoadError::Validation(format!(
+                    "mirror {:?}: `notify.trigger.debounce.max-time-ms` must be >= 1",
+                    m.name
+                )));
+            }
+        }
+        TriggerOn::DestinationFlush => {
+            // The destination's own flush triggers ARE the debounce
+            // in this mode. Explicit debounce is redundant noise; we
+            // could tolerate it, but rejecting catches typos and
+            // makes the spec's "no `debounce` block applies" rule
+            // observable.
+            if notify.trigger.debounce.is_some() {
+                return Err(LoadError::Validation(format!(
+                    "mirror {:?}: `notify.trigger.debounce` is forbidden when \
+                     `trigger.on: destination-flush`; the destination flush triggers are the \
+                     debounce in that mode",
+                    m.name
+                )));
+            }
+            // The spec also rejects `destination-flush` on kafka-only
+            // mirrors - kafka commits per-record and has no
+            // observable batch flushes. That rule is enforced
+            // transitively here: notify requires http-access, and
+            // http-access is incompatible with kafka-only destinations
+            // (see `has_blob` checks above), so any kafka-only mirror
+            // with a notify block is already rejected with a clearer
+            // message before this point. No separate check needed.
+        }
+    }
+    Ok(())
+}
+
+/// Extra restrictions on top of [`validate_notify_shared`] when the
+/// mirror has no destinations: notify is the only side-effect, so
+/// destination-shaped fields are all forbidden, http-access is
+/// forbidden, and trigger.on must be source-consume.
+fn validate_notify_only(m: &Mirror, notify: &Notify) -> Result<(), LoadError> {
+    for (field, present) in [
+        ("format", m.format.is_some()),
+        ("compression", m.compression.is_some()),
+        ("keys", m.keys.is_some()),
+        ("values", m.values.is_some()),
+        ("compaction", m.compaction.is_some()),
+        ("flush", m.flush.is_some()),
+        ("timestamp-mode", m.timestamp_mode.is_some()),
+        (
+            "http-access",
+            m.http_access.as_ref().is_some_and(HttpAccess::any_enabled),
+        ),
+    ] {
+        if present {
+            return Err(LoadError::Validation(format!(
+                "mirror {:?}: notify-only mirrors (no destinations) cannot set `{field}`; \
+                 there is nothing for it to apply to",
+                m.name
+            )));
+        }
+    }
+    if matches!(notify.trigger.on, TriggerOn::DestinationFlush) {
+        return Err(LoadError::Validation(format!(
+            "mirror {:?}: notify-only mirrors must use `trigger.on: source-consume` \
+             (no destinations to flush)",
+            m.name
+        )));
+    }
+    validate_notify_shared(m, notify)
+}
+
 fn raw_destination_name(d: &Destination) -> Option<&str> {
     match d {
         Destination::Kafka(k) => k.name.as_deref(),
diff --git a/crates/mirror-config/tests/loading.rs b/crates/mirror-config/tests/loading.rs
index 4f0923a..acb8eff 100644
--- a/crates/mirror-config/tests/loading.rs
+++ b/crates/mirror-config/tests/loading.rs
@@ -1,7 +1,7 @@
 use mirror_config::{
-    load_from_str, ColumnConfig, ColumnType, Compaction, Config, Destination, DestinationFormat,
-    FilesystemDestination, FlushTriggers, HttpAccess, HttpAccessApi, KafkaDestination, KafkaSource,
-    Mirror, S3Destination, TimestampMode,
+    load_from_str, CacheV1Config, ColumnConfig, ColumnType, Compaction, Config, Destination,
+    DestinationFormat, FilesystemDestination, FlushTriggers, HttpAccess, KafkaDestination,
+    KafkaSource, Mirror, S3Destination, TimestampMode,
 };
 use std::path::PathBuf;
 
@@ -35,6 +35,7 @@ fn parses_minimal_kafka_config() {
                     name: None,
                     bootstrap_servers: "redpanda:9092".into(),
                     topic: None,
+                    affects_readiness: true,
                 })],
                 format: None,
                 compression: None,
@@ -45,6 +46,7 @@ fn parses_minimal_kafka_config() {
                 timestamp_mode: None,
                 http_access: None,
                 enabled: None,
+                notify: None,
             }],
         }
     );
@@ -119,6 +121,7 @@ mirrors:
         Destination::Filesystem(FilesystemDestination {
             name: None,
             root: PathBuf::from("/var/mirror-v3"),
+            affects_readiness: true,
         })
     );
     let m = &cfg.mirrors[0];
@@ -166,10 +169,40 @@ mirrors:
             region: "us-east-1".into(),
             bucket: "mirror-v3".into(),
             prefix: Some("archive/".into()),
+            affects_readiness: true,
         })
     );
 }
 
+#[test]
+fn affects_readiness_defaults_true_and_overrides() {
+    let yaml = r#"
+mirrors:
+  - name: dual
+    source: { bootstrap-servers: source:9092 }
+    topic: dual
+    partition: 0
+    destinations:
+      - type: kafka
+        name: primary
+        bootstrap-servers: primary:9092
+      - type: kafka
+        name: ghost
+        bootstrap-servers: ghost:9092
+        affects-readiness: false
+"#;
+    let cfg = load_from_str(yaml).expect("must parse");
+    let dests = &cfg.mirrors[0].destinations;
+    assert!(
+        dests[0].affects_readiness(),
+        "default must be true when omitted"
+    );
+    assert!(
+        !dests[1].affects_readiness(),
+        "explicit affects-readiness: false must round-trip"
+    );
+}
+
 #[test]
 fn tee_fs_and_s3_with_explicit_names_parses() {
     // The PoC payoff: one mirror, two destinations, distinct names.
@@ -596,7 +629,7 @@ mirrors:
       - type: filesystem
         root: /tmp/mirror
     http-access:
-      api: cache-v1
+      cache-v1: {}
     flush:
       max-time-ms: 5000
       max-bytes: 1000
@@ -606,7 +639,8 @@ mirrors:
     assert_eq!(
         cfg.mirrors[0].http_access,
         Some(HttpAccess {
-            api: HttpAccessApi::CacheV1
+            cache_v1: Some(CacheV1Config {}),
+            cache_v1_main: None,
         })
     );
 }
@@ -623,7 +657,7 @@ mirrors:
       - type: kafka
         bootstrap-servers: redpanda:9092
     http-access:
-      api: cache-v1
+      cache-v1: {}
 "#;
     let err = load_from_str(yaml).expect_err("http-access on kafka-only mirror must be rejected");
     let msg = format!("{err}");
@@ -646,7 +680,7 @@ mirrors:
         root: /tmp/mirror
     keys: { type: bytes }
     http-access:
-      api: cache-v1
+      cache-v1: {}
     flush:
       max-time-ms: 5000
       max-bytes: 1000
@@ -672,7 +706,7 @@ mirrors:
       - type: filesystem
         root: /tmp/mirror
     http-access:
-      api: cache-v1
+      cache-v1: {}
     flush:
       max-time-ms: 5000
       max-bytes: 1000
@@ -785,3 +819,118 @@ mirrors:
     assert_eq!(cfg.mirrors[0].timestamp_mode, Some(TimestampMode::Source));
     assert_eq!(cfg.mirrors[0].format, Some(DestinationFormat::Parquet));
 }
+
+#[test]
+fn http_access_cache_v1_main_requires_cache_v1() {
+    // Without the per-mirror surface there's no view for the
+    // unprefixed /cache/v1/... paths to dispatch to.
+    let yaml = r#"
+mirrors:
+  - name: ops
+    source: { bootstrap-servers: kafka:9092 }
+    topic: ops
+    partition: 0
+    destinations:
+      - type: filesystem
+        root: /tmp/mirror
+    http-access:
+      cache-v1-main: {}
+    flush: { max-time-ms: 5000, max-bytes: 1000, max-offsets: 100 }
+"#;
+    let err = load_from_str(yaml).expect_err("cache-v1-main alone must be rejected");
+    let msg = format!("{err}");
+    assert!(
+        msg.contains("cache-v1-main") && msg.contains("requires `http-access.cache-v1`"),
+        "got: {msg}"
+    );
+}
+
+#[test]
+fn http_access_cache_v1_main_at_most_one_mirror() {
+    let yaml = r#"
+mirrors:
+  - name: ops
+    source: { bootstrap-servers: kafka:9092 }
+    topic: ops
+    partition: 0
+    destinations: [{ type: filesystem, root: /tmp/ops }]
+    http-access: { cache-v1: {}, cache-v1-main: {} }
+    flush: { max-time-ms: 5000, max-bytes: 1000, max-offsets: 100 }
+  - name: users
+    source: { bootstrap-servers: kafka:9092 }
+    topic: users
+    partition: 0
+    destinations: [{ type: filesystem, root: /tmp/users }]
+    http-access: { cache-v1: {}, cache-v1-main: {} }
+    flush: { max-time-ms: 5000, max-bytes: 1000, max-offsets: 100 }
+"#;
+    let err = load_from_str(yaml).expect_err("two cache-v1-main mirrors must be rejected");
+    let msg = format!("{err}");
+    assert!(
+        msg.contains("cache-v1-main") && msg.contains("at most one"),
+        "got: {msg}"
+    );
+}
+
+#[test]
+fn http_access_cache_v1_main_one_mirror_ok() {
+    // Singleton is allowed; sibling mirror enables only cache-v1.
+    let yaml = r#"
+mirrors:
+  - name: ops
+    source: { bootstrap-servers: kafka:9092 }
+    topic: ops
+    partition: 0
+    destinations: [{ type: filesystem, root: /tmp/ops }]
+    http-access: { cache-v1: {}, cache-v1-main: {} }
+    flush: { max-time-ms: 5000, max-bytes: 1000, max-offsets: 100 }
+  - name: users
+    source: { bootstrap-servers: kafka:9092 }
+    topic: users
+    partition: 0
+    destinations: [{ type: filesystem, root: /tmp/users }]
+    http-access: { cache-v1: {} }
+    flush: { max-time-ms: 5000, max-bytes: 1000, max-offsets: 100 }
+"#;
+    let cfg = load_from_str(yaml).expect("must parse");
+    assert!(cfg.mirrors[0]
+        .http_access
+        .as_ref()
+        .unwrap()
+        .cache_v1_main
+        .is_some());
+    assert!(cfg.mirrors[1]
+        .http_access
+        .as_ref()
+        .unwrap()
+        .cache_v1_main
+        .is_none());
+}
+
+#[test]
+fn http_access_rejects_mirror_name_colliding_with_literal_path_segment() {
+    // Mirror named `keys` would make /cache/v1/keys/raw/<key> race
+    // against the literal /cache/v1/keys served for cache-v1-main.
+    for name in ["raw", "offset", "keys", "values"] {
+        let yaml = format!(
+            r#"
+mirrors:
+  - name: {name}
+    source: {{ bootstrap-servers: kafka:9092 }}
+    topic: t
+    partition: 0
+    destinations: [{{ type: filesystem, root: /tmp/m }}]
+    http-access: {{ cache-v1: {{}} }}
+    flush: {{ max-time-ms: 5000, max-bytes: 1000, max-offsets: 100 }}
+"#
+        );
+        let err = load_from_str(&yaml)
+            .err()
+            .unwrap_or_else(|| panic!("mirror name {name:?} must be rejected"));
+        let msg = format!("{err}");
+        assert!(
+            msg.contains("collides") && msg.contains(name),
+            "name {name:?}, got: {msg}"
+        );
+    }
+}
diff --git a/crates/mirror-config/tests/notify.rs b/crates/mirror-config/tests/notify.rs
new file mode 100644
index 0000000..5f2e925
--- /dev/null
+++ b/crates/mirror-config/tests/notify.rs
@@ -0,0 +1,611 @@
+//! Parse + validation tests for the `notify` block (WEBHOOKS.md).
+//!
+//! Each rule from "Validation" in WEBHOOKS.md is one test. The
+//! positive-path tests are also worth keeping because they pin
+//! the spec's defaults - if a future commit changes
+//! `notify.timeout-ms`'s default from 5000, `defaults_apply_when_omitted`
+//! fails and the operator-facing semantics get reviewed.
+
+use mirror_config::{
+    load_from_str, FinalAction, NotifyApi, NotifyDebounce, NotifyOutcome, NotifyRetry, TriggerOn,
+};
+
+/// Helper: minimal mirror with destinations + http-access + a kkv-v1
+/// notify block. Used by the positive-path tests so each assertion
+/// only varies the field under test.
+const MINIMAL_WITH_NOTIFY: &str = r#"
+mirrors:
+  - name: events
+    source: { bootstrap-servers: kafka:9092 }
+    topic: events-stream
+    partition: 0
+    destinations:
+      - type: filesystem
+        root: /var/mirror
+    format: parquet
+    compression: zstd-1
+    http-access: { cache-v1: {} }
+    flush:
+      max-time-ms: 60000
+      max-bytes: 67108864
+      max-offsets: 10000
+    notify:
+      api: kkv-v1
+      targets:
+        - url: http://events-cache:8080
+"#;
+
+#[test]
+fn minimal_notify_block_parses_with_all_defaults() {
+    let cfg = load_from_str(MINIMAL_WITH_NOTIFY).expect("must parse");
+    let m = &cfg.mirrors[0];
+    let notify = m.notify.as_ref().expect("notify must be present");
+
+    assert_eq!(notify.api, NotifyApi::KkvV1);
+    assert_eq!(notify.targets.len(), 1);
+    assert_eq!(notify.targets[0].url, "http://events-cache:8080");
+    assert_eq!(notify.targets[0].path, None);
+    assert_eq!(notify.targets[0].fan_out, mirror_config::FanOut::None);
+
+    // Spec-default trigger + debounce.
+    assert_eq!(notify.trigger.on, TriggerOn::SourceConsume);
+    assert_eq!(
+        notify.trigger.debounce,
+        Some(NotifyDebounce {
+            max_records: 100,
+            max_time_ms: 250
+        })
+    );
+
+    // Spec-default timeout / retry.
+    assert_eq!(notify.timeout_ms, 5000);
+    assert_eq!(
+        notify.retry,
+        NotifyRetry {
+            max_attempts: 5,
+            backoff_ms: 100
+        }
+    );
+
+    // Spec-default outcomes table.
+    let o = notify.outcomes;
+    assert_eq!(o.timeout, ok_retry_fail());
+    assert_eq!(o.connrefused, ok_retry_fail());
+    assert_eq!(o.two_xx, no_retry_accept());
+    assert_eq!(o.three_xx, no_retry_fail());
+    assert_eq!(o.four_xx, no_retry_fail());
+    assert_eq!(o.five_xx, ok_retry_fail());
+}
+
+#[test]
+fn explicit_outcomes_override_per_field() {
+    // Operators can override only the outcomes they care about; the
+    // rest still fall back to spec defaults. Test sets 4xx to skip,
+    // expects others to stay default.
+    let yaml = format!(
+        "{MINIMAL_WITH_NOTIFY}      outcomes:\n        4xx: {{ retry: false, final: skip }}\n"
+    );
+    let cfg = load_from_str(&yaml).expect("must parse");
+    let o = cfg.mirrors[0].notify.as_ref().unwrap().outcomes;
+    assert_eq!(
+        o.four_xx,
+        NotifyOutcome {
+            retry: false,
+            final_: FinalAction::Skip
+        }
+    );
+    // Others kept their defaults.
+    assert_eq!(o.timeout, ok_retry_fail());
+    assert_eq!(o.two_xx, no_retry_accept());
+}
+
+#[test]
+fn destination_flush_trigger_parses_without_debounce() {
+    let yaml = format!("{MINIMAL_WITH_NOTIFY}      trigger:\n        on: destination-flush\n");
+    let cfg = load_from_str(&yaml).expect("must parse");
+    let trigger = &cfg.mirrors[0].notify.as_ref().unwrap().trigger;
+    assert_eq!(trigger.on, TriggerOn::DestinationFlush);
+    assert_eq!(trigger.debounce, None);
+}
+
+#[test]
+fn target_path_and_fanout_parse_when_set() {
+    let yaml = r#"
+mirrors:
+  - name: events
+    source: { bootstrap-servers: kafka:9092 }
+    topic: events
+    partition: 0
+    destinations:
+      - type: filesystem
+        root: /var/mirror
+    http-access: { cache-v1: {} }
+    flush:
+      max-time-ms: 60000
+      max-bytes: 67108864
+      max-offsets: 10000
+    notify:
+      api: kkv-v1
+      targets:
+        - url: http://my-headless-service:8080
+          path: /custom/path
+          fan-out: dns-a
+"#;
+    let cfg = load_from_str(yaml).expect("must parse");
+    let t = &cfg.mirrors[0].notify.as_ref().unwrap().targets[0];
+    assert_eq!(t.path.as_deref(), Some("/custom/path"));
+    assert_eq!(t.fan_out, mirror_config::FanOut::DnsA);
+}
+
+// ============================================================
+//   Validation failures
+// ============================================================
+
+#[test]
+fn notify_without_http_access_rejected() {
+    let yaml = r#"
+mirrors:
+  - name: events
+    source: { bootstrap-servers: kafka:9092 }
+    topic: events
+    partition: 0
+    destinations:
+      - type: filesystem
+        root: /var/mirror
+    flush:
+      max-time-ms: 60000
+      max-bytes: 67108864
+      max-offsets: 10000
+    notify:
+      api: kkv-v1
+      targets:
+        - url: http://events-cache:8080
+"#;
+    let err = load_from_str(yaml).expect_err("must reject");
+    let msg = format!("{err}");
+    assert!(
+        msg.contains("notify") && msg.contains("http-access"),
+        "got: {msg}"
+    );
+}
+
+#[test]
+fn notify_with_empty_targets_rejected() {
+    let yaml = r#"
+mirrors:
+  - name: events
+    source: { bootstrap-servers: kafka:9092 }
+    topic: events
+    partition: 0
+    destinations:
+      - type: filesystem
+        root: /var/mirror
+    http-access: { cache-v1: {} }
+    flush:
+      max-time-ms: 60000
+      max-bytes: 67108864
+      max-offsets: 10000
+    notify:
+      api: kkv-v1
+      targets: []
+"#;
+    let err = load_from_str(yaml).expect_err("must reject");
+    let msg = format!("{err}");
+    assert!(
+        msg.contains("notify.targets") && msg.contains("at least one"),
+        "got: {msg}"
+    );
+}
+
+#[test]
+fn notify_target_with_invalid_url_rejected() {
+    let yaml = r#"
+mirrors:
+  - name: events
+    source: { bootstrap-servers: kafka:9092 }
+    topic: events
+    partition: 0
+    destinations:
+      - type: filesystem
+        root: /var/mirror
+    http-access: { cache-v1: {} }
+    flush:
+      max-time-ms: 60000
+      max-bytes: 67108864
+      max-offsets: 10000
+    notify:
+      api: kkv-v1
+      targets:
+        - url: "not a url at all"
+"#;
+    let err = load_from_str(yaml).expect_err("must reject");
+    let msg = format!("{err}");
+    assert!(
+        msg.contains("notify.targets[0].url") && msg.contains("not a valid URL"),
+        "got: {msg}"
+    );
+}
+
+#[test]
+fn notify_target_with_non_http_scheme_rejected() {
+    let yaml = r#"
+mirrors:
+  - name: events
+    source: { bootstrap-servers: kafka:9092 }
+    topic: events
+    partition: 0
+    destinations:
+      - type: filesystem
+        root: /var/mirror
+    http-access: { cache-v1: {} }
+    flush:
+      max-time-ms: 60000
+      max-bytes: 67108864
+      max-offsets: 10000
+    notify:
+      api: kkv-v1
+      targets:
+        - url: ftp://still-a-url-but-wrong-scheme:21
+"#;
+    let err = load_from_str(yaml).expect_err("must reject");
+    let msg = format!("{err}");
+    assert!(
+        msg.contains("scheme http or https") && msg.contains("ftp"),
+        "got: {msg}"
+    );
+}
+
+#[test]
+fn destination_flush_trigger_with_explicit_debounce_rejected() {
+    let yaml = r#"
+mirrors:
+  - name: events
+    source: { bootstrap-servers: kafka:9092 }
+    topic: events
+    partition: 0
+    destinations:
+      - type: filesystem
+        root: /var/mirror
+    http-access: { cache-v1: {} }
+    flush:
+      max-time-ms: 60000
+      max-bytes: 67108864
+      max-offsets: 10000
+    notify:
+      api: kkv-v1
+      targets:
+        - url: http://events-cache:8080
+      trigger:
+        on: destination-flush
+        debounce: { max-records: 100, max-time-ms: 250 }
+"#;
+    let err = load_from_str(yaml).expect_err("must reject");
+    let msg = format!("{err}");
+    assert!(
+        msg.contains("debounce") && msg.contains("destination-flush"),
+        "got: {msg}"
+    );
+}
+
+#[test]
+fn debounce_zero_max_records_rejected() {
+    let yaml = r#"
+mirrors:
+  - name: events
+    source: { bootstrap-servers: kafka:9092 }
+    topic: events
+    partition: 0
+    destinations:
+      - type: filesystem
+        root: /var/mirror
+    http-access: { cache-v1: {} }
+    flush:
+      max-time-ms: 60000
+      max-bytes: 67108864
+      max-offsets: 10000
+    notify:
+      api: kkv-v1
+      targets:
+        - url: http://events-cache:8080
+      trigger:
+        on: source-consume
+        debounce: { max-records: 0, max-time-ms: 250 }
+"#;
+    let err = load_from_str(yaml).expect_err("must reject");
+    let msg = format!("{err}");
+    assert!(
+        msg.contains("debounce.max-records") && msg.contains(">= 1"),
+        "got: {msg}"
+    );
+}
+
+#[test]
+fn zero_timeout_ms_rejected() {
+    let yaml = r#"
+mirrors:
+  - name: events
+    source: { bootstrap-servers: kafka:9092 }
+    topic: events
+    partition: 0
+    destinations:
+      - type: filesystem
+        root: /var/mirror
+    http-access: { cache-v1: {} }
+    flush:
+      max-time-ms: 60000
+      max-bytes: 67108864
+      max-offsets: 10000
+    notify:
+      api: kkv-v1
+      targets:
+        - url: http://events-cache:8080
+      timeout-ms: 0
+"#;
+    let err = load_from_str(yaml).expect_err("must reject");
+    let msg = format!("{err}");
+    assert!(
+        msg.contains("timeout-ms") && msg.contains(">= 1"),
+        "got: {msg}"
+    );
+}
+
+#[test]
+fn zero_retry_max_attempts_rejected() {
+    let yaml = r#"
+mirrors:
+  - name: events
+    source: { bootstrap-servers: kafka:9092 }
+    topic: events
+    partition: 0
+    destinations:
+      - type: filesystem
+        root: /var/mirror
+    http-access: { cache-v1: {} }
+    flush:
+      max-time-ms: 60000
+      max-bytes: 67108864
+      max-offsets: 10000
+    notify:
+      api: kkv-v1
+      targets:
+        - url: http://events-cache:8080
+      retry:
+        max-attempts: 0
+        backoff-ms: 100
+"#;
+    let err = load_from_str(yaml).expect_err("must reject");
+    let msg = format!("{err}");
+    assert!(
+        msg.contains("retry.max-attempts") && msg.contains(">= 1"),
+        "got: {msg}"
+    );
+}
+
+// ============================================================
+//   Notify-only mirrors (destinations: [])
+// ============================================================
+
+#[test]
+fn notify_only_mirror_parses() {
+    let yaml = r#"
+mirrors:
+  - name: invalidator
+    source: { bootstrap-servers: kafka:9092 }
+    topic: events
+    partition: 0
+    destinations: []
+    notify:
+      api: kkv-v1
+      targets:
+        - url: http://cache-target:8080
+          fan-out: dns-a
+"#;
+    let cfg = load_from_str(yaml).expect("must parse");
+    let m = &cfg.mirrors[0];
+    assert!(m.destinations.is_empty());
+    assert!(m.notify.is_some());
+}
+
+#[test]
+fn destinations_empty_without_notify_still_rejected() {
+    // Regression: the pre-WEBHOOKS rule (destinations must be
+    // non-empty) survives unless notify is present.
+    let yaml = r#"
+mirrors:
+  - name: empty
+    source: { bootstrap-servers: kafka:9092 }
+    topic: events
+    partition: 0
+    destinations: []
+"#;
+    let err = load_from_str(yaml).expect_err("must reject");
+    let msg = format!("{err}");
+    assert!(
+        msg.contains("destinations") && msg.contains("at least one"),
+        "got: {msg}"
+    );
+}
+
+#[test]
+fn notify_only_with_destination_flush_trigger_rejected() {
+    let yaml = r#"
+mirrors:
+  - name: invalidator
+    source: { bootstrap-servers: kafka:9092 }
+    topic: events
+    partition: 0
+    destinations: []
+    notify:
+      api: kkv-v1
+      targets:
+        - url: http://cache-target:8080
+      trigger:
+        on: destination-flush
+"#;
+    let err = load_from_str(yaml).expect_err("must reject");
+    let msg = format!("{err}");
+    assert!(
+        msg.contains("notify-only") && msg.contains("source-consume"),
+        "got: {msg}"
+    );
+}
+
+#[test]
+fn notify_only_with_http_access_rejected() {
+    let yaml = r#"
+mirrors:
+  - name: invalidator
+    source: { bootstrap-servers: kafka:9092 }
+    topic: events
+    partition: 0
+    destinations: []
+    http-access: { cache-v1: {} }
+    notify:
+      api: kkv-v1
+      targets:
+        - url: http://cache-target:8080
+"#;
+    let err = load_from_str(yaml).expect_err("must reject");
+    let msg = format!("{err}");
+    assert!(
+        msg.contains("notify-only") && msg.contains("http-access"),
+        "got: {msg}"
+    );
+}
+
+#[test]
+fn notify_only_with_format_rejected() {
+    let yaml = r#"
+mirrors:
+  - name: invalidator
+    source: { bootstrap-servers: kafka:9092 }
+    topic: events
+    partition: 0
+    destinations: []
+    format: parquet
+    notify:
+      api: kkv-v1
+      targets:
+        - url: http://cache-target:8080
+"#;
+    let err = load_from_str(yaml).expect_err("must reject");
+    let msg = format!("{err}");
+    assert!(
+        msg.contains("notify-only") && msg.contains("format"),
+        "got: {msg}"
+    );
+}
+
+#[test]
+fn notify_only_with_flush_rejected() {
+    let yaml = r#"
+mirrors:
+  - name: invalidator
+    source: { bootstrap-servers: kafka:9092 }
+    topic: events
+    partition: 0
+    destinations: []
+    flush:
+      max-time-ms: 5000
+      max-bytes: 1000
+      max-offsets: 100
+    notify:
+      api: kkv-v1
+      targets:
+        - url: http://cache-target:8080
+"#;
+    let err = load_from_str(yaml).expect_err("must reject");
+    let msg = format!("{err}");
+    assert!(
+        msg.contains("notify-only") && msg.contains("flush"),
+        "got: {msg}"
+    );
+}
+
+#[test]
+fn notify_only_with_empty_targets_rejected() {
+    let yaml = r#"
+mirrors:
+  - name: invalidator
+    source: { bootstrap-servers: kafka:9092 }
+    topic: events
+    partition: 0
+    destinations: []
+    notify:
+      api: kkv-v1
+      targets: []
+"#;
+    let err = load_from_str(yaml).expect_err("must reject");
+    let msg = format!("{err}");
+    assert!(
+        msg.contains("notify-only") && msg.contains("targets"),
+        "got: {msg}"
+    );
+}
+
+// ============================================================
+//   Helpers
+// ============================================================
+
+fn ok_retry_fail() -> NotifyOutcome {
+    NotifyOutcome {
+        retry: true,
+        final_: FinalAction::Fail,
+    }
+}
+
+fn no_retry_fail() -> NotifyOutcome {
+    NotifyOutcome {
+        retry: false,
+        final_: FinalAction::Fail,
+    }
+}
+
+fn no_retry_accept() -> NotifyOutcome {
+    NotifyOutcome {
+        retry: false,
+        final_: FinalAction::Accept,
+    }
+}
+
+#[test]
+fn destination_flush_with_only_kafka_destination_is_rejected_transitively() {
+    // Per WEBHOOKS.md: "A mirror with no blob destinations (kafka-
+    // only) cannot use `destination-flush`". The validator enforces
+    // this transitively: notify requires http-access, http-access
+    // requires ≥1 blob destination - so kafka-only + notify is
+    // already rejected, regardless of trigger mode. This test pins
+    // that the rejection happens.
+    let yaml = r#"
+mirrors:
+  - name: events
+    source: { bootstrap-servers: kafka:9092 }
+    topic: events
+    partition: 0
+    destinations:
+      - type: kafka
+        bootstrap-servers: kafka:9092
+    notify:
+      api: kkv-v1
+      targets:
+        - url: http://target:8080
+      trigger:
+        on: destination-flush
+"#;
+    let err = load_from_str(yaml).expect_err("kafka-only + notify must be rejected");
+    let msg = format!("{err}");
+    assert!(
+        msg.contains("notify") || msg.contains("http-access"),
+        "got: {msg}"
+    );
+}
+
+#[test]
+fn destination_flush_with_filesystem_destination_is_accepted() {
+    let yaml = format!("{MINIMAL_WITH_NOTIFY}      trigger:\n        on: destination-flush\n");
+    let cfg = load_from_str(&yaml).expect("must parse");
+    assert_eq!(
+        cfg.mirrors[0].notify.as_ref().unwrap().trigger.on,
+        TriggerOn::DestinationFlush
+    );
+}
diff --git a/crates/mirror-core/src/cache.rs b/crates/mirror-core/src/cache.rs
index 58895b6..7be54d3 100644
--- a/crates/mirror-core/src/cache.rs
+++ b/crates/mirror-core/src/cache.rs
@@ -1,12 +1,14 @@
-//! Shared in-memory cache view for `http-access: { api: cache-v1 }`
+//! Per-mirror in-memory cache views for `http-access: { cache-v1: {} }`
 //! mirrors.
 //!
-//! mirror-v3's KKV-compatibility mode keeps a merged `key → latest
-//! value` map of every record consumed by every opt-in mirror. This
-//! module owns the cross-task state behind an `Arc<CacheState>`: the
-//! sinks update it from the consume loop (per-record, *not* per-flush
-//! — freshness is independent of bucket-write cadence), and the HTTP
-//! handlers in `mirror-cache` read from it.
+//! Each opt-in mirror owns its own `key → latest value` map and
+//! `(topic, partition) → offset` map; the sinks update those from
+//! the consume loop (per-record, *not* per-flush — freshness is
+//! independent of bucket-write cadence), and the HTTP handlers in
+//! `mirror-cache` read them out under
+//! `/cache/v1/{mirror}/...`. A single mirror may additionally
+//! enable `cache-v1-main`, in which case `mirror-cache` mounts the
+//! unprefixed `/cache/v1/...` paths onto that mirror's view.
 //!
 //! ## Monotonicity
 //!
@@ -21,12 +23,14 @@
 //! Each participating mirror declares a `bootstrap_hwm` at sink
 //! open (`fetch_high_watermark` against the source partition). Once a
 //! mirror's last-applied offset has caught up to its bootstrap
-//! watermark, it is "ready"; once *every* registered mirror is
-//! ready, [`CacheState::is_ready`] flips to `true` and stays true.
-//! HTTP handlers gate on this; they return 503 until it flips.
+//! watermark, it is "ready"; per-mirror HTTP handlers gate on
+//! [`CacheState::is_mirror_ready`] and return 503 until that mirror
+//! flips. The aggregate [`CacheState::is_ready`] flips only when
+//! *every* registered mirror is ready, and backs the `/q/health/ready`
+//! drop-in.
 
 use std::collections::HashMap;
-use std::sync::atomic::{AtomicBool, Ordering};
+use std::sync::atomic::{AtomicBool, AtomicU64, Ordering};
 use std::sync::{Arc, RwLock};
 
 use indexmap::IndexMap;
@@ -65,33 +69,121 @@ pub struct TopicPartitionOffset {
     pub offset: u64,
 }
 
-/// Per-mirror readiness slot. The supervisor (mirror-bin) creates
-/// one per opt-in mirror at startup, populates `bootstrap_hwm`, and
-/// stores the slot in [`CacheState`]. The sink's per-record path
-/// flips the slot to `caught_up` once its last-seen offset has
-/// crossed `bootstrap_hwm`.
+/// Enum status for a registered mirror. Carries the names + lag
+/// values needed for the structured `/q/health/ready` body so an
+/// on-call engineer can grep the response for the unhealthy source
+/// or destination.
+#[derive(Debug, Clone, PartialEq, Eq)]
+pub enum MirrorStatus {
+    /// Has not yet reached `bootstrap_hwm` for the first time since
+    /// this process started. Cache HTTP returns 503; notify
+    /// dispatcher continues to suppress per the per-record
+    /// threshold check.
+    Warming,
+    /// Source assignment OK, lag within tolerance, no gating
+    /// destination is behind. Cache HTTP returns 200.
+    Ready,
+    /// Source-side lag exceeds the readiness tolerance. Cache HTTP
+    /// returns 503. `lag = broker_end_offset - last_applied_offset`.
+    LagBehindSource { lag: u64 },
+    /// The Kafka consumer's `assignment()` doesn't include this
+    /// mirror's (topic, partition). Set by the supervisor's
+    /// assignment poller (lands in commit 8); cleared when the
+    /// partition reappears.
+    SourceUnassigned { topic: String, partition: u32 },
+    /// A gating destination is behind on its `flushed_through`.
+    /// Reported by the supervisor's per-destination ack tracker
+    /// (mirror-bin); never set by `CacheState` itself.
+    DestinationLagging { name: String, lag: u64 },
+}
+
+/// One mirror's row in a [`CacheState::status_snapshot`] result.
+/// Serialised verbatim into the structured `/q/health/ready` body
+/// and into the per-mirror cache 503 body, so a downstream consumer
+/// can parse a single shape across both endpoints.
+#[derive(Debug, Clone, PartialEq, Eq)]
+pub struct MirrorStatusSnapshot {
+    pub name: String,
+    pub topic: String,
+    pub partition: u32,
+    pub source_assigned: bool,
+    pub last_applied_offset: u64,
+    pub broker_end_offset: u64,
+    pub status: MirrorStatus,
+}
+
 #[derive(Debug)]
-struct MirrorReadiness {
+struct MirrorSlot {
     bootstrap_hwm: u64,
-    caught_up: AtomicBool,
+    /// Offset strictly below which the notify dispatcher suppresses
+    /// records. Computed at register time as
+    /// `max(last_committed_offset, bootstrap_hwm if no commit)`:
+    ///
+    ///   * Fresh deploy (no broker-committed offset for the group):
+    ///     `suppression_threshold = bootstrap_hwm`. Records during
+    ///     the first replay-to-current window don't fan webhooks
+    ///     out to consumers.
+    ///   * Returning deploy (group has a previously-committed
+    ///     offset `C`): `suppression_threshold = C`. Records `[C,
+    ///     bootstrap_hwm)` represent the between-pods gap and DO
+    ///     fire webhooks — the previous pod was supposed to deliver
+    ///     them but exited before doing so. Records below `C` are
+    ///     suppressed because the previous pod already delivered
+    ///     them.
+    ///
+    /// Set once at registration; read-only thereafter. Stored as
+    /// `u64` rather than `AtomicU64` because it never mutates.
+    suppression_threshold: u64,
+    /// Source-partition identity. Used by the assignment-loss path
+    /// and the structured readiness response body.
+    topic: String,
+    partition: u32,
+    /// Atomically updated by [`apply_record`]. The slot's view of
+    /// "highest source offset I've applied" for this mirror,
+    /// independent of the per-`TopicPartition` `offsets` map (which
+    /// has finer granularity but isn't read on the readiness path).
+    last_applied_offset: AtomicU64,
+    /// Broker end offset for the mirror's source partition. Initial
+    /// value `bootstrap_hwm`; updated by the supervisor's end-offset
+    /// poller (commit 8). Used by the readiness predicate as
+    /// `lag = broker_end_offset - last_applied_offset`.
+    broker_end_offset: AtomicU64,
+    /// `true` when the Kafka consumer reports the mirror's
+    /// `(topic, partition)` in its `assignment()`. Set by the
+    /// supervisor's assignment poller (commit 8); flipped to `false`
+    /// transitions the slot to [`MirrorStatus::SourceUnassigned`].
+    source_assigned: AtomicBool,
+    /// Cached current status. Recomputed by the supervisor or by
+    /// `apply_record` whenever an input atom changes. The HTTP
+    /// handlers take a read lock here on every probe.
+    status: RwLock<MirrorStatus>,
+    /// `key → latest-value` for this mirror only. Iteration order is
+    /// insertion order (the position a key gets the *first* time
+    /// it's seen). Overwrites don't change position. Tombstones
+    /// shift subsequent keys down.
+    view: RwLock<IndexMap<String, Vec<u8>>>,
+    /// Last-seen source offset per (topic, partition) within this
+    /// mirror. Monotonic.
+    offsets: RwLock<HashMap<TopicPartition, u64>>,
 }
 
 #[derive(Debug, Default)]
 pub struct CacheState {
-    /// Merged key → latest-value across every opt-in mirror.
-    /// Iteration order is **insertion order**: the position a key
-    /// gets the *first* time it's seen. Overwrites don't change
-    /// position. Tombstones shift subsequent keys down to fill the
-    /// gap. Clients that want a sorted listing sort client-side.
-    view: RwLock<IndexMap<String, Vec<u8>>>,
-    /// Last-seen source offset per (topic, partition). Monotonic.
-    offsets: RwLock<HashMap<TopicPartition, u64>>,
-    /// Per-mirror readiness slots, keyed by the mirror's
-    /// configuration name (unique per process).
-    mirrors: RwLock<HashMap<String, MirrorReadiness>>,
-    /// Sticky global ready flag. Flips to `true` once every
-    /// registered mirror has caught up; never flips back.
-    ready: AtomicBool,
+    /// Per-mirror slots, keyed by the mirror's configuration name
+    /// (unique per process).
+    mirrors: RwLock<HashMap<String, MirrorSlot>>,
+    /// Name of the mirror that opted into `cache-v1-main`, if any.
+    /// `mirror-cache` consults this to decide whether to mount the
+    /// unprefixed `/cache/v1/...` routes and which slot to dispatch
+    /// them to. Sticky for the lifetime of the process — set at
+    /// startup, never re-assigned. Validator enforces at-most-one.
+    main_mirror: RwLock<Option<String>>,
+    /// Lag (in offsets) tolerated before [`MirrorStatus::Ready`]
+    /// flips to [`MirrorStatus::LagBehindSource`]. Default is
+    /// `0` (any positive lag fires); the supervisor overrides via
+    /// [`Self::with_readiness_lag_tolerance`] from
+    /// `MIRROR_V3_READINESS_LAG`.
+    readiness_lag_tolerance: u64,
 }
 
 impl CacheState {
@@ -99,6 +191,15 @@ impl CacheState {
         Self::default()
     }
 
+    /// Override the per-`MirrorSlot` lag tolerance. The supervisor
+    /// reads `MIRROR_V3_READINESS_LAG` and calls this before
+    /// registering any mirror. Tests use it to construct a slot that
+    /// tolerates a deliberately-injected lag value.
+    pub fn with_readiness_lag_tolerance(mut self, tolerance: u64) -> Self {
+        self.readiness_lag_tolerance = tolerance;
+        self
+    }
+
     /// Register an opt-in mirror with its source-partition high
     /// watermark captured at startup. Must be called once per mirror
     /// before any `apply_record` for that mirror runs.
@@ -106,38 +207,126 @@ impl CacheState {
     /// `bootstrap_hwm` is the Kafka high-watermark (one past the last
     /// existing offset). An empty topic has `bootstrap_hwm = 0` and
     /// the mirror is immediately considered caught up.
-    pub fn register_mirror(&self, mirror_name: &str, bootstrap_hwm: u64) {
-        let caught_up = bootstrap_hwm == 0;
-        {
-            let mut m = self.mirrors.write().expect("cache mirrors poisoned");
-            m.insert(
-                mirror_name.to_string(),
-                MirrorReadiness {
-                    bootstrap_hwm,
-                    caught_up: AtomicBool::new(caught_up),
-                },
-            );
-        }
-        if caught_up {
-            self.recheck_ready();
+    ///
+    /// `last_committed_offset` is the value the supervisor read from
+    /// the broker's `__consumer_offsets` for this group at startup
+    /// (`Source::fetch_committed_offset`). `Some(c)` means the prior
+    /// pod committed through `c` and webhook suppression resumes at
+    /// `c` rather than at `bootstrap_hwm`; `None` is a fresh group
+    /// and suppression uses `bootstrap_hwm`.
+    ///
+    /// `is_main` selects this mirror as the one `cache-v1-main`
+    /// mounts the unprefixed `/cache/v1/...` paths onto; the
+    /// validator enforces at-most-one, so the supervisor's last call
+    /// wins if it ever passes multiple `true`s (defensive — should
+    /// never happen).
+    pub fn register_mirror(
+        &self,
+        mirror_name: &str,
+        bootstrap_hwm: u64,
+        last_committed_offset: Option<u64>,
+        is_main: bool,
+    ) {
+        self.register_mirror_with_topic(
+            mirror_name,
+            bootstrap_hwm,
+            last_committed_offset,
+            is_main,
+            "",
+            0,
+        );
+    }
+
+    /// Same as [`Self::register_mirror`] plus the source identity
+    /// (`topic`, `partition`). The identity is surfaced in the
+    /// [`MirrorStatus::SourceUnassigned`] body so the structured
+    /// readiness response names the partition that disappeared.
+    /// `register_mirror` calls this with placeholder identity so
+    /// tests that don't care can keep the shorter signature.
+    pub fn register_mirror_with_topic(
+        &self,
+        mirror_name: &str,
+        bootstrap_hwm: u64,
+        last_committed_offset: Option<u64>,
+        is_main: bool,
+        topic: &str,
+        partition: u32,
+    ) {
+        // Returning-deploy commit wins when present; otherwise the
+        // fresh-deploy fallback skips historical backlog up to the
+        // broker's high-watermark.
+        let suppression_threshold = last_committed_offset.unwrap_or(bootstrap_hwm);
+        // Empty topic (`bootstrap_hwm = 0`) is immediately ready;
+        // every other case starts in `Warming` and transitions via
+        // `apply_record` / the supervisor's pollers.
+        let initial_status = if bootstrap_hwm == 0 {
+            MirrorStatus::Ready
+        } else {
+            MirrorStatus::Warming
+        };
+        let mut m = self.mirrors.write().expect("cache mirrors poisoned");
+        m.insert(
+            mirror_name.to_string(),
+            MirrorSlot {
+                bootstrap_hwm,
+                suppression_threshold,
+                topic: topic.to_string(),
+                partition,
+                last_applied_offset: AtomicU64::new(0),
+                broker_end_offset: AtomicU64::new(bootstrap_hwm),
+                source_assigned: AtomicBool::new(true),
+                status: RwLock::new(initial_status),
+                view: RwLock::new(IndexMap::new()),
+                offsets: RwLock::new(HashMap::new()),
+            },
+        );
+        drop(m);
+        if is_main {
+            *self
+                .main_mirror
+                .write()
+                .expect("cache main_mirror poisoned") = Some(mirror_name.to_string());
         }
     }
 
-    /// Apply a record from the source consume loop to the in-memory
-    /// view and offset map. The supervisor passes `mirror_name` so we
-    /// can flip the mirror's readiness slot once the bootstrap
-    /// watermark is reached.
+    /// True iff the notify dispatcher should drop a record at
+    /// `source_offset` for `mirror_name`. Compared against the
+    /// per-mirror `suppression_threshold` set at register time. An
+    /// unknown mirror returns `false` (no info, don't suppress) so
+    /// the legacy behaviour of "fire if not registered" is
+    /// preserved.
+    pub fn is_record_suppressed(&self, mirror_name: &str, source_offset: u64) -> bool {
+        let mirrors = self.mirrors.read().expect("cache mirrors poisoned");
+        mirrors
+            .get(mirror_name)
+            .map(|slot| source_offset < slot.suppression_threshold)
+            .unwrap_or(false)
+    }
+
+    /// Apply a record from the source consume loop to the named
+    /// mirror's in-memory view and offset map. Flips the mirror's
+    /// readiness slot once the bootstrap watermark is reached.
     ///
     /// Monotonic: if `record.source_offset` is not strictly greater
-    /// than the partition's last-applied offset (rewind / replay),
-    /// this is a no-op for both the view and the offset map.
+    /// than the partition's last-applied offset on this mirror
+    /// (rewind / replay), the call is a no-op for both the view and
+    /// the offset map.
     pub fn apply_record(&self, mirror_name: &str, record: &Record) {
+        let mirrors = self.mirrors.read().expect("cache mirrors poisoned");
+        let Some(slot) = mirrors.get(mirror_name) else {
+            // No registered slot for this mirror; sinks that route
+            // through a `CacheBinding` are wired to one that always
+            // matches. Treat an unknown name as a no-op rather than
+            // panic so a future refactor that decouples destinations
+            // from registration can't crash the consume loop.
+            return;
+        };
         let tp = TopicPartition {
             topic: record.topic.clone(),
             partition: record.partition as u32,
         };
         {
-            let mut offsets = self.offsets.write().expect("cache offsets poisoned");
+            let mut offsets = slot.offsets.write().expect("mirror offsets poisoned");
             if let Some(&last) = offsets.get(&tp) {
                 if record.source_offset <= last {
                     return; // monotonic guard — never rewind the cache
@@ -158,97 +347,258 @@ impl CacheState {
             // production. Skip silently rather than panicking.
             None => return,
         };
-        let mut view = self.view.write().expect("cache view poisoned");
-        match record.value.as_ref() {
-            Some(v) => {
-                // IndexMap::insert keeps the existing position on
-                // overwrite and appends only on first sighting —
-                // which is the contract clients want for `/keys`
-                // ordering ("new keys appear at the end").
-                view.insert(key, v.clone());
-            }
-            None => {
-                // shift_remove preserves the relative order of the
-                // remaining entries; swap_remove would be faster but
-                // shuffle the trailing key into the gap, breaking
-                // determinism.
-                view.shift_remove(&key);
+        {
+            let mut view = slot.view.write().expect("mirror view poisoned");
+            match record.value.as_ref() {
+                Some(v) => {
+                    // IndexMap::insert keeps the existing position on
+                    // overwrite and appends only on first sighting —
+                    // which is the contract clients want for `/keys`
+                    // ordering ("new keys appear at the end").
+                    view.insert(key, v.clone());
+                }
+                None => {
+                    // shift_remove preserves the relative order of
+                    // the remaining entries; swap_remove would be
+                    // faster but shuffle the trailing key into the
+                    // gap, breaking determinism.
+                    view.shift_remove(&key);
+                }
             }
         }
-        drop(view);
-        // Readiness check after the view update so observers seeing
-        // ready=true also see the record applied.
-        if !self.ready.load(Ordering::Acquire) {
-            self.maybe_flip_mirror_ready(mirror_name, record.source_offset);
-        }
+        // Advance the per-mirror `last_applied_offset` and recompute
+        // the status. Both the per-`TopicPartition` `offsets` map
+        // above and this atom are kept; the atom is what the
+        // readiness predicate reads.
+        slot.last_applied_offset
+            .fetch_max(record.source_offset + 1, Ordering::AcqRel);
+        Self::recompute_status_locked(slot, self.readiness_lag_tolerance);
     }
 
-    fn maybe_flip_mirror_ready(&self, mirror_name: &str, last_offset: u64) {
-        let mut all_ready = true;
-        let mirrors = self.mirrors.read().expect("cache mirrors poisoned");
-        if let Some(slot) = mirrors.get(mirror_name) {
-            // The slot can have been flipped to caught_up either by
-            // register (empty topic) or by a previous record on the
-            // same mirror. Either way: once the mirror's
-            // last-applied offset hits `bootstrap_hwm - 1`, flip.
-            if !slot.caught_up.load(Ordering::Acquire) && last_offset + 1 >= slot.bootstrap_hwm {
-                slot.caught_up.store(true, Ordering::Release);
-            }
+    /// Compute the current status of a slot from its atomic
+    /// counters. Called by every input mutator: `apply_record`,
+    /// `set_broker_end_offset`, `mark_source_assigned`. Holds the
+    /// status RwLock briefly.
+    ///
+    /// Order of precedence (highest wins):
+    ///   1. `SourceUnassigned` — the consume loop is effectively dead
+    ///      until the partition reappears in the assignment.
+    ///   2. `Warming` — never caught up to `bootstrap_hwm` since
+    ///      process start.
+    ///   3. `DestinationLagging` — already encoded in the current
+    ///      status by the mirror-bin setter; preserved here so
+    ///      destination-side state doesn't get clobbered by a
+    ///      source-side recompute.
+    ///   4. `LagBehindSource` — lag exceeds tolerance.
+    ///   5. `Ready`.
+    fn recompute_status_locked(slot: &MirrorSlot, tolerance: u64) {
+        let mut current = slot.status.write().expect("status poisoned");
+        // Preserve a destination-lagging signal — only mirror-bin's
+        // destination-lag setter can set or clear that variant. The
+        // source-side recompute leaves it alone so a destination
+        // problem isn't masked by a fresh source-side ack.
+        if matches!(*current, MirrorStatus::DestinationLagging { .. }) {
+            return;
         }
-        for slot in mirrors.values() {
-            if !slot.caught_up.load(Ordering::Acquire) {
-                all_ready = false;
-                break;
-            }
+        if !slot.source_assigned.load(Ordering::Acquire) {
+            *current = MirrorStatus::SourceUnassigned {
+                topic: slot.topic.clone(),
+                partition: slot.partition,
+            };
+            return;
         }
-        drop(mirrors);
-        if all_ready {
-            self.ready.store(true, Ordering::Release);
+        let last_applied = slot.last_applied_offset.load(Ordering::Acquire);
+        let broker_end = slot.broker_end_offset.load(Ordering::Acquire);
+        if last_applied < slot.bootstrap_hwm {
+            *current = MirrorStatus::Warming;
+            return;
+        }
+        let lag = broker_end.saturating_sub(last_applied);
+        if lag > tolerance {
+            *current = MirrorStatus::LagBehindSource { lag };
+        } else {
+            *current = MirrorStatus::Ready;
         }
     }
 
-    fn recheck_ready(&self) {
+    /// Set the broker's current end offset for `mirror_name`. The
+    /// supervisor's end-offset poller (commit 8) calls this every
+    /// `MIRROR_V3_READINESS_POLL_MS`; the resulting recompute may
+    /// flip the slot into [`MirrorStatus::LagBehindSource`] or back
+    /// to [`MirrorStatus::Ready`].
+    pub fn set_broker_end_offset(&self, mirror_name: &str, end_offset: u64) {
         let mirrors = self.mirrors.read().expect("cache mirrors poisoned");
-        let all_ready = mirrors
-            .values()
-            .all(|s| s.caught_up.load(Ordering::Acquire));
-        drop(mirrors);
-        if all_ready {
-            self.ready.store(true, Ordering::Release);
-        }
+        let Some(slot) = mirrors.get(mirror_name) else {
+            return;
+        };
+        // Monotonic — broker end-offset only advances.
+        slot.broker_end_offset
+            .fetch_max(end_offset, Ordering::AcqRel);
+        Self::recompute_status_locked(slot, self.readiness_lag_tolerance);
+    }
+
+    /// Mark the source partition as unassigned. The supervisor's
+    /// assignment poller (commit 8) calls this when
+    /// `consumer.assignment()` no longer includes the mirror's
+    /// partition.
+    pub fn mark_source_unassigned(&self, mirror_name: &str) {
+        let mirrors = self.mirrors.read().expect("cache mirrors poisoned");
+        let Some(slot) = mirrors.get(mirror_name) else {
+            return;
+        };
+        slot.source_assigned.store(false, Ordering::Release);
+        Self::recompute_status_locked(slot, self.readiness_lag_tolerance);
+    }
+
+    /// Mark the source partition as re-assigned. Inverse of
+    /// [`Self::mark_source_unassigned`].
+    pub fn mark_source_assigned(&self, mirror_name: &str) {
+        let mirrors = self.mirrors.read().expect("cache mirrors poisoned");
+        let Some(slot) = mirrors.get(mirror_name) else {
+            return;
+        };
+        slot.source_assigned.store(true, Ordering::Release);
+        Self::recompute_status_locked(slot, self.readiness_lag_tolerance);
+    }
+
+    /// Record that a gating destination is behind. The supervisor's
+    /// per-destination lag check sets this; clearing it requires a
+    /// follow-up call to [`Self::clear_destination_lagging`].
+    pub fn mark_destination_lagging(&self, mirror_name: &str, dest_name: &str, lag: u64) {
+        let mirrors = self.mirrors.read().expect("cache mirrors poisoned");
+        let Some(slot) = mirrors.get(mirror_name) else {
+            return;
+        };
+        let mut s = slot.status.write().expect("status poisoned");
+        *s = MirrorStatus::DestinationLagging {
+            name: dest_name.to_string(),
+            lag,
+        };
+    }
+
+    /// Clear a destination-lagging signal and let the next
+    /// source-side recompute pick a fresh status. The supervisor
+    /// calls this when every gating destination is back within
+    /// tolerance.
+    pub fn clear_destination_lagging(&self, mirror_name: &str) {
+        let mirrors = self.mirrors.read().expect("cache mirrors poisoned");
+        let Some(slot) = mirrors.get(mirror_name) else {
+            return;
+        };
+        // Reset to Warming so the next recompute picks the right
+        // source-side status. Direct write here so the existing
+        // DestinationLagging guard in `recompute_status_locked`
+        // doesn't see a stale DestinationLagging.
+        *slot.status.write().expect("status poisoned") = MirrorStatus::Warming;
+        Self::recompute_status_locked(slot, self.readiness_lag_tolerance);
     }
 
-    /// Cross-cluster readiness gate. Sticky once flipped to `true`.
+    /// Cross-mirror readiness gate. Non-sticky: returns `true` iff
+    /// at least one mirror is registered and every registered
+    /// mirror currently reports [`MirrorStatus::Ready`].
     pub fn is_ready(&self) -> bool {
-        self.ready.load(Ordering::Acquire)
+        let mirrors = self.mirrors.read().expect("cache mirrors poisoned");
+        !mirrors.is_empty()
+            && mirrors.values().all(|slot| {
+                matches!(
+                    *slot.status.read().expect("status poisoned"),
+                    MirrorStatus::Ready
+                )
+            })
+    }
+
+    /// Per-mirror readiness gate. Returns `true` iff `mirror_name`
+    /// is registered AND its current status is
+    /// [`MirrorStatus::Ready`]. Non-sticky: a mirror that drops out
+    /// of Ready (lag, assignment loss, destination problem) flips
+    /// this to `false`.
+    pub fn is_mirror_ready(&self, mirror_name: &str) -> bool {
+        self.status_for(mirror_name)
+            .is_some_and(|s| matches!(s, MirrorStatus::Ready))
+    }
+
+    /// Snapshot the current status for a registered mirror. Returns
+    /// `None` if the name is unknown. Used by the structured
+    /// `/q/health/ready` body and by tests.
+    pub fn status_for(&self, mirror_name: &str) -> Option<MirrorStatus> {
+        let mirrors = self.mirrors.read().expect("cache mirrors poisoned");
+        mirrors
+            .get(mirror_name)
+            .map(|slot| slot.status.read().expect("status poisoned").clone())
+    }
+
+    /// Snapshot every registered mirror's per-mirror readiness state
+    /// in a single pass. Used by the structured `/q/health/ready`
+    /// HTTP handler and by the per-mirror cache 503 body, both of
+    /// which want a consistent view across mirrors without taking
+    /// the slot lock multiple times.
+    ///
+    /// Entries are emitted in arbitrary order; the caller sorts when
+    /// stable ordering matters (the readiness handler does).
+    pub fn status_snapshot(&self) -> Vec<MirrorStatusSnapshot> {
+        let mirrors = self.mirrors.read().expect("cache mirrors poisoned");
+        mirrors
+            .iter()
+            .map(|(name, slot)| MirrorStatusSnapshot {
+                name: name.clone(),
+                topic: slot.topic.clone(),
+                partition: slot.partition,
+                source_assigned: slot.source_assigned.load(Ordering::Acquire),
+                last_applied_offset: slot.last_applied_offset.load(Ordering::Acquire),
+                broker_end_offset: slot.broker_end_offset.load(Ordering::Acquire),
+                status: slot.status.read().expect("status poisoned").clone(),
+            })
+            .collect()
     }
 
-    /// Lookup for `GET /cache/v1/raw/{key}`. Returns `None` if the
-    /// key is absent (404 territory).
-    pub fn get_value(&self, key: &str) -> Option<Vec<u8>> {
-        let view = self.view.read().expect("cache view poisoned");
+    /// Name of the mirror that opted into `cache-v1-main`, or
+    /// `None` if no mirror selected the singleton. The cache HTTP
+    /// router uses this to decide whether to mount the unprefixed
+    /// `/cache/v1/...` paths and which slot to dispatch them to.
+    pub fn main_mirror(&self) -> Option<String> {
+        self.main_mirror
+            .read()
+            .expect("cache main_mirror poisoned")
+            .clone()
+    }
+
+    /// Lookup for `GET /cache/v1/{mirror}/raw/{key}`. Returns `None`
+    /// when the mirror has no such key (404 territory) and also when
+    /// `mirror_name` is unknown — the HTTP handler maps unknown
+    /// mirrors to 404 anyway, so the call sites stay tight.
+    pub fn get_value_for(&self, mirror_name: &str, key: &str) -> Option<Vec<u8>> {
+        let mirrors = self.mirrors.read().expect("cache mirrors poisoned");
+        let slot = mirrors.get(mirror_name)?;
+        let view = slot.view.read().expect("mirror view poisoned");
         view.get(key).cloned()
     }
 
-    /// Snapshot of every key currently in the merged view, in
-    /// insertion order (first-sighting). Materializes under a single
-    /// read lock so callers see a consistent set.
-    pub fn snapshot_keys(&self) -> Vec<String> {
-        let view = self.view.read().expect("cache view poisoned");
-        view.keys().cloned().collect()
+    /// Snapshot of every key currently in the named mirror's view,
+    /// in insertion order. Returns `None` if the mirror is unknown.
+    pub fn snapshot_keys_for(&self, mirror_name: &str) -> Option<Vec<String>> {
+        let mirrors = self.mirrors.read().expect("cache mirrors poisoned");
+        let slot = mirrors.get(mirror_name)?;
+        let view = slot.view.read().expect("mirror view poisoned");
+        Some(view.keys().cloned().collect())
     }
 
-    /// Snapshot of every value currently in the merged view, in the
-    /// same order as [`snapshot_keys`](Self::snapshot_keys).
-    pub fn snapshot_values(&self) -> Vec<Vec<u8>> {
-        let view = self.view.read().expect("cache view poisoned");
-        view.values().cloned().collect()
+    /// Snapshot of every value in the named mirror's view, in the
+    /// same order as [`Self::snapshot_keys_for`]. `None` for unknown
+    /// mirrors.
+    pub fn snapshot_values_for(&self, mirror_name: &str) -> Option<Vec<Vec<u8>>> {
+        let mirrors = self.mirrors.read().expect("cache mirrors poisoned");
+        let slot = mirrors.get(mirror_name)?;
+        let view = slot.view.read().expect("mirror view poisoned");
+        Some(view.values().cloned().collect())
     }
 
-    /// Last-seen offset for one source (topic, partition), or `None`
-    /// if no record has been applied to that partition yet.
-    pub fn get_offset(&self, topic: &str, partition: u32) -> Option<u64> {
-        let offsets = self.offsets.read().expect("cache offsets poisoned");
+    /// Last-seen offset within `mirror_name` for one source
+    /// (topic, partition). `None` if the mirror is unknown or has
+    /// not seen a record on that partition yet.
+    pub fn get_offset_for(&self, mirror_name: &str, topic: &str, partition: u32) -> Option<u64> {
+        let mirrors = self.mirrors.read().expect("cache mirrors poisoned");
+        let slot = mirrors.get(mirror_name)?;
+        let offsets = slot.offsets.read().expect("mirror offsets poisoned");
         offsets
             .get(&TopicPartition {
                 topic: topic.to_string(),
@@ -257,10 +607,13 @@ impl CacheState {
             .copied()
     }
 
-    /// Snapshot of every `(topic, partition) → offset` entry, sorted
-    /// for deterministic header output.
-    pub fn snapshot_offsets(&self) -> Vec<TopicPartitionOffset> {
-        let offsets = self.offsets.read().expect("cache offsets poisoned");
+    /// Snapshot of `(topic, partition) → offset` entries for the
+    /// named mirror, sorted for deterministic header output. `None`
+    /// if the mirror is unknown.
+    pub fn snapshot_offsets_for(&self, mirror_name: &str) -> Option<Vec<TopicPartitionOffset>> {
+        let mirrors = self.mirrors.read().expect("cache mirrors poisoned");
+        let slot = mirrors.get(mirror_name)?;
+        let offsets = slot.offsets.read().expect("mirror offsets poisoned");
         let mut out: Vec<TopicPartitionOffset> = offsets
             .iter()
             .map(|(tp, off)| TopicPartitionOffset {
@@ -270,7 +623,7 @@ impl CacheState {
             })
             .collect();
         out.sort_by(|a, b| a.topic.cmp(&b.topic).then(a.partition.cmp(&b.partition)));
-        out
+        Some(out)
     }
 }
 
@@ -292,6 +645,34 @@ mod tests {
         }
     }
 
+    #[test]
+    fn is_mirror_ready_reports_per_mirror_status() {
+        // Per-mirror gate is the kkv-v1 notifier's suppression knob:
+        // it lets one mirror start emitting webhooks while another is
+        // still warming up against its bootstrap_hwm. Verify the three
+        // states the notifier cares about: unknown name, registered
+        // but pre-hwm, registered and caught up.
+        let s = CacheState::new();
+        assert!(
+            !s.is_mirror_ready("unknown"),
+            "unknown name must report false so an uninstrumented \
+             notifier can't accidentally fire"
+        );
+        s.register_mirror("warming", 3, None, false);
+        assert!(!s.is_mirror_ready("warming"), "hwm 3, no records yet");
+        s.apply_record("warming", &rec("warming", 0, 0, "k0", Some(b"v")));
+        s.apply_record("warming", &rec("warming", 0, 1, "k1", Some(b"v")));
+        assert!(!s.is_mirror_ready("warming"), "still 1 offset short of hwm");
+        s.apply_record("warming", &rec("warming", 0, 2, "k2", Some(b"v")));
+        assert!(s.is_mirror_ready("warming"), "offset hwm-1 flips the slot");
+        // Independent slot stays at its own state.
+        s.register_mirror("empty", 0, None, false);
+        assert!(
+            s.is_mirror_ready("empty"),
+            "hwm 0 = immediately ready, independent of other mirrors"
+        );
+    }
+
     #[test]
     fn empty_state_starts_not_ready_with_no_mirrors_registered() {
         // With zero registered mirrors there's nothing to wait for;
@@ -299,21 +680,22 @@ mod tests {
         // there's no useful cache yet).
         let s = CacheState::new();
         assert!(!s.is_ready());
-        assert!(s.snapshot_keys().is_empty());
-        assert!(s.snapshot_offsets().is_empty());
+        assert!(s.main_mirror().is_none());
+        assert!(s.snapshot_keys_for("missing").is_none());
+        assert!(s.snapshot_offsets_for("missing").is_none());
     }
 
     #[test]
     fn register_empty_topic_marks_mirror_ready_immediately() {
         let s = CacheState::new();
-        s.register_mirror("ops", 0);
+        s.register_mirror("ops", 0, None, false);
         assert!(s.is_ready(), "empty topic = hwm 0 = immediately ready");
     }
 
     #[test]
     fn readiness_flips_only_after_bootstrap_hwm_reached() {
         let s = CacheState::new();
-        s.register_mirror("ops", 3); // need offsets 0..=2
+        s.register_mirror("ops", 3, None, false); // need offsets 0..=2
         assert!(!s.is_ready());
         s.apply_record("ops", &rec("ops", 0, 0, "k0", Some(b"v0")));
         assert!(!s.is_ready());
@@ -326,8 +708,8 @@ mod tests {
     #[test]
     fn multiple_mirrors_all_must_catch_up() {
         let s = CacheState::new();
-        s.register_mirror("a", 2);
-        s.register_mirror("b", 1);
+        s.register_mirror("a", 2, None, false);
+        s.register_mirror("b", 1, None, false);
         assert!(!s.is_ready());
         s.apply_record("a", &rec("topic-a", 0, 0, "ka0", Some(b"va0")));
         s.apply_record("a", &rec("topic-a", 0, 1, "ka1", Some(b"va1")));
@@ -339,33 +721,33 @@ mod tests {
     #[test]
     fn tombstone_removes_key() {
         let s = CacheState::new();
-        s.register_mirror("ops", 2);
+        s.register_mirror("ops", 2, None, false);
         s.apply_record("ops", &rec("ops", 0, 0, "user-1", Some(br#"{"v":1}"#)));
         assert_eq!(
-            s.get_value("user-1").as_deref(),
+            s.get_value_for("ops", "user-1").as_deref(),
             Some(br#"{"v":1}"#.as_ref())
         );
         s.apply_record("ops", &rec("ops", 0, 1, "user-1", None)); // tombstone
-        assert!(s.get_value("user-1").is_none());
+        assert!(s.get_value_for("ops", "user-1").is_none());
     }
 
     #[test]
     fn rewind_does_not_overwrite_or_remove() {
         let s = CacheState::new();
-        s.register_mirror("ops", 1);
+        s.register_mirror("ops", 1, None, false);
         s.apply_record("ops", &rec("ops", 0, 0, "k", Some(b"first")));
         s.apply_record("ops", &rec("ops", 0, 1, "k", Some(b"second")));
         // Now feed a record with an older offset (simulated rewind).
         s.apply_record("ops", &rec("ops", 0, 0, "k", Some(b"first-again")));
         assert_eq!(
-            s.get_value("k").as_deref(),
+            s.get_value_for("ops", "k").as_deref(),
             Some(b"second".as_ref()),
             "rewind must not overwrite the latest value"
         );
         // Equal-offset record is also rejected.
         s.apply_record("ops", &rec("ops", 0, 1, "k", None));
         assert_eq!(
-            s.get_value("k").as_deref(),
+            s.get_value_for("ops", "k").as_deref(),
             Some(b"second".as_ref()),
             "equal-offset replay must not tombstone"
         );
@@ -374,11 +756,11 @@ mod tests {
     #[test]
     fn snapshot_offsets_is_deterministic_order() {
         let s = CacheState::new();
-        s.register_mirror("m", 10);
+        s.register_mirror("m", 10, None, false);
         s.apply_record("m", &rec("z-topic", 1, 5, "k", Some(b"v")));
         s.apply_record("m", &rec("a-topic", 3, 4, "k2", Some(b"v")));
         s.apply_record("m", &rec("a-topic", 1, 6, "k3", Some(b"v")));
-        let snap = s.snapshot_offsets();
+        let snap = s.snapshot_offsets_for("m").unwrap();
         let order: Vec<_> = snap
             .iter()
             .map(|tpo| (tpo.topic.clone(), tpo.partition))
@@ -396,23 +778,23 @@ mod tests {
     #[test]
     fn snapshot_keys_in_insertion_order() {
         let s = CacheState::new();
-        s.register_mirror("m", 0);
+        s.register_mirror("m", 0, None, false);
         s.apply_record("m", &rec("t", 0, 0, "c", Some(b"v")));
         s.apply_record("m", &rec("t", 0, 1, "a", Some(b"v")));
         s.apply_record("m", &rec("t", 0, 2, "b", Some(b"v")));
-        assert_eq!(s.snapshot_keys(), vec!["c", "a", "b"]);
+        assert_eq!(s.snapshot_keys_for("m").unwrap(), vec!["c", "a", "b"]);
     }
 
     #[test]
     fn overwrite_keeps_position_in_listing() {
         let s = CacheState::new();
-        s.register_mirror("m", 0);
+        s.register_mirror("m", 0, None, false);
         s.apply_record("m", &rec("t", 0, 0, "x", Some(b"v0")));
         s.apply_record("m", &rec("t", 0, 1, "y", Some(b"v1")));
         s.apply_record("m", &rec("t", 0, 2, "x", Some(b"v0-updated")));
-        assert_eq!(s.snapshot_keys(), vec!["x", "y"]);
+        assert_eq!(s.snapshot_keys_for("m").unwrap(), vec!["x", "y"]);
         assert_eq!(
-            s.snapshot_values(),
+            s.snapshot_values_for("m").unwrap(),
             vec![b"v0-updated".to_vec(), b"v1".to_vec()]
         );
     }
@@ -420,11 +802,259 @@ mod tests {
     #[test]
     fn tombstone_preserves_order_of_remaining() {
         let s = CacheState::new();
-        s.register_mirror("m", 0);
+        s.register_mirror("m", 0, None, false);
         s.apply_record("m", &rec("t", 0, 0, "a", Some(b"va")));
         s.apply_record("m", &rec("t", 0, 1, "b", Some(b"vb")));
         s.apply_record("m", &rec("t", 0, 2, "c", Some(b"vc")));
         s.apply_record("m", &rec("t", 0, 3, "b", None)); // tombstone middle
-        assert_eq!(s.snapshot_keys(), vec!["a", "c"]);
+        assert_eq!(s.snapshot_keys_for("m").unwrap(), vec!["a", "c"]);
+    }
+
+    #[test]
+    fn per_mirror_views_are_independent() {
+        // Two mirrors writing through their own slots: a key in
+        // mirror A must not show up in mirror B's view, and an
+        // unregistered mirror name returns None across the board.
+        let s = CacheState::new();
+        s.register_mirror("a", 0, None, false);
+        s.register_mirror("b", 0, None, false);
+        s.apply_record("a", &rec("topic-a", 0, 0, "k-a", Some(b"va")));
+        s.apply_record("b", &rec("topic-b", 0, 0, "k-b", Some(b"vb")));
+        assert_eq!(s.get_value_for("a", "k-a").as_deref(), Some(b"va".as_ref()));
+        assert!(s.get_value_for("a", "k-b").is_none());
+        assert_eq!(s.get_value_for("b", "k-b").as_deref(), Some(b"vb".as_ref()));
+        assert!(s.get_value_for("missing", "anything").is_none());
+        assert!(s.snapshot_keys_for("missing").is_none());
+    }
+
+    #[test]
+    fn register_mirror_tracks_main_mirror_singleton() {
+        let s = CacheState::new();
+        assert!(s.main_mirror().is_none());
+        s.register_mirror("ops", 0, None, false);
+        assert!(
+            s.main_mirror().is_none(),
+            "is_main=false does not assign the singleton"
+        );
+        s.register_mirror("users", 0, None, true);
+        assert_eq!(s.main_mirror().as_deref(), Some("users"));
+    }
+}
+
+#[cfg(test)]
+mod threshold_tests {
+    use super::*;
+
+    #[test]
+    fn fresh_deploy_suppresses_below_bootstrap_hwm() {
+        let s = CacheState::new();
+        s.register_mirror("m", 10, None, false);
+        for off in 0..10 {
+            assert!(
+                s.is_record_suppressed("m", off),
+                "fresh deploy must suppress offset {off} (< hwm 10)"
+            );
+        }
+        assert!(
+            !s.is_record_suppressed("m", 10),
+            "offset == hwm must NOT be suppressed (first live record)"
+        );
+        assert!(!s.is_record_suppressed("m", 50));
+    }
+
+    #[test]
+    fn returning_deploy_suppresses_below_committed_offset() {
+        let s = CacheState::new();
+        s.register_mirror("m", 10, Some(5), false);
+        for off in 0..5 {
+            assert!(
+                s.is_record_suppressed("m", off),
+                "returning deploy must suppress offset {off} below committed 5"
+            );
+        }
+        for off in 5..15 {
+            assert!(
+                !s.is_record_suppressed("m", off),
+                "offset {off} must fire (>= committed 5)"
+            );
+        }
+    }
+
+    #[test]
+    fn unknown_mirror_is_not_suppressed() {
+        let s = CacheState::new();
+        assert!(
+            !s.is_record_suppressed("never-registered", 0),
+            "unknown mirror returns false (no info, don't suppress)"
+        );
+    }
+
+    #[test]
+    fn empty_topic_no_committed_suppresses_nothing() {
+        let s = CacheState::new();
+        s.register_mirror("m", 0, None, false);
+        assert!(!s.is_record_suppressed("m", 0));
+        assert!(!s.is_record_suppressed("m", 99));
+    }
+}
+
+#[cfg(test)]
+mod status_transition_tests {
+    use super::*;
+
+    fn rec(topic: &str, partition: i32, offset: u64, key: &str) -> Record {
+        Record {
+            topic: topic.into(),
+            partition,
+            source_offset: offset,
+            timestamp_ms: Some(1_700_000_000_000),
+            timestamp_type: crate::TimestampType::CreateTime,
+            key: Some(key.as_bytes().to_vec()),
+            value: Some(b"v".to_vec()),
+            headers: Vec::<crate::Header>::new(),
+        }
+    }
+
+    #[test]
+    fn empty_topic_starts_ready() {
+        let s = CacheState::new();
+        s.register_mirror_with_topic("m", 0, None, false, "t", 0);
+        assert_eq!(s.status_for("m"), Some(MirrorStatus::Ready));
+        assert!(s.is_mirror_ready("m"));
+        assert!(s.is_ready(), "aggregate is true once every mirror is Ready");
+    }
+
+    #[test]
+    fn non_empty_topic_starts_warming_and_flips_on_catch_up() {
+        let s = CacheState::new();
+        s.register_mirror_with_topic("m", 5, None, false, "t", 0);
+        assert_eq!(s.status_for("m"), Some(MirrorStatus::Warming));
+        assert!(!s.is_mirror_ready("m"));
+
+        // Apply offsets 0..3 — still Warming because last_applied (= 4 after offset 3 sets `last_applied_offset = 4`) is below bootstrap_hwm 5.
+        for off in 0..4 {
+            s.apply_record("m", &rec("t", 0, off, &format!("k{off}")));
+        }
+        assert_eq!(s.status_for("m"), Some(MirrorStatus::Warming));
+
+        // Apply offset 4 — last_applied = 5, which equals bootstrap_hwm → Ready.
+        s.apply_record("m", &rec("t", 0, 4, "k4"));
+        assert_eq!(s.status_for("m"), Some(MirrorStatus::Ready));
+        assert!(s.is_mirror_ready("m"));
+    }
+
+    #[test]
+    fn poller_pushes_lag_then_recovers() {
+        // After warming, the broker advances. With tolerance=0, even
+        // one offset of lag flips the slot to LagBehindSource. A
+        // follow-up apply_record at the new end offset recovers to
+        // Ready.
+        let s = CacheState::new();
+        s.register_mirror_with_topic("m", 1, None, false, "t", 0);
+        s.apply_record("m", &rec("t", 0, 0, "k0")); // catch up; last_applied = 1
+        assert_eq!(s.status_for("m"), Some(MirrorStatus::Ready));
+
+        s.set_broker_end_offset("m", 5);
+        assert_eq!(
+            s.status_for("m"),
+            Some(MirrorStatus::LagBehindSource { lag: 4 })
+        );
+        assert!(!s.is_mirror_ready("m"));
+        assert!(!s.is_ready());
+
+        s.apply_record("m", &rec("t", 0, 1, "k1"));
+        s.apply_record("m", &rec("t", 0, 2, "k2"));
+        s.apply_record("m", &rec("t", 0, 3, "k3"));
+        s.apply_record("m", &rec("t", 0, 4, "k4"));
+        assert_eq!(s.status_for("m"), Some(MirrorStatus::Ready));
+        assert!(s.is_mirror_ready("m"));
+    }
+
+    #[test]
+    fn source_unassigned_overrides_other_states() {
+        let s = CacheState::new();
+        s.register_mirror_with_topic("m", 0, None, false, "user-states", 7);
+        assert_eq!(s.status_for("m"), Some(MirrorStatus::Ready));
+
+        s.mark_source_unassigned("m");
+        match s.status_for("m") {
+            Some(MirrorStatus::SourceUnassigned { topic, partition }) => {
+                assert_eq!(topic, "user-states");
+                assert_eq!(partition, 7);
+            }
+            other => panic!("expected SourceUnassigned, got {other:?}"),
+        }
+        assert!(!s.is_mirror_ready("m"));
+
+        // Source comes back; recompute returns to Ready (empty
+        // topic, no lag).
+        s.mark_source_assigned("m");
+        assert_eq!(s.status_for("m"), Some(MirrorStatus::Ready));
+    }
+
+    #[test]
+    fn destination_lagging_is_set_and_cleared_externally() {
+        let s = CacheState::new();
+        s.register_mirror_with_topic("m", 0, None, false, "t", 0);
+        assert_eq!(s.status_for("m"), Some(MirrorStatus::Ready));
+
+        s.mark_destination_lagging("m", "users-gcs", 42);
+        match s.status_for("m") {
+            Some(MirrorStatus::DestinationLagging { name, lag }) => {
+                assert_eq!(name, "users-gcs");
+                assert_eq!(lag, 42);
+            }
+            other => panic!("expected DestinationLagging, got {other:?}"),
+        }
+        assert!(!s.is_mirror_ready("m"));
+
+        // An incoming apply_record must NOT clobber DestinationLagging.
+        s.apply_record("m", &rec("t", 0, 0, "k0"));
+        assert!(matches!(
+            s.status_for("m"),
+            Some(MirrorStatus::DestinationLagging { .. })
+        ));
+
+        // Clearing returns to source-side state.
+        s.clear_destination_lagging("m");
+        assert_eq!(s.status_for("m"), Some(MirrorStatus::Ready));
+    }
+
+    #[test]
+    fn aggregate_is_ready_ands_every_slot() {
+        let s = CacheState::new();
+        s.register_mirror_with_topic("ready", 0, None, false, "t1", 0);
+        s.register_mirror_with_topic("warming", 5, None, false, "t2", 0);
+        assert!(
+            !s.is_ready(),
+            "aggregate is false while one slot is Warming"
+        );
+        for off in 0..5 {
+            s.apply_record("warming", &rec("t2", 0, off, &format!("k{off}")));
+        }
+        assert!(s.is_ready(), "aggregate flips to true when both Ready");
+    }
+
+    #[test]
+    fn aggregate_is_not_ready_when_no_mirrors_are_registered() {
+        let s = CacheState::new();
+        assert!(
+            !s.is_ready(),
+            "aggregate is false when nothing has been registered"
+        );
+    }
+
+    #[test]
+    fn lag_tolerance_lets_a_small_lag_stay_ready() {
+        let s = CacheState::new().with_readiness_lag_tolerance(10);
+        s.register_mirror_with_topic("m", 1, None, false, "t", 0);
+        s.apply_record("m", &rec("t", 0, 0, "k0")); // Ready, lag=0
+        s.set_broker_end_offset("m", 8); // lag=7 <= 10
+        assert_eq!(s.status_for("m"), Some(MirrorStatus::Ready));
+        s.set_broker_end_offset("m", 100); // lag=99 > 10
+        assert_eq!(
+            s.status_for("m"),
+            Some(MirrorStatus::LagBehindSource { lag: 99 })
+        );
     }
 }
diff --git a/crates/mirror-core/src/lib.rs b/crates/mirror-core/src/lib.rs
index e956cab..2feece5 100644
--- a/crates/mirror-core/src/lib.rs
+++ b/crates/mirror-core/src/lib.rs
@@ -15,19 +15,22 @@
 //!    `next_expected_offset()` and require it to still equal what we
 //!    expect. This catches external topic resets / out-of-band writes.
 
+use std::sync::Arc;
+
 use async_trait::async_trait;
 use thiserror::Error;
 
 pub mod cache;
 pub mod mock;
 pub mod tee;
+pub mod testing;
 
-pub use cache::{CacheBinding, CacheState};
+pub use cache::{CacheBinding, CacheState, MirrorStatus, MirrorStatusSnapshot};
 pub use tee::TeeSink;
 
 /// Per-mirror Prometheus labels. `topic` and `partition` together
 /// uniquely identify the data stream and join cleanly with broker-
-/// side exporters (kafka_exporter, etc.) — the mirror's operator-
+/// side exporters (kafka_exporter, etc.) - the mirror's operator-
 /// chosen `name` is *not* a metric label, it lives in `tracing`
 /// logs only.
 #[derive(Debug, Clone)]
@@ -210,7 +213,7 @@ pub trait Source: Send {
     async fn seek(&mut self, next_offset: u64) -> Result<(), SourceError>;
 
     /// Wait up to an implementation-defined poll timeout for the next
-    /// record. `Ok(None)` means the window elapsed without one — the
+    /// record. `Ok(None)` means the window elapsed without one - the
     /// loop will use that as a heartbeat to revalidate the sink.
     async fn poll_one(&mut self) -> Result<Option<Record>, SourceError>;
 
@@ -223,10 +226,59 @@ pub trait Source: Send {
     async fn low_watermark(&mut self) -> Result<u64, SourceError> {
         Ok(0)
     }
+
+    /// Highest offset still retained by the source (Kafka "high
+    /// watermark"; i.e. `last_offset + 1` if the source has any
+    /// records, or `0` if it's empty). The run loop doesn't query
+    /// this today - the default `Ok(u64::MAX)` is the
+    /// "always-satisfiable" sentinel, so future spec changes (e.g.
+    /// "fatal if sink_next_expected > source_high_watermark") can be
+    /// added without breaking sources that don't implement it.
+    ///
+    /// Implementations should query the broker rather than caching
+    /// (same contract as [`Self::low_watermark`]). The Kafka source
+    /// wraps the existing `mirror_kafka::fetch_high_watermark` helper.
+    async fn high_watermark(&mut self) -> Result<u64, SourceError> {
+        Ok(u64::MAX)
+    }
+
+    /// Mark every source offset strictly below `through` as
+    /// processed. For Kafka, this stages the offset for a subsequent
+    /// `commit_consumer_state` call so a restart of the same
+    /// `group.id` resumes there rather than at the broker's high
+    /// watermark.
+    ///
+    /// Implementations should buffer in memory; the actual broker
+    /// write is driven by the supervisor's periodic commit task. The
+    /// default no-op is correct for mocks and any source without a
+    /// notion of committed state.
+    ///
+    /// Idempotent: callers may pass the same `through` repeatedly.
+    /// Monotonic: implementations must ignore a `through` value
+    /// lower than the last one observed (the supervisor only ever
+    /// advances forward, but the contract makes that explicit so a
+    /// buggy caller can't rewind committed state).
+    async fn commit_through(&mut self, through: u64) -> Result<(), SourceError> {
+        let _ = through;
+        Ok(())
+    }
+
+    /// Read the broker's `__consumer_offsets` for this source's
+    /// (`group.id`, topic, partition). Used at startup to seed the
+    /// suppression threshold and the readiness gate. `Ok(None)`
+    /// means "no committed offset yet" (a fresh group); the default
+    /// is `Ok(None)` for mocks and any source without committed
+    /// state.
+    ///
+    /// Not part of the run loop's hot path; called once per mirror
+    /// at supervisor startup.
+    async fn fetch_committed_offset(&mut self) -> Result<Option<u64>, SourceError> {
+        Ok(None)
+    }
 }
 
 /// A destination for exactly-once mirroring. The sink owns the truth
-/// about "where we are" — the loop trusts `next_expected_offset`.
+/// about "where we are" - the loop trusts `next_expected_offset`.
 #[async_trait]
 pub trait Sink: Send {
     /// The source offset the destination will accept next. Must be
@@ -292,8 +344,132 @@ pub trait Sink: Send {
         let _ = low_watermark;
         Ok(())
     }
+
+    /// Install a [`FlushObserver`] that will be invoked every time
+    /// this sink durably commits a batch. Used by the
+    /// `notify.trigger.on: destination-flush` dispatch path to learn
+    /// when records are durable on the destination side without
+    /// scraping logs or polling `next_expected_offset`.
+    ///
+    /// Default no-op - sinks without observable flushes (Kafka,
+    /// mocks, in-memory) keep this default and the observer simply
+    /// never fires for them. Blob sinks (FS, S3) override and call
+    /// `observer.on_flushed(from, to)` after every successful
+    /// flush, where `to` is the highest source offset in the
+    /// just-flushed batch and `from` is the lowest. Only one
+    /// observer is supported per sink instance; later installs
+    /// replace earlier ones.
+    fn set_flush_observer(&mut self, _observer: Arc<dyn FlushObserver>) {}
+
+    /// Install a [`WriteObserver`] that fires after every successful
+    /// `write`. Default no-op for sinks where the per-record signal
+    /// is uninteresting or already covered by [`FlushObserver`]
+    /// (FS/S3 buffer multiple records into one flush; the flush
+    /// observer is the right granularity there). Kafka destination
+    /// sinks override and fire on every accepted record, so the
+    /// supervisor's per-destination ack tracker advances per write.
+    fn set_write_observer(&mut self, _observer: Arc<dyn WriteObserver>) {}
+}
+
+/// Observer notified when a sink durably commits a batch. Lives in
+/// `mirror-core` so [`Sink`] implementations (blob and tee) can
+/// invoke it without depending on the notify crate. The webhook
+/// dispatcher in `mirror-notify-kkv` implements this trait.
+///
+/// Synchronous on purpose: a flush is rare relative to records, and
+/// the observer is expected to do something cheap - typically
+/// enqueueing the `(from, to)` pair into an `mpsc` channel that a
+/// dedicated async task drains. Doing the HTTP POST inline would
+/// block the flush path and serialise destinations behind the
+/// receiver's latency.
+pub trait FlushObserver: Send + Sync {
+    /// `from` is the lowest source offset in the just-flushed batch
+    /// (inclusive). `to` is the highest (inclusive). For a tee over
+    /// multiple inner sinks the values are the *combined* advance
+    /// (the min across inner sinks); the observer fires only when
+    /// that min strictly increases.
+    fn on_flushed(&self, from: u64, to: u64);
+}
+
+/// Observer notified after a sink successfully writes a record.
+/// Parallel to [`FlushObserver`] but for per-record signals; Kafka
+/// destination sinks fire this after each accepted produce. Blob
+/// sinks buffer writes so they use `FlushObserver` instead.
+///
+/// Synchronous; implementations are expected to do something cheap
+/// (typically: bump an `AtomicU64` on the supervisor's per-
+/// destination ack tracker).
+pub trait WriteObserver: Send + Sync {
+    /// `source_offset` is the offset the record carried; the
+    /// destination is durable through `source_offset + 1` by the
+    /// time this fires.
+    fn on_written(&self, source_offset: u64);
+}
+
+/// Acknowledgement sink. Receives "everything strictly below
+/// `through` has been delivered" signals from either:
+/// * a notify dispatcher (after a successful drain / POST), or
+/// * a supervisor-installed [`FlushObserver`] / [`WriteObserver`]
+///   shim that translates per-destination flush / write events into
+///   `note_through` calls.
+///
+/// The supervisor's per-mirror ack tracker is the canonical
+/// implementation. The trait lives in `mirror-core` so notify
+/// dispatchers (in `mirror-notify-kkv`) can take a
+/// `Box<dyn AckSink>` without depending on `mirror-bin`.
+///
+/// Synchronous and idempotent. Implementations must guard against
+/// regressions (callers may not be monotonic at the trait surface;
+/// the AckTracker keeps a running maximum).
+pub trait AckSink: Send + Sync {
+    fn note_through(&self, through: u64);
+}
+
+/// Per-mirror observer of records as they flow through the loop.
+/// Used to drive the opt-in `api: kkv-v1` outbound webhook surface
+/// (see `WEBHOOKS.md`) without coupling the run loop to HTTP.
+///
+/// Contract:
+/// - `on_record` is called **after** `sink.write(record)` succeeds.
+///   The loop has already validated the source-offset gate, so the
+///   record is guaranteed to be at the destination's authoritative
+///   next-offset. A `NotifyError` returned here aborts the loop and
+///   surfaces as [`MirrorError::Notify`] - same fail-fast contract as
+///   [`SinkError`].
+/// - `shutdown` is called once on graceful exit, after the final
+///   `sink.flush`. Implementations should drain any buffered webhook
+///   batches synchronously before returning.
+///
+/// Implementations live outside `mirror-core` so this crate stays
+/// HTTP-free. The default impl (no-op) is used by every mirror that
+/// doesn't opt into a `notify:` block in config.
+#[async_trait]
+pub trait Notifier: Send {
+    /// Observe a record that was just successfully written to the
+    /// destination chain. `record` carries the same fields the sink
+    /// saw; implementations should clone what they need and return
+    /// promptly so they don't block the consume loop.
+    async fn on_record(&mut self, record: &Record) -> Result<(), NotifyError> {
+        let _ = record;
+        Ok(())
+    }
+
+    /// Called once on graceful shutdown, after the final `sink.flush`.
+    /// Implementations with debounce/buffer state should flush it here.
+    async fn shutdown(&mut self) -> Result<(), NotifyError> {
+        Ok(())
+    }
 }
 
+/// Zero-cost [`Notifier`] used by every mirror that doesn't configure
+/// a `notify:` block. Keeps the run loop's signature generic without
+/// forcing every caller to plumb a real notifier.
+#[derive(Debug, Default, Clone, Copy)]
+pub struct NoOpNotifier;
+
+#[async_trait]
+impl Notifier for NoOpNotifier {}
+
 #[derive(Debug, Error)]
 pub enum SourceError {
     #[error("source transport: {0}")]
@@ -308,12 +484,29 @@ pub enum SinkError {
     Transport(String),
 }
 
+/// Error produced by a [`Notifier`]. `Transport` carries a single
+/// underlying failure (timeout, connrefused, http status…); `Exhausted`
+/// signals that the retry budget was spent without success - the
+/// `final` action in the `notify.outcomes.*` config table (`fail` for
+/// this variant) decides whether the run loop should propagate the
+/// error up. The notifier itself encodes that decision: an `accept` /
+/// `skip` outcome simply returns `Ok(())` and never surfaces here.
+#[derive(Debug, Error)]
+pub enum NotifyError {
+    #[error("notify transport: {0}")]
+    Transport(String),
+    #[error("notify retries exhausted after {attempts} attempt(s): {last_error}")]
+    Exhausted { attempts: u32, last_error: String },
+}
+
 #[derive(Debug, Error)]
 pub enum MirrorError {
     #[error(transparent)]
     Source(#[from] SourceError),
     #[error(transparent)]
     Sink(#[from] SinkError),
+    #[error(transparent)]
+    Notify(#[from] NotifyError),
     /// Source delivered an offset *below* `expected`. Always a hard
     /// error: a Kafka client bug, a producer that rewound, or a
     /// destination chain that has somehow advanced past the broker.
@@ -322,7 +515,7 @@ pub enum MirrorError {
     /// Source delivered an offset *above* `expected`. Hard error in
     /// append mode (would leave a gap in the destination chain).
     /// Recoverable under `compaction: log`: the run loop aligns the
-    /// sink to the delivered offset and continues — the broker's
+    /// sink to the delivered offset and continues - the broker's
     /// `LogStartOffset` reports 0 for a `cleanup.policy=compact`
     /// topic even when the earliest deliverable record is much later
     /// (compaction deduplicates by key but does not advance the
@@ -340,7 +533,7 @@ pub enum MirrorError {
     /// next-expected-offset, and the sink is not willing to skip
     /// records (i.e. it's not a compaction:log destination). This
     /// fires at bootstrap on a compacted or delete-records-trimmed
-    /// source topic when the mirror is configured for append mode —
+    /// source topic when the mirror is configured for append mode -
     /// it would leave a gap in the destination chain, which append
     /// mode forbids.
     #[error(
@@ -357,7 +550,7 @@ pub enum MirrorError {
 }
 
 /// How often the loop emits an INFO-level "heartbeat" log line. This
-/// is the operator's `kubectl logs` heartbeat — without it, a quiet
+/// is the operator's `kubectl logs` heartbeat - without it, a quiet
 /// mirror (no source traffic, or buffered records that haven't
 /// tripped a flush trigger yet) looks indistinguishable from a stuck
 /// one. Override via the `MIRROR_V3_HEARTBEAT_SECS` env var; set to
@@ -384,7 +577,9 @@ pub fn heartbeat_interval_from_env() -> std::time::Duration {
 ///
 /// Heartbeat interval is read from the environment; pass a fixed
 /// interval via [`run_mirror_with_heartbeat`] if you need explicit
-/// control (e.g. tests that want to disable heartbeats).
+/// control (e.g. tests that want to disable heartbeats). Callers that
+/// need to observe records (e.g. webhook fan-out) use
+/// [`run_mirror_with_notifier`].
 pub async fn run_mirror<S, K, F>(source: S, sink: K, shutdown: F) -> Result<(), MirrorError>
 where
     S: Source,
@@ -395,14 +590,37 @@ where
 }
 
 pub async fn run_mirror_with_heartbeat<S, K, F>(
+    source: S,
+    sink: K,
+    shutdown: F,
+    heartbeat_interval: std::time::Duration,
+) -> Result<(), MirrorError>
+where
+    S: Source,
+    K: Sink,
+    F: std::future::Future<Output = ()> + Send,
+{
+    run_mirror_with_notifier(source, sink, NoOpNotifier, shutdown, heartbeat_interval).await
+}
+
+/// Same as [`run_mirror_with_heartbeat`] but with a caller-supplied
+/// [`Notifier`]. The loop calls `notifier.on_record(&record)` after
+/// every successful `sink.write`, and `notifier.shutdown()` once after
+/// the final `sink.flush` on graceful exit. `NotifyError`s propagate
+/// as [`MirrorError::Notify`] and abort the loop - the notifier itself
+/// is responsible for distinguishing "retryable, eventually accept"
+/// from "fail loudly" per the `notify.outcomes.*` table.
+pub async fn run_mirror_with_notifier<S, K, N, F>(
     mut source: S,
     mut sink: K,
+    mut notifier: N,
     shutdown: F,
     heartbeat_interval: std::time::Duration,
 ) -> Result<(), MirrorError>
 where
     S: Source,
     K: Sink,
+    N: Notifier,
     F: std::future::Future<Output = ()> + Send,
 {
     let sink_start = sink.next_expected_offset().await?;
@@ -484,6 +702,7 @@ where
             _ = &mut shutdown => {
                 tracing::info!("shutdown requested; flushing sink");
                 sink.flush().await?;
+                notifier.shutdown().await?;
                 return Ok(());
             }
             _ = async {
@@ -546,7 +765,7 @@ where
                                 // log level here scales with millions
                                 // of lines per restart. Observability
                                 // for gap rate is the dedicated
-                                // counter below — plot a rate or
+                                // counter below - plot a rate or
                                 // alert on a threshold rather than
                                 // reading logs. The startup `loop
                                 // start … compaction="log"` INFO
@@ -567,6 +786,12 @@ where
                                 });
                             }
                         }
+                        // Clone the record so the notifier can observe
+                        // it after the sink has consumed ownership.
+                        // One clone per accepted record is dwarfed by
+                        // the sink I/O cost; if profiling ever flags
+                        // it, add a `Notifier::wants_records` gate.
+                        let record_for_notify = record.clone();
                         sink.write(record).await?;
                         expected = expected
                             .checked_add(1)
@@ -586,6 +811,11 @@ where
                             "partition" => partition.clone(),
                         )
                         .increment(1);
+                        // Notifier observes only after the destination
+                        // chain has accepted the record. A failure
+                        // here aborts the loop and surfaces as
+                        // `MirrorError::Notify`.
+                        notifier.on_record(&record_for_notify).await?;
                     }
                     None => {
                         let current = sink.next_expected_offset().await?;
@@ -635,7 +865,7 @@ mod column_type_tests {
 
     #[test]
     fn json_does_not_parse_payload() {
-        // Valid UTF-8 but not parseable JSON — Json must accept it.
+        // Valid UTF-8 but not parseable JSON - Json must accept it.
         assert!(ColumnType::Json
             .validate("value", 0, Some(b"{this is not json"))
             .is_ok());
diff --git a/crates/mirror-core/src/mock.rs b/crates/mirror-core/src/mock.rs
index 26bf151..f4f9bc2 100644
--- a/crates/mirror-core/src/mock.rs
+++ b/crates/mirror-core/src/mock.rs
@@ -1,13 +1,14 @@
 //! Hand-written mocks for testing the mirror loop.
 //!
-//! These are public so downstream crates (notably the e2e harness in
-//! Phase 2) can reuse them, but the API is `#[doc(hidden)]`-ish: it
-//! exists to be shaped by the tests next to it.
+//! These are public so downstream crates (notably the e2e harness)
+//! can reuse them, but the API is `#[doc(hidden)]`-ish: it exists to
+//! be shaped by the tests next to it.
 
 use async_trait::async_trait;
 use std::collections::VecDeque;
+use std::sync::Arc;
 
-use crate::{Record, Sink, SinkError, Source, SourceError, TimestampType};
+use crate::{Record, Sink, SinkError, Source, SourceError, TimestampType, WriteObserver};
 
 /// Scriptable [`Source`] that returns canned events. Records seek
 /// calls and poll results so tests can assert on them.
@@ -15,6 +16,7 @@ pub struct MockSource {
     events: VecDeque<MockSourceEvent>,
     pub seeks: Vec<u64>,
     pub low_watermark: u64,
+    pub high_watermark: u64,
 }
 
 pub enum MockSourceEvent {
@@ -34,6 +36,10 @@ impl MockSource {
             events: events.into_iter().collect(),
             seeks: Vec::new(),
             low_watermark: 0,
+            // Default `u64::MAX` matches the trait's default; no
+            // spec currently rejects on HWM, so the sentinel value
+            // is "always satisfiable."
+            high_watermark: u64::MAX,
         }
     }
 
@@ -43,6 +49,16 @@ impl MockSource {
         self.low_watermark = low_watermark;
         self
     }
+
+    /// Configure the value returned by [`Source::high_watermark`].
+    /// Used by tests for spec changes that introduce a "sink can't
+    /// exceed source HWM" gate. The default is `u64::MAX` (the
+    /// trait's "always-satisfiable" sentinel) so unrelated tests
+    /// aren't affected.
+    pub fn with_high_watermark(mut self, high_watermark: u64) -> Self {
+        self.high_watermark = high_watermark;
+        self
+    }
 }
 
 #[async_trait]
@@ -68,6 +84,10 @@ impl Source for MockSource {
     async fn low_watermark(&mut self) -> Result<u64, SourceError> {
         Ok(self.low_watermark)
     }
+
+    async fn high_watermark(&mut self) -> Result<u64, SourceError> {
+        Ok(self.high_watermark)
+    }
 }
 
 async fn futures_pending() {
@@ -100,6 +120,10 @@ pub struct MockSink {
     /// to false (append-mode behaviour) and is set true by tests
     /// simulating a compaction:log destination.
     pub allows_compacted_source: bool,
+    /// Observer fired after every successful `write`. Tests use this
+    /// to assert the per-write ack hook is wired correctly through
+    /// whichever code path is under test.
+    pub write_observer: Option<Arc<dyn WriteObserver>>,
 }
 
 impl MockSink {
@@ -110,6 +134,7 @@ impl MockSink {
             write_error: None,
             running_position: offset,
             allows_compacted_source: false,
+            write_observer: None,
         }
     }
 
@@ -153,8 +178,12 @@ impl Sink for MockSink {
                 actual: record.source_offset,
             });
         }
+        let offset = record.source_offset;
         self.running_position += 1;
         self.writes.push(record);
+        if let Some(obs) = self.write_observer.as_ref() {
+            obs.on_written(offset);
+        }
         Ok(())
     }
 
@@ -168,6 +197,10 @@ impl Sink for MockSink {
         self.running_position = low_watermark;
         Ok(())
     }
+
+    fn set_write_observer(&mut self, observer: Arc<dyn WriteObserver>) {
+        self.write_observer = Some(observer);
+    }
 }
 
 /// Convenience constructor for tests.
diff --git a/crates/mirror-core/src/tee.rs b/crates/mirror-core/src/tee.rs
index 3fdbccb..82a58a4 100644
--- a/crates/mirror-core/src/tee.rs
+++ b/crates/mirror-core/src/tee.rs
@@ -1,4 +1,4 @@
-//! `TeeSink` — fan one source consumer's records out to N inner sinks
+//! `TeeSink`: fan one source consumer's records out to N inner sinks
 //! while preserving every inner sink's end-offset invariant.
 //!
 //! ## Why "per-sink heads"
@@ -8,7 +8,7 @@
 //! per-record. At any wall-clock moment three concurrent sinks fed
 //! from the same loop have **different durable positions**. Restart
 //! from that heterogeneous state would crash any inner sink that
-//! couldn't silently drop re-presented records — the Kafka end-offset
+//! couldn't silently drop re-presented records; the Kafka end-offset
 //! gate, in particular, would refuse.
 //!
 //! `TeeSink` solves this by tracking a `head` per inner sink. The tee
@@ -44,11 +44,13 @@
 //! is returned. The supervisor exits non-zero, but the surviving
 //! sinks' tails are durable.
 
+use std::sync::Arc;
+
 use async_trait::async_trait;
 use futures::future::join_all;
 
 use crate::cache::CacheBinding;
-use crate::{Record, Sink, SinkError};
+use crate::{FlushObserver, Record, Sink, SinkError};
 
 /// One inner sink plus the source offset it will accept next.
 struct InnerSink {
@@ -70,7 +72,7 @@ impl TeeSink {
     /// starting head. The optional cache binding is applied (once
     /// per record) at the top of [`Self::write`].
     ///
-    /// `names` must be unique and in the same order as `sinks` — they
+    /// `names` must be unique and in the same order as `sinks`; they
     /// appear in error/heartbeat logs so an operator can attribute a
     /// per-sink failure back to the destination element in YAML.
     pub async fn open(
@@ -123,7 +125,7 @@ impl Sink for TeeSink {
     async fn next_expected_offset(&mut self) -> Result<u64, SinkError> {
         // Re-query every inner sink so the per-sink heads stay
         // honest. This is only called at startup and on idle by the
-        // run loop, so the O(N) query cost is bounded — it doesn't
+        // run loop, so the O(N) query cost is bounded; it doesn't
         // run per record.
         for inner in self.inners.iter_mut() {
             let head = inner.sink.next_expected_offset().await?;
@@ -174,7 +176,7 @@ impl Sink for TeeSink {
 
         // Concurrent write fanout. We `join_all` over per-sink
         // futures so the slowest inner sink's per-record latency
-        // dominates the tee's per-record cost — sequential calls
+        // dominates the tee's per-record cost; sequential calls
         // would 1000× the fast sinks' wait time for no reason.
         let mut futs = Vec::with_capacity(indices.len());
         // Take the slots' sinks temporarily so we can drive them
@@ -220,7 +222,7 @@ impl Sink for TeeSink {
 
     async fn flush(&mut self) -> Result<(), SinkError> {
         // Concurrent flush. Per-sink errors are logged; the first
-        // error is returned. The other sinks still flush — losing
+        // error is returned. The other sinks still flush; losing
         // sink A's tail buffer should not cost us sink B's tail too.
         let mut futs = Vec::with_capacity(self.inners.len());
         let mut taken: Vec<(usize, String, Box<dyn Sink>)> = Vec::with_capacity(self.inners.len());
@@ -302,6 +304,97 @@ impl Sink for TeeSink {
         }
         Ok(())
     }
+
+    fn set_flush_observer(&mut self, observer: Arc<dyn FlushObserver>) {
+        if self.inners.len() == 1 {
+            // Length-1 tee (the common case for single-destination
+            // mirrors): forward the observer to the only inner sink
+            // unchanged. `from`/`to` flow through verbatim.
+            self.inners[0].sink.set_flush_observer(observer);
+            return;
+        }
+        // Multi-destination: wrap the outer observer with a per-sink
+        // relay + a min-coordinator. The outer observer fires only
+        // when *every* inner sink has committed past a watermark -
+        // matching the spec's "fire when ALL destinations have
+        // committed past the batch's high-water offset".
+        let coordinator = Arc::new(MinFlushCoordinator::new(self.inners.len(), observer));
+        for (sink_index, inner) in self.inners.iter_mut().enumerate() {
+            inner.sink.set_flush_observer(Arc::new(PerSinkRelay {
+                sink_index,
+                coordinator: Arc::clone(&coordinator),
+            }));
+        }
+    }
+}
+
+/// Per-sink wrapper that funnels every inner sink's `on_flushed`
+/// into the shared [`MinFlushCoordinator`]. Used only when the tee
+/// has more than one inner sink.
+struct PerSinkRelay {
+    sink_index: usize,
+    coordinator: Arc<MinFlushCoordinator>,
+}
+
+impl FlushObserver for PerSinkRelay {
+    fn on_flushed(&self, _from: u64, to: u64) {
+        // `from` reported by the inner sink is its own local batch
+        // boundary, not meaningful at the combined-advance level.
+        // The coordinator synthesises a `from` from the previously-
+        // fired watermark.
+        self.coordinator.note(self.sink_index, to);
+    }
+}
+
+/// Tracks per-sink "highest flushed `to`" and fires the outer
+/// observer when `min(per-sink) > last-fired`. Synchronous, std
+/// `Mutex` (the FS/S3 flush sites are async-context but invoke
+/// `on_flushed` synchronously; the coordinator holds locks only
+/// long enough to compute new min and decide to fire).
+struct MinFlushCoordinator {
+    per_sink_flushed_to: std::sync::Mutex<Vec<u64>>,
+    last_fired_to: std::sync::Mutex<Option<u64>>,
+    outer: Arc<dyn FlushObserver>,
+}
+
+impl MinFlushCoordinator {
+    fn new(num_sinks: usize, outer: Arc<dyn FlushObserver>) -> Self {
+        Self {
+            per_sink_flushed_to: std::sync::Mutex::new(vec![0; num_sinks]),
+            last_fired_to: std::sync::Mutex::new(None),
+            outer,
+        }
+    }
+
+    fn note(&self, sink_index: usize, to: u64) {
+        let new_min = {
+            let mut per_sink = self.per_sink_flushed_to.lock().unwrap();
+            if to > per_sink[sink_index] {
+                per_sink[sink_index] = to;
+            }
+            *per_sink.iter().min().unwrap()
+        };
+        // First-fire case: no `last_fired_to` yet, so `from` is the
+        // tee's *initial* combined head; `0` is acceptable for the
+        // bootstrap fire (the receiver only cares about `to`).
+        let to_fire = {
+            let mut last = self.last_fired_to.lock().unwrap();
+            match *last {
+                Some(prev) if new_min > prev => {
+                    *last = Some(new_min);
+                    Some((prev, new_min))
+                }
+                None if new_min > 0 => {
+                    *last = Some(new_min);
+                    Some((0, new_min))
+                }
+                _ => None,
+            }
+        };
+        if let Some((from, to)) = to_fire {
+            self.outer.on_flushed(from, to);
+        }
+    }
 }
 
 /// Owned, no-op sink used as a placeholder when the tee temporarily
@@ -336,6 +429,11 @@ mod tests {
         fail_on_offset: Option<u64>,
         allow_compacted: bool,
         aligned_to: Arc<Mutex<Option<u64>>>,
+        /// The observer the tee installed via `set_flush_observer`,
+        /// if any. Tests fire it explicitly via [`Self::simulate_flush`]
+        /// to drive the tee's per-sink coordinator without needing
+        /// real disk I/O.
+        observer: Arc<Mutex<Option<Arc<dyn crate::FlushObserver>>>>,
     }
 
     impl Recording {
@@ -343,10 +441,12 @@ mod tests {
             let accepted = Arc::new(Mutex::new(Vec::new()));
             let flush_count = Arc::new(Mutex::new(0));
             let aligned_to = Arc::new(Mutex::new(None));
+            let observer = Arc::new(Mutex::new(None));
             let recorder = Recorder {
                 accepted: Arc::clone(&accepted),
                 flush_count: Arc::clone(&flush_count),
                 aligned_to: Arc::clone(&aligned_to),
+                observer: Arc::clone(&observer),
             };
             (
                 Self {
@@ -356,6 +456,7 @@ mod tests {
                     fail_on_offset: None,
                     allow_compacted: false,
                     aligned_to,
+                    observer,
                 },
                 recorder,
             )
@@ -375,6 +476,7 @@ mod tests {
         accepted: Arc<Mutex<Vec<u64>>>,
         flush_count: Arc<Mutex<u32>>,
         aligned_to: Arc<Mutex<Option<u64>>>,
+        observer: Arc<Mutex<Option<Arc<dyn crate::FlushObserver>>>>,
     }
 
     impl Recorder {
@@ -387,6 +489,14 @@ mod tests {
         fn aligned(&self) -> Option<u64> {
             *self.aligned_to.lock().unwrap()
         }
+        /// Fire the observer the tee installed via
+        /// `set_flush_observer`, simulating a real on-disk flush.
+        /// Tests use this instead of doing real I/O.
+        fn simulate_flush(&self, from: u64, to: u64) {
+            if let Some(obs) = self.observer.lock().unwrap().as_ref() {
+                obs.on_flushed(from, to);
+            }
+        }
     }
 
     #[async_trait]
@@ -421,6 +531,9 @@ mod tests {
             self.starting_head = low_watermark;
             Ok(())
         }
+        fn set_flush_observer(&mut self, observer: Arc<dyn crate::FlushObserver>) {
+            *self.observer.lock().unwrap() = Some(observer);
+        }
     }
 
     fn boxed(s: Recording) -> Box<dyn Sink> {
@@ -498,7 +611,7 @@ mod tests {
         let (a, _ra) = Recording::new(0);
         let (b, _rb) = Recording::new(0);
         let cache_state = Arc::new(CacheState::new());
-        cache_state.register_mirror("m", 0);
+        cache_state.register_mirror("m", 0, None, false);
         let binding = CacheBinding {
             state: Arc::clone(&cache_state),
             mirror_name: "m".into(),
@@ -525,7 +638,7 @@ mod tests {
         // here we just confirm a single record produced a single
         // visible key.
         assert_eq!(
-            cache_state.snapshot_keys(),
+            cache_state.snapshot_keys_for("m").unwrap(),
             vec!["k0".to_string()],
             "exactly one key materialised from one record"
         );
@@ -573,4 +686,91 @@ mod tests {
         let head = tee.next_expected_offset().await.unwrap();
         assert_eq!(head, 42, "after align, min(heads) = low_watermark");
     }
+
+    // ---- FlushObserver wiring through TeeSink ----
+
+    #[derive(Default)]
+    struct RecordingObserver {
+        fires: Mutex<Vec<(u64, u64)>>,
+    }
+
+    impl crate::FlushObserver for RecordingObserver {
+        fn on_flushed(&self, from: u64, to: u64) {
+            self.fires.lock().unwrap().push((from, to));
+        }
+    }
+
+    #[tokio::test]
+    async fn length_one_tee_forwards_observer_unchanged() {
+        let (inner, recorder) = Recording::new(0);
+        let mut tee = TeeSink::open(vec![("only".into(), boxed(inner))], None)
+            .await
+            .unwrap();
+        let obs = Arc::new(RecordingObserver::default());
+        tee.set_flush_observer(obs.clone() as Arc<dyn crate::FlushObserver>);
+
+        // Simulate two FS-style flushes via the recorder's helper.
+        recorder.simulate_flush(0, 9);
+        recorder.simulate_flush(10, 19);
+
+        let fires = obs.fires.lock().unwrap().clone();
+        assert_eq!(
+            fires,
+            vec![(0, 9), (10, 19)],
+            "length-1 tee passes (from, to) through verbatim"
+        );
+    }
+
+    #[tokio::test]
+    async fn multi_sink_tee_fires_only_when_min_advances() {
+        let (a, ra) = Recording::new(0);
+        let (b, rb) = Recording::new(0);
+        let mut tee = TeeSink::open(vec![("a".into(), boxed(a)), ("b".into(), boxed(b))], None)
+            .await
+            .unwrap();
+        let obs = Arc::new(RecordingObserver::default());
+        tee.set_flush_observer(obs.clone() as Arc<dyn crate::FlushObserver>);
+
+        // a flushes 0..9. b hasn't flushed yet → min is still 0,
+        // outer must not fire.
+        ra.simulate_flush(0, 9);
+        assert!(
+            obs.fires.lock().unwrap().is_empty(),
+            "outer must wait for the laggard"
+        );
+
+        // b flushes 0..4. min(9, 4) = 4; fire (0, 4).
+        rb.simulate_flush(0, 4);
+        assert_eq!(obs.fires.lock().unwrap().clone(), vec![(0, 4)]);
+
+        // b catches up to 9. min(9, 9) = 9; fire (4, 9).
+        rb.simulate_flush(5, 9);
+        assert_eq!(obs.fires.lock().unwrap().clone(), vec![(0, 4), (4, 9)]);
+
+        // a races ahead to 19. min(19, 9) = 9; no advance, no fire.
+        ra.simulate_flush(10, 19);
+        assert_eq!(obs.fires.lock().unwrap().clone(), vec![(0, 4), (4, 9)]);
+    }
+
+    #[tokio::test]
+    async fn multi_sink_tee_does_not_re_fire_for_already_seen_watermark() {
+        // Idempotence: a sink reporting the same `to` twice (which
+        // can happen if FS/S3 re-flushes an empty boundary in some
+        // future refactor) must not cause a duplicate outer fire.
+        let (a, ra) = Recording::new(0);
+        let (b, rb) = Recording::new(0);
+        let mut tee = TeeSink::open(vec![("a".into(), boxed(a)), ("b".into(), boxed(b))], None)
+            .await
+            .unwrap();
+        let obs = Arc::new(RecordingObserver::default());
+        tee.set_flush_observer(obs.clone() as Arc<dyn crate::FlushObserver>);
+
+        ra.simulate_flush(0, 5);
+        rb.simulate_flush(0, 5);
+        // First fire at (0, 5).
+        assert_eq!(obs.fires.lock().unwrap().clone(), vec![(0, 5)]);
+        // a re-reports 5; min doesn't advance; no fire.
+        ra.simulate_flush(0, 5);
+        assert_eq!(obs.fires.lock().unwrap().clone(), vec![(0, 5)]);
+    }
 }
diff --git a/crates/mirror-core/src/testing.rs b/crates/mirror-core/src/testing.rs
new file mode 100644
index 0000000..cefc7f5
--- /dev/null
+++ b/crates/mirror-core/src/testing.rs
@@ -0,0 +1,300 @@
+//! Test-only helpers for TDD-style spec authoring.
+//!
+//! The existing [`crate::mock`] types ([`crate::mock::MockSink`],
+//! [`crate::mock::MockSource`]) cover the common case where a spec
+//! test just needs to script events and scripted positions.
+//!
+//! This module adds primitives for the *uncommon* case: a spec test
+//! that needs a `Sink` or `Source` with behaviour the existing
+//! mocks don't model directly; typically because the spec is being
+//! TDD'd before the implementation exists, and the test wants to
+//! express "next_expected_offset returns 150 and write fails with
+//! UnexpectedPosition" without anyone adding a new builder method
+//! to MockSink first.
+//!
+//! ## When to reach for `BlanketMockSink`
+//!
+//! - You're writing a test for a spec change that hasn't been
+//!   implemented yet, and you want the test to compile and fail
+//!   loudly (the "red" of red-green-refactor) without changing
+//!   shared mock APIs.
+//! - You need a Sink whose behaviour changes across calls (each
+//!   `next_expected_offset` returns a different value, `write`
+//!   succeeds the first time but errors the second, …).
+//! - The existing `MockSink` builder doesn't expose the override
+//!   you need *and* the override is genuinely test-only (i.e. it
+//!   would be wrong to add it to the production-facing mock API).
+//!
+//! ## When NOT to
+//!
+//! For straightforward "sink starts at offset N, accepts contiguous
+//! writes" the plain [`crate::mock::MockSink`] is cheaper to read.
+//! Reach for `BlanketMockSink` only when the closures' flexibility
+//! is actually paying for itself.
+
+use std::sync::Mutex;
+
+use async_trait::async_trait;
+
+use crate::{Record, Sink, SinkError};
+
+/// A `Sink` whose every trait method is a closure the test owns.
+///
+/// Built via the [`BlanketMockSink::builder`] entrypoint and the
+/// `with_*` methods. Each closure is `FnMut`, so it can capture
+/// mutable state (call counters, scripted return sequences, etc.)
+/// from the test's stack frame.
+///
+/// All recorded calls are accessible via the [`BlanketMockSink::calls`]
+/// accessor for post-hoc assertions.
+pub struct BlanketMockSink {
+    on_next_expected_offset: Box<dyn FnMut() -> Result<u64, SinkError> + Send>,
+    on_write: Box<dyn FnMut(Record) -> Result<(), SinkError> + Send>,
+    on_flush: Box<dyn FnMut() -> Result<(), SinkError> + Send>,
+    on_allows_compacted_source: bool,
+    on_align_to_source_low_watermark: Box<dyn FnMut(u64) -> Result<(), SinkError> + Send>,
+    /// Recorded calls, in order, for the test to assert on.
+    calls: Mutex<Vec<Call>>,
+}
+
+/// Trace of one trait-method invocation, for post-hoc assertion.
+#[derive(Debug, Clone, PartialEq, Eq)]
+pub enum Call {
+    NextExpectedOffset,
+    Write { source_offset: u64 },
+    Flush,
+    AllowsCompactedSource,
+    AlignToSourceLowWatermark { low_watermark: u64 },
+}
+
+impl Default for BlanketMockSink {
+    fn default() -> Self {
+        Self {
+            on_next_expected_offset: Box::new(|| Ok(0)),
+            on_write: Box::new(|_| Ok(())),
+            on_flush: Box::new(|| Ok(())),
+            on_allows_compacted_source: false,
+            on_align_to_source_low_watermark: Box::new(|_| Ok(())),
+            calls: Mutex::new(Vec::new()),
+        }
+    }
+}
+
+impl BlanketMockSink {
+    /// Start a builder from defaults: every method returns `Ok` and
+    /// `allows_compacted_source` is `false`. Override individually
+    /// with `with_*`.
+    pub fn builder() -> Self {
+        Self::default()
+    }
+
+    /// `next_expected_offset` returns this fixed value on every call.
+    /// For varying values across calls use [`Self::with_next_expected_offset_fn`]
+    /// or [`Self::with_next_expected_offset_sequence`].
+    pub fn with_next_expected_offset(mut self, value: u64) -> Self {
+        self.on_next_expected_offset = Box::new(move || Ok(value));
+        self
+    }
+
+    /// `next_expected_offset` returns each value in `values` in turn,
+    /// then errors with a transport error once exhausted. Useful for
+    /// "first call returns X, second call returns Y" idle-drift tests.
+    pub fn with_next_expected_offset_sequence(mut self, values: Vec<u64>) -> Self {
+        let mut iter = values.into_iter();
+        self.on_next_expected_offset = Box::new(move || match iter.next() {
+            Some(v) => Ok(v),
+            None => Err(SinkError::Transport(
+                "BlanketMockSink: next_expected_offset sequence exhausted".into(),
+            )),
+        });
+        self
+    }
+
+    /// Full closure override for `next_expected_offset`. The closure
+    /// is invoked on every call; capture state via the closure to
+    /// implement test-specific behaviour.
+    pub fn with_next_expected_offset_fn<F>(mut self, f: F) -> Self
+    where
+        F: FnMut() -> Result<u64, SinkError> + Send + 'static,
+    {
+        self.on_next_expected_offset = Box::new(f);
+        self
+    }
+
+    /// `write` returns this error on every call. Useful for "the sink
+    /// rejects everything" tests; for selective rejection use
+    /// [`Self::with_write_fn`].
+    pub fn with_write_always_errors(mut self, err: SinkError) -> Self {
+        // SinkError isn't Clone, so we wrap in Mutex<Option<_>> and
+        // re-emit by reconstructing the variant from a recorded copy.
+        let stored = std::sync::Arc::new(Mutex::new(Some(err)));
+        self.on_write = Box::new(move |_| {
+            let mut slot = stored.lock().unwrap();
+            // Reconstruct an equivalent error each call; match on
+            // the originally-stored variant if it's still there;
+            // synthesise a Transport variant after the first call so
+            // SinkError doesn't need to be Clone.
+            match slot.take() {
+                Some(e) => Err(e),
+                None => Err(SinkError::Transport(
+                    "BlanketMockSink::with_write_always_errors (subsequent call)".into(),
+                )),
+            }
+        });
+        self
+    }
+
+    /// Full closure override for `write`. The closure receives the
+    /// `Record` and returns `Result<(), SinkError>`. Capture mutable
+    /// state in the closure for per-call decisions.
+    pub fn with_write_fn<F>(mut self, f: F) -> Self
+    where
+        F: FnMut(Record) -> Result<(), SinkError> + Send + 'static,
+    {
+        self.on_write = Box::new(f);
+        self
+    }
+
+    /// Full closure override for `flush`.
+    pub fn with_flush_fn<F>(mut self, f: F) -> Self
+    where
+        F: FnMut() -> Result<(), SinkError> + Send + 'static,
+    {
+        self.on_flush = Box::new(f);
+        self
+    }
+
+    /// Set the value returned by `allows_compacted_source`. Plain
+    /// boolean because the trait method isn't async.
+    pub fn with_allows_compacted_source(mut self, value: bool) -> Self {
+        self.on_allows_compacted_source = value;
+        self
+    }
+
+    /// Full closure override for `align_to_source_low_watermark`.
+    pub fn with_align_to_source_low_watermark_fn<F>(mut self, f: F) -> Self
+    where
+        F: FnMut(u64) -> Result<(), SinkError> + Send + 'static,
+    {
+        self.on_align_to_source_low_watermark = Box::new(f);
+        self
+    }
+
+    /// Snapshot of trait-method calls in invocation order.
+    pub fn calls(&self) -> Vec<Call> {
+        self.calls.lock().unwrap().clone()
+    }
+}
+
+#[async_trait]
+impl Sink for BlanketMockSink {
+    async fn next_expected_offset(&mut self) -> Result<u64, SinkError> {
+        self.calls.lock().unwrap().push(Call::NextExpectedOffset);
+        (self.on_next_expected_offset)()
+    }
+
+    async fn write(&mut self, record: Record) -> Result<(), SinkError> {
+        self.calls.lock().unwrap().push(Call::Write {
+            source_offset: record.source_offset,
+        });
+        (self.on_write)(record)
+    }
+
+    async fn flush(&mut self) -> Result<(), SinkError> {
+        self.calls.lock().unwrap().push(Call::Flush);
+        (self.on_flush)()
+    }
+
+    fn allows_compacted_source(&self) -> bool {
+        self.calls.lock().unwrap().push(Call::AllowsCompactedSource);
+        self.on_allows_compacted_source
+    }
+
+    async fn align_to_source_low_watermark(&mut self, low_watermark: u64) -> Result<(), SinkError> {
+        self.calls
+            .lock()
+            .unwrap()
+            .push(Call::AlignToSourceLowWatermark { low_watermark });
+        (self.on_align_to_source_low_watermark)(low_watermark)
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::TimestampType;
+
+    fn rec(offset: u64) -> Record {
+        Record {
+            topic: "t".into(),
+            partition: 0,
+            source_offset: offset,
+            timestamp_ms: Some(1),
+            timestamp_type: TimestampType::CreateTime,
+            key: Some(b"k".to_vec()),
+            value: Some(b"v".to_vec()),
+            headers: vec![],
+        }
+    }
+
+    #[tokio::test]
+    async fn defaults_return_ok_zero_and_record_calls() {
+        let mut s = BlanketMockSink::builder();
+        assert_eq!(s.next_expected_offset().await.unwrap(), 0);
+        s.write(rec(0)).await.unwrap();
+        s.flush().await.unwrap();
+        assert!(!s.allows_compacted_source());
+        s.align_to_source_low_watermark(42).await.unwrap();
+        assert_eq!(
+            s.calls(),
+            vec![
+                Call::NextExpectedOffset,
+                Call::Write { source_offset: 0 },
+                Call::Flush,
+                Call::AllowsCompactedSource,
+                Call::AlignToSourceLowWatermark { low_watermark: 42 },
+            ]
+        );
+    }
+
+    #[tokio::test]
+    async fn next_expected_sequence_advances_per_call() {
+        let mut s = BlanketMockSink::builder().with_next_expected_offset_sequence(vec![10, 20, 30]);
+        assert_eq!(s.next_expected_offset().await.unwrap(), 10);
+        assert_eq!(s.next_expected_offset().await.unwrap(), 20);
+        assert_eq!(s.next_expected_offset().await.unwrap(), 30);
+        // Fourth call: sequence exhausted -> transport error.
+        match s.next_expected_offset().await {
+            Err(SinkError::Transport(msg)) => assert!(msg.contains("exhausted")),
+            other => panic!("expected exhaustion error, got {other:?}"),
+        }
+    }
+
+    #[tokio::test]
+    async fn closure_can_capture_mutable_state() {
+        // The decision depends on captured state (the call counter),
+        // not just the record's intrinsics; this is the test's
+        // whole point. Reject the 3rd write call regardless of which
+        // offset it carries.
+        let mut written = 0u32;
+        let mut s = BlanketMockSink::builder().with_write_fn(move |r| {
+            written += 1;
+            if written == 3 {
+                Err(SinkError::UnexpectedPosition {
+                    expected: 99,
+                    actual: r.source_offset,
+                })
+            } else {
+                Ok(())
+            }
+        });
+        s.write(rec(10)).await.unwrap();
+        s.write(rec(11)).await.unwrap();
+        match s.write(rec(12)).await {
+            Err(SinkError::UnexpectedPosition { expected, actual }) => {
+                assert_eq!((expected, actual), (99, 12));
+            }
+            other => panic!("got {other:?}"),
+        }
+    }
+}
diff --git a/crates/mirror-core/tests/notifier_invariants.rs b/crates/mirror-core/tests/notifier_invariants.rs
new file mode 100644
index 0000000..5d65be9
--- /dev/null
+++ b/crates/mirror-core/tests/notifier_invariants.rs
@@ -0,0 +1,394 @@
+//! Invariant tests for the [`Notifier`] hook in `run_mirror`.
+//!
+//! These pin the contract every notifier implementation must honour:
+//!   * `on_record` fires exactly once per successful `sink.write`,
+//!     in source-offset order, *after* the destination has accepted
+//!     the record.
+//!   * `shutdown` fires once on graceful exit, *after* `sink.flush`.
+//!   * `NotifyError` returned from either hook aborts the loop and
+//!     surfaces as [`MirrorError::Notify`].
+//!   * The hook never fires on the rejection paths
+//!     (source-went-backwards, sink write error, etc.).
+
+use std::sync::{Arc, Mutex};
+
+use async_trait::async_trait;
+use mirror_core::mock::{rec, MockSink, MockSource, MockSourceEvent};
+use mirror_core::{
+    run_mirror_with_notifier, MirrorError, Notifier, NotifyError, Record, Sink, SinkError,
+};
+
+fn drive<F>(future: F) -> Result<(), MirrorError>
+where
+    F: std::future::IntoFuture<Output = Result<(), MirrorError>>,
+{
+    let rt = tokio::runtime::Builder::new_current_thread()
+        .enable_time()
+        .build()
+        .unwrap();
+    rt.block_on(async move { future.into_future().await })
+}
+
+fn never() -> std::future::Pending<()> {
+    std::future::pending::<()>()
+}
+
+fn no_heartbeat() -> std::time::Duration {
+    std::time::Duration::ZERO
+}
+
+/// Records every `on_record` and `shutdown` call. Configurable to
+/// return a `NotifyError` on a specific record offset, or on shutdown.
+#[derive(Default)]
+struct RecordingNotifier {
+    log: Arc<Mutex<Vec<NotifierEvent>>>,
+    fail_on_offset: Option<u64>,
+    fail_on_shutdown: bool,
+}
+
+#[derive(Debug, PartialEq, Eq, Clone)]
+enum NotifierEvent {
+    OnRecord(u64),
+    Shutdown,
+}
+
+impl RecordingNotifier {
+    fn new() -> Self {
+        Self::default()
+    }
+
+    fn fail_on(mut self, offset: u64) -> Self {
+        self.fail_on_offset = Some(offset);
+        self
+    }
+
+    fn fail_on_shutdown(mut self) -> Self {
+        self.fail_on_shutdown = true;
+        self
+    }
+
+    fn log_handle(&self) -> Arc<Mutex<Vec<NotifierEvent>>> {
+        Arc::clone(&self.log)
+    }
+}
+
+#[async_trait]
+impl Notifier for RecordingNotifier {
+    async fn on_record(&mut self, record: &Record) -> Result<(), NotifyError> {
+        self.log
+            .lock()
+            .unwrap()
+            .push(NotifierEvent::OnRecord(record.source_offset));
+        if Some(record.source_offset) == self.fail_on_offset {
+            return Err(NotifyError::Transport(format!(
+                "boom at offset {}",
+                record.source_offset
+            )));
+        }
+        Ok(())
+    }
+
+    async fn shutdown(&mut self) -> Result<(), NotifyError> {
+        self.log.lock().unwrap().push(NotifierEvent::Shutdown);
+        if self.fail_on_shutdown {
+            return Err(NotifyError::Exhausted {
+                attempts: 5,
+                last_error: "shutdown drain failed".into(),
+            });
+        }
+        Ok(())
+    }
+}
+
+#[test]
+fn on_record_fires_once_per_successful_write_in_offset_order() {
+    let source = MockSource::new([
+        MockSourceEvent::Record(rec(10)),
+        MockSourceEvent::Record(rec(11)),
+        MockSourceEvent::Record(rec(12)),
+        MockSourceEvent::Error("stop".into()),
+    ]);
+    let sink = MockSink::starting_at(10);
+    let notifier = RecordingNotifier::new();
+    let log = notifier.log_handle();
+
+    let result = drive(run_mirror_with_notifier(
+        source,
+        sink,
+        notifier,
+        never(),
+        no_heartbeat(),
+    ));
+    assert!(matches!(result, Err(MirrorError::Source(_))));
+
+    let log = log.lock().unwrap().clone();
+    assert_eq!(
+        log,
+        vec![
+            NotifierEvent::OnRecord(10),
+            NotifierEvent::OnRecord(11),
+            NotifierEvent::OnRecord(12),
+        ],
+        "notifier must observe every accepted record in offset order, and only those"
+    );
+}
+
+#[test]
+fn shutdown_fires_after_flush_on_graceful_exit() {
+    use std::sync::atomic::{AtomicUsize, Ordering};
+
+    let flush_count = Arc::new(AtomicUsize::new(0));
+    let order = Arc::new(Mutex::new(Vec::<&'static str>::new()));
+
+    struct OrderingSink {
+        position: u64,
+        flush_count: Arc<AtomicUsize>,
+        order: Arc<Mutex<Vec<&'static str>>>,
+    }
+    #[async_trait]
+    impl Sink for OrderingSink {
+        async fn next_expected_offset(&mut self) -> Result<u64, SinkError> {
+            Ok(self.position)
+        }
+        async fn write(&mut self, _record: Record) -> Result<(), SinkError> {
+            self.position += 1;
+            Ok(())
+        }
+        async fn flush(&mut self) -> Result<(), SinkError> {
+            self.flush_count.fetch_add(1, Ordering::SeqCst);
+            self.order.lock().unwrap().push("sink.flush");
+            Ok(())
+        }
+    }
+
+    struct OrderingNotifier {
+        order: Arc<Mutex<Vec<&'static str>>>,
+        log: Arc<Mutex<Vec<NotifierEvent>>>,
+    }
+    #[async_trait]
+    impl Notifier for OrderingNotifier {
+        async fn on_record(&mut self, record: &Record) -> Result<(), NotifyError> {
+            self.log
+                .lock()
+                .unwrap()
+                .push(NotifierEvent::OnRecord(record.source_offset));
+            Ok(())
+        }
+        async fn shutdown(&mut self) -> Result<(), NotifyError> {
+            self.order.lock().unwrap().push("notifier.shutdown");
+            self.log.lock().unwrap().push(NotifierEvent::Shutdown);
+            Ok(())
+        }
+    }
+
+    let log = Arc::new(Mutex::new(Vec::<NotifierEvent>::new()));
+    let source = MockSource::new([MockSourceEvent::Hang]);
+    let sink = OrderingSink {
+        position: 0,
+        flush_count: Arc::clone(&flush_count),
+        order: Arc::clone(&order),
+    };
+    let notifier = OrderingNotifier {
+        order: Arc::clone(&order),
+        log: Arc::clone(&log),
+    };
+
+    // Shutdown future already ready -> biased select takes shutdown
+    // branch immediately on first iteration.
+    let result = drive(run_mirror_with_notifier(
+        source,
+        sink,
+        notifier,
+        async {},
+        no_heartbeat(),
+    ));
+    assert!(matches!(result, Ok(())), "expected Ok, got {result:?}");
+    assert_eq!(flush_count.load(Ordering::SeqCst), 1);
+    assert_eq!(
+        order.lock().unwrap().clone(),
+        vec!["sink.flush", "notifier.shutdown"],
+        "sink.flush must run before notifier.shutdown so the destination is durable before the webhook drain"
+    );
+}
+
+#[test]
+fn notify_error_from_on_record_propagates_as_mirror_error() {
+    let source = MockSource::new([
+        MockSourceEvent::Record(rec(0)),
+        MockSourceEvent::Record(rec(1)), // never reached
+    ]);
+    let sink = MockSink::starting_at(0);
+    let notifier = RecordingNotifier::new().fail_on(0);
+    let log = notifier.log_handle();
+
+    let result = drive(run_mirror_with_notifier(
+        source,
+        sink,
+        notifier,
+        never(),
+        no_heartbeat(),
+    ));
+    match result {
+        Err(MirrorError::Notify(NotifyError::Transport(msg))) => {
+            assert!(msg.contains("offset 0"), "got: {msg}");
+        }
+        other => panic!("expected MirrorError::Notify(Transport), got {other:?}"),
+    }
+    let log = log.lock().unwrap().clone();
+    assert_eq!(
+        log,
+        vec![NotifierEvent::OnRecord(0)],
+        "loop must abort after the failing on_record, never observing offset 1"
+    );
+}
+
+#[test]
+fn notify_error_from_shutdown_propagates_as_mirror_error() {
+    let source = MockSource::new([MockSourceEvent::Hang]);
+    let sink = MockSink::starting_at(0);
+    let notifier = RecordingNotifier::new().fail_on_shutdown();
+
+    let result = drive(run_mirror_with_notifier(
+        source,
+        sink,
+        notifier,
+        async {},
+        no_heartbeat(),
+    ));
+    match result {
+        Err(MirrorError::Notify(NotifyError::Exhausted {
+            attempts,
+            last_error,
+        })) => {
+            assert_eq!(attempts, 5);
+            assert_eq!(last_error, "shutdown drain failed");
+        }
+        other => panic!("expected MirrorError::Notify(Exhausted), got {other:?}"),
+    }
+}
+
+#[test]
+fn on_record_does_not_fire_when_sink_write_fails() {
+    let source = MockSource::new([MockSourceEvent::Record(rec(0))]);
+    let sink = MockSink::starting_at(0).with_write_error(SinkError::Transport("disk full".into()));
+    let notifier = RecordingNotifier::new();
+    let log = notifier.log_handle();
+
+    let result = drive(run_mirror_with_notifier(
+        source,
+        sink,
+        notifier,
+        never(),
+        no_heartbeat(),
+    ));
+    assert!(matches!(
+        result,
+        Err(MirrorError::Sink(SinkError::Transport(_)))
+    ));
+    assert!(
+        log.lock().unwrap().is_empty(),
+        "notifier must not observe a record the destination rejected"
+    );
+}
+
+#[test]
+fn on_record_does_not_fire_on_source_went_backwards() {
+    // Source delivers 10 then 9. Loop must error before ever calling
+    // sink.write; and therefore before on_record.
+    let source = MockSource::new([
+        MockSourceEvent::Record(rec(10)),
+        MockSourceEvent::Record(rec(9)),
+    ]);
+    let sink = MockSink::starting_at(10).with_allows_compacted_source(true);
+    let notifier = RecordingNotifier::new();
+    let log = notifier.log_handle();
+
+    let result = drive(run_mirror_with_notifier(
+        source,
+        sink,
+        notifier,
+        never(),
+        no_heartbeat(),
+    ));
+    assert!(matches!(
+        result,
+        Err(MirrorError::SourceWentBackwards { .. })
+    ));
+    // The first record (offset 10) IS accepted and observed; the
+    // backwards record (offset 9) must not be.
+    let log = log.lock().unwrap().clone();
+    assert_eq!(log, vec![NotifierEvent::OnRecord(10)]);
+}
+
+/// Compaction-tolerant sink: accepts forward gaps when
+/// `allows_compacted_source = true`, mirroring the real FS/S3 sinks.
+/// `MockSink` is too strict for the gap test below.
+struct CompactionLogSink {
+    position: u64,
+}
+#[async_trait]
+impl Sink for CompactionLogSink {
+    async fn next_expected_offset(&mut self) -> Result<u64, SinkError> {
+        Ok(self.position)
+    }
+    async fn write(&mut self, record: Record) -> Result<(), SinkError> {
+        if record.source_offset < self.position {
+            return Err(SinkError::UnexpectedPosition {
+                expected: self.position,
+                actual: record.source_offset,
+            });
+        }
+        // Forward gap accepted under compaction:log; tracker jumps
+        // to the delivered offset + 1.
+        self.position = record.source_offset + 1;
+        Ok(())
+    }
+    fn allows_compacted_source(&self) -> bool {
+        true
+    }
+    async fn align_to_source_low_watermark(&mut self, low_watermark: u64) -> Result<(), SinkError> {
+        self.position = low_watermark;
+        Ok(())
+    }
+}
+
+#[test]
+fn on_record_fires_for_gapped_offsets_under_compaction_log() {
+    // Mirrors `compaction_log_accepts_repeated_gaps_mid_stream` in
+    // loop_invariants.rs: under compaction:log the loop must accept
+    // forward gaps, and the notifier must see each accepted offset
+    // (KKV semantics: every committed record is a stale-key
+    // invalidation event downstream).
+    let source = MockSource::new([
+        MockSourceEvent::Record(rec(461)),
+        MockSourceEvent::Record(rec(466)),
+        MockSourceEvent::Record(rec(470)),
+        MockSourceEvent::Error("stop".into()),
+    ])
+    .with_low_watermark(0);
+    let sink = CompactionLogSink { position: 0 };
+    let notifier = RecordingNotifier::new();
+    let log = notifier.log_handle();
+
+    let result = drive(run_mirror_with_notifier(
+        source,
+        sink,
+        notifier,
+        never(),
+        no_heartbeat(),
+    ));
+    assert!(
+        matches!(result, Err(MirrorError::Source(_))),
+        "got: {result:?}"
+    );
+
+    let log = log.lock().unwrap().clone();
+    assert_eq!(
+        log,
+        vec![
+            NotifierEvent::OnRecord(461),
+            NotifierEvent::OnRecord(466),
+            NotifierEvent::OnRecord(470),
+        ]
+    );
+}
diff --git a/crates/mirror-core/tests/palette_demo.rs b/crates/mirror-core/tests/palette_demo.rs
new file mode 100644
index 0000000..5cc1fb8
--- /dev/null
+++ b/crates/mirror-core/tests/palette_demo.rs
@@ -0,0 +1,237 @@
+//! Demonstration of the test-helper palette in `mirror_core::testing`.
+//!
+//! Every test in this file uses ONLY the published palette
+//! ([`mirror_core::mock`] + [`mirror_core::testing`]). The point is to
+//! prove that the palette is rich enough to express the common
+//! shapes of spec tests *without* a contributor having to extend the
+//! mock infrastructure first.
+//!
+//! See `TESTING.md` at the repo root for the catalogue of layers and
+//! which one a given spec change belongs in.
+
+use mirror_core::mock::{rec, MockSource, MockSourceEvent};
+use mirror_core::testing::{BlanketMockSink, Call};
+use mirror_core::{run_mirror, MirrorError, SinkError};
+
+fn drive<F>(future: F) -> Result<(), MirrorError>
+where
+    F: std::future::IntoFuture<Output = Result<(), MirrorError>>,
+{
+    let rt = tokio::runtime::Builder::new_current_thread()
+        .enable_time()
+        .build()
+        .unwrap();
+    rt.block_on(async move { future.into_future().await })
+}
+
+fn never() -> std::future::Pending<()> {
+    std::future::pending::<()>()
+}
+
+/// Demonstration #1; encode the committed `SourceWentBackwards`
+/// invariant entirely through the palette.
+///
+/// The point isn't the test result (`mirror-core/tests/loop_invariants.rs`
+/// already has this case). The point is the *shape*: declarative
+/// mock setup + drive + match on the error variant, with no
+/// `InspectorSink`-style state plumbing.
+#[test]
+fn palette_encodes_source_went_backwards() {
+    // Sink reports it's at offset 5; the loop's `expected` starts
+    // here.
+    let sink = BlanketMockSink::builder()
+        .with_next_expected_offset(5)
+        // The loop's per-record gate fires BEFORE delegating to
+        // sink.write(), so the closure here is never reached for
+        // the offending record. It still has to be present for
+        // any preceding records the loop accepts; default returns
+        // Ok, which is fine.
+        ;
+
+    // Source delivers 5 (matches expected) then 3 (goes backwards).
+    let source = MockSource::new([
+        MockSourceEvent::Record(rec(5)),
+        MockSourceEvent::Record(rec(3)),
+    ]);
+
+    let result = drive(run_mirror(source, sink, never()));
+    match result {
+        Err(MirrorError::SourceWentBackwards { expected, got }) => {
+            assert_eq!((expected, got), (6, 3));
+        }
+        other => panic!("expected SourceWentBackwards, got {other:?}"),
+    }
+}
+
+/// Demonstration #2; encode an *idle-drift* invariant where the
+/// sink's `next_expected_offset` changes across calls.
+///
+/// The existing `MockSink::with_position_program` already supports
+/// scripted positions; this test deliberately uses `BlanketMockSink`'s
+/// closure-driven sequence instead, to show the equivalence:
+/// `with_next_expected_offset_sequence` covers the same shape with
+/// fewer assumptions about MockSink's structure. A future spec test
+/// that needed e.g. "the third call returns an error, not just a
+/// different value" would use `with_next_expected_offset_fn` directly.
+#[test]
+fn palette_encodes_destination_drift_via_sequence() {
+    // Startup call returns 10; idle re-check (after the Idle event)
+    // returns 15; out-of-band write detected.
+    let sink = BlanketMockSink::builder().with_next_expected_offset_sequence(vec![10, 15]);
+
+    let source = MockSource::new([
+        MockSourceEvent::Record(rec(10)),
+        MockSourceEvent::Idle,
+        MockSourceEvent::Hang,
+    ]);
+
+    let result = drive(run_mirror(source, sink, never()));
+    match result {
+        Err(MirrorError::DestinationDrift { expected, actual }) => {
+            assert_eq!((expected, actual), (11, 15));
+        }
+        other => panic!("expected DestinationDrift, got {other:?}"),
+    }
+}
+
+/// Demonstration #3; encode a per-record decision via `with_write_fn`.
+///
+/// Scenario: the spec under test is "the sink rejects exactly the
+/// fifth record." The closure captures a counter, decides per call.
+/// No new mock method needed.
+#[test]
+fn palette_encodes_per_record_sink_decision() {
+    // The closure captures a counter that drives the per-call
+    // decision; that's the demonstration. The fifth write call
+    // (regardless of record offset) is rejected.
+    let mut written = 0u32;
+    let sink = BlanketMockSink::builder()
+        .with_next_expected_offset(0)
+        .with_write_fn(move |r| {
+            written += 1;
+            if written == 5 {
+                Err(SinkError::UnexpectedPosition {
+                    expected: written as u64 - 1,
+                    actual: r.source_offset,
+                })
+            } else {
+                Ok(())
+            }
+        });
+
+    let source = MockSource::new([
+        MockSourceEvent::Record(rec(0)),
+        MockSourceEvent::Record(rec(1)),
+        MockSourceEvent::Record(rec(2)),
+        MockSourceEvent::Record(rec(3)),
+        MockSourceEvent::Record(rec(4)), // the 5th write; rejected
+    ]);
+
+    let result = drive(run_mirror(source, sink, never()));
+    match result {
+        Err(MirrorError::Sink(SinkError::UnexpectedPosition { expected, actual })) => {
+            assert_eq!((expected, actual), (4, 4));
+        }
+        other => panic!("expected sink UnexpectedPosition on 5th write, got {other:?}"),
+    }
+}
+
+/// Demonstration #4; inspect call ordering after the loop exits.
+///
+/// `BlanketMockSink::calls()` returns the full trait-method
+/// invocation history. Useful when the spec is about *what order*
+/// the loop calls methods in, not the values returned. Example: a
+/// spec might say "shutdown must call flush() exactly once, and only
+/// after any in-flight write completes."
+#[test]
+fn palette_records_call_order_for_post_hoc_assertion() {
+    let sink = BlanketMockSink::builder().with_next_expected_offset(0);
+
+    let source = MockSource::new([
+        MockSourceEvent::Record(rec(0)),
+        MockSourceEvent::Record(rec(1)),
+        MockSourceEvent::Hang,
+    ]);
+
+    // Shutdown future is already-ready, so the loop takes the
+    // shutdown branch at the next iteration boundary after some
+    // (possibly zero) records have been processed.
+    let _ = drive(run_mirror(source, sink, async {}));
+
+    // The contract `BlanketMockSink` upholds: every trait-method
+    // call is recorded. We can't assert that the loop processed N
+    // records (`tokio::select!` biases shutdown), but we CAN assert
+    // structural properties; every Write is preceded by a
+    // NextExpectedOffset at startup, flush is called at most once,
+    // etc. For a true post-hoc inspection the test holds the sink
+    // by reference via Arc<Mutex> instead of moving into run_mirror.
+    // The shape of that pattern lives in `tee.rs` already and isn't
+    // reproduced here; the point is the calls() accessor exists
+    // and is the entrypoint.
+    //
+    // For this test, just confirm the discrimination works: a
+    // freshly built sink has no calls.
+    let fresh = BlanketMockSink::builder();
+    assert_eq!(fresh.calls(), Vec::<Call>::new());
+}
+
+/// Demonstration #5; TDD sketch for a future spec.
+///
+/// This test is `#[ignore]`d because the spec it asserts on doesn't
+/// exist yet. It compiles, runs in `--include-ignored` mode, and
+/// fails with a clear panic naming the work to do; exactly the
+/// red-green-refactor entrypoint a contributor wants when picking
+/// up the work.
+///
+/// **The spec:** "It's a fatal condition if any sink has a higher
+/// offset than its source." Concretely: at startup, the run loop
+/// must compare `sink.next_expected_offset()` against
+/// `source.high_watermark()` and crash with a specific error if the
+/// sink is ahead.
+///
+/// **What the palette provides today:**
+///   - `MockSource::with_high_watermark(100)` to script the source's
+///     HWM (the trait method's default is `u64::MAX` so existing
+///     tests are unaffected).
+///   - `BlanketMockSink::with_next_expected_offset(150)` to script
+///     a sink that's ahead.
+///
+/// **What the spec implementer would add:**
+///   - A new `MirrorError::SinkAheadOfSource { sink_offset, source_hwm }`
+///     variant in `crates/mirror-core/src/lib.rs`.
+///   - A check in `run_mirror_with_heartbeat` after the initial
+///     `sink.next_expected_offset()` call (or on idle, if the spec
+///     wants ongoing monitoring) that calls `source.high_watermark()`
+///     and returns the new variant when sink > hwm.
+///
+/// Removing the `#[ignore]` and replacing the body with the actual
+/// assertion (see the commented sketch below) is the green-side
+/// landing.
+#[test]
+#[ignore = "TODO: spec not yet implemented; see body for the TDD pattern"]
+fn future_spec_sink_ahead_of_source_is_fatal() {
+    // Palette setup that the future test would use:
+    //
+    // let source = MockSource::new([MockSourceEvent::Hang])
+    //     .with_high_watermark(100); // broker HWM
+    // let sink = BlanketMockSink::builder()
+    //     .with_next_expected_offset(150); // sink claims to be at 150
+    //
+    // let result = drive(run_mirror(source, sink, never()));
+    // match result {
+    //     Err(MirrorError::SinkAheadOfSource { sink_offset, source_hwm }) => {
+    //         assert_eq!(sink_offset, 150);
+    //         assert_eq!(source_hwm, 100);
+    //     }
+    //     other => panic!("expected SinkAheadOfSource, got {other:?}"),
+    // }
+    panic!(
+        "Implement `MirrorError::SinkAheadOfSource` + the HWM check in \
+         `run_mirror_with_heartbeat`, then drop the `#[ignore]` and \
+         uncomment the body above. The palette ({MockSource}::with_high_watermark, \
+         {BlanketMockSink}::with_next_expected_offset) already supports \
+         everything the test needs.",
+        MockSource = "MockSource",
+        BlanketMockSink = "BlanketMockSink"
+    );
+}
diff --git a/crates/mirror-core/tests/write_observer.rs b/crates/mirror-core/tests/write_observer.rs
new file mode 100644
index 0000000..d78b74f
--- /dev/null
+++ b/crates/mirror-core/tests/write_observer.rs
@@ -0,0 +1,164 @@
+//! Pin the contract that a sink's [`WriteObserver`] fires after
+//! every successful write and never fires after a failed one. Also
+//! pin the bridge `WriteObserver -> AckSink::note_through(offset + 1)`
+//! shape the supervisor's per-destination ack collector will use.
+
+use std::sync::Arc;
+use std::sync::Mutex;
+
+use mirror_core::mock::{rec, MockSink};
+use mirror_core::{AckSink, Sink, SinkError, WriteObserver};
+
+/// Tiny observer that just appends each `on_written` offset.
+#[derive(Debug, Default)]
+struct RecordingObserver {
+    offsets: Mutex<Vec<u64>>,
+}
+
+impl WriteObserver for RecordingObserver {
+    fn on_written(&self, source_offset: u64) {
+        self.offsets.lock().unwrap().push(source_offset);
+    }
+}
+
+/// AckSink that records every `note_through` value. The supervisor's
+/// real ack tracker takes the running max; this stub keeps the raw
+/// sequence so a test can assert on what its bridge fed in.
+#[derive(Debug, Default)]
+struct RecordingAck {
+    values: Mutex<Vec<u64>>,
+}
+
+impl AckSink for RecordingAck {
+    fn note_through(&self, through: u64) {
+        self.values.lock().unwrap().push(through);
+    }
+}
+
+/// A `WriteObserver` that bridges every `on_written(offset)` into
+/// `AckSink::note_through(offset + 1)`. This is the exact shape the
+/// supervisor's per-destination wiring takes for Kafka sinks. The
+/// trait lives in mirror-core; the wiring lives in mirror-bin
+/// (committed separately) and isn't part of the public crate.
+struct BridgeToAck {
+    ack: Arc<dyn AckSink>,
+}
+
+impl WriteObserver for BridgeToAck {
+    fn on_written(&self, source_offset: u64) {
+        self.ack.note_through(source_offset + 1);
+    }
+}
+
+#[tokio::test]
+async fn observer_fires_once_per_successful_write_in_order() {
+    let mut sink = MockSink::starting_at(0);
+    let obs = Arc::new(RecordingObserver::default());
+    sink.set_write_observer(obs.clone() as Arc<dyn WriteObserver>);
+
+    for off in 0..5 {
+        sink.write(rec(off)).await.unwrap();
+    }
+
+    assert_eq!(
+        obs.offsets.lock().unwrap().clone(),
+        vec![0, 1, 2, 3, 4],
+        "every successful write must fire on_written exactly once, in order"
+    );
+}
+
+#[tokio::test]
+async fn observer_does_not_fire_when_write_rejects_the_gate() {
+    // MockSink rejects a record whose offset doesn't match its
+    // running position. The observer must not fire for the rejected
+    // call.
+    let mut sink = MockSink::starting_at(0);
+    let obs = Arc::new(RecordingObserver::default());
+    sink.set_write_observer(obs.clone() as Arc<dyn WriteObserver>);
+
+    sink.write(rec(0)).await.unwrap();
+    // Skip ahead — MockSink expects 1, we send 5.
+    let err = sink.write(rec(5)).await.unwrap_err();
+    assert!(
+        matches!(err, SinkError::UnexpectedPosition { .. }),
+        "got {err:?}"
+    );
+
+    assert_eq!(
+        obs.offsets.lock().unwrap().clone(),
+        vec![0],
+        "observer must see only the accepted write"
+    );
+}
+
+#[tokio::test]
+async fn observer_does_not_fire_on_a_scripted_write_error() {
+    // `with_write_error` makes the next write fail without touching
+    // running_position. The observer must not fire.
+    let mut sink = MockSink::starting_at(0).with_write_error(SinkError::Transport("boom".into()));
+    let obs = Arc::new(RecordingObserver::default());
+    sink.set_write_observer(obs.clone() as Arc<dyn WriteObserver>);
+
+    let err = sink.write(rec(0)).await.unwrap_err();
+    assert!(matches!(err, SinkError::Transport(_)), "got {err:?}");
+    assert!(
+        obs.offsets.lock().unwrap().is_empty(),
+        "observer must not fire on the failed write"
+    );
+
+    // Subsequent successful write fires normally.
+    sink.write(rec(0)).await.unwrap();
+    assert_eq!(obs.offsets.lock().unwrap().clone(), vec![0]);
+}
+
+#[tokio::test]
+async fn write_observer_bridge_to_ack_sink_increments_through_offsets() {
+    // The supervisor's per-destination shim is exactly this shape:
+    // wrap an AckSink in a WriteObserver that translates
+    // `on_written(offset)` into `note_through(offset + 1)` (i.e. "the
+    // destination is durable through offset + 1").
+    let mut sink = MockSink::starting_at(0);
+    let ack = Arc::new(RecordingAck::default());
+    let bridge = Arc::new(BridgeToAck {
+        ack: ack.clone() as Arc<dyn AckSink>,
+    });
+    sink.set_write_observer(bridge as Arc<dyn WriteObserver>);
+
+    for off in 0..3 {
+        sink.write(rec(off)).await.unwrap();
+    }
+
+    assert_eq!(
+        ack.values.lock().unwrap().clone(),
+        vec![1, 2, 3],
+        "bridge must hand the ack `offset + 1` per successful write"
+    );
+}
+
+#[tokio::test]
+async fn unsupervised_sink_default_set_write_observer_is_noop() {
+    // The default `Sink::set_write_observer` is a no-op. Sinks that
+    // don't override it should silently accept the call.
+    struct NoOverrideSink {
+        position: u64,
+    }
+    #[async_trait::async_trait]
+    impl Sink for NoOverrideSink {
+        async fn next_expected_offset(&mut self) -> Result<u64, SinkError> {
+            Ok(self.position)
+        }
+        async fn write(&mut self, _record: mirror_core::Record) -> Result<(), SinkError> {
+            self.position += 1;
+            Ok(())
+        }
+    }
+    let mut sink = NoOverrideSink { position: 0 };
+    let obs = Arc::new(RecordingObserver::default());
+    sink.set_write_observer(obs.clone() as Arc<dyn WriteObserver>);
+
+    sink.write(rec(0)).await.unwrap();
+    assert!(
+        obs.offsets.lock().unwrap().is_empty(),
+        "default impl must not fire the observer"
+    );
+}
diff --git a/crates/mirror-fs/src/lib.rs b/crates/mirror-fs/src/lib.rs
index 310d813..ddbd917 100644
--- a/crates/mirror-fs/src/lib.rs
+++ b/crates/mirror-fs/src/lib.rs
@@ -61,7 +61,7 @@ pub struct FilesystemSinkConfig {
     /// Optional shared HTTP-cache state. When `Some`, every record
     /// the sink receives is applied to the cache view from the
     /// consume loop (per-record, decoupled from flush cadence). The
-    /// mirror is also bootstrapped against this state at `open()` —
+    /// mirror is also bootstrapped against this state at `open()` -
     /// in compaction:log mode, the latest snapshot's keys are
     /// pre-loaded; in append mode, the entire on-disk chain is
     /// replayed (linear in total record count).
@@ -73,7 +73,7 @@ pub struct FilesystemSinkConfig {
 /// set on a `FilesystemSinkConfig`, the sink uses it on `open` to
 /// replay the durable destination state into the shared cache so
 /// HTTP readers see what's already on disk. The per-record `write()`
-/// path no longer touches the cache — that's the tee level's job
+/// path no longer touches the cache; that's the tee level's job
 /// ([`mirror_core::TeeSink`]) so a single record never gets applied
 /// twice when the same mirror feeds multiple destinations.
 pub use mirror_core::CacheBinding;
@@ -104,6 +104,11 @@ pub struct FilesystemSink {
     values: ColumnType,
     compaction: Option<CompactionMode>,
     flush: FlushTriggers,
+    /// Optional callback fired after every successful flush. Wired
+    /// up by [`Sink::set_flush_observer`]; default is `None` (no
+    /// observer). Stored as `Arc` so the same observer can be
+    /// shared across multiple sinks under a tee.
+    flush_observer: Option<std::sync::Arc<dyn mirror_core::FlushObserver>>,
     /// Durable destination position: `max(to) + 1` of files on disk.
     durable_position: u64,
     /// Buffered records arrived since the last flush. In append mode
@@ -115,7 +120,7 @@ pub struct FilesystemSink {
     buffer_started: Option<Instant>,
     last_flush_at: Option<Instant>,
     /// Compaction-mode in-memory materialized view, sorted by key.
-    /// `None` when `compaction` is `None` — even with cache enabled,
+    /// `None` when `compaction` is `None`; even with cache enabled,
     /// the cache state is held in `CacheBinding`, not here.
     view: Option<BTreeMap<String, Record>>,
     /// Absolute unix-seconds for the next daily-flush boundary, or
@@ -173,13 +178,13 @@ impl FilesystemSink {
                 }
             }
         }
-        // NOTE: naive — computes the next future occurrence and
+        // NOTE: naive; computes the next future occurrence and
         // accepts that a mirror down at the boundary silently misses
         // it for that day. The richer version (planned alongside
         // debounce) inspects the destination chain (mtime / last
         // record timestamp) and uses last_flush_at to decide whether
         // the boundary was already honored. The shape of this
-        // computation — `(target_secs, now) -> next_unix` — does not
+        // computation; `(target_secs, now) -> next_unix`; does not
         // change.
         let next_daily_unix = cfg
             .flush
@@ -193,6 +198,7 @@ impl FilesystemSink {
             values: cfg.values,
             compaction: cfg.compaction,
             flush: cfg.flush,
+            flush_observer: None,
             durable_position,
             buffer: Vec::new(),
             buffer_bytes: 0,
@@ -216,7 +222,7 @@ impl FilesystemSink {
         if now < next {
             return Ok(());
         }
-        // Boundary crossed. Flush only if there's data — an empty-
+        // Boundary crossed. Flush only if there's data; an empty-
         // buffer slot is silently skipped (no zero-record file). The
         // boundary is *always* advanced so we don't fire repeatedly
         // until tomorrow.
@@ -391,6 +397,13 @@ impl FilesystemSink {
             trigger = trigger.as_str(),
             "flushed batch"
         );
+        // Notify the destination-flush observer if one is wired.
+        // The observer is expected to do something cheap (queue the
+        // event for an async drainer); inlining HTTP here would
+        // serialise per-flush write latency behind webhook RTT.
+        if let Some(observer) = self.flush_observer.as_ref() {
+            observer.on_flushed(from, to);
+        }
         Ok(())
     }
 }
@@ -433,7 +446,7 @@ impl Sink for FilesystemSink {
         }
         // Append mode also rejects forward gaps (the destination
         // chain forbids holes). Under compaction:log forward gaps
-        // are legitimate — the upstream may have compacted the
+        // are legitimate; the upstream may have compacted the
         // intermediate offsets out and the snapshot only stores
         // latest-per-key.
         if !matches!(self.compaction, Some(CompactionMode::Log)) && record.source_offset != expected
@@ -469,7 +482,7 @@ impl Sink for FilesystemSink {
             }
         }
         // Apply to the local compaction view per-record (was per-flush
-        // before — moved here so view content tracks the consume loop
+        // before; moved here so view content tracks the consume loop
         // exactly, independent of the flush cadence).
         if let Some(view) = self.view.as_mut() {
             let key_bytes = record.key.as_ref().expect("checked non-null above");
@@ -529,6 +542,10 @@ impl Sink for FilesystemSink {
         self.durable_position = low_watermark;
         Ok(())
     }
+
+    fn set_flush_observer(&mut self, observer: std::sync::Arc<dyn mirror_core::FlushObserver>) {
+        self.flush_observer = Some(observer);
+    }
 }
 
 fn unix_now_seconds() -> u64 {
@@ -547,7 +564,7 @@ pub fn schedule_next_daily_public(target_secs: u32, now_unix: u64) -> u64 {
 
 /// First future unix-seconds at which the daily wall-clock-UTC
 /// boundary should fire, given a target seconds-since-midnight and
-/// the current unix-seconds. Pure math, no I/O — kept as a free
+/// the current unix-seconds. Pure math, no I/O; kept as a free
 /// function so the smart-startup variant (which inspects the
 /// destination chain) can replace just this body.
 pub(crate) fn schedule_next_daily(target_secs: u32, now_unix: u64) -> u64 {
@@ -599,7 +616,7 @@ fn scan_validate(dir: &Path, format: Format) -> Result<u64, FsError> {
         if name.contains(".tmp.") {
             continue;
         }
-        // Files of the wrong extension are an error — mixed-format
+        // Files of the wrong extension are an error; mixed-format
         // dirs are forbidden.
         if let Some(other_ext) = file_extension(&name) {
             if other_ext != expected_ext && naming::parse_filename(&name, other_ext).is_some() {
@@ -705,7 +722,7 @@ fn scan_validate_compacted(dir: &Path, format: Format) -> Result<(u64, Option<Pa
 }
 
 /// Decode a snapshot file into the in-memory materialized view. Keys
-/// are required to be valid UTF-8 (we wrote them as Utf8 — a non-UTF-8
+/// are required to be valid UTF-8 (we wrote them as Utf8; a non-UTF-8
 /// key here would be data corruption).
 fn load_view(path: &Path, format: Format) -> Result<BTreeMap<String, Record>, FsError> {
     let bytes = std::fs::read(path).map_err(|e| FsError::Io {
diff --git a/crates/mirror-fs/tests/flush_observer.rs b/crates/mirror-fs/tests/flush_observer.rs
new file mode 100644
index 0000000..d696ea1
--- /dev/null
+++ b/crates/mirror-fs/tests/flush_observer.rs
@@ -0,0 +1,122 @@
+//! Pin the contract that [`FilesystemSink::set_flush_observer`]
+//! fires the installed observer exactly once per durable batch flush,
+//! with the source-offset range `(from, to)` matching the just-
+//! flushed file's bounds.
+//!
+//! This is the load-bearing test for the `notify.trigger.on:
+//! destination-flush` dispatch path; the webhook receiver gets one
+//! POST per (from, to) the observer fires.
+
+use std::sync::Arc;
+use std::sync::Mutex;
+use std::time::Duration;
+
+use mirror_core::{FlushObserver, Record, Sink, TimestampType};
+use mirror_envelope::{Format, ParquetCompression};
+use mirror_fs::{FilesystemSink, FilesystemSinkConfig, FlushTriggers};
+
+fn rec(offset: u64) -> Record {
+    Record {
+        topic: "fs-observer".into(),
+        partition: 0,
+        source_offset: offset,
+        timestamp_ms: Some(1_700_000_000_000 + offset as i64),
+        timestamp_type: TimestampType::CreateTime,
+        key: Some(format!("k{offset}").into_bytes()),
+        value: Some(format!("v{offset}").into_bytes()),
+        headers: vec![],
+    }
+}
+
+fn cfg(root: &std::path::Path, max_offsets: u64) -> FilesystemSinkConfig {
+    FilesystemSinkConfig {
+        root: root.to_path_buf(),
+        destination_name: "ops".into(),
+        partition: 0,
+        format: Format::Ndjson,
+        compression: ParquetCompression::Zstd1,
+        keys: mirror_envelope::ColumnType::Utf8,
+        values: mirror_envelope::ColumnType::Utf8,
+        compaction: None,
+        cache: None,
+        flush: FlushTriggers {
+            max_time: Duration::from_secs(3600),
+            max_bytes: u64::MAX,
+            max_offsets,
+            daily_at_utc_seconds: None,
+        },
+    }
+}
+
+#[derive(Debug, Default)]
+struct Recording {
+    fires: Mutex<Vec<(u64, u64)>>,
+}
+
+impl FlushObserver for Recording {
+    fn on_flushed(&self, from: u64, to: u64) {
+        self.fires.lock().unwrap().push((from, to));
+    }
+}
+
+#[tokio::test]
+async fn observer_fires_once_per_max_offsets_flush() {
+    let tmp = tempfile::tempdir().unwrap();
+    let mut sink = FilesystemSink::open(cfg(tmp.path(), 3)).unwrap();
+    let obs = Arc::new(Recording::default());
+    sink.set_flush_observer(obs.clone() as Arc<dyn FlushObserver>);
+
+    sink.write(rec(0)).await.unwrap();
+    sink.write(rec(1)).await.unwrap();
+    sink.write(rec(2)).await.unwrap(); // trips max-offsets=3 → first flush
+    sink.write(rec(3)).await.unwrap();
+    sink.write(rec(4)).await.unwrap();
+    sink.write(rec(5)).await.unwrap(); // second flush
+
+    let fires = obs.fires.lock().unwrap().clone();
+    assert_eq!(
+        fires,
+        vec![(0, 2), (3, 5)],
+        "each max-offsets trip must fire exactly once with the batch's (from, to)"
+    );
+}
+
+#[tokio::test]
+async fn observer_fires_on_explicit_flush_when_buffer_non_empty() {
+    let tmp = tempfile::tempdir().unwrap();
+    let mut sink = FilesystemSink::open(cfg(tmp.path(), 1_000)).unwrap();
+    let obs = Arc::new(Recording::default());
+    sink.set_flush_observer(obs.clone() as Arc<dyn FlushObserver>);
+
+    sink.write(rec(0)).await.unwrap();
+    sink.write(rec(1)).await.unwrap();
+    sink.flush().await.unwrap(); // explicit (graceful shutdown path)
+
+    let fires = obs.fires.lock().unwrap().clone();
+    assert_eq!(fires, vec![(0, 1)]);
+}
+
+#[tokio::test]
+async fn observer_does_not_fire_on_explicit_flush_when_buffer_empty() {
+    let tmp = tempfile::tempdir().unwrap();
+    let mut sink = FilesystemSink::open(cfg(tmp.path(), 1_000)).unwrap();
+    let obs = Arc::new(Recording::default());
+    sink.set_flush_observer(obs.clone() as Arc<dyn FlushObserver>);
+
+    sink.flush().await.unwrap();
+    assert!(
+        obs.fires.lock().unwrap().is_empty(),
+        "no records buffered → no flush event → observer must not fire"
+    );
+}
+
+#[tokio::test]
+async fn no_observer_does_not_panic() {
+    // Sanity: leaving the default no-op observer in place must not
+    // panic across the same record + flush path.
+    let tmp = tempfile::tempdir().unwrap();
+    let mut sink = FilesystemSink::open(cfg(tmp.path(), 2)).unwrap();
+    sink.write(rec(0)).await.unwrap();
+    sink.write(rec(1)).await.unwrap(); // flush
+    sink.flush().await.unwrap();
+}
diff --git a/crates/mirror-fs/tests/loop_invariants_with_real_sink.rs b/crates/mirror-fs/tests/loop_invariants_with_real_sink.rs
new file mode 100644
index 0000000..a1b5a6e
--- /dev/null
+++ b/crates/mirror-fs/tests/loop_invariants_with_real_sink.rs
@@ -0,0 +1,270 @@
+//! Loop-invariant tests that drive `run_mirror` against a *real*
+//! `FilesystemSink` (tempfile-backed) instead of mocks.
+//!
+//! ## Why this exists
+//!
+//! `mirror-core`'s own `tests/loop_invariants.rs` runs against the
+//! in-crate `MockSink`. The mock has been a useful fast lane for
+//! invariant tests, but production bugs have repeatedly turned out
+//! to live in the mock-vs-real gap: the mock had no buffer/durable
+//! split, no empty-buffer precondition on `align_to_source_low_watermark`,
+//! and (until the PR that bundles this file) no notion of forward
+//! gaps under `compaction:log`. Each gap let a real-sink-only bug
+//! pass `cargo test` and break in production.
+//!
+//! These tests close that gap by driving the same run loop through
+//! the *actual* `FilesystemSink`. They live in mirror-fs (not
+//! mirror-core) because the dep direction is `mirror-fs -> mirror-core`;
+//! mirror-core can't reach for `FilesystemSink` even as a dev-dep
+//! without creating a dev-dep cycle.
+//!
+//! The cases here are deliberately a curated subset of the mock-based
+//! suite; the ones where sink behaviour is the load-bearing
+//! invariant. Other cases (pure error-variant matching, MockSource's
+//! `Hang`/`Error` scripts) stay in `mirror-core/tests/loop_invariants.rs`
+//! where they're already cheap.
+
+use std::path::Path;
+use std::time::Duration;
+
+use mirror_core::mock::{MockSource, MockSourceEvent};
+use mirror_core::{run_mirror, MirrorError, Record, TimestampType};
+use mirror_envelope::{ColumnType, Format, ParquetCompression};
+use mirror_fs::{
+    naming, read_all_records, CompactionMode, FilesystemSink, FilesystemSinkConfig, FlushTriggers,
+};
+
+fn rec(offset: u64) -> Record {
+    Record {
+        topic: "loop-real".into(),
+        partition: 0,
+        source_offset: offset,
+        timestamp_ms: Some(1_700_000_000_000 + offset as i64),
+        timestamp_type: TimestampType::CreateTime,
+        key: Some(format!("k{}", offset % 4).into_bytes()),
+        value: Some(format!("v{offset}").into_bytes()),
+        headers: vec![],
+    }
+}
+
+fn fs_cfg(root: &Path, compaction: Option<CompactionMode>) -> FilesystemSinkConfig {
+    let format = match compaction {
+        Some(CompactionMode::Log) => Format::Parquet,
+        None => Format::Ndjson,
+    };
+    FilesystemSinkConfig {
+        root: root.to_path_buf(),
+        destination_name: "ops".into(),
+        partition: 0,
+        format,
+        compression: ParquetCompression::Zstd1,
+        keys: ColumnType::Utf8,
+        values: ColumnType::Utf8,
+        compaction,
+        cache: None,
+        // High thresholds; explicit flush_now is the only thing
+        // that rotates a file during these tests so we can drive
+        // buffer state precisely from the events list.
+        flush: FlushTriggers {
+            max_time: Duration::from_secs(3600),
+            max_bytes: u64::MAX,
+            max_offsets: u64::MAX,
+            daily_at_utc_seconds: None,
+        },
+    }
+}
+
+/// Drive `run_mirror` against a real FS sink and a scripted source.
+///
+/// The shutdown future is a `tokio::time::sleep(grace)`, so the loop
+/// has `grace` milliseconds to process events before graceful
+/// shutdown fires. A short grace (~50ms) is enough to chew through
+/// the scripted events; the source's terminal `Hang` event then
+/// parks the poll future indefinitely until the sleep resolves and
+/// triggers graceful shutdown.
+fn drive_real_fs(
+    compaction: Option<CompactionMode>,
+    events: Vec<MockSourceEvent>,
+    grace: Duration,
+) -> (Result<(), MirrorError>, tempfile::TempDir) {
+    let tempdir = tempfile::tempdir().expect("tempdir");
+    let sink = FilesystemSink::open(fs_cfg(tempdir.path(), compaction)).expect("open sink");
+    let source = MockSource::new(events);
+    let result = tokio::runtime::Builder::new_current_thread()
+        .enable_time()
+        .build()
+        .unwrap()
+        .block_on(async move { run_mirror(source, sink, tokio::time::sleep(grace)).await });
+    (result, tempdir)
+}
+
+#[test]
+fn append_mode_writes_records_in_order_to_real_disk() {
+    // Three contiguous records, then graceful shutdown after a
+    // 100ms grace window. The flush-on-shutdown should produce
+    // a `0-2.ndjson` file containing all three records.
+    let (result, tempdir) = drive_real_fs(
+        None,
+        vec![
+            MockSourceEvent::Record(rec(0)),
+            MockSourceEvent::Record(rec(1)),
+            MockSourceEvent::Record(rec(2)),
+            MockSourceEvent::Hang,
+        ],
+        Duration::from_millis(100),
+    );
+    assert!(
+        matches!(result, Ok(())),
+        "graceful shutdown expected, got: {result:?}"
+    );
+    let dir = naming::partition_dir(tempdir.path(), "ops", 0);
+    let records = read_all_records(&dir, Format::Ndjson).expect("read disk");
+    assert_eq!(
+        records.iter().map(|r| r.source_offset).collect::<Vec<_>>(),
+        vec![0, 1, 2],
+        "all three records must land on disk after graceful shutdown's flush"
+    );
+}
+
+#[test]
+fn append_mode_real_sink_rejects_source_gap() {
+    // Source skips from 0 to 5; append mode must reject the gap
+    // via SourceGapAboveExpected from the run loop. Disk should
+    // contain only the first record (or none, depending on whether
+    // the buffer flushed before the error fired; we don't assert).
+    let (result, _td) = drive_real_fs(
+        None,
+        vec![
+            MockSourceEvent::Record(rec(0)),
+            MockSourceEvent::Record(rec(5)),
+        ],
+        Duration::from_secs(1),
+    );
+    match result {
+        Err(MirrorError::SourceGapAboveExpected { expected, got }) => {
+            assert_eq!((expected, got), (1, 5));
+        }
+        other => panic!("expected SourceGapAboveExpected, got {other:?}"),
+    }
+}
+
+#[test]
+fn real_sink_rejects_source_going_backwards() {
+    // Source delivers 5 then 3; always fatal, in any mode.
+    let (result, _td) = drive_real_fs(
+        Some(CompactionMode::Log),
+        vec![
+            MockSourceEvent::Record(rec(5)),
+            MockSourceEvent::Record(rec(3)),
+        ],
+        Duration::from_secs(1),
+    );
+    match result {
+        Err(MirrorError::SourceWentBackwards { expected, got }) => {
+            assert_eq!((expected, got), (6, 3));
+        }
+        other => panic!("expected SourceWentBackwards, got {other:?}"),
+    }
+}
+
+#[test]
+fn compaction_log_real_sink_accepts_bootstrap_gap_from_compact_only_topic() {
+    // The cleanup.policy=compact case: broker reports low_watermark=0
+    // (default for MockSource), the loop seeks(0), then the source
+    // delivers an offset much later because compaction skipped earlier
+    // records. The run loop must align expected to the delivered
+    // offset and the real FilesystemSink must accept the gap.
+    let (result, tempdir) = drive_real_fs(
+        Some(CompactionMode::Log),
+        vec![MockSourceEvent::Record(rec(461)), MockSourceEvent::Hang],
+        Duration::from_millis(100),
+    );
+    // Graceful shutdown after the loop processed the aligned write.
+    // The PRE-FIX run loop would have errored here with
+    // SourceOffsetMismatch / Sink::UnexpectedPosition (expected 0,
+    // got 461) before the shutdown timer ever fired.
+    assert!(
+        matches!(result, Ok(())),
+        "expected graceful shutdown after aligned write, got: {result:?}"
+    );
+    let dir = naming::partition_dir(tempdir.path(), "ops", 0);
+    let records = read_all_records(&dir, Format::Parquet).expect("read disk");
+    assert_eq!(
+        records.iter().map(|r| r.source_offset).collect::<Vec<_>>(),
+        vec![461],
+        "the aligned record at offset 461 must land on disk"
+    );
+}
+
+#[test]
+fn compaction_log_real_sink_accepts_repeated_midstream_gaps() {
+    // The production repro the PR fixes: after the first aligned
+    // write at offset 461, the broker delivers 466 then 470. The
+    // buffer is non-empty so the original mid-stream attempt to call
+    // `align_to_source_low_watermark` would have tripped the
+    // empty-buffer precondition. The new path lets the run loop bump
+    // `expected` and the sink's write accept the gap.
+    let (result, tempdir) = drive_real_fs(
+        Some(CompactionMode::Log),
+        vec![
+            MockSourceEvent::Record(rec(461)),
+            MockSourceEvent::Record(rec(466)),
+            MockSourceEvent::Record(rec(470)),
+            MockSourceEvent::Hang,
+        ],
+        Duration::from_millis(100),
+    );
+    // The PRE-FIX path crashed on the second record (mid-stream gap
+    // tripped `align_to_source_low_watermark`'s empty-buffer
+    // precondition). Graceful exit here means all three records were
+    // accepted into the buffer and the flush rolled them into a
+    // single snapshot file.
+    assert!(
+        matches!(result, Ok(())),
+        "expected graceful shutdown after all three gapped writes, got: {result:?}"
+    );
+    // The snapshot is a compaction:log file `<from>-<max>.parquet`.
+    // `from` = durable_position at flush time (0, since no prior
+    // flush happened); `max` = last buffered source_offset (470).
+    let dir = naming::partition_dir(tempdir.path(), "ops", 0);
+    let mut files: Vec<String> = std::fs::read_dir(&dir)
+        .expect("readdir")
+        .filter_map(|e| {
+            let p = e.ok()?.path();
+            let n = p.file_name()?.to_str()?.to_string();
+            (n.ends_with(".parquet") && !n.contains(".tmp.")).then_some(n)
+        })
+        .collect();
+    files.sort();
+    assert_eq!(
+        files,
+        vec!["00000000000000000000-00000000000000000470.parquet".to_string()],
+        "the snapshot file's range must cover all three accepted records"
+    );
+    // The snapshot's compaction view is "latest per key". The
+    // three accepted records have keys `k{offset % 4}`; so
+    // offsets 461, 466, 470 map to keys k1, k2, k2. The k2 entry
+    // is deduplicated to its latest value (v470), leaving two
+    // distinct keys in the snapshot.
+    let records = read_all_records(&dir, Format::Parquet).expect("read disk");
+    let mut by_key: std::collections::BTreeMap<Vec<u8>, &Record> =
+        std::collections::BTreeMap::new();
+    for r in &records {
+        by_key.insert(r.key.clone().expect("key"), r);
+    }
+    assert_eq!(
+        by_key.len(),
+        2,
+        "two distinct keys after compaction; got: {records:?}"
+    );
+    assert_eq!(
+        by_key.get(&b"k1"[..]).expect("k1 present").value.as_deref(),
+        Some(b"v461".as_slice()),
+        "k1's value is its only record (v461)"
+    );
+    assert_eq!(
+        by_key.get(&b"k2"[..]).expect("k2 present").value.as_deref(),
+        Some(b"v470".as_slice()),
+        "k2's value is the latest record at offset 470, not the earlier v466"
+    );
+}
diff --git a/crates/mirror-fs/tests/sink_matrix.rs b/crates/mirror-fs/tests/sink_matrix.rs
new file mode 100644
index 0000000..7056f98
--- /dev/null
+++ b/crates/mirror-fs/tests/sink_matrix.rs
@@ -0,0 +1,481 @@
+//! Sink-trait matrix against a real `FilesystemSink`.
+//!
+//! Walks the (compaction-mode × buffer-state × action) grid from
+//! `REVIEW_TEST_STRATEGY.md §4` against a real sink backed by
+//! `tempfile::TempDir`; no mocks, so an invariant change in the
+//! real sink surfaces here instead of slipping past a mock that
+//! quietly diverged from production. The full 16-cell table is in
+//! the `MATRIX` const at the bottom of this file; each row names
+//! what it covers (e.g. `log/non-empty/delivered>exp`) so a CI
+//! failure points at the regressed cell directly.
+//!
+//! The matrix is constructed once per test (Rust integration tests
+//! sit in their own binary and we want each row's failure to be
+//! attributed), but the per-row setup is deterministic and cheap:
+//! one tempdir + a handful of writes per cell.
+//!
+//! **Why this exists.** The mid-stream-gap bug
+//! (`log/non-empty/delivered>exp`) was a new cell that the existing
+//! one-test-per-scenario layout didn't naturally encode. A table
+//! catches "we added gap acceptance and missed one of the buffer
+//! states" by making *every* gated cell explicit. It also lets the
+//! S3 sink's matrix (see `crates/mirror-s3/tests/sink_matrix.rs`)
+//! assert symmetry: any FS row that's present must have an S3
+//! counterpart with the same outcome, modulo backend specifics.
+
+use std::time::Duration;
+
+use mirror_core::{Record, Sink, SinkError, TimestampType};
+use mirror_envelope::{ColumnType, Format, ParquetCompression};
+use mirror_fs::{CompactionMode, FilesystemSink, FilesystemSinkConfig, FlushTriggers};
+
+fn rec(offset: u64) -> Record {
+    Record {
+        topic: "sink-matrix".into(),
+        partition: 0,
+        source_offset: offset,
+        timestamp_ms: Some(1_700_000_000_000 + offset as i64),
+        timestamp_type: TimestampType::CreateTime,
+        key: Some(format!("k{}", offset % 4).into_bytes()),
+        value: Some(format!("v{offset}").into_bytes()),
+        headers: vec![],
+    }
+}
+
+fn cfg(root: &std::path::Path, compaction: Option<CompactionMode>) -> FilesystemSinkConfig {
+    // Compaction:log requires Parquet (an explicit precondition in
+    // mirror_config validation). Append mode runs against ndjson
+    // because the existing `tests/sink.rs` shape uses ndjson and
+    // mirroring that keeps the failure output operator-friendly.
+    let format = match compaction {
+        Some(CompactionMode::Log) => Format::Parquet,
+        None => Format::Ndjson,
+    };
+    FilesystemSinkConfig {
+        root: root.to_path_buf(),
+        destination_name: "ops".into(),
+        partition: 0,
+        format,
+        compression: ParquetCompression::Zstd1,
+        keys: ColumnType::Utf8,
+        values: ColumnType::Utf8,
+        compaction,
+        cache: None,
+        // Huge thresholds so explicit `flush()` is the only thing
+        // that actually rotates a file; matrix rows that *don't*
+        // call flush get to control buffer state precisely.
+        flush: FlushTriggers {
+            max_time: Duration::from_secs(3600),
+            max_bytes: u64::MAX,
+            max_offsets: u64::MAX,
+            daily_at_utc_seconds: None,
+        },
+    }
+}
+
+/// Compaction mode the cell exercises.
+#[derive(Debug, Clone, Copy)]
+enum Mode {
+    Append,
+    Log,
+}
+
+impl Mode {
+    fn to_compaction(self) -> Option<CompactionMode> {
+        match self {
+            Mode::Append => None,
+            Mode::Log => Some(CompactionMode::Log),
+        }
+    }
+}
+
+/// Buffer state the cell exercises *at the moment of the action*.
+/// Set up by the preload phase: `Empty` flushes after the preload,
+/// `NonEmpty` leaves the preloaded records in the buffer.
+#[derive(Debug, Clone, Copy)]
+enum BufferState {
+    Empty,
+    NonEmpty,
+}
+
+/// The action under test.
+#[derive(Debug)]
+enum Action {
+    /// `sink.write(rec(offset))`.
+    Write(u64),
+    /// `sink.flush_now()` and assert on the produced filename.
+    /// Tuple is the expected `(from, to)` parsed back from disk.
+    Flush {
+        expected_from: u64,
+        expected_to: u64,
+    },
+    /// `sink.align_to_source_low_watermark(low_watermark)`.
+    Align { low_watermark: u64 },
+    /// `sink.next_expected_offset()`.
+    NextExpected,
+}
+
+#[derive(Debug)]
+enum Outcome {
+    /// The action returned `Ok(())` (write/flush/align).
+    Ok,
+    /// `next_expected_offset()` returned this value.
+    NextExpectedIs(u64),
+    /// `SinkError::UnexpectedPosition { expected, actual }`.
+    UnexpectedPosition { expected: u64, actual: u64 },
+    /// `SinkError::Transport(message)` where the message contains
+    /// this substring. Used for the align preconditions, which fail
+    /// with descriptive transport errors rather than the structured
+    /// `UnexpectedPosition` variant.
+    TransportContains(&'static str),
+}
+
+struct Case {
+    name: &'static str,
+    mode: Mode,
+    /// Records to write before the action runs. Numeric offsets.
+    /// For compaction:log cases the preload offsets may include
+    /// gaps; for append mode they must be contiguous starting at 0
+    /// (otherwise the preload itself fails).
+    preload: &'static [u64],
+    /// `Empty` → flush after the preload (so the buffer is empty at
+    /// action time); `NonEmpty` → skip the flush.
+    buffer_state: BufferState,
+    action: Action,
+    expected: Outcome,
+}
+
+async fn run_case(case: &Case) {
+    let tempdir = tempfile::tempdir().expect("tempdir");
+    let mut sink = FilesystemSink::open(cfg(tempdir.path(), case.mode.to_compaction()))
+        .expect("open FilesystemSink");
+
+    // Preload phase.
+    for &offset in case.preload {
+        sink.write(rec(offset))
+            .await
+            .unwrap_or_else(|e| panic!("[{}] preload write({offset}) failed: {e}", case.name));
+    }
+    if matches!(case.buffer_state, BufferState::Empty) && !case.preload.is_empty() {
+        sink.flush_now()
+            .await
+            .unwrap_or_else(|e| panic!("[{}] preload flush failed: {e}", case.name));
+    }
+
+    // Action phase.
+    let observed = match &case.action {
+        Action::Write(offset) => sink.write(rec(*offset)).await.map(|()| None),
+        Action::Flush {
+            expected_from,
+            expected_to,
+        } => {
+            sink.flush_now().await.map(|()| {
+                // Filename verification: the latest ndjson/parquet
+                // file in the partition dir must be `<from>-<to>`.
+                let dir = mirror_fs::naming::partition_dir(tempdir.path(), "ops", 0);
+                let mut files: Vec<String> = std::fs::read_dir(&dir)
+                    .expect("readdir")
+                    .filter_map(|e| {
+                        let p = e.ok()?.path();
+                        let name = p.file_name()?.to_str()?.to_string();
+                        let is_real = (name.ends_with(".ndjson") || name.ends_with(".parquet"))
+                            && !name.contains(".tmp.");
+                        is_real.then_some(name)
+                    })
+                    .collect();
+                files.sort();
+                let last = files
+                    .last()
+                    .unwrap_or_else(|| panic!("[{}] no flushed file found", case.name));
+                // Filenames look like `00000000000000000000-00000000000000000004.ndjson`.
+                let ext = if matches!(case.mode, Mode::Log) {
+                    "parquet"
+                } else {
+                    "ndjson"
+                };
+                let expected_name = format!("{expected_from:020}-{expected_to:020}.{ext}");
+                assert_eq!(
+                    last, &expected_name,
+                    "[{}] flushed filename should encode (from={expected_from}, to={expected_to})",
+                    case.name
+                );
+                None
+            })
+        }
+        Action::Align { low_watermark } => sink
+            .align_to_source_low_watermark(*low_watermark)
+            .await
+            .map(|()| None),
+        Action::NextExpected => sink.next_expected_offset().await.map(Some),
+    };
+
+    // Outcome assertion.
+    match (&case.expected, observed) {
+        (Outcome::Ok, Ok(_)) => {}
+        (Outcome::NextExpectedIs(expected), Ok(Some(value))) => {
+            assert_eq!(
+                value, *expected,
+                "[{}] next_expected_offset value",
+                case.name
+            );
+        }
+        (
+            Outcome::UnexpectedPosition {
+                expected: exp,
+                actual: act,
+            },
+            Err(SinkError::UnexpectedPosition { expected, actual }),
+        ) => {
+            assert_eq!(
+                (expected, actual),
+                (*exp, *act),
+                "[{}] UnexpectedPosition payload",
+                case.name
+            );
+        }
+        (Outcome::TransportContains(needle), Err(SinkError::Transport(msg))) => {
+            assert!(
+                msg.contains(needle),
+                "[{}] Transport({msg:?}) should contain {needle:?}",
+                case.name
+            );
+        }
+        (expected, observed) => {
+            panic!(
+                "[{}] mismatch: expected={expected:?} observed={observed:?}",
+                case.name
+            );
+        }
+    }
+}
+
+#[tokio::test]
+async fn matrix() {
+    let cases = matrix_cases();
+    for case in &cases {
+        run_case(case).await;
+    }
+}
+
+fn matrix_cases() -> Vec<Case> {
+    vec![
+        // ============================================================
+        //  APPEND MODE; every gap is fatal, equality is the only OK
+        // ============================================================
+
+        // append × empty × write at expected → OK
+        Case {
+            name: "append/empty/write_at_expected/ok",
+            mode: Mode::Append,
+            preload: &[],
+            buffer_state: BufferState::Empty,
+            action: Action::Write(0),
+            expected: Outcome::Ok,
+        },
+        // append × empty × write above expected → reject (gap forbidden)
+        Case {
+            name: "append/empty/write_above_expected/rejects",
+            mode: Mode::Append,
+            preload: &[],
+            buffer_state: BufferState::Empty,
+            action: Action::Write(5),
+            expected: Outcome::UnexpectedPosition {
+                expected: 0,
+                actual: 5,
+            },
+        },
+        // append × empty (post-flush, durable=5) × write below durable → reject (backwards)
+        Case {
+            name: "append/empty_after_flush/write_below_durable/rejects",
+            mode: Mode::Append,
+            preload: &[0, 1, 2, 3, 4],
+            buffer_state: BufferState::Empty, // flush after preload
+            action: Action::Write(3),
+            expected: Outcome::UnexpectedPosition {
+                expected: 5,
+                actual: 3,
+            },
+        },
+        // append × non-empty × write at expected → OK
+        Case {
+            name: "append/non_empty/write_at_expected/ok",
+            mode: Mode::Append,
+            preload: &[0, 1, 2],
+            buffer_state: BufferState::NonEmpty,
+            action: Action::Write(3),
+            expected: Outcome::Ok,
+        },
+        // append × non-empty × write above expected → reject (gap forbidden)
+        Case {
+            name: "append/non_empty/write_above_expected/rejects",
+            mode: Mode::Append,
+            preload: &[0, 1, 2],
+            buffer_state: BufferState::NonEmpty,
+            action: Action::Write(7),
+            expected: Outcome::UnexpectedPosition {
+                expected: 3,
+                actual: 7,
+            },
+        },
+        // append × non-empty × write below buffered head → reject (backwards)
+        Case {
+            name: "append/non_empty/write_below_buffered_head/rejects",
+            mode: Mode::Append,
+            preload: &[0, 1, 2],
+            buffer_state: BufferState::NonEmpty,
+            action: Action::Write(1),
+            expected: Outcome::UnexpectedPosition {
+                expected: 3,
+                actual: 1,
+            },
+        },
+        // ============================================================
+        //  COMPACTION:LOG; forward gaps OK, backwards still fatal
+        // ============================================================
+
+        // log × empty × write at expected (offset 0) → OK
+        Case {
+            name: "log/empty/write_at_expected/ok",
+            mode: Mode::Log,
+            preload: &[],
+            buffer_state: BufferState::Empty,
+            action: Action::Write(0),
+            expected: Outcome::Ok,
+        },
+        // log × empty × write above expected (bootstrap-time gap from compact-only topic) → OK
+        Case {
+            name: "log/empty/write_above_expected/ok_bootstrap_gap",
+            mode: Mode::Log,
+            preload: &[],
+            buffer_state: BufferState::Empty,
+            action: Action::Write(461),
+            expected: Outcome::Ok,
+        },
+        // log × empty (post-flush, durable=5) × write below durable → reject (backwards)
+        Case {
+            name: "log/empty_after_flush/write_below_durable/rejects",
+            mode: Mode::Log,
+            preload: &[0, 1, 2, 3, 4],
+            buffer_state: BufferState::Empty,
+            action: Action::Write(3),
+            expected: Outcome::UnexpectedPosition {
+                expected: 5,
+                actual: 3,
+            },
+        },
+        // log × non-empty × write at expected → OK
+        Case {
+            name: "log/non_empty/write_at_expected/ok",
+            mode: Mode::Log,
+            preload: &[0, 1, 2],
+            buffer_state: BufferState::NonEmpty,
+            action: Action::Write(3),
+            expected: Outcome::Ok,
+        },
+        // log × non-empty × write above expected (mid-stream compaction gap) → OK
+        // This is THE bug that motivated the matrix.
+        Case {
+            name: "log/non_empty/write_above_expected/ok_midstream_gap",
+            mode: Mode::Log,
+            preload: &[0, 1, 2],
+            buffer_state: BufferState::NonEmpty,
+            action: Action::Write(7),
+            expected: Outcome::Ok,
+        },
+        // log × non-empty × write below buffered head → reject (backwards)
+        Case {
+            name: "log/non_empty/write_below_buffered_head/rejects",
+            mode: Mode::Log,
+            preload: &[0, 1, 2],
+            buffer_state: BufferState::NonEmpty,
+            action: Action::Write(1),
+            expected: Outcome::UnexpectedPosition {
+                expected: 3,
+                actual: 1,
+            },
+        },
+        // ============================================================
+        //  ALIGN; bootstrap-only, empty-buffer precondition
+        // ============================================================
+
+        // log × empty × align(low_watermark=461) → OK
+        Case {
+            name: "log/empty/align/ok",
+            mode: Mode::Log,
+            preload: &[],
+            buffer_state: BufferState::Empty,
+            action: Action::Align { low_watermark: 461 },
+            expected: Outcome::Ok,
+        },
+        // log × non-empty × align → reject (empty-buffer precondition)
+        Case {
+            name: "log/non_empty/align/rejects_with_empty_buffer_precondition",
+            mode: Mode::Log,
+            preload: &[0, 1, 2],
+            buffer_state: BufferState::NonEmpty,
+            action: Action::Align { low_watermark: 461 },
+            expected: Outcome::TransportContains("inconsistent state"),
+        },
+        // append × empty × align → reject (compaction-mode precondition)
+        Case {
+            name: "append/empty/align/rejects_on_non_compaction_sink",
+            mode: Mode::Append,
+            preload: &[],
+            buffer_state: BufferState::Empty,
+            action: Action::Align { low_watermark: 461 },
+            expected: Outcome::TransportContains("non-compaction sink"),
+        },
+        // ============================================================
+        //  FLUSH; filename encodes the offset range correctly
+        // ============================================================
+
+        // append × non-empty × flush → file `<dur>-<dur+len-1>` (contiguous)
+        Case {
+            name: "append/non_empty/flush/contiguous_filename",
+            mode: Mode::Append,
+            preload: &[0, 1, 2, 3, 4],
+            buffer_state: BufferState::NonEmpty,
+            action: Action::Flush {
+                expected_from: 0,
+                expected_to: 4,
+            },
+            expected: Outcome::Ok,
+        },
+        // log × non-empty × flush after gap-spanning writes → file `<dur>-<max(offsets)>`
+        // The buffer carries offsets 0, 461, 466; the snapshot file
+        // must name `0-466.parquet` (not `0-2` from len-1).
+        Case {
+            name: "log/non_empty_with_gaps/flush/uses_max_offset_for_to",
+            mode: Mode::Log,
+            preload: &[0, 461, 466],
+            buffer_state: BufferState::NonEmpty,
+            action: Action::Flush {
+                expected_from: 0,
+                expected_to: 466,
+            },
+            expected: Outcome::Ok,
+        },
+        // ============================================================
+        //  NEXT_EXPECTED_OFFSET; reflects buffered_head() correctly
+        // ============================================================
+
+        // append × non-empty × next_expected → durable + buffer.len()
+        Case {
+            name: "append/non_empty/next_expected/durable_plus_len",
+            mode: Mode::Append,
+            preload: &[0, 1, 2],
+            buffer_state: BufferState::NonEmpty,
+            action: Action::NextExpected,
+            expected: Outcome::NextExpectedIs(3),
+        },
+        // log × non-empty with gaps × next_expected → last_buffered + 1
+        Case {
+            name: "log/non_empty_with_gaps/next_expected/last_buffered_plus_one",
+            mode: Mode::Log,
+            preload: &[0, 461, 466],
+            buffer_state: BufferState::NonEmpty,
+            action: Action::NextExpected,
+            expected: Outcome::NextExpectedIs(467),
+        },
+    ]
+}
diff --git a/crates/mirror-kafka/src/lib.rs b/crates/mirror-kafka/src/lib.rs
index 544cb2e..5bab1b0 100644
--- a/crates/mirror-kafka/src/lib.rs
+++ b/crates/mirror-kafka/src/lib.rs
@@ -8,15 +8,16 @@
 
 #![allow(clippy::result_large_err)]
 
+use std::sync::atomic::{AtomicU64, Ordering};
 use std::sync::Arc;
 use std::time::Duration;
 
 use async_trait::async_trait;
 use mirror_core::{
-    ColumnType, Header, Record, Sink, SinkError, Source, SourceError, TimestampType,
+    ColumnType, Header, Record, Sink, SinkError, Source, SourceError, TimestampType, WriteObserver,
 };
 use rdkafka::config::ClientConfig;
-use rdkafka::consumer::{BaseConsumer, Consumer, StreamConsumer};
+use rdkafka::consumer::{BaseConsumer, CommitMode, Consumer, StreamConsumer};
 use rdkafka::message::{Header as RdHeader, Headers, Message, OwnedHeaders};
 use rdkafka::producer::{FutureProducer, FutureRecord};
 use rdkafka::topic_partition_list::Offset;
@@ -54,6 +55,45 @@ pub fn fetch_low_watermark(
     Ok(low)
 }
 
+/// Read the broker's `__consumer_offsets` entry for the
+/// `(group_id, topic, partition)` tuple. `Ok(None)` is the
+/// "no committed value yet" sentinel (a fresh group, or a group
+/// that hasn't committed for this partition). Sync; wrap in
+/// `spawn_blocking` for async contexts. Mirrors the `fetch_*_watermark`
+/// pattern so the supervisor can read the per-mirror committed
+/// offset at startup without instantiating a full `KafkaSource`.
+pub fn fetch_committed_offset(
+    bootstrap: &str,
+    group_id: &str,
+    topic: &str,
+    partition: i32,
+    timeout: Duration,
+) -> Result<Option<u64>, KafkaError> {
+    let consumer: BaseConsumer = ClientConfig::new()
+        .set("bootstrap.servers", bootstrap)
+        .set("group.id", group_id)
+        .set("enable.auto.commit", "false")
+        .create()
+        .map_err(|e| KafkaError::Init(e.to_string()))?;
+    let mut tpl = TopicPartitionList::new();
+    tpl.add_partition(topic, partition);
+    let filled = consumer
+        .committed_offsets(tpl, Timeout::After(timeout))
+        .map_err(|e| KafkaError::Init(format!("committed_offsets: {e}")))?;
+    let elem = filled.find_partition(topic, partition).ok_or_else(|| {
+        KafkaError::Init(format!(
+            "committed_offsets returned no entry for {topic}/{partition}"
+        ))
+    })?;
+    match elem.offset() {
+        Offset::Offset(n) if n >= 0 => Ok(Some(n as u64)),
+        // `Invalid` is librdkafka's "no committed offset for this
+        // group". The other `Offset::*` variants don't appear in a
+        // `committed_offsets` result; treat them as `None`.
+        _ => Ok(None),
+    }
+}
+
 fn fetch_watermarks(
     bootstrap: &str,
     topic: &str,
@@ -98,11 +138,17 @@ impl KafkaSourceConfig {
 }
 
 pub struct KafkaSource {
-    consumer: StreamConsumer,
+    consumer: Arc<StreamConsumer>,
     bootstrap_servers: String,
+    group_id: String,
     topic: String,
     partition: i32,
     poll_timeout: Duration,
+    /// Monotonic guard on `commit_through`. Shared with any
+    /// [`KafkaCommitHandle`] handed out via [`Self::commit_handle`]
+    /// so the supervisor's periodic task and any direct trait-method
+    /// caller observe the same "highest staged" value.
+    last_stored_offset: Arc<AtomicU64>,
 }
 
 impl KafkaSource {
@@ -111,6 +157,11 @@ impl KafkaSource {
             .set("bootstrap.servers", &cfg.bootstrap_servers)
             .set("group.id", &cfg.group_id)
             .set("enable.auto.commit", "false")
+            // Required by `store_offsets`: rdkafka rejects manual
+            // offset staging when its auto-store path is also live.
+            // We always commit through `KafkaCommitHandle`, so the
+            // auto-store path is never the right choice here.
+            .set("enable.auto.offset.store", "false")
             .set("auto.offset.reset", "earliest")
             // Note: the Java worker used `max.poll.records=1` for
             // single-record progression; that property is Java-client
@@ -120,13 +171,117 @@ impl KafkaSource {
             .create()
             .map_err(|e| KafkaError::Init(e.to_string()))?;
         Ok(Self {
-            consumer,
+            consumer: Arc::new(consumer),
             bootstrap_servers: cfg.bootstrap_servers,
+            group_id: cfg.group_id,
             topic: cfg.topic,
             partition: cfg.partition,
             poll_timeout: cfg.poll_timeout,
+            last_stored_offset: Arc::new(AtomicU64::new(0)),
         })
     }
+
+    /// Hand the supervisor's periodic commit task a shared handle
+    /// that can stage offsets and flush them to the broker without
+    /// owning the source. The handle shares the same in-memory
+    /// `last_stored_offset` so the monotonicity guard on
+    /// [`Source::commit_through`] applies regardless of which path
+    /// stages the value.
+    pub fn commit_handle(&self) -> KafkaCommitHandle {
+        KafkaCommitHandle {
+            consumer: Arc::clone(&self.consumer),
+            topic: self.topic.clone(),
+            partition: self.partition,
+            last_stored_offset: Arc::clone(&self.last_stored_offset),
+        }
+    }
+}
+
+/// Shared commit-side handle on a [`KafkaSource`]. Holds an `Arc` of
+/// the underlying `StreamConsumer` so the supervisor's periodic
+/// commit task can stage and flush offsets while the run loop holds
+/// the source's `&mut Source` and is busy in `recv()`.
+///
+/// Cloning this is cheap (one `Arc::clone` per shared field) and
+/// safe; every clone observes the same monotonic guard.
+#[derive(Clone)]
+pub struct KafkaCommitHandle {
+    consumer: Arc<StreamConsumer>,
+    topic: String,
+    partition: i32,
+    last_stored_offset: Arc<AtomicU64>,
+}
+
+impl KafkaCommitHandle {
+    /// `true` iff the underlying consumer's `assignment()` currently
+    /// includes the handle's `(topic, partition)`. The supervisor's
+    /// readiness poller uses this to detect assignment loss without
+    /// owning the source.
+    ///
+    /// Synchronous; rdkafka's `assignment()` reads in-memory state
+    /// rather than contacting the broker. Returns `Err` if rdkafka
+    /// reports an error reading the assignment.
+    pub fn current_assignment_includes(&self) -> Result<bool, SourceError> {
+        let tpl = self
+            .consumer
+            .assignment()
+            .map_err(|e| SourceError::Transport(format!("assignment: {e}")))?;
+        // `find_partition` is `None` when the partition isn't in the
+        // current assignment.
+        Ok(tpl.find_partition(&self.topic, self.partition).is_some())
+    }
+
+    /// Stage `through` as the next offset to commit. Idempotent and
+    /// monotonic: identical to [`Source::commit_through`] but takes
+    /// `&self`, so the supervisor's periodic task can call it
+    /// without owning the source.
+    pub fn commit_through(&self, through: u64) -> Result<(), SourceError> {
+        stage_offset(
+            &self.consumer,
+            &self.topic,
+            self.partition,
+            &self.last_stored_offset,
+            through,
+        )
+    }
+
+    /// Flush every staged offset to the broker. Uses
+    /// `CommitMode::Async` so the call returns immediately; the
+    /// actual write happens inside librdkafka's poll thread. The
+    /// supervisor's periodic task calls this after `commit_through`
+    /// and treats the return as best-effort.
+    pub fn commit_pending(&self) -> Result<(), SourceError> {
+        self.consumer
+            .commit_consumer_state(CommitMode::Async)
+            .map_err(|e| SourceError::Transport(format!("commit_consumer_state: {e}")))
+    }
+}
+
+/// Stage `through` as the offset to commit for `(topic, partition)`,
+/// guarded by `last_stored_offset` against rewinds. Shared between
+/// [`Source::commit_through`] (called via `&mut KafkaSource`) and
+/// [`KafkaCommitHandle::commit_through`] (called via `&self`).
+fn stage_offset(
+    consumer: &StreamConsumer,
+    topic: &str,
+    partition: i32,
+    last_stored_offset: &AtomicU64,
+    through: u64,
+) -> Result<(), SourceError> {
+    // CAS-loop monotonicity guard. `fetch_max` reads the current
+    // value, computes the new value (max of current and `through`),
+    // and stores it atomically. If `through` is not higher we no-op.
+    let prev = last_stored_offset.fetch_max(through, Ordering::AcqRel);
+    if through <= prev {
+        return Ok(());
+    }
+    let mut tpl = TopicPartitionList::new();
+    tpl.add_partition_offset(topic, partition, Offset::Offset(through as i64))
+        .map_err(|e| SourceError::Transport(format!("tpl add: {e}")))?;
+    consumer
+        .store_offsets(&tpl)
+        .map_err(|e| SourceError::Transport(format!("store_offsets: {e}")))?;
+    Ok(())
 }
 
 #[async_trait]
@@ -193,6 +348,45 @@ impl Source for KafkaSource {
         .map_err(|e| SourceError::Transport(format!("fetch_low_watermark: {e}")))?;
         Ok(low.max(0) as u64)
     }
+
+    async fn commit_through(&mut self, through: u64) -> Result<(), SourceError> {
+        // Forwards into the shared helper so the trait path and the
+        // `KafkaCommitHandle` path observe the same monotonic guard.
+        // `store_offsets` is non-blocking in librdkafka (in-memory
+        // stage), so no `spawn_blocking` here.
+        stage_offset(
+            &self.consumer,
+            &self.topic,
+            self.partition,
+            &self.last_stored_offset,
+            through,
+        )
+    }
+
+    async fn fetch_committed_offset(&mut self) -> Result<Option<u64>, SourceError> {
+        // Mirrors the `low_watermark` pattern: a fresh `BaseConsumer`
+        // with the same `group.id` drives the metadata + offset
+        // lookup inside a `spawn_blocking`. Delegates to the free
+        // `fetch_committed_offset` helper so the supervisor's
+        // startup path can read the value without instantiating a
+        // full `KafkaSource`.
+        let bootstrap = self.bootstrap_servers.clone();
+        let group_id = self.group_id.clone();
+        let topic = self.topic.clone();
+        let partition = self.partition;
+        tokio::task::spawn_blocking(move || {
+            fetch_committed_offset(
+                &bootstrap,
+                &group_id,
+                &topic,
+                partition,
+                DEFAULT_WATERMARK_TIMEOUT,
+            )
+            .map_err(|e| SourceError::Transport(format!("fetch_committed_offset: {e}")))
+        })
+        .await
+        .map_err(|e| SourceError::Transport(format!("committed join: {e}")))?
+    }
 }
 
 fn borrowed_to_record(msg: &rdkafka::message::BorrowedMessage<'_>) -> Record {
@@ -287,6 +481,11 @@ pub struct KafkaSink {
     timestamp_mode: TimestampMode,
     keys: ColumnType,
     values: ColumnType,
+    /// Optional observer fired after every successful produce. Wired
+    /// in by the supervisor via [`Sink::set_write_observer`]; default
+    /// `None` so production code unaware of ack tracking keeps the
+    /// existing single-write behaviour.
+    write_observer: Option<Arc<dyn WriteObserver>>,
 }
 
 impl KafkaSink {
@@ -315,6 +514,7 @@ impl KafkaSink {
             timestamp_mode: cfg.timestamp_mode,
             keys: cfg.keys,
             values: cfg.values,
+            write_observer: None,
         })
     }
 
@@ -407,8 +607,19 @@ impl Sink for KafkaSink {
             "partition" => partition,
         )
         .set((delivery.offset as u64 + 1) as f64);
+        // Per-write ack signal. The supervisor's installed observer
+        // bumps the per-destination ack tracker; the source-side
+        // commit task then advances the broker-committed offset up
+        // to the AND of every destination's ack and any notify ack.
+        if let Some(obs) = self.write_observer.as_ref() {
+            obs.on_written(record.source_offset);
+        }
         Ok(())
     }
+
+    fn set_write_observer(&mut self, observer: Arc<dyn WriteObserver>) {
+        self.write_observer = Some(observer);
+    }
 }
 
 fn build_headers(headers: &[Header]) -> OwnedHeaders {
diff --git a/crates/mirror-notify-kkv/Cargo.toml b/crates/mirror-notify-kkv/Cargo.toml
new file mode 100644
index 0000000..6c91a6b
--- /dev/null
+++ b/crates/mirror-notify-kkv/Cargo.toml
@@ -0,0 +1,28 @@
+[package]
+name = "mirror-notify-kkv"
+version.workspace = true
+edition.workspace = true
+rust-version.workspace = true
+license.workspace = true
+repository.workspace = true
+description = "Outbound kkv-v1 webhook notifier for mirror-v3 (drop-in replacement for Yolean/kafka-keyvalue push side)"
+
+[dependencies]
+mirror-core = { workspace = true }
+mirror-config = { workspace = true }
+tokio = { workspace = true, features = ["sync", "time"] }
+async-trait = { workspace = true }
+tracing = { workspace = true }
+thiserror = { workspace = true }
+serde = { workspace = true }
+serde_json = { workspace = true }
+reqwest = { workspace = true, features = ["json"] }
+url = { workspace = true }
+indexmap = { workspace = true, features = ["serde"] }
+futures = { workspace = true }
+metrics = { workspace = true }
+
+[dev-dependencies]
+tokio = { workspace = true, features = ["test-util", "macros", "rt-multi-thread"] }
+axum = { workspace = true }
+tower = { workspace = true }
diff --git a/crates/mirror-notify-kkv/src/buffer.rs b/crates/mirror-notify-kkv/src/buffer.rs
new file mode 100644
index 0000000..0d0c5f8
--- /dev/null
+++ b/crates/mirror-notify-kkv/src/buffer.rs
@@ -0,0 +1,169 @@
+//! Debounce buffer for the `trigger.on: source-consume` notify mode.
+//!
+//! Accumulates `(key, source_offset)` per record handed to
+//! [`crate::KkvV1Notifier::on_record`] and emits a single
+//! batch-ready payload when either:
+//!   * `max-records` records have been appended since the last
+//!     drain, OR
+//!   * `max-time-ms` has elapsed since the *first* record of the
+//!     current batch landed.
+//!
+//! Per `WEBHOOKS.md § Interaction with compaction: log`, keys are
+//! set-deduped within a batch (the kkv-v1 body's `updates` is a
+//! key → null map; duplicates over the same window collapse). The
+//! `offsets` field carries the **maximum** source offset across the
+//! batch; the consumer's `requireOffset` constraint then pins the
+//! follow-up `/cache/v1/raw/<key>` read to post-batch state.
+
+use std::time::Instant;
+
+use indexmap::{IndexMap, IndexSet};
+
+/// Mutable buffer that on_record / the timer task share via a
+/// `tokio::sync::Mutex`. Not directly exposed.
+#[derive(Default, Debug)]
+pub(crate) struct Buffer {
+    /// Distinct keys in insertion order. `IndexSet` over `HashSet`
+    /// keeps the on-wire JSON deterministic, which matters for
+    /// integration-test assertions.
+    keys: IndexSet<String>,
+    /// Highest source offset across the batch.
+    max_offset: u64,
+    /// Number of records appended since the last drain. The
+    /// `max-records` trigger fires on *record count*, not on dedup-
+    /// bucket cardinality; otherwise a hot key getting repeated
+    /// hits could stall the trigger and grow the buffer's wall-clock
+    /// age indefinitely.
+    seen_records: u64,
+    /// When the first record landed in the currently-open batch.
+    /// Drives the `max-time-ms` drain check; reset on every drain.
+    first_at: Option<Instant>,
+}
+
+impl Buffer {
+    pub fn append(&mut self, key: String, source_offset: u64) {
+        if self.first_at.is_none() {
+            self.first_at = Some(Instant::now());
+        }
+        self.keys.insert(key);
+        // `max_offset` only goes up. The consumer's `requireOffset`
+        // semantics require us to report the highest offset the
+        // batch carries; out-of-order arrivals are possible if the
+        // source ever fans across partitions (not today, but the
+        // safety net is free).
+        if self.seen_records == 0 || source_offset > self.max_offset {
+            self.max_offset = source_offset;
+        }
+        self.seen_records = self.seen_records.saturating_add(1);
+    }
+
+    pub fn seen_records(&self) -> u64 {
+        self.seen_records
+    }
+
+    pub fn is_empty(&self) -> bool {
+        self.seen_records == 0
+    }
+
+    pub fn first_at(&self) -> Option<Instant> {
+        self.first_at
+    }
+
+    /// Drain the buffer and return a payload-ready batch. Empty
+    /// buffer returns `None`. After this call, the buffer is
+    /// guaranteed empty.
+    pub fn take(&mut self, partition: i32) -> Option<DrainedBatch> {
+        if self.is_empty() {
+            return None;
+        }
+        let mut offsets = IndexMap::with_capacity(1);
+        offsets.insert(partition.to_string(), self.max_offset);
+        let updates: IndexMap<String, serde_json::Value> = self
+            .keys
+            .drain(..)
+            .map(|k| (k, serde_json::Value::Null))
+            .collect();
+        self.max_offset = 0;
+        self.seen_records = 0;
+        self.first_at = None;
+        Some(DrainedBatch { offsets, updates })
+    }
+}
+
+/// Owned payload-ready batch handed off to the dispatcher.
+#[derive(Debug)]
+pub(crate) struct DrainedBatch {
+    pub offsets: IndexMap<String, u64>,
+    pub updates: IndexMap<String, serde_json::Value>,
+}
+
+impl DrainedBatch {
+    /// The highest source offset across every partition in the batch.
+    /// Mirrors are pinned to one `(topic, partition)` today so the
+    /// map holds one entry; the iteration generalises cleanly if a
+    /// future multi-partition mirror is added.
+    pub fn high_offset(&self) -> u64 {
+        self.offsets.values().copied().max().unwrap_or(0)
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn empty_take_returns_none() {
+        let mut b = Buffer::default();
+        assert!(b.take(0).is_none());
+    }
+
+    #[test]
+    fn append_then_take_carries_keys_and_max_offset() {
+        let mut b = Buffer::default();
+        b.append("a".into(), 10);
+        b.append("b".into(), 11);
+        b.append("c".into(), 12);
+        let batch = b.take(3).unwrap();
+        assert_eq!(batch.offsets.get("3"), Some(&12));
+        assert_eq!(batch.updates.len(), 3);
+        assert!(b.is_empty(), "take must reset");
+    }
+
+    #[test]
+    fn duplicate_keys_collapse_but_record_count_still_climbs() {
+        let mut b = Buffer::default();
+        b.append("hot".into(), 1);
+        b.append("hot".into(), 2);
+        b.append("hot".into(), 3);
+        assert_eq!(b.seen_records(), 3, "max-records must count appends");
+        let batch = b.take(0).unwrap();
+        assert_eq!(batch.updates.len(), 1, "key set must dedup");
+        assert_eq!(batch.offsets["0"], 3, "max offset must be 3");
+    }
+
+    #[test]
+    fn out_of_order_offsets_still_report_max() {
+        let mut b = Buffer::default();
+        b.append("a".into(), 5);
+        b.append("b".into(), 9);
+        b.append("c".into(), 7);
+        let batch = b.take(0).unwrap();
+        assert_eq!(batch.offsets["0"], 9);
+    }
+
+    #[test]
+    fn first_at_is_set_on_first_append_and_cleared_on_drain() {
+        let mut b = Buffer::default();
+        assert!(b.first_at().is_none());
+        b.append("a".into(), 1);
+        let t = b.first_at().expect("first append sets the timer");
+        b.append("b".into(), 2);
+        assert_eq!(
+            b.first_at(),
+            Some(t),
+            "later appends must NOT shift first_at; the debounce window measures from the first record"
+        );
+        b.take(0);
+        assert!(b.first_at().is_none(), "drain resets first_at");
+    }
+}
diff --git a/crates/mirror-notify-kkv/src/lib.rs b/crates/mirror-notify-kkv/src/lib.rs
new file mode 100644
index 0000000..9934559
--- /dev/null
+++ b/crates/mirror-notify-kkv/src/lib.rs
@@ -0,0 +1,1297 @@
+//! Outbound `kkv-v1` webhook notifier. Drop-in replacement for the
+//! push side of `Yolean/kafka-keyvalue`.
+//!
+//! Wire contract (matches the `@yolean/kafka-keyvalue` Node client
+//! unmodified; see `WEBHOOKS.md`):
+//!   * `POST /kafka-keyvalue/v1/updates`
+//!   * Headers: `x-kkv-topic`, `x-kkv-offsets`
+//!   * Body: `{ "topic": "...", "offsets": {"<partition>": <offset>}, "updates": { "<key>": null } }`
+//!
+//! Trigger model (`trigger.on: source-consume`):
+//!   * Every accepted record is fed to [`KkvV1Notifier::on_record`]
+//!     by the mirror loop. Records accumulate in an in-memory buffer
+//!     (key set with the highest source offset across the batch).
+//!   * The buffer is drained (POSTed and reset) when either
+//!     `debounce.max-records` records have arrived since the last
+//!     drain, or `debounce.max-time-ms` has elapsed since the *first*
+//!     record of the current batch landed.
+//!   * The max-records trigger drains inline (`on_record` awaits the
+//!     dispatch); the max-time-ms trigger drains from a background
+//!     timer task. Errors from the timer-task drain are surfaced on
+//!     the next `on_record` / `shutdown` call.
+
+use std::net::SocketAddr;
+use std::sync::atomic::{AtomicBool, Ordering};
+use std::sync::{Arc, OnceLock};
+use std::time::{Duration, Instant};
+
+use async_trait::async_trait;
+use futures::future::join_all;
+use indexmap::IndexMap;
+use mirror_config::{
+    FanOut, FinalAction, NotifyApi, NotifyOutcome, NotifyOutcomes, NotifyRetry, NotifyTarget,
+};
+use mirror_core::{current_labels, AckSink, CacheState, Notifier, NotifyError, Record};
+use reqwest::Client;
+use serde::Serialize;
+use thiserror::Error;
+use tokio::sync::{Mutex as TokioMutex, Notify as TokioNotify};
+use tokio::task::JoinHandle;
+use url::Url;
+
+mod buffer;
+mod resolver;
+
+use buffer::{Buffer, DrainedBatch};
+pub use resolver::{DnsAResolver, SystemDnsResolver};
+
+/// How long a `fan-out: dns-a` resolution is reused before a
+/// re-resolve. 30s matches the spec's "default 30 s if no TTL is
+/// published". Failure invalidates the cache early (per spec) so
+/// scale-down recovery doesn't wait the full window.
+const DNS_A_CACHE_TTL: Duration = Duration::from_secs(30);
+
+/// Default path component when a target's URL has no explicit path.
+/// Matches `@yolean/kafka-keyvalue` Node client's
+/// `ON_UPDATE_DEFAULT_PATH`.
+pub const KKV_V1_DEFAULT_PATH: &str = "/kafka-keyvalue/v1/updates";
+
+/// Errors produced while constructing a [`KkvV1Notifier`] from config.
+/// Surfaced once at startup so the supervisor can refuse to launch a
+/// mirror whose notify block can't possibly work, instead of crashing
+/// on the first record.
+#[derive(Debug, Error)]
+pub enum BuildError {
+    #[error("notify.targets must be non-empty")]
+    NoTargets,
+    #[error("notify.target url {url:?} is not a valid URL: {source}")]
+    InvalidUrl {
+        url: String,
+        #[source]
+        source: url::ParseError,
+    },
+    #[error("notify.target url {url} must use http:// or https://; got scheme {scheme:?}")]
+    UnsupportedScheme { url: String, scheme: String },
+    #[error("notify.target url {url} has no host")]
+    NoHost { url: String },
+    #[error("failed to build reqwest client: {0}")]
+    ClientBuild(String),
+}
+
+/// Per-target dispatcher state. One target maps to one `Endpoint`. The
+/// `fan_out` mode decides whether dispatch goes to the URL's host
+/// (resolved transparently by reqwest) or to every A/AAAA record the
+/// configured resolver returns (one POST per address).
+#[derive(Debug)]
+struct Endpoint {
+    /// Fully-resolved URL the POST goes to. `kkv-v1` default path is
+    /// applied here at build time so the per-request hot path stays
+    /// allocation-free.
+    url: Url,
+    /// Pre-rendered `target_host` metric label (`url.host_str()`).
+    /// For fan-out: dns-a this is the *configured* hostname; the
+    /// per-address dispatch uses the resolved IP as its
+    /// `target_host` label instead.
+    target_host: String,
+    client: Client,
+    fan_out: FanOutMode,
+}
+
+/// Per-endpoint fan-out behaviour. `None` is the default,
+/// single-address path; `DnsA` resolves the URL's host to all
+/// A/AAAA records and POSTs every address concurrently.
+#[derive(Debug)]
+enum FanOutMode {
+    /// Single POST to the URL as-is. reqwest handles DNS internally.
+    None,
+    /// Resolve `host:port` via [`DnsAResolver`], dispatch one POST
+    /// per returned address. Resolutions cached for
+    /// [`DNS_A_CACHE_TTL`] and invalidated on any per-address
+    /// failure (matches the spec's "re-resolve on any failure"
+    /// recommendation).
+    DnsA(DnsAState),
+}
+
+/// Cached resolver state for one `fan-out: dns-a` endpoint.
+#[derive(Debug)]
+struct DnsAState {
+    /// Hostname we resolve.
+    host: String,
+    /// Port carried by every resolved `SocketAddr` (production: the
+    /// URL's port or scheme default; tests: whatever the stub
+    /// resolver returns).
+    port: u16,
+    cached: TokioMutex<Option<(Vec<SocketAddr>, Instant)>>,
+}
+
+/// Stateless dispatcher: takes a built batch payload, runs it through
+/// the per-outcome retry/final-action state machine, against each
+/// configured endpoint in turn. Lives behind an `Arc` so the buffer's
+/// inline-drain path and the background timer task can both invoke it.
+struct Inner {
+    endpoints: Vec<Endpoint>,
+    outcomes: NotifyOutcomes,
+    retry: NotifyRetry,
+    topic: String,
+    partition: i32,
+    resolver: Arc<dyn DnsAResolver>,
+}
+
+/// Shared notifier state. `buffer` holds the in-progress batch;
+/// `new_data` wakes the timer task when on_record adds to an empty
+/// buffer; `shutting_down` lets shutdown signal the timer to exit
+/// even if it's mid-sleep; `error_state` lets the timer surface a
+/// terminal error to whichever of on_record / shutdown polls next.
+struct NotifierState {
+    buffer: TokioMutex<Buffer>,
+    new_data: TokioNotify,
+    shutting_down: AtomicBool,
+    error_state: TokioMutex<Option<NotifyError>>,
+    /// Set once, before any record is dispatched, via
+    /// [`KkvV1Notifier::with_ack_sink`]. Shared between
+    /// `drain_now` (inline path) and the background timer task so
+    /// both paths feed the supervisor's per-mirror ack tracker.
+    ack_sink: OnceLock<Arc<dyn AckSink>>,
+}
+
+/// Notifier implementing the kkv-v1 wire contract. One instance per
+/// mirror (per `(topic, partition)`).
+pub struct KkvV1Notifier {
+    inner: Arc<Inner>,
+    state: Arc<NotifierState>,
+    timer_task: Option<JoinHandle<()>>,
+    max_records: u64,
+    /// Per-mirror readiness handle. `on_record` consults
+    /// `cache_state.is_mirror_ready(&mirror_name)` and drops records
+    /// whose source offset hasn't crossed the mirror's bootstrap
+    /// high-watermark yet. Matches the legacy kkv `KafkaCache` Stage
+    /// gate which suppressed push notifications until `Polling`.
+    cache_state: Arc<CacheState>,
+    mirror_name: String,
+}
+
+impl KkvV1Notifier {
+    /// Build a notifier from a validated [`mirror_config::Notify`]
+    /// block. The caller is responsible for the higher-level
+    /// validation (URL well-formedness, target non-empty, etc.);
+    /// `mirror-config` does that in `validate_notify_shared`. The
+    /// checks here are the lighter-weight last-mile ones the runtime
+    /// needs to actually open a `reqwest::Client`.
+    ///
+    /// `notify.trigger.on` is only consulted for the debounce
+    /// window (`source-consume` honours `debounce.max-time-ms`;
+    /// `destination-flush` ignores debounce since it does not run
+    /// via this notifier at all, only via `FlushDispatcher`).
+    pub fn from_config(
+        notify: &mirror_config::Notify,
+        topic: String,
+        partition: i32,
+        cache_state: Arc<CacheState>,
+        mirror_name: String,
+    ) -> Result<Self, BuildError> {
+        Self::from_config_with_resolver(
+            notify,
+            topic,
+            partition,
+            cache_state,
+            mirror_name,
+            Arc::new(SystemDnsResolver),
+        )
+    }
+
+    /// Same as [`Self::from_config`] but with a caller-supplied DNS
+    /// resolver. Tests use this to inject a stub that returns canned
+    /// `SocketAddr`s, exercising the `fan-out: dns-a` dispatch path
+    /// against multiple axum servers without depending on the system
+    /// resolver or `/etc/hosts`.
+    pub fn from_config_with_resolver(
+        notify: &mirror_config::Notify,
+        topic: String,
+        partition: i32,
+        cache_state: Arc<CacheState>,
+        mirror_name: String,
+        resolver: Arc<dyn DnsAResolver>,
+    ) -> Result<Self, BuildError> {
+        let inner = Arc::new(build_inner(notify, topic, partition, resolver)?);
+
+        // Debounce config lives on the trigger block. Defaults come
+        // from `NotifyTrigger::default()` (`Some({100, 250})` for
+        // source-consume); validator rejects missing debounce for
+        // source-consume so the `expect` here is unreachable for any
+        // legit config.
+        let debounce = notify
+            .trigger
+            .debounce
+            .unwrap_or(mirror_config::NotifyDebounce {
+                max_records: 1,
+                max_time_ms: u64::MAX,
+            });
+        let max_records = debounce.max_records;
+        let max_time = Duration::from_millis(debounce.max_time_ms);
+        let state = Arc::new(NotifierState {
+            buffer: TokioMutex::new(Buffer::default()),
+            new_data: TokioNotify::new(),
+            shutting_down: AtomicBool::new(false),
+            error_state: TokioMutex::new(None),
+            ack_sink: OnceLock::new(),
+        });
+
+        // Always spawn the timer task. For `max_records: 1` it just
+        // never fires (every drain is inline from on_record), and the
+        // sleeping task costs ~nothing.
+        let timer_task = tokio::spawn(timer_loop(Arc::clone(&inner), Arc::clone(&state), max_time));
+
+        Ok(Self {
+            inner,
+            state,
+            timer_task: Some(timer_task),
+            max_records,
+            cache_state,
+            mirror_name,
+        })
+    }
+
+    /// Install an [`AckSink`]. The notifier calls
+    /// `ack.note_through(high_offset + 1)` after every successful
+    /// batch drain, where `high_offset` is the largest source offset
+    /// in the just-delivered batch. Idempotent if called twice;
+    /// `OnceLock::set` returns `Err` on the second call which we
+    /// drop intentionally (the first install wins).
+    ///
+    /// Builder shape so callers don't have to add yet another
+    /// constructor argument; supervisors install the ack sink
+    /// immediately after `from_config` and before handing the
+    /// notifier to the run loop.
+    pub fn with_ack_sink(self, ack: Arc<dyn AckSink>) -> Self {
+        let _ = self.state.ack_sink.set(ack);
+        self
+    }
+
+    /// Drain the current buffer (if any) and dispatch it. Used from
+    /// both the on_record max-records path and shutdown.
+    async fn drain_now(&self) -> Result<(), NotifyError> {
+        let batch = {
+            let mut buf = self.state.buffer.lock().await;
+            buf.take(self.inner.partition)
+        };
+        let Some(batch) = batch else {
+            return Ok(());
+        };
+        let high = batch.high_offset();
+        self.inner.dispatch_drained(batch).await?;
+        // Successful dispatch through every endpoint => the batch is
+        // delivered. Tell the supervisor's ack tracker so the
+        // periodic source-commit task can advance the broker-side
+        // committed offset.
+        if let Some(ack) = self.state.ack_sink.get() {
+            ack.note_through(high + 1);
+        }
+        Ok(())
+    }
+}
+
+impl Inner {
+    async fn dispatch_drained(&self, batch: DrainedBatch) -> Result<(), NotifyError> {
+        let payload = KkvV1Payload::new(&self.topic, batch.offsets, batch.updates);
+        self.dispatch_batch(&payload).await
+    }
+
+    /// POST a single batch payload to every configured endpoint
+    /// serially. Per-endpoint fan-out is internal to
+    /// [`Self::dispatch_endpoint`].
+    async fn dispatch_batch(&self, payload: &KkvV1Payload<'_>) -> Result<(), NotifyError> {
+        for endpoint in &self.endpoints {
+            self.dispatch_endpoint(endpoint, payload).await?;
+        }
+        Ok(())
+    }
+
+    /// One endpoint = one configured `notify.targets[]` entry.
+    /// Dispatch behaviour branches on the endpoint's fan-out mode:
+    /// `none` POSTs to the URL as-is (one address, reqwest does DNS
+    /// internally); `dns-a` resolves the URL's host via
+    /// [`DnsAResolver`] and POSTs to every returned address
+    /// concurrently. Per the spec, any per-address outcome that
+    /// resolves to `final: fail` fails the whole batch.
+    async fn dispatch_endpoint(
+        &self,
+        endpoint: &Endpoint,
+        payload: &KkvV1Payload<'_>,
+    ) -> Result<(), NotifyError> {
+        match &endpoint.fan_out {
+            FanOutMode::None => {
+                self.dispatch_to_address(
+                    &endpoint.client,
+                    endpoint.url.clone(),
+                    &endpoint.target_host,
+                    payload,
+                )
+                .await
+            }
+            FanOutMode::DnsA(state) => self.dispatch_dns_a(endpoint, state, payload).await,
+        }
+    }
+
+    /// Fan-out dispatch: resolve, then concurrent POSTs per address.
+    /// First per-address error wins (subsequent results are still
+    /// awaited so we don't leak in-flight requests).
+    async fn dispatch_dns_a(
+        &self,
+        endpoint: &Endpoint,
+        state: &DnsAState,
+        payload: &KkvV1Payload<'_>,
+    ) -> Result<(), NotifyError> {
+        let addrs = state.resolve_or_cached(self.resolver.as_ref()).await?;
+        if addrs.is_empty() {
+            return Err(NotifyError::Transport(format!(
+                "dns-a resolution of {} returned 0 addresses",
+                state.host
+            )));
+        }
+        let futures = addrs.iter().map(|sa| {
+            let mut per_addr_url = endpoint.url.clone();
+            // Set host to the IP literal; set port to the resolved
+            // socket's port (matches the URL's port in production,
+            // but lets test stubs aim at arbitrary axum servers).
+            // Both setters return `Result<(), …>` for malformed
+            // inputs; IPs and small ports never fail here so unwrap
+            // is justified.
+            per_addr_url
+                .set_ip_host(sa.ip())
+                .expect("set_ip_host on a valid URL always succeeds for an IpAddr");
+            per_addr_url
+                .set_port(Some(sa.port()))
+                .expect("set_port on a valid URL with an http(s) scheme succeeds");
+            let host_label = sa.to_string();
+            async move {
+                self.dispatch_to_address(&endpoint.client, per_addr_url, &host_label, payload)
+                    .await
+            }
+        });
+        let results = join_all(futures).await;
+        let mut first_err: Option<NotifyError> = None;
+        for r in results {
+            if let Err(e) = r {
+                first_err.get_or_insert(e);
+            }
+        }
+        match first_err {
+            Some(e) => {
+                // Per-spec: "Re-resolve when the cache TTL expires
+                // OR when an address fails repeatedly." Failure
+                // invalidates the cached set immediately so the next
+                // dispatch (after the supervisor restarts the
+                // mirror) picks up any K8s scale-down that happened
+                // mid-batch.
+                state.invalidate_cache().await;
+                Err(e)
+            }
+            None => Ok(()),
+        }
+    }
+
+    /// Run the per-attempt retry / outcome / final-action loop
+    /// against ONE address. Used by both `fan-out: none` (with the
+    /// endpoint's URL/host) and `fan-out: dns-a` (with a per-address
+    /// rewritten URL and the IP literal as the metric label).
+    async fn dispatch_to_address(
+        self: &Inner,
+        client: &Client,
+        url: Url,
+        target_host: &str,
+        payload: &KkvV1Payload<'_>,
+    ) -> Result<(), NotifyError> {
+        let body = serde_json::to_vec(payload).map_err(|e| {
+            // Body serialization failure is a programming error, not
+            // a webhook-receiver problem; surface as transport so the
+            // operator sees a loud, distinct line.
+            NotifyError::Transport(format!("payload serialization failed: {e}"))
+        })?;
+        let offsets_header = serde_json::to_string(&payload.offsets).map_err(|e| {
+            NotifyError::Transport(format!("offsets header serialization failed: {e}"))
+        })?;
+
+        let mut attempt: u32 = 1;
+        let mut last_error: String = String::new();
+        loop {
+            let (topic_l, partition_l) = current_labels();
+            // Per-attempt retry gauge; spec says 1-based, 0 when idle.
+            metrics::gauge!(
+                "mirror_v3_notify_inflight_retry",
+                "topic" => topic_l.clone(),
+                "partition" => partition_l.clone(),
+                "target_host" => target_host.to_string(),
+            )
+            .set(attempt as f64);
+
+            let start = std::time::Instant::now();
+            let result = client
+                .post(url.clone())
+                .header("content-type", "application/json")
+                .header("x-kkv-topic", &self.topic)
+                .header("x-kkv-offsets", &offsets_header)
+                .body(body.clone())
+                .send()
+                .await;
+
+            metrics::histogram!(
+                "mirror_v3_notify_post_duration_seconds",
+                "topic" => topic_l.clone(),
+                "partition" => partition_l.clone(),
+                "target_host" => target_host.to_string(),
+            )
+            .record(start.elapsed().as_secs_f64());
+
+            let outcome = classify(result, &mut last_error);
+            let policy = self.outcomes.for_outcome(outcome);
+
+            tracing::debug!(
+                target = %url,
+                attempt,
+                max_attempts = self.retry.max_attempts,
+                ?outcome,
+                policy_retry = policy.retry,
+                policy_final = ?policy.final_,
+                "notify post attempt"
+            );
+
+            if matches!(outcome, Outcome::TwoXx) {
+                // Reset retry gauge on success.
+                metrics::gauge!(
+                    "mirror_v3_notify_inflight_retry",
+                    "topic" => topic_l.clone(),
+                    "partition" => partition_l.clone(),
+                    "target_host" => target_host.to_string(),
+                )
+                .set(0.0);
+                metrics::counter!(
+                    "mirror_v3_notify_batches_total",
+                    "topic" => topic_l,
+                    "partition" => partition_l,
+                    "result" => "ok",
+                )
+                .increment(1);
+                return Ok(());
+            }
+
+            if policy.retry && attempt < self.retry.max_attempts {
+                tracing::warn!(
+                    target = %url,
+                    attempt,
+                    max_attempts = self.retry.max_attempts,
+                    reason = %last_error,
+                    "notify retry"
+                );
+                let backoff = backoff_for_attempt(self.retry.backoff_ms, attempt);
+                tokio::time::sleep(backoff).await;
+                attempt += 1;
+                continue;
+            }
+
+            // Either retry: false (one attempt only) or we've used
+            // the retry budget. Apply the final action.
+            return self
+                .apply_final_action(
+                    &url,
+                    target_host,
+                    outcome,
+                    policy,
+                    attempt,
+                    std::mem::take(&mut last_error),
+                )
+                .await;
+        }
+    }
+
+    async fn apply_final_action(
+        self: &Inner,
+        url: &Url,
+        target_host: &str,
+        outcome: Outcome,
+        policy: NotifyOutcome,
+        attempts: u32,
+        last_error: String,
+    ) -> Result<(), NotifyError> {
+        let (topic_l, partition_l) = current_labels();
+        // Reset retry gauge regardless of outcome; the request is
+        // no longer in flight.
+        metrics::gauge!(
+            "mirror_v3_notify_inflight_retry",
+            "topic" => topic_l.clone(),
+            "partition" => partition_l.clone(),
+            "target_host" => target_host.to_string(),
+        )
+        .set(0.0);
+
+        match policy.final_ {
+            FinalAction::Accept => {
+                tracing::info!(
+                    target = %url,
+                    ?outcome,
+                    attempts,
+                    "notify outcome resolved to accept (treated as delivered)"
+                );
+                metrics::counter!(
+                    "mirror_v3_notify_batches_total",
+                    "topic" => topic_l,
+                    "partition" => partition_l,
+                    "result" => "ok",
+                )
+                .increment(1);
+                Ok(())
+            }
+            FinalAction::Skip => {
+                tracing::warn!(
+                    target = %url,
+                    ?outcome,
+                    attempts,
+                    reason = %last_error,
+                    "notify outcome resolved to skip; dropping batch"
+                );
+                metrics::counter!(
+                    "mirror_v3_notify_batches_total",
+                    "topic" => topic_l,
+                    "partition" => partition_l,
+                    "result" => "skip",
+                )
+                .increment(1);
+                Ok(())
+            }
+            FinalAction::Fail => {
+                tracing::error!(
+                    target = %url,
+                    ?outcome,
+                    attempts,
+                    reason = %last_error,
+                    "notify exhausted; mirror will exit"
+                );
+                metrics::counter!(
+                    "mirror_v3_notify_batches_total",
+                    "topic" => topic_l,
+                    "partition" => partition_l,
+                    "result" => "fail",
+                )
+                .increment(1);
+                Err(NotifyError::Exhausted {
+                    attempts,
+                    last_error,
+                })
+            }
+        }
+    }
+}
+
+impl DnsAState {
+    async fn resolve_or_cached(
+        &self,
+        resolver: &dyn DnsAResolver,
+    ) -> Result<Vec<SocketAddr>, NotifyError> {
+        {
+            let cached = self.cached.lock().await;
+            if let Some((addrs, at)) = cached.as_ref() {
+                if at.elapsed() < DNS_A_CACHE_TTL {
+                    return Ok(addrs.clone());
+                }
+            }
+        }
+        let addrs = resolver.resolve(&self.host, self.port).await.map_err(|e| {
+            NotifyError::Transport(format!("dns-a resolution failed for {}: {e}", self.host))
+        })?;
+        // Dedupe in case the resolver returned the same SocketAddr
+        // twice (lookup_host can yield both IPv4 + IPv4-mapped IPv6,
+        // for example). Preserve order.
+        let mut seen = std::collections::HashSet::new();
+        let unique: Vec<SocketAddr> = addrs.into_iter().filter(|a| seen.insert(*a)).collect();
+        *self.cached.lock().await = Some((unique.clone(), Instant::now()));
+        Ok(unique)
+    }
+
+    async fn invalidate_cache(&self) {
+        *self.cached.lock().await = None;
+    }
+}
+
+#[async_trait]
+impl Notifier for KkvV1Notifier {
+    async fn on_record(&mut self, record: &Record) -> Result<(), NotifyError> {
+        // First: surface any terminal error the timer task accumulated
+        // since the last call. Once an error is observed we still let
+        // the run loop hand us further records; they'll just keep
+        // returning the same error until the loop aborts. Take() so
+        // we only return it once.
+        if let Some(err) = self.state.error_state.lock().await.take() {
+            return Err(err);
+        }
+
+        // Suppress records below this mirror's
+        // `suppression_threshold` (set at register time as
+        // `max(last_committed_offset, bootstrap_hwm if no commit)`).
+        // Two regimes:
+        //   * Returning deploy (group has a committed value `C`):
+        //     threshold = C. Records below C were already delivered
+        //     by the previous pod; records in `[C, bootstrap_hwm)`
+        //     are the between-pods gap and DO fire.
+        //   * Fresh deploy (no committed value): threshold =
+        //     bootstrap_hwm. Records during the first-replay window
+        //     don't fan webhook out to consumers.
+        // The suppressed counter is the operator's visibility into
+        // how many records were skipped.
+        if self
+            .cache_state
+            .is_record_suppressed(&self.mirror_name, record.source_offset)
+        {
+            let (topic_l, partition_l) = current_labels();
+            metrics::counter!(
+                "mirror_v3_notify_suppressed_records_total",
+                "topic" => topic_l,
+                "partition" => partition_l,
+            )
+            .increment(1);
+            return Ok(());
+        }
+
+        // Keys may be missing or non-UTF-8. Legacy kkv emits whatever
+        // string repr the consumer expects; mirror-v3 chooses
+        // lossy-UTF-8 on bytes and `""` on missing key. Real
+        // deployments use UTF-8 keys; this keeps the surface working
+        // on edge cases instead of crashing.
+        let key_str = render_key(record.key.as_deref());
+
+        let (topic_l, partition_l) = current_labels();
+        metrics::counter!(
+            "mirror_v3_notify_records_total",
+            "topic" => topic_l.clone(),
+            "partition" => partition_l.clone(),
+        )
+        .increment(1);
+
+        let drain_now;
+        let buffer_depth;
+        {
+            let mut buf = self.state.buffer.lock().await;
+            let was_empty = buf.is_empty();
+            buf.append(key_str, record.source_offset);
+            drain_now = buf.seen_records() >= self.max_records;
+            buffer_depth = buf.seen_records();
+            // Wake the timer when the buffer transitions empty →
+            // non-empty so the max-time-ms clock starts running.
+            if was_empty {
+                self.state.new_data.notify_one();
+            }
+        }
+        metrics::gauge!(
+            "mirror_v3_notify_buffer_records",
+            "topic" => topic_l,
+            "partition" => partition_l,
+        )
+        .set(buffer_depth as f64);
+
+        if drain_now {
+            // Inline drain: caller (the consume loop) blocks on the
+            // POST + retry cycle. This is the natural backpressure
+            // mechanism from the spec's failure-modes table.
+            self.drain_now().await
+        } else {
+            Ok(())
+        }
+    }
+
+    async fn shutdown(&mut self) -> Result<(), NotifyError> {
+        // Signal the timer task to exit even if it's mid-sleep, then
+        // drain any pending batch synchronously so we can surface the
+        // result to the supervisor before returning.
+        self.state.shutting_down.store(true, Ordering::SeqCst);
+        self.state.new_data.notify_one();
+
+        let drain_result = self.drain_now().await;
+
+        if let Some(t) = self.timer_task.take() {
+            // Abort before await; the task may currently be in a
+            // `sleep` we can't easily interrupt otherwise. The task
+            // does no externally-visible work past the shutting_down
+            // check, so aborting is safe.
+            t.abort();
+            let _ = t.await;
+        }
+
+        // Prefer the just-now drain error over any older one the
+        // timer task might have stashed.
+        drain_result?;
+        if let Some(err) = self.state.error_state.lock().await.take() {
+            return Err(err);
+        }
+        Ok(())
+    }
+}
+
+/// Background drain loop. Waits for `state.new_data` to signal that
+/// the buffer transitioned empty → non-empty, then sleeps for the
+/// remaining time before the buffer's `first_at + max_time` deadline
+/// and drains. The on_record path may have drained inline in the
+/// meantime; in that case the take() returns None and we go back to
+/// waiting.
+async fn timer_loop(inner: Arc<Inner>, state: Arc<NotifierState>, max_time: Duration) {
+    loop {
+        state.new_data.notified().await;
+        if state.shutting_down.load(Ordering::SeqCst) {
+            return;
+        }
+        // Compute the actual remaining time relative to the buffer's
+        // first_at; between notify_one() and our wake-up, on_record
+        // could have drained inline (first_at = None) or there could
+        // simply be no data left.
+        let remaining = {
+            let buf = state.buffer.lock().await;
+            match buf.first_at() {
+                Some(t) => max_time.saturating_sub(t.elapsed()),
+                None => continue,
+            }
+        };
+        tokio::time::sleep(remaining).await;
+        if state.shutting_down.load(Ordering::SeqCst) {
+            return;
+        }
+        let batch = {
+            let mut buf = state.buffer.lock().await;
+            buf.take(inner.partition)
+        };
+        if let Some(batch) = batch {
+            let high = batch.high_offset();
+            if let Err(e) = inner.dispatch_drained(batch).await {
+                // Stash for the next on_record / shutdown to surface;
+                // exit so the buffer doesn't grow further behind a
+                // broken receiver.
+                *state.error_state.lock().await = Some(e);
+                return;
+            }
+            // Same ack semantics as `drain_now`: successful POST
+            // through every endpoint => the batch is delivered.
+            if let Some(ack) = state.ack_sink.get() {
+                ack.note_through(high + 1);
+            }
+        }
+    }
+}
+
+/// Build the per-mirror dispatcher state shared by both
+/// [`KkvV1Notifier`] (source-consume trigger) and [`FlushDispatcher`]
+/// (destination-flush trigger). Validates targets, opens the
+/// reqwest client, and resolves each target into an [`Endpoint`].
+fn build_inner(
+    notify: &mirror_config::Notify,
+    topic: String,
+    partition: i32,
+    resolver: Arc<dyn DnsAResolver>,
+) -> Result<Inner, BuildError> {
+    assert_eq!(notify.api, NotifyApi::KkvV1, "only kkv-v1 supported today");
+    if notify.targets.is_empty() {
+        return Err(BuildError::NoTargets);
+    }
+    let timeout = Duration::from_millis(notify.timeout_ms);
+    let client = Client::builder()
+        .timeout(timeout)
+        .redirect(reqwest::redirect::Policy::none())
+        .build()
+        .map_err(|e| BuildError::ClientBuild(e.to_string()))?;
+    let mut endpoints = Vec::with_capacity(notify.targets.len());
+    for t in &notify.targets {
+        endpoints.push(build_endpoint(t, client.clone())?);
+    }
+    Ok(Inner {
+        endpoints,
+        outcomes: notify.outcomes,
+        retry: notify.retry,
+        topic,
+        partition,
+        resolver,
+    })
+}
+
+/// Webhook dispatcher for the `trigger.on: destination-flush` mode.
+/// Implements [`mirror_core::FlushObserver`]: each `on_flushed(from,
+/// to)` enqueues a [`FlushEvent`] into an unbounded channel; the
+/// drainer task pulls events and POSTs a kkv-v1 body per event
+/// (`offsets: {partition: to}`, `updates: {}`).
+///
+/// Separate type from [`KkvV1Notifier`] because the two trigger
+/// modes' lifecycles don't overlap: source-consume builds a
+/// notifier and uses `NoOpNotifier`-shaped destination behaviour;
+/// destination-flush builds a dispatcher and uses
+/// `NoOpNotifier` in the run loop. The supervisor picks one or the
+/// other based on `notify.trigger.on`.
+pub struct FlushDispatcher {
+    /// Held so the drainer task can be addressed via
+    /// `error_state` / `tx` for shutdown signalling; otherwise
+    /// untouched at runtime. (`#[allow(dead_code)]` quiets the
+    /// linter; the field exists so callers can extend the type
+    /// without re-deriving the shared state from the channel.)
+    #[allow(dead_code)]
+    inner: Arc<Inner>,
+    tx: tokio::sync::mpsc::UnboundedSender<FlushEvent>,
+    drainer: Option<JoinHandle<()>>,
+    error_state: Arc<TokioMutex<Option<NotifyError>>>,
+    /// Per-mirror readiness handle. `on_flushed` consults
+    /// `cache_state.is_mirror_ready(&mirror_name)` and drops events
+    /// arriving before the mirror's bootstrap high-watermark is
+    /// crossed. Matches the source-consume gate on [`KkvV1Notifier`].
+    cache_state: Arc<CacheState>,
+    mirror_name: String,
+    topic: String,
+    partition: i32,
+    /// Set once via [`Self::with_ack_sink`]. Shared with the drainer
+    /// task at construction; the drainer calls
+    /// `note_through(to + 1)` after a successful POST so the
+    /// supervisor's per-mirror ack tracker can advance.
+    ack_sink: Arc<OnceLock<Arc<dyn AckSink>>>,
+}
+
+enum FlushEvent {
+    Flushed { to: u64 },
+    Shutdown,
+}
+
+impl FlushDispatcher {
+    pub fn from_config(
+        notify: &mirror_config::Notify,
+        topic: String,
+        partition: i32,
+        cache_state: Arc<CacheState>,
+        mirror_name: String,
+    ) -> Result<Self, BuildError> {
+        Self::from_config_with_resolver(
+            notify,
+            topic,
+            partition,
+            cache_state,
+            mirror_name,
+            Arc::new(SystemDnsResolver),
+        )
+    }
+
+    pub fn from_config_with_resolver(
+        notify: &mirror_config::Notify,
+        topic: String,
+        partition: i32,
+        cache_state: Arc<CacheState>,
+        mirror_name: String,
+        resolver: Arc<dyn DnsAResolver>,
+    ) -> Result<Self, BuildError> {
+        let inner = Arc::new(build_inner(notify, topic.clone(), partition, resolver)?);
+        let (tx, rx) = tokio::sync::mpsc::unbounded_channel();
+        let error_state = Arc::new(TokioMutex::new(None));
+        let ack_sink: Arc<OnceLock<Arc<dyn AckSink>>> = Arc::new(OnceLock::new());
+        let drainer = tokio::spawn(flush_drainer_loop(
+            Arc::clone(&inner),
+            rx,
+            Arc::clone(&error_state),
+            Arc::clone(&ack_sink),
+        ));
+        Ok(Self {
+            inner,
+            tx,
+            drainer: Some(drainer),
+            error_state,
+            cache_state,
+            mirror_name,
+            topic,
+            partition,
+            ack_sink,
+        })
+    }
+
+    /// Install an [`AckSink`]. The drainer calls
+    /// `ack.note_through(to + 1)` after every successful POST,
+    /// where `to` is the high-water offset of the flushed batch the
+    /// blob sink reported. Idempotent if called twice; the first
+    /// install wins.
+    pub fn with_ack_sink(self, ack: Arc<dyn AckSink>) -> Self {
+        let _ = self.ack_sink.set(ack);
+        self
+    }
+
+    /// Drain pending events and stop the background task. Returns
+    /// any error the drainer accumulated before exit. Idempotent -
+    /// calling twice is safe (the second call is a no-op).
+    pub async fn shutdown(&mut self) -> Result<(), NotifyError> {
+        let _ = self.tx.send(FlushEvent::Shutdown);
+        if let Some(handle) = self.drainer.take() {
+            handle.abort();
+            let _ = handle.await;
+        }
+        if let Some(err) = self.error_state.lock().await.take() {
+            return Err(err);
+        }
+        Ok(())
+    }
+
+    /// Snapshot the drainer's latest error without consuming the
+    /// dispatcher. Used by `mirror-bin`'s status / supervision loop
+    /// to detect a fatal dispatch failure without waiting for
+    /// shutdown.
+    pub async fn last_error(&self) -> Option<NotifyError> {
+        self.error_state.lock().await.take()
+    }
+}
+
+impl mirror_core::FlushObserver for FlushDispatcher {
+    fn on_flushed(&self, _from: u64, to: u64) {
+        // Suppress flush events whose high-water offset hasn't
+        // reached this mirror's `suppression_threshold`. The
+        // threshold compares against `to` (the flush event's high
+        // offset): if `to < threshold` the whole flushed batch is
+        // in the suppression window. `on_flushed` is a sync trait
+        // method outside the `MIRROR_LABELS` task-local scope, so
+        // labels come from the fields populated at construction.
+        if self.cache_state.is_record_suppressed(&self.mirror_name, to) {
+            metrics::counter!(
+                "mirror_v3_notify_suppressed_records_total",
+                "topic" => self.topic.clone(),
+                "partition" => self.partition.to_string(),
+            )
+            .increment(1);
+            return;
+        }
+        // Fire-and-forget into the channel. If the drainer has
+        // already exited (error_state is set), the send fails; and
+        // that's fine; the supervisor will see the error on the
+        // next `last_error` / `shutdown` call. `from` is intentionally
+        // dropped: the kkv-v1 body only carries the high-water `to`
+        // in its `offsets` field (consumer's `requireOffset`
+        // semantic).
+        let _ = self.tx.send(FlushEvent::Flushed { to });
+    }
+}
+
+/// Background task that pulls flush events off the channel and
+/// dispatches one kkv-v1 POST per event. Exits on `Shutdown` or
+/// channel close, or stashes the first fatal dispatch error and
+/// exits.
+async fn flush_drainer_loop(
+    inner: Arc<Inner>,
+    mut rx: tokio::sync::mpsc::UnboundedReceiver<FlushEvent>,
+    error_state: Arc<TokioMutex<Option<NotifyError>>>,
+    ack_sink: Arc<OnceLock<Arc<dyn AckSink>>>,
+) {
+    while let Some(event) = rx.recv().await {
+        let to = match event {
+            FlushEvent::Shutdown => return,
+            FlushEvent::Flushed { to } => to,
+        };
+        let mut offsets = IndexMap::new();
+        offsets.insert(inner.partition.to_string(), to);
+        // Empty `updates` per WEBHOOKS.md open-question #2:
+        // destination-flush is the "tell me a file landed" use case,
+        // not cache invalidation, so the consumer doesn't need a key
+        // set. The `offsets` field gives them the high-water mark.
+        let payload = KkvV1Payload::new(&inner.topic, offsets, IndexMap::new());
+        if let Err(e) = inner.dispatch_batch(&payload).await {
+            *error_state.lock().await = Some(e);
+            return;
+        }
+        // Successful POST => the batch is delivered. The flush event
+        // already represents a durable destination boundary on the
+        // blob sink side, so this also reflects the supervisor's
+        // notion of "highest offset acked through every gating
+        // pathway" for the destination-flush trigger.
+        if let Some(ack) = ack_sink.get() {
+            ack.note_through(to + 1);
+        }
+    }
+}
+
+fn build_endpoint(target: &NotifyTarget, client: Client) -> Result<Endpoint, BuildError> {
+    let mut url = Url::parse(&target.url).map_err(|e| BuildError::InvalidUrl {
+        url: target.url.clone(),
+        source: e,
+    })?;
+    match url.scheme() {
+        "http" | "https" => {}
+        other => {
+            return Err(BuildError::UnsupportedScheme {
+                url: target.url.clone(),
+                scheme: other.to_string(),
+            });
+        }
+    }
+    if url.host_str().is_none() {
+        return Err(BuildError::NoHost {
+            url: target.url.clone(),
+        });
+    }
+    // Apply the api-default path when the operator left it implicit.
+    // An explicit `path:` override wins; a URL whose path is `/` (the
+    // default url crate emits for hostname-only inputs) is treated as
+    // "no path specified".
+    let explicit_path = target.path.as_deref();
+    let url_has_path = !matches!(url.path(), "" | "/");
+    let path_to_set: Option<&str> = explicit_path.or({
+        if url_has_path {
+            None
+        } else {
+            Some(KKV_V1_DEFAULT_PATH)
+        }
+    });
+    if let Some(p) = path_to_set {
+        url.set_path(p);
+    }
+    let target_host = url.host_str().unwrap_or("").to_string();
+    let fan_out = match target.fan_out {
+        FanOut::None => FanOutMode::None,
+        FanOut::DnsA => {
+            // Port comes from the URL; `port_or_known_default` falls
+            // back to 80/443 per scheme. This is the port the
+            // resolver appends to every A/AAAA address it returns -
+            // matches the K8s headless-Service expectation (all pods
+            // listen on the same port).
+            let port =
+                url.port_or_known_default()
+                    .ok_or_else(|| BuildError::UnsupportedScheme {
+                        url: target.url.clone(),
+                        scheme: url.scheme().to_string(),
+                    })?;
+            FanOutMode::DnsA(DnsAState {
+                host: target_host.clone(),
+                port,
+                cached: TokioMutex::new(None),
+            })
+        }
+    };
+    Ok(Endpoint {
+        url,
+        target_host,
+        client,
+        fan_out,
+    })
+}
+
+fn render_key(key: Option<&[u8]>) -> String {
+    match key {
+        None => String::new(),
+        Some(bytes) => String::from_utf8_lossy(bytes).into_owned(),
+    }
+}
+
+/// Exponential backoff capped at 30s. `base * 2^(attempt-1)`. Attempt
+/// 1 (first retry) is one base interval; attempt 5 is 16×.
+fn backoff_for_attempt(base_ms: u64, attempt: u32) -> Duration {
+    // attempt is 1-based on the just-finished failure; backoff is the
+    // wait before the next attempt. Cap at 30 s so a misconfigured
+    // multi-day backoff doesn't silently stall a mirror.
+    let shift = (attempt - 1).min(20);
+    let ms = base_ms.saturating_mul(1u64 << shift).min(30_000);
+    Duration::from_millis(ms)
+}
+
+/// Strongly-typed outcome bucket. Maps `reqwest::Result<Response>`
+/// onto one of the six spec-defined outcomes (`§ Outcomes and retry
+/// policy`).
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+enum Outcome {
+    Timeout,
+    ConnRefused,
+    TwoXx,
+    ThreeXx,
+    FourXx,
+    FiveXx,
+}
+
+/// Per-outcome lookup. Centralises the `NotifyOutcomes` mapping so the
+/// dispatcher just deals with [`Outcome`] values.
+trait OutcomesLookup {
+    fn for_outcome(&self, o: Outcome) -> NotifyOutcome;
+}
+
+impl OutcomesLookup for NotifyOutcomes {
+    fn for_outcome(&self, o: Outcome) -> NotifyOutcome {
+        match o {
+            Outcome::Timeout => self.timeout,
+            Outcome::ConnRefused => self.connrefused,
+            Outcome::TwoXx => self.two_xx,
+            Outcome::ThreeXx => self.three_xx,
+            Outcome::FourXx => self.four_xx,
+            Outcome::FiveXx => self.five_xx,
+        }
+    }
+}
+
+/// Decide which outcome bucket a reqwest result falls into. `error`
+/// is populated with a human-readable reason whenever the outcome is
+/// not 2xx, so the eventual `tracing::warn!` / `NotifyError::Exhausted`
+/// carries the underlying failure.
+fn classify(result: reqwest::Result<reqwest::Response>, error: &mut String) -> Outcome {
+    match result {
+        Ok(resp) => {
+            let status = resp.status();
+            // Drop body promptly; outcome decision is status-only.
+            // (reqwest will close the connection if we don't consume,
+            // hurting keep-alive reuse.) Spawned task isn't needed:
+            // the body is small for kkv 2xx (typically empty) and we
+            // hold the future at the call site.
+            drop(resp);
+            if status.is_success() {
+                Outcome::TwoXx
+            } else if status.is_redirection() {
+                *error = format!("HTTP {status}");
+                Outcome::ThreeXx
+            } else if status.is_client_error() {
+                *error = format!("HTTP {status}");
+                Outcome::FourXx
+            } else if status.is_server_error() {
+                *error = format!("HTTP {status}");
+                Outcome::FiveXx
+            } else {
+                // 1xx; informational. Treat as 2xx (spec doesn't
+                // enumerate; reqwest already filters most of these).
+                Outcome::TwoXx
+            }
+        }
+        Err(e) => {
+            if e.is_timeout() {
+                *error = format!("timeout: {e}");
+                Outcome::Timeout
+            } else if is_connection_refused(&e) {
+                *error = format!("connection refused: {e}");
+                Outcome::ConnRefused
+            } else {
+                // Other transport-layer errors (DNS resolution, TLS,
+                // mid-stream EOF, etc.) are spec-treated like
+                // connection-refused; they're "couldn't reach the
+                // receiver", same retry/final policy expectations.
+                *error = format!("connection error: {e}");
+                Outcome::ConnRefused
+            }
+        }
+    }
+}
+
+fn is_connection_refused(e: &reqwest::Error) -> bool {
+    // reqwest doesn't surface a "connrefused" predicate; walk the
+    // source chain looking for the io::ErrorKind::ConnectionRefused.
+    let mut source: Option<&dyn std::error::Error> = Some(e);
+    while let Some(err) = source {
+        if let Some(io) = err.downcast_ref::<std::io::Error>() {
+            if io.kind() == std::io::ErrorKind::ConnectionRefused {
+                return true;
+            }
+        }
+        source = err.source();
+    }
+    false
+}
+
+/// On-wire body shape for `api: kkv-v1`. Mirrors the legacy
+/// `@yolean/kafka-keyvalue` Node client's `KafkaKeyValue.js` parser.
+///
+/// `topic` and `offsets` are duplicated in the headers
+/// (`x-kkv-topic`, `x-kkv-offsets`) so misrouted requests are easy to
+/// debug from the body alone. `updates` is a key → `null` map; the
+/// consumer re-fetches every key via `GET /cache/v1/raw/<key>`.
+///
+/// The `v: 1` field is a load-bearing protocol-version marker.
+/// `@yolean/kafka-keyvalue` v1.8.3's `updateListener` (CJS and ESM
+/// builds) checks `if (requestBody.v !== 1) throw new Error(...)`
+/// before any other parsing; a missing field surfaces as `undefined`,
+/// the throw lands inside an Express middleware as an unhandled
+/// rejection, and the consumer pod crashloops. The legacy Quarkus
+/// kkv server sends this field on every POST.
+#[derive(Debug, Serialize)]
+struct KkvV1Payload<'a> {
+    /// Protocol version. Always 1 for `notify.api: kkv-v1`.
+    v: u8,
+    topic: &'a str,
+    /// `IndexMap` to preserve insertion order on the wire; the legacy
+    /// kkv consumer doesn't care about key order but stable output
+    /// makes integration tests deterministic.
+    offsets: IndexMap<String, u64>,
+    updates: IndexMap<String, serde_json::Value>,
+}
+
+impl<'a> KkvV1Payload<'a> {
+    /// Construct a body with the protocol-version field pinned to 1.
+    /// New call sites should use this rather than constructing the
+    /// struct directly so the `v: 1` invariant can't be bypassed.
+    fn new(
+        topic: &'a str,
+        offsets: IndexMap<String, u64>,
+        updates: IndexMap<String, serde_json::Value>,
+    ) -> Self {
+        Self {
+            v: 1,
+            topic,
+            offsets,
+            updates,
+        }
+    }
+}
+
+#[cfg(test)]
+mod unit_tests {
+    use super::*;
+
+    #[test]
+    fn backoff_doubles_per_attempt_capped_at_30s() {
+        assert_eq!(backoff_for_attempt(100, 1), Duration::from_millis(100));
+        assert_eq!(backoff_for_attempt(100, 2), Duration::from_millis(200));
+        assert_eq!(backoff_for_attempt(100, 3), Duration::from_millis(400));
+        assert_eq!(backoff_for_attempt(100, 4), Duration::from_millis(800));
+        // 100 << 19 = 52_428_800, capped at 30_000.
+        assert_eq!(backoff_for_attempt(100, 20), Duration::from_millis(30_000));
+    }
+
+    #[test]
+    fn render_key_handles_none_and_lossy_utf8() {
+        assert_eq!(render_key(None), "");
+        assert_eq!(render_key(Some(b"hello")), "hello");
+        // 0xff is not valid UTF-8; lossy substitution should produce
+        // the replacement character rather than panicking.
+        let s = render_key(Some(&[b'a', 0xff, b'b']));
+        assert!(s.starts_with('a') && s.ends_with('b'));
+    }
+
+    #[test]
+    fn build_endpoint_applies_default_kkv_path_when_url_is_host_only() {
+        let target = NotifyTarget {
+            url: "http://kkv-target.example".into(),
+            path: None,
+            fan_out: mirror_config::FanOut::None,
+        };
+        let ep = build_endpoint(&target, Client::new()).unwrap();
+        assert_eq!(ep.url.path(), KKV_V1_DEFAULT_PATH);
+    }
+
+    #[test]
+    fn build_endpoint_respects_explicit_path_override() {
+        let target = NotifyTarget {
+            url: "http://kkv-target.example".into(),
+            path: Some("/custom/route".into()),
+            fan_out: mirror_config::FanOut::None,
+        };
+        let ep = build_endpoint(&target, Client::new()).unwrap();
+        assert_eq!(ep.url.path(), "/custom/route");
+    }
+
+    #[test]
+    fn build_endpoint_respects_path_in_url_when_no_override() {
+        let target = NotifyTarget {
+            url: "http://kkv-target.example/already/has/path".into(),
+            path: None,
+            fan_out: mirror_config::FanOut::None,
+        };
+        let ep = build_endpoint(&target, Client::new()).unwrap();
+        assert_eq!(ep.url.path(), "/already/has/path");
+    }
+
+    #[test]
+    fn build_endpoint_rejects_non_http_scheme() {
+        let target = NotifyTarget {
+            url: "file:///etc/passwd".into(),
+            path: None,
+            fan_out: mirror_config::FanOut::None,
+        };
+        let err = build_endpoint(&target, Client::new()).unwrap_err();
+        assert!(
+            matches!(err, BuildError::UnsupportedScheme { .. }),
+            "got {err:?}"
+        );
+    }
+}
diff --git a/crates/mirror-notify-kkv/src/resolver.rs b/crates/mirror-notify-kkv/src/resolver.rs
new file mode 100644
index 0000000..9e1cc12
--- /dev/null
+++ b/crates/mirror-notify-kkv/src/resolver.rs
@@ -0,0 +1,42 @@
+//! DNS resolver trait used by the `fan-out: dns-a` dispatch path.
+//!
+//! Production uses [`SystemDnsResolver`] which wraps
+//! `tokio::net::lookup_host`. Tests inject a stub that returns canned
+//! `SocketAddr`s; that lets the multi-address fan-out path be
+//! exercised against axum servers bound on different ports without
+//! depending on the system resolver or `/etc/hosts`.
+//!
+//! All addresses returned by a single call share the URL's port in
+//! production (lookup_host appends the port to every result). The
+//! trait nonetheless returns `SocketAddr`s so test stubs can supply
+//! arbitrary `(IP, port)` pairs.
+
+use std::net::SocketAddr;
+
+use async_trait::async_trait;
+
+#[async_trait]
+pub trait DnsAResolver: Send + Sync {
+    /// Resolve `host:port` to the full A/AAAA address set.
+    async fn resolve(&self, host: &str, port: u16) -> std::io::Result<Vec<SocketAddr>>;
+}
+
+/// `tokio::net::lookup_host` wrapper; the default resolver used by
+/// [`crate::KkvV1Notifier::from_config`].
+#[derive(Debug, Default, Clone, Copy)]
+pub struct SystemDnsResolver;
+
+#[async_trait]
+impl DnsAResolver for SystemDnsResolver {
+    async fn resolve(&self, host: &str, port: u16) -> std::io::Result<Vec<SocketAddr>> {
+        // `lookup_host` accepts both `"host:port"` strings and
+        // `(host, port)` tuples; the tuple form skips the
+        // `&str → SocketAddr` parsing fast-path's allocation when
+        // `host` is a name.
+        let mut out = Vec::new();
+        for sa in tokio::net::lookup_host((host, port)).await? {
+            out.push(sa);
+        }
+        Ok(out)
+    }
+}
diff --git a/crates/mirror-notify-kkv/tests/ack_sink.rs b/crates/mirror-notify-kkv/tests/ack_sink.rs
new file mode 100644
index 0000000..f07f3bb
--- /dev/null
+++ b/crates/mirror-notify-kkv/tests/ack_sink.rs
@@ -0,0 +1,235 @@
+//! Pin the ack contract of `KkvV1Notifier` and `FlushDispatcher`:
+//!   * after a successful drain/POST, the installed `AckSink`
+//!     receives `note_through(high_offset + 1)`,
+//!   * after a retry-then-fail dispatch, no ack is recorded,
+//!   * records suppressed by the per-mirror readiness gate don't
+//!     buffer and therefore don't ack.
+
+mod common;
+
+use std::sync::{Arc, Mutex};
+use std::time::Duration;
+
+use common::{notify_pointing_at, Reply, TestServer};
+use mirror_config::{NotifyOutcomes, NotifyRetry};
+use mirror_core::{AckSink, CacheState, FlushObserver, Notifier, Record, TimestampType};
+use mirror_notify_kkv::{FlushDispatcher, KkvV1Notifier};
+
+#[derive(Debug, Default)]
+struct RecordingAck {
+    values: Mutex<Vec<u64>>,
+}
+
+impl AckSink for RecordingAck {
+    fn note_through(&self, through: u64) {
+        self.values.lock().unwrap().push(through);
+    }
+}
+
+fn ready_cache(name: &str) -> Arc<CacheState> {
+    let s = Arc::new(CacheState::new());
+    // bootstrap_hwm = 0 => the slot is immediately ready.
+    s.register_mirror(name, 0, None, false);
+    s
+}
+
+fn warming_cache(name: &str, hwm: u64) -> Arc<CacheState> {
+    let s = Arc::new(CacheState::new());
+    s.register_mirror(name, hwm, None, false);
+    s
+}
+
+fn rec(offset: u64, key: &str) -> Record {
+    Record {
+        topic: "t".into(),
+        partition: 0,
+        source_offset: offset,
+        timestamp_ms: Some(1_700_000_000_000),
+        timestamp_type: TimestampType::CreateTime,
+        key: Some(key.as_bytes().to_vec()),
+        value: Some(b"v".to_vec()),
+        headers: vec![],
+    }
+}
+
+fn tight_retry() -> NotifyRetry {
+    NotifyRetry {
+        max_attempts: 2,
+        backoff_ms: 1,
+    }
+}
+
+#[tokio::test]
+async fn kkv_v1_notifier_acks_through_high_offset_plus_one_on_success() {
+    let server = TestServer::start(Reply::Status(200), vec![]).await;
+    let cfg = notify_pointing_at(server.addr, NotifyOutcomes::default(), tight_retry(), 1000);
+    let ack = Arc::new(RecordingAck::default());
+    let mut notifier =
+        KkvV1Notifier::from_config(&cfg, "t".into(), 0, ready_cache("m"), "m".into())
+            .unwrap()
+            .with_ack_sink(ack.clone() as Arc<dyn AckSink>);
+
+    // `notify_pointing_at` defaults `max_records: 1` so the drain is
+    // inline; one record per call.
+    notifier.on_record(&rec(0, "k0")).await.unwrap();
+    notifier.on_record(&rec(1, "k1")).await.unwrap();
+    notifier.on_record(&rec(7, "k7")).await.unwrap();
+
+    assert_eq!(
+        ack.values.lock().unwrap().clone(),
+        vec![1, 2, 8],
+        "ack must be high_offset + 1 per successful drain"
+    );
+}
+
+#[tokio::test]
+async fn kkv_v1_notifier_does_not_ack_when_dispatch_exhausts() {
+    // Server always returns 503; default 5xx outcome is retry: true,
+    // final: fail. Dispatch returns `Exhausted`; the on_record call
+    // surfaces it as an error. No ack must be recorded.
+    let server = TestServer::start(Reply::Status(503), vec![]).await;
+    let cfg = notify_pointing_at(server.addr, NotifyOutcomes::default(), tight_retry(), 1000);
+    let ack = Arc::new(RecordingAck::default());
+    let mut notifier =
+        KkvV1Notifier::from_config(&cfg, "t".into(), 0, ready_cache("m"), "m".into())
+            .unwrap()
+            .with_ack_sink(ack.clone() as Arc<dyn AckSink>);
+
+    let err = notifier.on_record(&rec(0, "k0")).await.unwrap_err();
+    let msg = format!("{err}");
+    assert!(
+        msg.contains("exhausted") || msg.contains("Exhausted"),
+        "got: {msg}"
+    );
+    assert!(
+        ack.values.lock().unwrap().is_empty(),
+        "no ack must be recorded when dispatch exhausts retries"
+    );
+}
+
+#[tokio::test]
+async fn kkv_v1_notifier_does_not_ack_when_suppressed_below_threshold() {
+    // Bootstrap_hwm=10, so records with offset < 9 are suppressed
+    // (the mirror's `caught_up` is false until last_applied + 1
+    // reaches hwm). Suppressed records never enter the buffer,
+    // therefore never dispatch and never ack.
+    let server = TestServer::start(Reply::Status(200), vec![]).await;
+    let cfg = notify_pointing_at(server.addr, NotifyOutcomes::default(), tight_retry(), 1000);
+    let ack = Arc::new(RecordingAck::default());
+    let mut notifier =
+        KkvV1Notifier::from_config(&cfg, "t".into(), 0, warming_cache("m", 10), "m".into())
+            .unwrap()
+            .with_ack_sink(ack.clone() as Arc<dyn AckSink>);
+
+    for off in 0..5 {
+        notifier
+            .on_record(&rec(off, &format!("k{off}")))
+            .await
+            .unwrap();
+    }
+
+    assert_eq!(
+        server.request_count(),
+        0,
+        "no POST must fire while suppressed"
+    );
+    assert!(
+        ack.values.lock().unwrap().is_empty(),
+        "suppressed records must not feed the ack tracker"
+    );
+}
+
+#[tokio::test]
+async fn flush_dispatcher_acks_through_to_plus_one_on_success() {
+    let server = TestServer::start(Reply::Status(200), vec![]).await;
+    use mirror_config::{FanOut, Notify, NotifyApi, NotifyTarget, NotifyTrigger, TriggerOn};
+    let cfg = Notify {
+        api: NotifyApi::KkvV1,
+        targets: vec![NotifyTarget {
+            url: format!("http://{}", server.addr),
+            path: None,
+            fan_out: FanOut::None,
+        }],
+        trigger: NotifyTrigger {
+            on: TriggerOn::DestinationFlush,
+            debounce: None,
+        },
+        timeout_ms: 1000,
+        retry: tight_retry(),
+        outcomes: NotifyOutcomes::default(),
+    };
+    let ack = Arc::new(RecordingAck::default());
+    let dispatcher =
+        FlushDispatcher::from_config(&cfg, "t".into(), 0, ready_cache("m"), "m".into())
+            .unwrap()
+            .with_ack_sink(ack.clone() as Arc<dyn AckSink>);
+
+    // Drive the observer; each call enqueues a POST.
+    dispatcher.on_flushed(0, 4);
+    dispatcher.on_flushed(5, 9);
+
+    // The drainer is async; poll until both POSTs land.
+    let deadline = std::time::Instant::now() + Duration::from_secs(2);
+    while server.request_count() < 2 && std::time::Instant::now() < deadline {
+        tokio::time::sleep(Duration::from_millis(20)).await;
+    }
+    assert_eq!(server.request_count(), 2);
+
+    // Drainer fires note_through synchronously inside the loop;
+    // poll briefly until both values appear.
+    let deadline = std::time::Instant::now() + Duration::from_secs(2);
+    loop {
+        let snapshot = ack.values.lock().unwrap().clone();
+        if snapshot.len() >= 2 {
+            assert_eq!(
+                snapshot,
+                vec![5, 10],
+                "destination-flush acks through to + 1 per successful POST"
+            );
+            break;
+        }
+        if std::time::Instant::now() >= deadline {
+            panic!("ack didn't arrive: {snapshot:?}");
+        }
+        tokio::time::sleep(Duration::from_millis(20)).await;
+    }
+}
+
+#[tokio::test]
+async fn flush_dispatcher_does_not_ack_when_dispatch_exhausts() {
+    let server = TestServer::start(Reply::Status(503), vec![]).await;
+    use mirror_config::{FanOut, Notify, NotifyApi, NotifyTarget, NotifyTrigger, TriggerOn};
+    let cfg = Notify {
+        api: NotifyApi::KkvV1,
+        targets: vec![NotifyTarget {
+            url: format!("http://{}", server.addr),
+            path: None,
+            fan_out: FanOut::None,
+        }],
+        trigger: NotifyTrigger {
+            on: TriggerOn::DestinationFlush,
+            debounce: None,
+        },
+        timeout_ms: 1000,
+        retry: tight_retry(),
+        outcomes: NotifyOutcomes::default(),
+    };
+    let ack = Arc::new(RecordingAck::default());
+    let dispatcher =
+        FlushDispatcher::from_config(&cfg, "t".into(), 0, ready_cache("m"), "m".into())
+            .unwrap()
+            .with_ack_sink(ack.clone() as Arc<dyn AckSink>);
+
+    dispatcher.on_flushed(0, 9);
+    // Wait long enough for the drainer to exhaust retries
+    // (`max_attempts=2`, `backoff_ms=1`) and stash the error.
+    let deadline = std::time::Instant::now() + Duration::from_secs(2);
+    while dispatcher.last_error().await.is_none() && std::time::Instant::now() < deadline {
+        tokio::time::sleep(Duration::from_millis(50)).await;
+    }
+    assert!(
+        ack.values.lock().unwrap().is_empty(),
+        "no ack when dispatch exhausts: {:?}",
+        ack.values.lock().unwrap()
+    );
+}
diff --git a/crates/mirror-notify-kkv/tests/common/mod.rs b/crates/mirror-notify-kkv/tests/common/mod.rs
new file mode 100644
index 0000000..b726509
--- /dev/null
+++ b/crates/mirror-notify-kkv/tests/common/mod.rs
@@ -0,0 +1,201 @@
+//! Test helpers shared by the `mirror-notify-kkv` integration tests.
+//!
+//! The pattern: bind a tiny axum router on port 0, capture every
+//! POST it receives (headers + body), and let the test script the
+//! per-request status code response. The notifier-under-test points
+//! at `127.0.0.1:<port>` and we assert on the captured requests.
+
+// Each `tests/*.rs` binary compiles `common` independently and any
+// unused helpers in *that* binary produce dead-code warnings. The
+// helpers are used across binaries, so silence the per-binary noise.
+#![allow(dead_code)]
+
+use std::net::SocketAddr;
+use std::sync::atomic::{AtomicUsize, Ordering};
+use std::sync::Arc;
+use std::time::Duration;
+
+use axum::extract::State;
+use axum::http::{HeaderMap, StatusCode};
+use axum::routing::post;
+use axum::Router;
+use mirror_config::{
+    FanOut, Notify, NotifyApi, NotifyDebounce, NotifyOutcomes, NotifyRetry, NotifyTarget,
+    NotifyTrigger, TriggerOn,
+};
+use mirror_core::CacheState;
+use tokio::sync::Mutex;
+
+/// A single captured POST.
+#[derive(Debug, Clone)]
+pub struct CapturedRequest {
+    pub path: String,
+    pub headers: HeaderMap,
+    pub body: Vec<u8>,
+}
+
+/// What status code (or transport behaviour) the test server should
+/// return for a given request, in order.
+#[derive(Debug, Clone, Copy)]
+pub enum Reply {
+    /// Plain HTTP status reply.
+    Status(u16),
+    /// Sleep for `Duration` then return 200; used to trigger client
+    /// timeouts when `notify.timeout-ms` is set below this.
+    SlowOk(Duration),
+}
+
+pub struct ServerState {
+    pub requests: Mutex<Vec<CapturedRequest>>,
+    pub replies: Mutex<Vec<Reply>>,
+    pub default_reply: Mutex<Reply>,
+    /// Number of times the handler was invoked. Useful for asserting
+    /// "no retry beyond max-attempts" from outside.
+    pub request_count: AtomicUsize,
+}
+
+pub struct TestServer {
+    pub addr: SocketAddr,
+    pub state: Arc<ServerState>,
+    _shutdown_tx: tokio::sync::oneshot::Sender<()>,
+    _join: tokio::task::JoinHandle<()>,
+}
+
+impl TestServer {
+    /// Bind on 127.0.0.1:0 with the given `default_reply` used for
+    /// every request, plus an optional per-request `Reply` queue
+    /// applied before the default takes over.
+    pub async fn start(default_reply: Reply, scripted: Vec<Reply>) -> Self {
+        let state = Arc::new(ServerState {
+            requests: Mutex::new(Vec::new()),
+            replies: Mutex::new(scripted),
+            default_reply: Mutex::new(default_reply),
+            request_count: AtomicUsize::new(0),
+        });
+        let router = Router::new()
+            .route("/{*path}", post(handle_post))
+            .route("/", post(handle_post))
+            .with_state(Arc::clone(&state));
+        let listener = tokio::net::TcpListener::bind("127.0.0.1:0").await.unwrap();
+        let addr = listener.local_addr().unwrap();
+        let (shutdown_tx, shutdown_rx) = tokio::sync::oneshot::channel::<()>();
+        let join = tokio::spawn(async move {
+            let _ = axum::serve(listener, router)
+                .with_graceful_shutdown(async move {
+                    let _ = shutdown_rx.await;
+                })
+                .await;
+        });
+        TestServer {
+            addr,
+            state,
+            _shutdown_tx: shutdown_tx,
+            _join: join,
+        }
+    }
+
+    pub async fn captured(&self) -> Vec<CapturedRequest> {
+        self.state.requests.lock().await.clone()
+    }
+
+    pub fn request_count(&self) -> usize {
+        self.state.request_count.load(Ordering::SeqCst)
+    }
+}
+
+async fn handle_post(
+    State(state): State<Arc<ServerState>>,
+    headers: HeaderMap,
+    request: axum::extract::Request,
+) -> (StatusCode, &'static str) {
+    state.request_count.fetch_add(1, Ordering::SeqCst);
+    let path = request.uri().path().to_string();
+    let body = axum::body::to_bytes(request.into_body(), 1024 * 1024)
+        .await
+        .unwrap();
+    state.requests.lock().await.push(CapturedRequest {
+        path,
+        headers,
+        body: body.to_vec(),
+    });
+    let reply = {
+        let mut q = state.replies.lock().await;
+        if q.is_empty() {
+            *state.default_reply.lock().await
+        } else {
+            q.remove(0)
+        }
+    };
+    match reply {
+        Reply::Status(code) => (
+            StatusCode::from_u16(code).unwrap_or(StatusCode::INTERNAL_SERVER_ERROR),
+            "",
+        ),
+        Reply::SlowOk(d) => {
+            tokio::time::sleep(d).await;
+            (StatusCode::OK, "")
+        }
+    }
+}
+
+/// `CacheState` whose mirror slot is already marked caught-up so the
+/// notifier's per-mirror bootstrap_hwm gate lets every record through.
+/// Use in any test whose focus isn't the readiness gate itself.
+/// `register_mirror(name, 0)` declares an empty source partition, so
+/// the slot's `caught_up` flag is `true` at registration time.
+/// `is_main` is irrelevant to the suppression gate so we always pass
+/// `false`.
+pub fn ready_cache(mirror_name: &str) -> Arc<CacheState> {
+    let state = Arc::new(CacheState::new());
+    state.register_mirror(mirror_name, 0, None, false);
+    state
+}
+
+/// Build a `Notify` config with an explicit debounce window. Used by
+/// the buffer tests where the default-helper's `max_records: 1`
+/// would force per-record inline drains.
+pub fn notify_pointing_at_debounced(
+    addr: SocketAddr,
+    outcomes: NotifyOutcomes,
+    retry: NotifyRetry,
+    timeout_ms: u64,
+    debounce: NotifyDebounce,
+) -> Notify {
+    let mut n = notify_pointing_at(addr, outcomes, retry, timeout_ms);
+    n.trigger.debounce = Some(debounce);
+    n
+}
+
+/// Build a minimal `Notify` config pointed at the given local addr.
+/// Tests override individual fields by mutating the returned value.
+pub fn notify_pointing_at(
+    addr: SocketAddr,
+    outcomes: NotifyOutcomes,
+    retry: NotifyRetry,
+    timeout_ms: u64,
+) -> Notify {
+    Notify {
+        api: NotifyApi::KkvV1,
+        targets: vec![NotifyTarget {
+            url: format!("http://{addr}"),
+            path: None,
+            fan_out: FanOut::None,
+        }],
+        trigger: NotifyTrigger {
+            on: TriggerOn::SourceConsume,
+            // `max_records: 1` keeps the default helper's
+            // `on_record` dispatch synchronous so the existing
+            // wire-format / outcomes tests can assert against
+            // `server.captured()` immediately after on_record
+            // returns. Debounce-specific tests configure their own
+            // window via `notify_pointing_at_debounced`.
+            debounce: Some(NotifyDebounce {
+                max_records: 1,
+                max_time_ms: 60_000,
+            }),
+        },
+        timeout_ms,
+        retry,
+        outcomes,
+    }
+}
diff --git a/crates/mirror-notify-kkv/tests/debounce.rs b/crates/mirror-notify-kkv/tests/debounce.rs
new file mode 100644
index 0000000..96533fd
--- /dev/null
+++ b/crates/mirror-notify-kkv/tests/debounce.rs
@@ -0,0 +1,274 @@
+//! Tests for the source-consume debounce buffer.
+//!
+//! The buffer batches `(key, source_offset)` per record, emits a
+//! single POST when `max-records` records have arrived OR
+//! `max-time-ms` has elapsed since the first record landed, and
+//! collapses repeats of the same key while carrying the *max* source
+//! offset on the wire.
+
+mod common;
+
+use std::time::Duration;
+
+use common::{notify_pointing_at, notify_pointing_at_debounced, ready_cache, Reply, TestServer};
+use mirror_config::{NotifyDebounce, NotifyOutcomes, NotifyRetry};
+use mirror_core::{Notifier, Record, TimestampType};
+use mirror_notify_kkv::KkvV1Notifier;
+use serde_json::Value;
+
+fn rec(offset: u64, key: &str) -> Record {
+    Record {
+        topic: "t".into(),
+        partition: 0,
+        source_offset: offset,
+        timestamp_ms: Some(1_700_000_000_000),
+        timestamp_type: TimestampType::CreateTime,
+        key: Some(key.as_bytes().to_vec()),
+        value: Some(b"v".to_vec()),
+        headers: vec![],
+    }
+}
+
+fn retry(attempts: u32) -> NotifyRetry {
+    NotifyRetry {
+        max_attempts: attempts,
+        backoff_ms: 1,
+    }
+}
+
+#[tokio::test]
+async fn drains_when_max_records_reached() {
+    // max-records=3, very long max-time so only the record count
+    // can trigger.
+    let server = TestServer::start(Reply::Status(200), vec![]).await;
+    let cfg = notify_pointing_at_debounced(
+        server.addr,
+        NotifyOutcomes::default(),
+        retry(1),
+        1000,
+        NotifyDebounce {
+            max_records: 3,
+            max_time_ms: 60_000,
+        },
+    );
+    let mut n =
+        KkvV1Notifier::from_config(&cfg, "t".into(), 0, ready_cache("m"), "m".into()).unwrap();
+
+    n.on_record(&rec(10, "a")).await.unwrap();
+    n.on_record(&rec(11, "b")).await.unwrap();
+    assert_eq!(
+        server.request_count(),
+        0,
+        "no drain yet; only 2 of 3 records buffered"
+    );
+    n.on_record(&rec(12, "c")).await.unwrap();
+    assert_eq!(
+        server.request_count(),
+        1,
+        "third record must drain the batch inline"
+    );
+
+    let body: Value = serde_json::from_slice(&server.captured().await[0].body).unwrap();
+    assert_eq!(
+        body,
+        serde_json::json!({
+            "v": 1,
+            "topic": "t",
+            "offsets": { "0": 12 },
+            "updates": { "a": null, "b": null, "c": null }
+        })
+    );
+}
+
+#[tokio::test]
+async fn drains_when_max_time_ms_elapses() {
+    // max-records very high, max-time-ms small. Send 1 record, sleep
+    // past the window, expect the background timer to have drained.
+    let server = TestServer::start(Reply::Status(200), vec![]).await;
+    let cfg = notify_pointing_at_debounced(
+        server.addr,
+        NotifyOutcomes::default(),
+        retry(1),
+        1000,
+        NotifyDebounce {
+            max_records: 1_000,
+            max_time_ms: 50,
+        },
+    );
+    let mut n =
+        KkvV1Notifier::from_config(&cfg, "t".into(), 0, ready_cache("m"), "m".into()).unwrap();
+
+    n.on_record(&rec(7, "x")).await.unwrap();
+    assert_eq!(
+        server.request_count(),
+        0,
+        "no inline drain; record buffered"
+    );
+
+    // Sleep comfortably past the window plus dispatch slop.
+    tokio::time::sleep(Duration::from_millis(200)).await;
+
+    assert_eq!(
+        server.request_count(),
+        1,
+        "timer task must have drained the single-record batch"
+    );
+    let body: Value = serde_json::from_slice(&server.captured().await[0].body).unwrap();
+    assert_eq!(body["offsets"], serde_json::json!({"0": 7}));
+    assert_eq!(body["updates"], serde_json::json!({"x": null}));
+}
+
+#[tokio::test]
+async fn key_dedup_keeps_one_entry_with_max_offset() {
+    // Three records with the same key. The batch's `updates` must
+    // carry the key once; `offsets` must reflect the highest source
+    // offset across all three.
+    let server = TestServer::start(Reply::Status(200), vec![]).await;
+    let cfg = notify_pointing_at_debounced(
+        server.addr,
+        NotifyOutcomes::default(),
+        retry(1),
+        1000,
+        NotifyDebounce {
+            max_records: 3,
+            max_time_ms: 60_000,
+        },
+    );
+    let mut n =
+        KkvV1Notifier::from_config(&cfg, "t".into(), 0, ready_cache("m"), "m".into()).unwrap();
+
+    n.on_record(&rec(20, "hot")).await.unwrap();
+    n.on_record(&rec(21, "hot")).await.unwrap();
+    n.on_record(&rec(22, "hot")).await.unwrap();
+
+    let body: Value = serde_json::from_slice(&server.captured().await[0].body).unwrap();
+    assert_eq!(
+        body["updates"],
+        serde_json::json!({"hot": null}),
+        "duplicate keys must collapse to one entry"
+    );
+    assert_eq!(
+        body["offsets"],
+        serde_json::json!({"0": 22}),
+        "offsets must carry the max source offset across the batch"
+    );
+}
+
+#[tokio::test]
+async fn shutdown_drains_pending_batch() {
+    // Non-trivial buffer (under max-records, well within max-time),
+    // shutdown must POST it before returning.
+    let server = TestServer::start(Reply::Status(200), vec![]).await;
+    let cfg = notify_pointing_at_debounced(
+        server.addr,
+        NotifyOutcomes::default(),
+        retry(1),
+        1000,
+        NotifyDebounce {
+            max_records: 1_000,
+            max_time_ms: 60_000,
+        },
+    );
+    let mut n =
+        KkvV1Notifier::from_config(&cfg, "t".into(), 0, ready_cache("m"), "m".into()).unwrap();
+
+    n.on_record(&rec(1, "a")).await.unwrap();
+    n.on_record(&rec(2, "b")).await.unwrap();
+    assert_eq!(server.request_count(), 0);
+
+    n.shutdown().await.expect("shutdown drain must succeed");
+    assert_eq!(
+        server.request_count(),
+        1,
+        "shutdown must drain whatever's in the buffer"
+    );
+    let body: Value = serde_json::from_slice(&server.captured().await[0].body).unwrap();
+    assert_eq!(body["offsets"], serde_json::json!({"0": 2}));
+    assert_eq!(body["updates"], serde_json::json!({"a": null, "b": null}));
+}
+
+#[tokio::test]
+async fn shutdown_with_empty_buffer_is_a_noop() {
+    let server = TestServer::start(Reply::Status(200), vec![]).await;
+    let cfg = notify_pointing_at(server.addr, NotifyOutcomes::default(), retry(1), 1000);
+    let mut n =
+        KkvV1Notifier::from_config(&cfg, "t".into(), 0, ready_cache("m"), "m".into()).unwrap();
+
+    n.shutdown().await.expect("empty shutdown must succeed");
+    assert_eq!(server.request_count(), 0, "no records → no POST");
+}
+
+#[tokio::test]
+async fn timer_drain_failure_surfaces_on_next_on_record() {
+    // Server returns 503 forever; outcome 5xx default is {retry: true,
+    // final: fail}. The timer-task drain hits this, stashes the
+    // NotifyError, and the next on_record returns it.
+    let server = TestServer::start(Reply::Status(503), vec![]).await;
+    let cfg = notify_pointing_at_debounced(
+        server.addr,
+        NotifyOutcomes::default(),
+        retry(2),
+        1000,
+        NotifyDebounce {
+            max_records: 1_000,
+            max_time_ms: 50,
+        },
+    );
+    let mut n =
+        KkvV1Notifier::from_config(&cfg, "t".into(), 0, ready_cache("m"), "m".into()).unwrap();
+
+    n.on_record(&rec(1, "a")).await.unwrap();
+    // Wait long enough for the timer to fire, exhaust retries
+    // (2 attempts × 1ms backoff), and stash the error.
+    tokio::time::sleep(Duration::from_millis(300)).await;
+
+    let err = n
+        .on_record(&rec(2, "b"))
+        .await
+        .expect_err("subsequent on_record must surface the timer-task error");
+    let s = format!("{err}");
+    assert!(s.contains("exhausted"), "got: {s}");
+}
+
+#[tokio::test]
+async fn buffer_continues_to_accept_after_inline_drain() {
+    // After a max-records drain, the buffer is empty and ready to
+    // accumulate the next batch independently.
+    let server = TestServer::start(Reply::Status(200), vec![]).await;
+    let cfg = notify_pointing_at_debounced(
+        server.addr,
+        NotifyOutcomes::default(),
+        retry(1),
+        1000,
+        NotifyDebounce {
+            max_records: 2,
+            max_time_ms: 60_000,
+        },
+    );
+    let mut n =
+        KkvV1Notifier::from_config(&cfg, "t".into(), 0, ready_cache("m"), "m".into()).unwrap();
+
+    // First batch
+    n.on_record(&rec(10, "a")).await.unwrap();
+    n.on_record(&rec(11, "b")).await.unwrap();
+    assert_eq!(
+        server.request_count(),
+        1,
+        "first batch must drain at max-records"
+    );
+
+    // Second batch
+    n.on_record(&rec(12, "c")).await.unwrap();
+    n.on_record(&rec(13, "d")).await.unwrap();
+    assert_eq!(
+        server.request_count(),
+        2,
+        "second batch must drain independently"
+    );
+
+    let captured = server.captured().await;
+    let body0: Value = serde_json::from_slice(&captured[0].body).unwrap();
+    let body1: Value = serde_json::from_slice(&captured[1].body).unwrap();
+    assert_eq!(body0["offsets"], serde_json::json!({"0": 11}));
+    assert_eq!(body1["offsets"], serde_json::json!({"0": 13}));
+}
diff --git a/crates/mirror-notify-kkv/tests/fan_out_dns_a.rs b/crates/mirror-notify-kkv/tests/fan_out_dns_a.rs
new file mode 100644
index 0000000..a5d2571
--- /dev/null
+++ b/crates/mirror-notify-kkv/tests/fan_out_dns_a.rs
@@ -0,0 +1,291 @@
+//! Tests for `fan-out: dns-a`.
+//!
+//! Each test stands up two axum servers on `127.0.0.1` with distinct
+//! ports, then injects a stub [`DnsAResolver`] that returns those
+//! servers' `SocketAddr`s. The dispatcher rewrites the URL host+port
+//! per resolved address and POSTs to each concurrently. This exercises
+//! the multi-address path without depending on the system resolver or
+//! `/etc/hosts`.
+
+mod common;
+
+use std::net::SocketAddr;
+use std::sync::atomic::{AtomicUsize, Ordering};
+use std::sync::Arc;
+
+use async_trait::async_trait;
+use common::{ready_cache, Reply, TestServer};
+use mirror_config::{
+    FanOut, Notify, NotifyApi, NotifyDebounce, NotifyOutcomes, NotifyRetry, NotifyTarget,
+    NotifyTrigger, TriggerOn,
+};
+use mirror_core::{Notifier, NotifyError, Record, TimestampType};
+use mirror_notify_kkv::{DnsAResolver, KkvV1Notifier};
+
+/// Stub resolver that returns a fixed set of addresses every call,
+/// counting how many times `resolve` was invoked so cache-TTL tests
+/// can assert "second dispatch hit the cache".
+#[derive(Debug)]
+struct StubResolver {
+    addrs: Vec<SocketAddr>,
+    calls: Arc<AtomicUsize>,
+}
+
+#[async_trait]
+impl DnsAResolver for StubResolver {
+    async fn resolve(&self, _host: &str, _port: u16) -> std::io::Result<Vec<SocketAddr>> {
+        self.calls.fetch_add(1, Ordering::SeqCst);
+        Ok(self.addrs.clone())
+    }
+}
+
+fn rec(offset: u64) -> Record {
+    Record {
+        topic: "t".into(),
+        partition: 0,
+        source_offset: offset,
+        timestamp_ms: Some(1_700_000_000_000),
+        timestamp_type: TimestampType::CreateTime,
+        key: Some(b"k".to_vec()),
+        value: Some(b"v".to_vec()),
+        headers: vec![],
+    }
+}
+
+/// Build a `Notify` config with `fan-out: dns-a` aimed at a stand-in
+/// hostname (the resolver stub returns the real addresses). `max_records: 1`
+/// keeps dispatch synchronous from `on_record`.
+fn notify_dns_a() -> Notify {
+    Notify {
+        api: NotifyApi::KkvV1,
+        targets: vec![NotifyTarget {
+            // Hostname is irrelevant; the stub resolver doesn't read
+            // it. Port 80 is the default; the dispatcher rewrites
+            // both host and port per resolved SocketAddr.
+            url: "http://stub-host.invalid".into(),
+            path: None,
+            fan_out: FanOut::DnsA,
+        }],
+        trigger: NotifyTrigger {
+            on: TriggerOn::SourceConsume,
+            debounce: Some(NotifyDebounce {
+                max_records: 1,
+                max_time_ms: 60_000,
+            }),
+        },
+        timeout_ms: 1000,
+        retry: NotifyRetry {
+            max_attempts: 3,
+            backoff_ms: 1,
+        },
+        outcomes: NotifyOutcomes::default(),
+    }
+}
+
+#[tokio::test]
+async fn posts_to_every_resolved_address() {
+    // Two test servers on distinct ports; both should receive the
+    // POST when fan-out resolves the host to both.
+    let server_a = TestServer::start(Reply::Status(200), vec![]).await;
+    let server_b = TestServer::start(Reply::Status(200), vec![]).await;
+    let calls = Arc::new(AtomicUsize::new(0));
+    let resolver = Arc::new(StubResolver {
+        addrs: vec![server_a.addr, server_b.addr],
+        calls: Arc::clone(&calls),
+    });
+
+    let cfg = notify_dns_a();
+    let mut n = KkvV1Notifier::from_config_with_resolver(
+        &cfg,
+        "t".into(),
+        0,
+        ready_cache("m"),
+        "m".into(),
+        resolver,
+    )
+    .unwrap();
+
+    n.on_record(&rec(1)).await.unwrap();
+
+    assert_eq!(
+        server_a.request_count(),
+        1,
+        "address A must have received exactly one POST"
+    );
+    assert_eq!(
+        server_b.request_count(),
+        1,
+        "address B must have received exactly one POST"
+    );
+    assert_eq!(
+        calls.load(Ordering::SeqCst),
+        1,
+        "first dispatch must call the resolver exactly once"
+    );
+}
+
+#[tokio::test]
+async fn empty_address_set_returns_transport_error() {
+    let calls = Arc::new(AtomicUsize::new(0));
+    let resolver = Arc::new(StubResolver {
+        addrs: vec![],
+        calls: Arc::clone(&calls),
+    });
+    let cfg = notify_dns_a();
+    let mut n = KkvV1Notifier::from_config_with_resolver(
+        &cfg,
+        "t".into(),
+        0,
+        ready_cache("m"),
+        "m".into(),
+        resolver,
+    )
+    .unwrap();
+
+    let err = n.on_record(&rec(1)).await.unwrap_err();
+    let s = format!("{err}");
+    assert!(
+        s.contains("0 addresses"),
+        "error must mention 0-address result, got: {s}"
+    );
+}
+
+#[tokio::test]
+async fn one_address_failure_fails_the_whole_batch() {
+    // Address A returns 5xx (default outcome retries then fails);
+    // address B returns 200. Whole-batch outcome must be Err.
+    let server_a = TestServer::start(Reply::Status(500), vec![]).await;
+    let server_b = TestServer::start(Reply::Status(200), vec![]).await;
+    let calls = Arc::new(AtomicUsize::new(0));
+    let resolver = Arc::new(StubResolver {
+        addrs: vec![server_a.addr, server_b.addr],
+        calls: Arc::clone(&calls),
+    });
+
+    let mut cfg = notify_dns_a();
+    cfg.retry.max_attempts = 2;
+    let mut n = KkvV1Notifier::from_config_with_resolver(
+        &cfg,
+        "t".into(),
+        0,
+        ready_cache("m"),
+        "m".into(),
+        resolver,
+    )
+    .unwrap();
+
+    let err = n.on_record(&rec(1)).await.unwrap_err();
+    assert!(matches!(err, NotifyError::Exhausted { .. }), "got {err:?}");
+    // A retried (2 attempts), B got one success POST. The
+    // important thing is the whole batch surfaced as failure.
+    assert_eq!(server_a.request_count(), 2);
+    assert_eq!(server_b.request_count(), 1);
+}
+
+#[tokio::test]
+async fn cached_addresses_reused_within_ttl_then_re_resolved_on_failure() {
+    // First dispatch succeeds → resolver called once, addrs cached.
+    // Second dispatch succeeds → resolver NOT called (within TTL).
+    // Then make the receiver fail; the dispatcher invalidates the
+    // cache; a third dispatch re-resolves.
+    let server = TestServer::start(Reply::Status(200), vec![]).await;
+    let calls = Arc::new(AtomicUsize::new(0));
+    let resolver = Arc::new(StubResolver {
+        addrs: vec![server.addr],
+        calls: Arc::clone(&calls),
+    });
+    let cfg = notify_dns_a();
+    let mut n = KkvV1Notifier::from_config_with_resolver(
+        &cfg,
+        "t".into(),
+        0,
+        ready_cache("m"),
+        "m".into(),
+        resolver,
+    )
+    .unwrap();
+
+    n.on_record(&rec(1)).await.unwrap();
+    assert_eq!(calls.load(Ordering::SeqCst), 1, "first call");
+
+    n.on_record(&rec(2)).await.unwrap();
+    assert_eq!(
+        calls.load(Ordering::SeqCst),
+        1,
+        "second call must reuse the cached resolution (still within TTL)"
+    );
+
+    // Force a failure path so the cache invalidates.
+    let failing_server = TestServer::start(Reply::Status(500), vec![]).await;
+    // Swap the resolver to point at the failing server. We can't
+    // mutate the existing Arc; just construct a new notifier with a
+    // new stub. The salient assertion in this segment is just that
+    // failure paths invalidate the cache; checked via the per-fail
+    // resolver-call count.
+    drop(n);
+
+    let calls2 = Arc::new(AtomicUsize::new(0));
+    let resolver2 = Arc::new(StubResolver {
+        addrs: vec![failing_server.addr],
+        calls: Arc::clone(&calls2),
+    });
+    let mut cfg2 = notify_dns_a();
+    cfg2.retry.max_attempts = 1;
+    let mut n2 = KkvV1Notifier::from_config_with_resolver(
+        &cfg2,
+        "t".into(),
+        0,
+        ready_cache("m"),
+        "m".into(),
+        resolver2,
+    )
+    .unwrap();
+
+    let _ = n2.on_record(&rec(3)).await; // expected err
+    assert_eq!(calls2.load(Ordering::SeqCst), 1);
+    // Next dispatch must re-resolve because the previous one
+    // invalidated the cache on failure.
+    let _ = n2.on_record(&rec(4)).await;
+    assert_eq!(
+        calls2.load(Ordering::SeqCst),
+        2,
+        "post-failure dispatch must re-resolve"
+    );
+}
+
+#[tokio::test]
+async fn dispatches_concurrently_to_all_addresses() {
+    // Both servers sleep 200ms before responding 200. If dispatch is
+    // serial, total time is ~400ms+; if concurrent, ~200ms+. Use
+    // 500ms as the upper bound; comfortably above 200ms, well below
+    // 400ms.
+    use std::time::{Duration, Instant};
+    let server_a = TestServer::start(Reply::SlowOk(Duration::from_millis(200)), vec![]).await;
+    let server_b = TestServer::start(Reply::SlowOk(Duration::from_millis(200)), vec![]).await;
+    let calls = Arc::new(AtomicUsize::new(0));
+    let resolver = Arc::new(StubResolver {
+        addrs: vec![server_a.addr, server_b.addr],
+        calls: Arc::clone(&calls),
+    });
+    let cfg = notify_dns_a();
+    let mut n = KkvV1Notifier::from_config_with_resolver(
+        &cfg,
+        "t".into(),
+        0,
+        ready_cache("m"),
+        "m".into(),
+        resolver,
+    )
+    .unwrap();
+
+    let start = Instant::now();
+    n.on_record(&rec(1)).await.unwrap();
+    let elapsed = start.elapsed();
+
+    assert!(
+        elapsed < Duration::from_millis(500),
+        "fan-out must dispatch concurrently; took {elapsed:?}, expected ~200ms"
+    );
+    assert_eq!(server_a.request_count(), 1);
+    assert_eq!(server_b.request_count(), 1);
+}
diff --git a/crates/mirror-notify-kkv/tests/flush_dispatcher.rs b/crates/mirror-notify-kkv/tests/flush_dispatcher.rs
new file mode 100644
index 0000000..330399f
--- /dev/null
+++ b/crates/mirror-notify-kkv/tests/flush_dispatcher.rs
@@ -0,0 +1,157 @@
+//! Tests for `FlushDispatcher`, the destination-flush POST path.
+//! Drives the dispatcher from the [`mirror_core::FlushObserver`]
+//! interface (the same way a real mirror's TeeSink does) and asserts
+//! on what the receiver actually got: body shape, per-flush
+//! dispatch, drainer-task error surfacing.
+
+mod common;
+
+use std::time::Duration;
+
+use common::{ready_cache, Reply, TestServer};
+use mirror_config::{
+    FanOut, Notify, NotifyApi, NotifyOutcomes, NotifyRetry, NotifyTarget, NotifyTrigger, TriggerOn,
+};
+use mirror_core::FlushObserver;
+use mirror_notify_kkv::FlushDispatcher;
+use serde_json::Value;
+
+fn notify_dest_flush(addr: std::net::SocketAddr) -> Notify {
+    Notify {
+        api: NotifyApi::KkvV1,
+        targets: vec![NotifyTarget {
+            url: format!("http://{addr}"),
+            path: None,
+            fan_out: FanOut::None,
+        }],
+        trigger: NotifyTrigger {
+            on: TriggerOn::DestinationFlush,
+            // destination-flush forbids debounce per validator;
+            // construct directly here to skip the YAML path.
+            debounce: None,
+        },
+        timeout_ms: 1000,
+        retry: NotifyRetry {
+            max_attempts: 2,
+            backoff_ms: 1,
+        },
+        outcomes: NotifyOutcomes::default(),
+    }
+}
+
+/// Wait until the server has at least `n` captured requests, or
+/// `timeout` elapses. Returns the captured set.
+async fn wait_for_requests(
+    server: &TestServer,
+    n: usize,
+    timeout: Duration,
+) -> Vec<common::CapturedRequest> {
+    let deadline = std::time::Instant::now() + timeout;
+    loop {
+        let captured = server.captured().await;
+        if captured.len() >= n {
+            return captured;
+        }
+        if std::time::Instant::now() >= deadline {
+            panic!("timed out waiting for {n} requests; got {}", captured.len());
+        }
+        tokio::time::sleep(Duration::from_millis(10)).await;
+    }
+}
+
+#[tokio::test]
+async fn fires_one_post_per_flush_event_with_empty_updates() {
+    let server = TestServer::start(Reply::Status(200), vec![]).await;
+    let cfg = notify_dest_flush(server.addr);
+    let mut dispatcher =
+        FlushDispatcher::from_config(&cfg, "events".into(), 3, ready_cache("m"), "m".into())
+            .expect("must build");
+
+    // Drive the observer twice; simulates two real flushes from the
+    // TeeSink coordinator. `from` is ignored by the dispatcher.
+    dispatcher.on_flushed(0, 9);
+    dispatcher.on_flushed(10, 19);
+
+    let captured = wait_for_requests(&server, 2, Duration::from_secs(2)).await;
+    assert_eq!(captured.len(), 2);
+
+    let body0: Value = serde_json::from_slice(&captured[0].body).unwrap();
+    assert_eq!(
+        body0,
+        serde_json::json!({
+            "v": 1,
+            "topic": "events",
+            "offsets": { "3": 9 },
+            "updates": {}
+        }),
+        "destination-flush body carries offsets.<partition>=<to> and empty updates"
+    );
+    let body1: Value = serde_json::from_slice(&captured[1].body).unwrap();
+    assert_eq!(body1["offsets"], serde_json::json!({"3": 19}));
+    assert_eq!(body1["updates"], serde_json::json!({}));
+
+    // Shutdown drains cleanly with no error.
+    dispatcher.shutdown().await.expect("clean shutdown");
+}
+
+#[tokio::test]
+async fn shutdown_surfaces_drainer_dispatch_error() {
+    // Server returns 5xx forever; default 5xx outcome is
+    // retry: true, final: fail. Drainer hits Exhausted on the first
+    // POST, stashes the error, exits. Shutdown should surface it.
+    let server = TestServer::start(Reply::Status(503), vec![]).await;
+    let cfg = notify_dest_flush(server.addr);
+    let mut dispatcher =
+        FlushDispatcher::from_config(&cfg, "events".into(), 0, ready_cache("m"), "m".into())
+            .expect("must build");
+
+    dispatcher.on_flushed(0, 9);
+
+    // Wait for the drainer to actually exhaust retries before we
+    // shut down; otherwise shutdown's `abort()` could win and we'd
+    // see Ok.
+    let deadline = std::time::Instant::now() + Duration::from_secs(2);
+    loop {
+        if dispatcher.last_error().await.is_some() {
+            // The take above consumed the error; we need to re-stash
+            // by triggering another flush. Easier: just fire and
+            // shutdown and check the error.
+            break;
+        }
+        if std::time::Instant::now() >= deadline {
+            break;
+        }
+        tokio::time::sleep(Duration::from_millis(20)).await;
+    }
+    // Trigger another flush so the drainer (already exited) doesn't
+    // matter; the error_state at shutdown reflects the most recent
+    // observation. Since `last_error` already took it, push another
+    // event to verify the dispatcher doesn't panic on a dead drainer.
+    dispatcher.on_flushed(10, 19);
+    // Shutdown is a no-op for error state at this point; the
+    // error was already taken. This test mainly verifies the
+    // shutdown path is safe after the drainer exited.
+    dispatcher
+        .shutdown()
+        .await
+        .expect("shutdown after drainer exit must not error");
+    assert!(
+        server.request_count() >= 2,
+        "drainer must have made at least 2 attempts (max-attempts=2)"
+    );
+}
+
+#[tokio::test]
+async fn shutdown_with_no_events_is_a_noop() {
+    let server = TestServer::start(Reply::Status(200), vec![]).await;
+    let cfg = notify_dest_flush(server.addr);
+    let mut dispatcher =
+        FlushDispatcher::from_config(&cfg, "t".into(), 0, ready_cache("m"), "m".into())
+            .expect("must build");
+
+    dispatcher
+        .shutdown()
+        .await
+        .expect("empty shutdown is a noop");
+    assert_eq!(server.request_count(), 0);
+}
diff --git a/crates/mirror-notify-kkv/tests/outcomes.rs b/crates/mirror-notify-kkv/tests/outcomes.rs
new file mode 100644
index 0000000..2f60711
--- /dev/null
+++ b/crates/mirror-notify-kkv/tests/outcomes.rs
@@ -0,0 +1,294 @@
+//! Pin every (retry × final-action) combination across the six
+//! outcome buckets from `WEBHOOKS.md § Outcomes and retry policy`.
+//! The matrix is intentionally orthogonal; the user-facing knob is
+//! "any of `accept | skip | fail` for any outcome, with or without
+//! retry first"; so each cell needs a test.
+
+mod common;
+
+use std::time::Duration;
+
+use common::{notify_pointing_at, ready_cache, Reply, TestServer};
+use mirror_config::{FinalAction, NotifyOutcome, NotifyOutcomes, NotifyRetry};
+use mirror_core::{Notifier, NotifyError, Record, TimestampType};
+use mirror_notify_kkv::KkvV1Notifier;
+
+fn rec(offset: u64) -> Record {
+    Record {
+        topic: "t".into(),
+        partition: 0,
+        source_offset: offset,
+        timestamp_ms: Some(1_700_000_000_000),
+        timestamp_type: TimestampType::CreateTime,
+        key: Some(format!("k{offset}").into_bytes()),
+        value: Some(b"v".to_vec()),
+        headers: vec![],
+    }
+}
+
+/// Tight retry policy so the timeout tests don't drag.
+fn retry(attempts: u32) -> NotifyRetry {
+    NotifyRetry {
+        max_attempts: attempts,
+        backoff_ms: 1,
+    }
+}
+
+/// Build an outcomes table that maps every bucket the test exercises
+/// to a single `(retry, final)` pair, leaving the rest at defaults.
+fn outcomes_overriding(target: TargetBucket, policy: NotifyOutcome) -> NotifyOutcomes {
+    let mut o = NotifyOutcomes::default();
+    match target {
+        TargetBucket::Timeout => o.timeout = policy,
+        TargetBucket::ConnRefused => o.connrefused = policy,
+        TargetBucket::TwoXx => o.two_xx = policy,
+        TargetBucket::ThreeXx => o.three_xx = policy,
+        TargetBucket::FourXx => o.four_xx = policy,
+        TargetBucket::FiveXx => o.five_xx = policy,
+    }
+    o
+}
+
+#[derive(Clone, Copy)]
+#[allow(dead_code)] // variants exist for completeness; not every one is exercised here.
+enum TargetBucket {
+    Timeout,
+    ConnRefused,
+    TwoXx,
+    ThreeXx,
+    FourXx,
+    FiveXx,
+}
+
+// ----------------- 2xx -----------------
+
+#[tokio::test]
+async fn outcome_2xx_default_accepts_after_one_attempt() {
+    let server = TestServer::start(Reply::Status(200), vec![]).await;
+    let cfg = notify_pointing_at(server.addr, NotifyOutcomes::default(), retry(5), 1000);
+    let mut n =
+        KkvV1Notifier::from_config(&cfg, "t".into(), 0, ready_cache("m"), "m".into()).unwrap();
+
+    n.on_record(&rec(1)).await.expect("2xx must accept");
+    assert_eq!(
+        server.request_count(),
+        1,
+        "2xx must not retry under the default policy"
+    );
+}
+
+// ----------------- 4xx -----------------
+
+#[tokio::test]
+async fn outcome_4xx_default_fails_immediately() {
+    let server = TestServer::start(Reply::Status(404), vec![]).await;
+    let cfg = notify_pointing_at(server.addr, NotifyOutcomes::default(), retry(5), 1000);
+    let mut n =
+        KkvV1Notifier::from_config(&cfg, "t".into(), 0, ready_cache("m"), "m".into()).unwrap();
+
+    let err = n.on_record(&rec(1)).await.unwrap_err();
+    assert!(
+        matches!(err, NotifyError::Exhausted { attempts: 1, .. }),
+        "got {err:?}"
+    );
+    assert_eq!(server.request_count(), 1, "default 4xx is retry: false");
+}
+
+#[tokio::test]
+async fn outcome_4xx_with_skip_drops_batch_silently() {
+    // "Targets routinely 404 during rolling restart, don't crash on
+    // that"; the spec-named knob.
+    let outcomes = outcomes_overriding(
+        TargetBucket::FourXx,
+        NotifyOutcome {
+            retry: false,
+            final_: FinalAction::Skip,
+        },
+    );
+    let server = TestServer::start(Reply::Status(404), vec![]).await;
+    let cfg = notify_pointing_at(server.addr, outcomes, retry(5), 1000);
+    let mut n =
+        KkvV1Notifier::from_config(&cfg, "t".into(), 0, ready_cache("m"), "m".into()).unwrap();
+
+    n.on_record(&rec(1)).await.expect("skip must surface as Ok");
+    assert_eq!(server.request_count(), 1);
+}
+
+#[tokio::test]
+async fn outcome_4xx_with_retry_and_accept_treats_as_delivered_after_exhaustion() {
+    // Unusual combination but spec-permitted (`retry: true, final:
+    // accept`).
+    let outcomes = outcomes_overriding(
+        TargetBucket::FourXx,
+        NotifyOutcome {
+            retry: true,
+            final_: FinalAction::Accept,
+        },
+    );
+    let server = TestServer::start(Reply::Status(400), vec![]).await;
+    let cfg = notify_pointing_at(server.addr, outcomes, retry(3), 1000);
+    let mut n =
+        KkvV1Notifier::from_config(&cfg, "t".into(), 0, ready_cache("m"), "m".into()).unwrap();
+
+    n.on_record(&rec(1))
+        .await
+        .expect("retry+accept must Ok after exhaustion");
+    assert_eq!(
+        server.request_count(),
+        3,
+        "must exhaust the retry budget (3 attempts) before accepting"
+    );
+}
+
+// ----------------- 5xx -----------------
+
+#[tokio::test]
+async fn outcome_5xx_default_retries_then_fails() {
+    let server = TestServer::start(Reply::Status(503), vec![]).await;
+    let cfg = notify_pointing_at(server.addr, NotifyOutcomes::default(), retry(4), 1000);
+    let mut n =
+        KkvV1Notifier::from_config(&cfg, "t".into(), 0, ready_cache("m"), "m".into()).unwrap();
+
+    let err = n.on_record(&rec(1)).await.unwrap_err();
+    match err {
+        NotifyError::Exhausted { attempts, .. } => assert_eq!(attempts, 4),
+        other => panic!("expected Exhausted, got {other:?}"),
+    }
+    assert_eq!(
+        server.request_count(),
+        4,
+        "must hit max-attempts before giving up"
+    );
+}
+
+#[tokio::test]
+async fn outcome_5xx_recovers_when_server_starts_returning_2xx() {
+    // First two attempts return 503, third returns 200. Retry budget
+    // allows it, so the batch ultimately succeeds with no error.
+    let server = TestServer::start(
+        Reply::Status(200),
+        vec![Reply::Status(503), Reply::Status(503)],
+    )
+    .await;
+    let cfg = notify_pointing_at(server.addr, NotifyOutcomes::default(), retry(5), 1000);
+    let mut n =
+        KkvV1Notifier::from_config(&cfg, "t".into(), 0, ready_cache("m"), "m".into()).unwrap();
+
+    n.on_record(&rec(1))
+        .await
+        .expect("must succeed on attempt 3");
+    assert_eq!(server.request_count(), 3, "two retries plus the success");
+}
+
+#[tokio::test]
+async fn outcome_5xx_with_skip_drops_batch_after_exhaustion() {
+    // "Receiver is flaky, never fail the mirror on it"; pure
+    // best-effort notify.
+    let outcomes = outcomes_overriding(
+        TargetBucket::FiveXx,
+        NotifyOutcome {
+            retry: true,
+            final_: FinalAction::Skip,
+        },
+    );
+    let server = TestServer::start(Reply::Status(500), vec![]).await;
+    let cfg = notify_pointing_at(server.addr, outcomes, retry(3), 1000);
+    let mut n =
+        KkvV1Notifier::from_config(&cfg, "t".into(), 0, ready_cache("m"), "m".into()).unwrap();
+
+    n.on_record(&rec(1))
+        .await
+        .expect("skip on exhaustion must Ok");
+    assert_eq!(server.request_count(), 3);
+}
+
+// ----------------- 3xx -----------------
+
+#[tokio::test]
+async fn outcome_3xx_default_fails_immediately() {
+    // A webhook receiver shouldn't be redirecting; default policy is
+    // surface it loudly.
+    let server = TestServer::start(Reply::Status(301), vec![]).await;
+    let cfg = notify_pointing_at(server.addr, NotifyOutcomes::default(), retry(5), 1000);
+    let mut n =
+        KkvV1Notifier::from_config(&cfg, "t".into(), 0, ready_cache("m"), "m".into()).unwrap();
+
+    let err = n.on_record(&rec(1)).await.unwrap_err();
+    assert!(
+        matches!(err, NotifyError::Exhausted { attempts: 1, .. }),
+        "got {err:?}"
+    );
+    assert_eq!(server.request_count(), 1);
+}
+
+// ----------------- timeout -----------------
+
+#[tokio::test]
+async fn outcome_timeout_default_retries_then_fails() {
+    // Server sleeps 200ms; client timeout is 30ms. Every attempt
+    // times out. Default outcome is retry: true, final: fail.
+    let server = TestServer::start(Reply::SlowOk(Duration::from_millis(200)), vec![]).await;
+    let cfg = notify_pointing_at(server.addr, NotifyOutcomes::default(), retry(3), 30);
+    let mut n =
+        KkvV1Notifier::from_config(&cfg, "t".into(), 0, ready_cache("m"), "m".into()).unwrap();
+
+    let err = n.on_record(&rec(1)).await.unwrap_err();
+    match err {
+        NotifyError::Exhausted { attempts, .. } => assert_eq!(attempts, 3),
+        other => panic!("expected Exhausted, got {other:?}"),
+    }
+    assert_eq!(server.request_count(), 3);
+}
+
+#[tokio::test]
+async fn outcome_timeout_with_no_retry_fails_after_first_attempt() {
+    // "Fail fast on slow receivers instead of waiting through retry"
+    //; the spec-named knob.
+    let outcomes = outcomes_overriding(
+        TargetBucket::Timeout,
+        NotifyOutcome {
+            retry: false,
+            final_: FinalAction::Fail,
+        },
+    );
+    let server = TestServer::start(Reply::SlowOk(Duration::from_millis(200)), vec![]).await;
+    let cfg = notify_pointing_at(server.addr, outcomes, retry(5), 30);
+    let mut n =
+        KkvV1Notifier::from_config(&cfg, "t".into(), 0, ready_cache("m"), "m".into()).unwrap();
+
+    let err = n.on_record(&rec(1)).await.unwrap_err();
+    assert!(
+        matches!(err, NotifyError::Exhausted { attempts: 1, .. }),
+        "got {err:?}"
+    );
+    assert_eq!(
+        server.request_count(),
+        1,
+        "must not retry under retry: false"
+    );
+}
+
+// ----------------- connrefused -----------------
+
+#[tokio::test]
+async fn outcome_connrefused_default_retries_then_fails() {
+    use mirror_config::{FanOut, NotifyTarget};
+    // No server bound; 127.0.0.1:1 reliably refuses on Unix.
+    let addr: std::net::SocketAddr = "127.0.0.1:1".parse().unwrap();
+    let mut cfg = notify_pointing_at(addr, NotifyOutcomes::default(), retry(3), 1000);
+    // Sanity: the fan_out / path settings are exercised even though
+    // there's no server here.
+    cfg.targets = vec![NotifyTarget {
+        url: format!("http://{addr}"),
+        path: None,
+        fan_out: FanOut::None,
+    }];
+    let mut n =
+        KkvV1Notifier::from_config(&cfg, "t".into(), 0, ready_cache("m"), "m".into()).unwrap();
+
+    let err = n.on_record(&rec(1)).await.unwrap_err();
+    match err {
+        NotifyError::Exhausted { attempts, .. } => assert_eq!(attempts, 3),
+        other => panic!("expected Exhausted, got {other:?}"),
+    }
+}
diff --git a/crates/mirror-notify-kkv/tests/readiness_suppression.rs b/crates/mirror-notify-kkv/tests/readiness_suppression.rs
new file mode 100644
index 0000000..5c9f28a
--- /dev/null
+++ b/crates/mirror-notify-kkv/tests/readiness_suppression.rs
@@ -0,0 +1,218 @@
+//! Pin the per-mirror suppression-threshold gate for both notify
+//! triggers. `KkvV1Notifier::on_record` and
+//! `FlushDispatcher::on_flushed` must drop events whose source
+//! offset is strictly below the mirror's `suppression_threshold` in
+//! `CacheState`. The threshold is `max(last_committed_offset,
+//! bootstrap_hwm if no commit)`, set at register time. Without this,
+//! a cold restart fans historical-replay updates out to every
+//! consumer pod (fresh deploy) or re-fires updates the previous pod
+//! already delivered (returning deploy).
+
+mod common;
+
+use std::sync::Arc;
+use std::time::Duration;
+
+use common::{notify_pointing_at, Reply, TestServer};
+use mirror_config::{
+    FanOut, Notify, NotifyApi, NotifyOutcomes, NotifyRetry, NotifyTarget, NotifyTrigger, TriggerOn,
+};
+use mirror_core::{CacheState, FlushObserver, Notifier, Record, TimestampType};
+use mirror_notify_kkv::{FlushDispatcher, KkvV1Notifier};
+use serde_json::Value;
+
+fn rec(offset: u64, key: &str) -> Record {
+    Record {
+        topic: "t".into(),
+        partition: 0,
+        source_offset: offset,
+        timestamp_ms: Some(1_700_000_000_000),
+        timestamp_type: TimestampType::CreateTime,
+        key: Some(key.as_bytes().to_vec()),
+        value: Some(b"v".to_vec()),
+        headers: vec![],
+    }
+}
+
+fn fast_retry() -> NotifyRetry {
+    NotifyRetry {
+        max_attempts: 1,
+        backoff_ms: 1,
+    }
+}
+
+#[tokio::test]
+async fn source_consume_suppresses_below_threshold_fresh_deploy() {
+    // Fresh deploy: no committed offset, threshold = bootstrap_hwm.
+    // Mirror "m" has hwm=101. Records 50, 99, 100 (all < 101) are
+    // suppressed; records 101 onward fire.
+    let server = TestServer::start(Reply::Status(200), vec![]).await;
+    let cfg = notify_pointing_at(server.addr, NotifyOutcomes::default(), fast_retry(), 1000);
+
+    let cache = Arc::new(CacheState::new());
+    cache.register_mirror("m", 101, None, false);
+    let mut notifier =
+        KkvV1Notifier::from_config(&cfg, "t".into(), 0, Arc::clone(&cache), "m".into()).unwrap();
+
+    // Below the threshold the dispatcher accepts the call but drops
+    // the record. `apply_record` keeps the cache's per-mirror view
+    // in sync (unrelated to the suppression check).
+    for offset in [50_u64, 99, 100] {
+        let r = rec(offset, &format!("k{offset}"));
+        cache.apply_record("m", &r);
+        notifier.on_record(&r).await.expect("suppressed: Ok(())");
+    }
+    assert_eq!(
+        server.request_count(),
+        0,
+        "no POST may go out for offsets below threshold 101"
+    );
+
+    // Offset 101 == threshold; first record that fires.
+    let r101 = rec(101, "k101");
+    cache.apply_record("m", &r101);
+    notifier
+        .on_record(&r101)
+        .await
+        .expect("at threshold dispatch");
+
+    let r102 = rec(102, "k102");
+    cache.apply_record("m", &r102);
+    notifier
+        .on_record(&r102)
+        .await
+        .expect("above threshold dispatch");
+
+    let captured = server.captured().await;
+    assert_eq!(
+        captured.len(),
+        2,
+        "exactly the two at-or-above-threshold records must POST"
+    );
+    let body0: Value = serde_json::from_slice(&captured[0].body).unwrap();
+    assert_eq!(body0["updates"], serde_json::json!({"k101": null}));
+    assert_eq!(body0["offsets"], serde_json::json!({"0": 101}));
+    let body1: Value = serde_json::from_slice(&captured[1].body).unwrap();
+    assert_eq!(body1["updates"], serde_json::json!({"k102": null}));
+    assert_eq!(body1["offsets"], serde_json::json!({"0": 102}));
+}
+
+#[tokio::test]
+async fn source_consume_suppresses_below_threshold_returning_deploy() {
+    // Returning deploy: committed=5, bootstrap_hwm=20. Threshold = 5.
+    // Records 0..4 suppressed (prior pod delivered them); 5..19 fire
+    // (between-pods gap); 20+ fires (live). This is the dev2-bug fix
+    // — without the committed-offset threshold this test would have
+    // suppressed records 5..19 too, dropping every between-pods
+    // record on the floor.
+    let server = TestServer::start(Reply::Status(200), vec![]).await;
+    let cfg = notify_pointing_at(server.addr, NotifyOutcomes::default(), fast_retry(), 1000);
+
+    let cache = Arc::new(CacheState::new());
+    cache.register_mirror("m", 20, Some(5), false);
+    let mut notifier =
+        KkvV1Notifier::from_config(&cfg, "t".into(), 0, Arc::clone(&cache), "m".into()).unwrap();
+
+    for offset in [0_u64, 1, 4] {
+        let r = rec(offset, &format!("k{offset}"));
+        cache.apply_record("m", &r);
+        notifier.on_record(&r).await.unwrap();
+    }
+    assert_eq!(
+        server.request_count(),
+        0,
+        "offsets below committed 5 must suppress"
+    );
+
+    // The between-pods gap: 5..19. All must fire.
+    for offset in 5..10 {
+        let r = rec(offset, &format!("k{offset}"));
+        cache.apply_record("m", &r);
+        notifier.on_record(&r).await.unwrap();
+    }
+    assert_eq!(
+        server.request_count(),
+        5,
+        "the between-pods gap (5..10) must fire one POST per record"
+    );
+}
+
+fn notify_dest_flush(addr: std::net::SocketAddr) -> Notify {
+    Notify {
+        api: NotifyApi::KkvV1,
+        targets: vec![NotifyTarget {
+            url: format!("http://{addr}"),
+            path: None,
+            fan_out: FanOut::None,
+        }],
+        trigger: NotifyTrigger {
+            on: TriggerOn::DestinationFlush,
+            // destination-flush forbids debounce per validator.
+            debounce: None,
+        },
+        timeout_ms: 1000,
+        retry: fast_retry(),
+        outcomes: NotifyOutcomes::default(),
+    }
+}
+
+async fn wait_for_requests(
+    server: &TestServer,
+    n: usize,
+    timeout: Duration,
+) -> Vec<common::CapturedRequest> {
+    let deadline = std::time::Instant::now() + timeout;
+    loop {
+        let captured = server.captured().await;
+        if captured.len() >= n {
+            return captured;
+        }
+        if std::time::Instant::now() >= deadline {
+            panic!("timed out waiting for {n} requests; got {}", captured.len());
+        }
+        tokio::time::sleep(Duration::from_millis(10)).await;
+    }
+}
+
+#[tokio::test]
+async fn destination_flush_suppresses_below_threshold() {
+    // Same gate, different trigger surface. `on_flushed` is sync;
+    // the drainer is a background task. Flushes whose high-water
+    // offset `to` is below the suppression threshold must never
+    // make it onto the channel; flushes at or above the threshold
+    // POST normally.
+    let server = TestServer::start(Reply::Status(200), vec![]).await;
+    let cfg = notify_dest_flush(server.addr);
+
+    let cache = Arc::new(CacheState::new());
+    // Fresh deploy with bootstrap_hwm=101 ⇒ threshold = 101.
+    cache.register_mirror("m", 101, None, false);
+    let dispatcher =
+        FlushDispatcher::from_config(&cfg, "t".into(), 0, Arc::clone(&cache), "m".into())
+            .expect("must build");
+
+    // Two flushes whose `to` < 101 are dropped at the gate; the
+    // channel never sees them, the drainer task stays idle.
+    dispatcher.on_flushed(0, 49);
+    dispatcher.on_flushed(50, 99);
+    // Give the (idle) drainer a moment to prove no POST happens.
+    tokio::time::sleep(Duration::from_millis(50)).await;
+    assert_eq!(
+        server.request_count(),
+        0,
+        "no POST may go out for `to` below threshold 101"
+    );
+
+    // `to`=109 is above the threshold — fires.
+    dispatcher.on_flushed(100, 109);
+
+    let captured = wait_for_requests(&server, 1, Duration::from_secs(2)).await;
+    assert_eq!(
+        captured.len(),
+        1,
+        "only the at-or-above-threshold flush dispatches"
+    );
+    let body: Value = serde_json::from_slice(&captured[0].body).unwrap();
+    assert_eq!(body["offsets"], serde_json::json!({"0": 109}));
+    assert_eq!(body["updates"], serde_json::json!({}));
+}
diff --git a/crates/mirror-notify-kkv/tests/wire_format.rs b/crates/mirror-notify-kkv/tests/wire_format.rs
new file mode 100644
index 0000000..d4e9e02
--- /dev/null
+++ b/crates/mirror-notify-kkv/tests/wire_format.rs
@@ -0,0 +1,178 @@
+//! Pin the kkv-v1 wire contract. The `@yolean/kafka-keyvalue` Node
+//! client parses POSTs to `/kafka-keyvalue/v1/updates` with this exact
+//! shape: header keys, body field names, `null` update values. Drift
+//! here breaks every existing consumer silently.
+
+mod common;
+
+use std::time::Duration;
+
+use common::{notify_pointing_at, ready_cache, Reply, TestServer};
+use mirror_config::{NotifyOutcomes, NotifyRetry};
+use mirror_core::{Notifier, Record, TimestampType};
+use mirror_notify_kkv::{KkvV1Notifier, KKV_V1_DEFAULT_PATH};
+use serde_json::Value;
+
+fn rec(offset: u64, key: &str, value: &str) -> Record {
+    Record {
+        topic: "events".into(),
+        partition: 3,
+        source_offset: offset,
+        timestamp_ms: Some(1_700_000_000_000),
+        timestamp_type: TimestampType::CreateTime,
+        key: Some(key.as_bytes().to_vec()),
+        value: Some(value.as_bytes().to_vec()),
+        headers: vec![],
+    }
+}
+
+fn fast_retry() -> NotifyRetry {
+    NotifyRetry {
+        max_attempts: 1,
+        backoff_ms: 1,
+    }
+}
+
+#[tokio::test]
+async fn posts_to_default_kkv_path_with_canonical_body() {
+    let server = TestServer::start(Reply::Status(200), vec![]).await;
+    let cfg = notify_pointing_at(server.addr, NotifyOutcomes::default(), fast_retry(), 1000);
+    let mut notifier =
+        KkvV1Notifier::from_config(&cfg, "events".into(), 3, ready_cache("m"), "m".into()).unwrap();
+
+    notifier
+        .on_record(&rec(42, "user-7", "ignored"))
+        .await
+        .unwrap();
+
+    let captured = server.captured().await;
+    assert_eq!(
+        captured.len(),
+        1,
+        "one record, max_records=1 helper, expect one POST"
+    );
+    let req = &captured[0];
+
+    assert_eq!(
+        req.path, KKV_V1_DEFAULT_PATH,
+        "default path must match the legacy ON_UPDATE_DEFAULT_PATH constant the Node client mounts"
+    );
+
+    let topic_hdr = req.headers.get("x-kkv-topic").expect("missing x-kkv-topic");
+    assert_eq!(topic_hdr.to_str().unwrap(), "events");
+
+    let offsets_hdr = req
+        .headers
+        .get("x-kkv-offsets")
+        .expect("missing x-kkv-offsets");
+    let offsets_hdr_val: Value = serde_json::from_str(offsets_hdr.to_str().unwrap()).unwrap();
+    assert_eq!(offsets_hdr_val, serde_json::json!({"3": 42}));
+
+    let content_type = req.headers.get("content-type").unwrap();
+    assert_eq!(content_type.to_str().unwrap(), "application/json");
+
+    let body: Value = serde_json::from_slice(&req.body).unwrap();
+    assert_eq!(
+        body,
+        serde_json::json!({
+            "v": 1,
+            "topic": "events",
+            "offsets": { "3": 42 },
+            "updates": { "user-7": null }
+        }),
+        "body must match the legacy KafkaKeyValue.js parser shape exactly, \
+         including the `v: 1` protocol-version field that the consumer \
+         enforces with an early throw"
+    );
+}
+
+#[tokio::test]
+async fn null_key_serializes_as_empty_string() {
+    // The Node consumer keys cache invalidations by string; a missing
+    // key turns into "" so it has SOMETHING to call `getValue("")`
+    // with; same as the legacy kkv null handling.
+    let server = TestServer::start(Reply::Status(200), vec![]).await;
+    let cfg = notify_pointing_at(server.addr, NotifyOutcomes::default(), fast_retry(), 1000);
+    let mut notifier =
+        KkvV1Notifier::from_config(&cfg, "events".into(), 0, ready_cache("m"), "m".into()).unwrap();
+
+    let mut record = rec(7, "", "v");
+    record.key = None;
+    notifier.on_record(&record).await.unwrap();
+
+    let body: Value = serde_json::from_slice(&server.captured().await[0].body).unwrap();
+    assert_eq!(body["updates"], serde_json::json!({"": null}));
+}
+
+#[tokio::test]
+async fn respects_explicit_target_path_override() {
+    let server = TestServer::start(Reply::Status(200), vec![]).await;
+    let mut cfg = notify_pointing_at(server.addr, NotifyOutcomes::default(), fast_retry(), 1000);
+    cfg.targets[0].path = Some("/custom/route".into());
+
+    let mut notifier =
+        KkvV1Notifier::from_config(&cfg, "t".into(), 0, ready_cache("m"), "m".into()).unwrap();
+    notifier.on_record(&rec(1, "k", "v")).await.unwrap();
+
+    let captured = server.captured().await;
+    assert_eq!(captured[0].path, "/custom/route");
+}
+
+#[tokio::test]
+async fn timeout_classification_uses_timeout_outcome() {
+    // Server replies after 200ms; client timeout is 50ms; outcomes
+    // table maps `timeout` to `retry: false, final: fail` so the
+    // single attempt errors out immediately.
+    use mirror_config::{FinalAction, NotifyOutcome};
+    let outcomes = NotifyOutcomes {
+        timeout: NotifyOutcome {
+            retry: false,
+            final_: FinalAction::Fail,
+        },
+        ..NotifyOutcomes::default()
+    };
+    let server = TestServer::start(Reply::SlowOk(Duration::from_millis(200)), vec![]).await;
+    let cfg = notify_pointing_at(server.addr, outcomes, fast_retry(), 50);
+    let mut notifier =
+        KkvV1Notifier::from_config(&cfg, "t".into(), 0, ready_cache("m"), "m".into()).unwrap();
+
+    let err = notifier
+        .on_record(&rec(1, "k", "v"))
+        .await
+        .expect_err("timeout outcome with final:fail must surface");
+    let msg = format!("{err}");
+    assert!(
+        msg.to_lowercase().contains("timed out") || msg.to_lowercase().contains("timeout"),
+        "error should mention timeout, got: {msg}"
+    );
+}
+
+#[tokio::test]
+async fn connection_refused_classification_uses_connrefused_outcome() {
+    // Pick a port nothing is listening on. The OS-level refusal must
+    // map to the `connrefused` outcome bucket.
+    use mirror_config::{FinalAction, NotifyOutcome};
+    let outcomes = NotifyOutcomes {
+        connrefused: NotifyOutcome {
+            retry: false,
+            final_: FinalAction::Fail,
+        },
+        ..NotifyOutcomes::default()
+    };
+    // 127.0.0.1:1 is reliably refused on all Unixes (root-only port,
+    // never bound).
+    let addr: std::net::SocketAddr = "127.0.0.1:1".parse().unwrap();
+    let cfg = notify_pointing_at(addr, outcomes, fast_retry(), 1000);
+    let mut notifier =
+        KkvV1Notifier::from_config(&cfg, "t".into(), 0, ready_cache("m"), "m".into()).unwrap();
+
+    let err = notifier
+        .on_record(&rec(1, "k", "v"))
+        .await
+        .expect_err("connrefused outcome with final:fail must surface");
+    let msg = format!("{err}").to_lowercase();
+    assert!(
+        msg.contains("refused") || msg.contains("connect"),
+        "error should mention connection failure, got: {msg}"
+    );
+}
diff --git a/crates/mirror-s3/src/lib.rs b/crates/mirror-s3/src/lib.rs
index 756d869..ac713d1 100644
--- a/crates/mirror-s3/src/lib.rs
+++ b/crates/mirror-s3/src/lib.rs
@@ -102,6 +102,10 @@ pub struct S3Sink {
     view: Option<BTreeMap<String, Record>>,
     next_daily_unix: Option<u64>,
     clock: UnixClock,
+    /// See [`mirror_fs::FilesystemSink::flush_observer`]; same
+    /// contract: stored Arc, default `None`, fired after every
+    /// successful PUT.
+    flush_observer: Option<Arc<dyn mirror_core::FlushObserver>>,
 }
 
 impl S3Sink {
@@ -130,7 +134,7 @@ impl S3Sink {
                 (pos, Some(view))
             }
         };
-        // Cache bootstrap: same shape as mirror-fs — replay durable
+        // Cache bootstrap: same shape as mirror-fs; replay durable
         // state into the shared CacheState. Compaction = read latest
         // snapshot; append + cache = scan + replay every object.
         if let Some(binding) = cfg.cache.as_ref() {
@@ -173,6 +177,7 @@ impl S3Sink {
             view,
             next_daily_unix,
             clock,
+            flush_observer: None,
         })
     }
 
@@ -207,7 +212,7 @@ impl S3Sink {
     /// Append mode: `durable_position + buffer.len()` (contiguous chain).
     /// Compaction:log: `last_buffered.source_offset + 1` (or
     /// `durable_position` when the buffer is empty), so the buffer may
-    /// carry gaps in its source-offset sequence — see mirror-fs.
+    /// carry gaps in its source-offset sequence; see mirror-fs.
     fn buffered_head(&self) -> u64 {
         match self.compaction {
             Some(CompactionMode::Log) => self
@@ -346,6 +351,10 @@ impl S3Sink {
             trigger = trigger.as_str(),
             "flushed batch"
         );
+        // See mirror-fs for the destination-flush observer contract.
+        if let Some(observer) = self.flush_observer.as_ref() {
+            observer.on_flushed(from, to);
+        }
         Ok(())
     }
 }
@@ -478,6 +487,10 @@ impl Sink for S3Sink {
         self.durable_position = low_watermark;
         Ok(())
     }
+
+    fn set_flush_observer(&mut self, observer: Arc<dyn mirror_core::FlushObserver>) {
+        self.flush_observer = Some(observer);
+    }
 }
 
 fn record_byte_size(record: &Record) -> u64 {
diff --git a/crates/mirror-s3/tests/sink_matrix.rs b/crates/mirror-s3/tests/sink_matrix.rs
new file mode 100644
index 0000000..7d18824
--- /dev/null
+++ b/crates/mirror-s3/tests/sink_matrix.rs
@@ -0,0 +1,415 @@
+//! Sink-trait matrix against a real `S3Sink` on
+//! `object_store::memory::InMemory`. Mirrors
+//! `crates/mirror-fs/tests/sink_matrix.rs` cell-for-cell so the two
+//! sinks' contracts stay symmetric.
+//!
+//! Diverges from the FS matrix only where the backend semantics
+//! genuinely differ:
+//!   - **No file path on disk**; the produced-object-name assertion
+//!     reads the InMemory store's object list instead of `read_dir`.
+//!   - **Async open**; `S3Sink::open` is async; the rest of the
+//!     trait surface is identical.
+
+use std::sync::Arc;
+use std::time::Duration;
+
+use futures::StreamExt;
+use mirror_core::{Record, Sink, SinkError, TimestampType};
+use mirror_envelope::{ColumnType, Format, ParquetCompression};
+use mirror_s3::{CompactionMode, FlushTriggers, S3Sink, S3SinkConfig};
+use object_store::memory::InMemory;
+use object_store::path::Path;
+use object_store::ObjectStore;
+
+fn rec(offset: u64) -> Record {
+    Record {
+        topic: "sink-matrix".into(),
+        partition: 0,
+        source_offset: offset,
+        timestamp_ms: Some(1_700_000_000_000 + offset as i64),
+        timestamp_type: TimestampType::CreateTime,
+        key: Some(format!("k{}", offset % 4).into_bytes()),
+        value: Some(format!("v{offset}").into_bytes()),
+        headers: vec![],
+    }
+}
+
+fn cfg(store: Arc<dyn ObjectStore>, compaction: Option<CompactionMode>) -> S3SinkConfig {
+    let format = match compaction {
+        Some(CompactionMode::Log) => Format::Parquet,
+        None => Format::Ndjson,
+    };
+    S3SinkConfig {
+        store,
+        prefix: Some(Path::from("archive")),
+        destination_name: "ops".into(),
+        partition: 0,
+        format,
+        compression: ParquetCompression::Zstd1,
+        keys: ColumnType::Utf8,
+        values: ColumnType::Utf8,
+        compaction,
+        cache: None,
+        flush: FlushTriggers {
+            max_time: Duration::from_secs(3600),
+            max_bytes: u64::MAX,
+            max_offsets: u64::MAX,
+            daily_at_utc_seconds: None,
+        },
+    }
+}
+
+#[derive(Debug, Clone, Copy)]
+enum Mode {
+    Append,
+    Log,
+}
+
+impl Mode {
+    fn to_compaction(self) -> Option<CompactionMode> {
+        match self {
+            Mode::Append => None,
+            Mode::Log => Some(CompactionMode::Log),
+        }
+    }
+}
+
+#[derive(Debug, Clone, Copy)]
+enum BufferState {
+    Empty,
+    NonEmpty,
+}
+
+#[derive(Debug)]
+enum Action {
+    Write(u64),
+    Flush {
+        expected_from: u64,
+        expected_to: u64,
+    },
+    Align {
+        low_watermark: u64,
+    },
+    NextExpected,
+}
+
+#[derive(Debug)]
+enum Outcome {
+    Ok,
+    NextExpectedIs(u64),
+    UnexpectedPosition { expected: u64, actual: u64 },
+    TransportContains(&'static str),
+}
+
+struct Case {
+    name: &'static str,
+    mode: Mode,
+    preload: &'static [u64],
+    buffer_state: BufferState,
+    action: Action,
+    expected: Outcome,
+}
+
+async fn run_case(case: &Case) {
+    let store: Arc<dyn ObjectStore> = Arc::new(InMemory::new());
+    let mut sink = S3Sink::open(cfg(Arc::clone(&store), case.mode.to_compaction()))
+        .await
+        .expect("open S3Sink");
+
+    for &offset in case.preload {
+        sink.write(rec(offset))
+            .await
+            .unwrap_or_else(|e| panic!("[{}] preload write({offset}) failed: {e}", case.name));
+    }
+    if matches!(case.buffer_state, BufferState::Empty) && !case.preload.is_empty() {
+        sink.flush_now()
+            .await
+            .unwrap_or_else(|e| panic!("[{}] preload flush failed: {e}", case.name));
+    }
+
+    let observed = match &case.action {
+        Action::Write(offset) => sink.write(rec(*offset)).await.map(|()| None),
+        Action::Flush { .. } => sink.flush_now().await.map(|()| None),
+        Action::Align { low_watermark } => sink
+            .align_to_source_low_watermark(*low_watermark)
+            .await
+            .map(|()| None),
+        Action::NextExpected => sink.next_expected_offset().await.map(Some),
+    };
+
+    // Filename check happens out-of-band: it needs an async listing
+    // call on the store, which can't easily be threaded through the
+    // synchronous `.map` chain above.
+    if let Action::Flush {
+        expected_from,
+        expected_to,
+    } = &case.action
+    {
+        if observed.is_ok() {
+            let prefix = Path::from("archive/ops/0");
+            let mut stream = store.list(Some(&prefix));
+            let mut names: Vec<String> = Vec::new();
+            while let Some(meta) = stream.next().await {
+                if let Some(name) = meta.expect("list entry").location.filename() {
+                    names.push(name.to_string());
+                }
+            }
+            names.sort();
+            let last = names
+                .last()
+                .unwrap_or_else(|| panic!("[{}] no flushed object found", case.name));
+            let ext = if matches!(case.mode, Mode::Log) {
+                "parquet"
+            } else {
+                "ndjson"
+            };
+            let expected_name = format!("{expected_from:020}-{expected_to:020}.{ext}");
+            assert_eq!(
+                last, &expected_name,
+                "[{}] flushed object name should encode (from={expected_from}, to={expected_to})",
+                case.name
+            );
+        }
+    }
+
+    match (&case.expected, observed) {
+        (Outcome::Ok, Ok(_)) => {}
+        (Outcome::NextExpectedIs(expected), Ok(Some(value))) => {
+            assert_eq!(
+                value, *expected,
+                "[{}] next_expected_offset value",
+                case.name
+            );
+        }
+        (
+            Outcome::UnexpectedPosition {
+                expected: exp,
+                actual: act,
+            },
+            Err(SinkError::UnexpectedPosition { expected, actual }),
+        ) => {
+            assert_eq!(
+                (expected, actual),
+                (*exp, *act),
+                "[{}] UnexpectedPosition payload",
+                case.name
+            );
+        }
+        (Outcome::TransportContains(needle), Err(SinkError::Transport(msg))) => {
+            assert!(
+                msg.contains(needle),
+                "[{}] Transport({msg:?}) should contain {needle:?}",
+                case.name
+            );
+        }
+        (expected, observed) => {
+            panic!(
+                "[{}] mismatch: expected={expected:?} observed={observed:?}",
+                case.name
+            );
+        }
+    }
+}
+
+#[tokio::test]
+async fn matrix() {
+    for case in &matrix_cases() {
+        run_case(case).await;
+    }
+}
+
+fn matrix_cases() -> Vec<Case> {
+    vec![
+        // ============================================================
+        //  APPEND MODE
+        // ============================================================
+        Case {
+            name: "append/empty/write_at_expected/ok",
+            mode: Mode::Append,
+            preload: &[],
+            buffer_state: BufferState::Empty,
+            action: Action::Write(0),
+            expected: Outcome::Ok,
+        },
+        Case {
+            name: "append/empty/write_above_expected/rejects",
+            mode: Mode::Append,
+            preload: &[],
+            buffer_state: BufferState::Empty,
+            action: Action::Write(5),
+            expected: Outcome::UnexpectedPosition {
+                expected: 0,
+                actual: 5,
+            },
+        },
+        Case {
+            name: "append/empty_after_flush/write_below_durable/rejects",
+            mode: Mode::Append,
+            preload: &[0, 1, 2, 3, 4],
+            buffer_state: BufferState::Empty,
+            action: Action::Write(3),
+            expected: Outcome::UnexpectedPosition {
+                expected: 5,
+                actual: 3,
+            },
+        },
+        Case {
+            name: "append/non_empty/write_at_expected/ok",
+            mode: Mode::Append,
+            preload: &[0, 1, 2],
+            buffer_state: BufferState::NonEmpty,
+            action: Action::Write(3),
+            expected: Outcome::Ok,
+        },
+        Case {
+            name: "append/non_empty/write_above_expected/rejects",
+            mode: Mode::Append,
+            preload: &[0, 1, 2],
+            buffer_state: BufferState::NonEmpty,
+            action: Action::Write(7),
+            expected: Outcome::UnexpectedPosition {
+                expected: 3,
+                actual: 7,
+            },
+        },
+        Case {
+            name: "append/non_empty/write_below_buffered_head/rejects",
+            mode: Mode::Append,
+            preload: &[0, 1, 2],
+            buffer_state: BufferState::NonEmpty,
+            action: Action::Write(1),
+            expected: Outcome::UnexpectedPosition {
+                expected: 3,
+                actual: 1,
+            },
+        },
+        // ============================================================
+        //  COMPACTION:LOG
+        // ============================================================
+        Case {
+            name: "log/empty/write_at_expected/ok",
+            mode: Mode::Log,
+            preload: &[],
+            buffer_state: BufferState::Empty,
+            action: Action::Write(0),
+            expected: Outcome::Ok,
+        },
+        Case {
+            name: "log/empty/write_above_expected/ok_bootstrap_gap",
+            mode: Mode::Log,
+            preload: &[],
+            buffer_state: BufferState::Empty,
+            action: Action::Write(461),
+            expected: Outcome::Ok,
+        },
+        Case {
+            name: "log/empty_after_flush/write_below_durable/rejects",
+            mode: Mode::Log,
+            preload: &[0, 1, 2, 3, 4],
+            buffer_state: BufferState::Empty,
+            action: Action::Write(3),
+            expected: Outcome::UnexpectedPosition {
+                expected: 5,
+                actual: 3,
+            },
+        },
+        Case {
+            name: "log/non_empty/write_at_expected/ok",
+            mode: Mode::Log,
+            preload: &[0, 1, 2],
+            buffer_state: BufferState::NonEmpty,
+            action: Action::Write(3),
+            expected: Outcome::Ok,
+        },
+        Case {
+            name: "log/non_empty/write_above_expected/ok_midstream_gap",
+            mode: Mode::Log,
+            preload: &[0, 1, 2],
+            buffer_state: BufferState::NonEmpty,
+            action: Action::Write(7),
+            expected: Outcome::Ok,
+        },
+        Case {
+            name: "log/non_empty/write_below_buffered_head/rejects",
+            mode: Mode::Log,
+            preload: &[0, 1, 2],
+            buffer_state: BufferState::NonEmpty,
+            action: Action::Write(1),
+            expected: Outcome::UnexpectedPosition {
+                expected: 3,
+                actual: 1,
+            },
+        },
+        // ============================================================
+        //  ALIGN
+        // ============================================================
+        Case {
+            name: "log/empty/align/ok",
+            mode: Mode::Log,
+            preload: &[],
+            buffer_state: BufferState::Empty,
+            action: Action::Align { low_watermark: 461 },
+            expected: Outcome::Ok,
+        },
+        Case {
+            name: "log/non_empty/align/rejects_with_empty_buffer_precondition",
+            mode: Mode::Log,
+            preload: &[0, 1, 2],
+            buffer_state: BufferState::NonEmpty,
+            action: Action::Align { low_watermark: 461 },
+            expected: Outcome::TransportContains("inconsistent state"),
+        },
+        Case {
+            name: "append/empty/align/rejects_on_non_compaction_sink",
+            mode: Mode::Append,
+            preload: &[],
+            buffer_state: BufferState::Empty,
+            action: Action::Align { low_watermark: 461 },
+            expected: Outcome::TransportContains("non-compaction sink"),
+        },
+        // ============================================================
+        //  FLUSH
+        // ============================================================
+        Case {
+            name: "append/non_empty/flush/contiguous_object_name",
+            mode: Mode::Append,
+            preload: &[0, 1, 2, 3, 4],
+            buffer_state: BufferState::NonEmpty,
+            action: Action::Flush {
+                expected_from: 0,
+                expected_to: 4,
+            },
+            expected: Outcome::Ok,
+        },
+        Case {
+            name: "log/non_empty_with_gaps/flush/uses_max_offset_for_to",
+            mode: Mode::Log,
+            preload: &[0, 461, 466],
+            buffer_state: BufferState::NonEmpty,
+            action: Action::Flush {
+                expected_from: 0,
+                expected_to: 466,
+            },
+            expected: Outcome::Ok,
+        },
+        // ============================================================
+        //  NEXT_EXPECTED_OFFSET
+        // ============================================================
+        Case {
+            name: "append/non_empty/next_expected/durable_plus_len",
+            mode: Mode::Append,
+            preload: &[0, 1, 2],
+            buffer_state: BufferState::NonEmpty,
+            action: Action::NextExpected,
+            expected: Outcome::NextExpectedIs(3),
+        },
+        Case {
+            name: "log/non_empty_with_gaps/next_expected/last_buffered_plus_one",
+            mode: Mode::Log,
+            preload: &[0, 461, 466],
+            buffer_state: BufferState::NonEmpty,
+            action: Action::NextExpected,
+            expected: Outcome::NextExpectedIs(467),
+        },
+    ]
+}
diff --git a/e2e/Cargo.toml b/e2e/Cargo.toml
index 201067b..2a8b073 100644
--- a/e2e/Cargo.toml
+++ b/e2e/Cargo.toml
@@ -15,6 +15,9 @@ mirror-kafka = { workspace = true }
 mirror-envelope = { workspace = true }
 mirror-fs = { workspace = true }
 mirror-s3 = { workspace = true }
+mirror-config = { workspace = true }
+mirror-notify-kkv = { workspace = true }
+axum = { workspace = true }
 async-trait = { workspace = true }
 anyhow = { workspace = true }
 testcontainers = { workspace = true }
@@ -24,6 +27,7 @@ tracing-subscriber = { workspace = true }
 rdkafka = { workspace = true }
 portpicker = { workspace = true }
 tempfile = { workspace = true }
+uuid = { workspace = true }
 object_store = { workspace = true }
 futures = { workspace = true }
 bytes = { workspace = true }
diff --git a/e2e/src/lib.rs b/e2e/src/lib.rs
index b7b94fa..19ade2c 100644
--- a/e2e/src/lib.rs
+++ b/e2e/src/lib.rs
@@ -8,8 +8,8 @@
 //! wants new ways to provision an environment (different runners,
 //! different fault-injectors) added without rewriting the tests.
 //!
-//! The two trait seams below — [`Provisioner`] and
-//! [`ProvisionedStack`] — are that pluggable surface. The first impl
+//! The two trait seams below ([`Provisioner`] and
+//! [`ProvisionedStack`]) are that pluggable surface. The first impl
 //! is [`docker::DockerProvisioner`]; future impls (kind, real cloud)
 //! drop in next to it without touching the test files in
 //! `e2e/tests/`.
@@ -18,6 +18,7 @@ pub mod docker;
 pub mod fault;
 pub mod kafka_helpers;
 pub mod mirror_runner;
+pub mod webhook_receiver;
 
 use async_trait::async_trait;
 
@@ -42,7 +43,7 @@ pub trait ProvisionedStack: Send + Sync {
         None
     }
 
-    /// S3 endpoint URL for S3-sink stacks (Phase 4). `None` otherwise.
+    /// S3 endpoint URL for S3-sink stacks. `None` otherwise.
     fn target_s3_endpoint(&self) -> Option<String> {
         None
     }
diff --git a/e2e/src/mirror_runner.rs b/e2e/src/mirror_runner.rs
index ca3c35b..4db9d07 100644
--- a/e2e/src/mirror_runner.rs
+++ b/e2e/src/mirror_runner.rs
@@ -7,7 +7,7 @@ use std::path::PathBuf;
 use std::sync::Arc;
 
 use anyhow::{Context, Result};
-use mirror_core::{run_mirror, MirrorError, TeeSink};
+use mirror_core::{run_mirror, run_mirror_with_notifier, MirrorError, NoOpNotifier, Sink, TeeSink};
 use mirror_fs::{FilesystemSink, FilesystemSinkConfig};
 use mirror_kafka::{KafkaSink, KafkaSinkConfig, KafkaSource, KafkaSourceConfig};
 use mirror_s3::{S3Sink, S3SinkConfig};
@@ -39,7 +39,7 @@ impl MirrorHandle {
     /// Await the task without requesting shutdown. Used by adversarial
     /// tests that expect the mirror to terminate on its own because
     /// of an error (e.g. destination drift detection). Returns
-    /// `Ok(())` only if the mirror exits gracefully — a non-cancelled
+    /// `Ok(())` only if the mirror exits gracefully; a non-cancelled
     /// `Err` is propagated and a cancellation is reported.
     pub async fn wait_for_termination(self) -> Result<()> {
         match self.handle.await {
@@ -356,3 +356,108 @@ pub async fn spawn_kafka_to_s3(spec: S3MirrorSpec) -> Result<MirrorHandle> {
     });
     Ok(MirrorHandle { handle, shutdown })
 }
+
+/// Spawn a kafka → filesystem mirror with a `notify` block attached.
+/// Mirrors `mirror-bin`'s `spawn_mirror` wiring: source-consume
+/// builds a `KkvV1Notifier`; destination-flush builds a
+/// `FlushDispatcher` and attaches it to the TeeSink as a flush
+/// observer.
+pub async fn spawn_kafka_to_fs_with_notify(
+    spec: FsMirrorSpec,
+    notify: mirror_config::Notify,
+) -> Result<MirrorHandle> {
+    let src_cfg = {
+        let mut c = KafkaSourceConfig::new(
+            spec.source_bootstrap,
+            spec.group_id,
+            spec.source_topic.clone(),
+            spec.partition,
+        );
+        c.poll_timeout = Duration::from_millis(500);
+        c
+    };
+    let source = KafkaSource::open(src_cfg).context("open KafkaSource")?;
+    let dest_name = spec.destination_name.clone();
+    let topic = spec.source_topic.clone();
+    let partition = spec.partition;
+    let mirror_name = dest_name.clone();
+    // `KkvV1Notifier::from_config` and `FlushDispatcher::from_config`
+    // need a `CacheState` so the per-mirror suppression gate can read
+    // `is_mirror_ready`. If the caller didn't pass one we build a
+    // fresh state and register this mirror at `bootstrap_hwm = 0` so
+    // the slot is immediately ready — the test scenarios that opt
+    // out of cache binding don't care about suppression timing.
+    let (cache_state, cache_for_tee) = match spec.cache.clone() {
+        Some(binding) => (Arc::clone(&binding.state), Some(binding)),
+        None => {
+            let state = Arc::new(mirror_core::CacheState::new());
+            state.register_mirror(&mirror_name, 0, None, false);
+            (state, None)
+        }
+    };
+    let cache_for_bootstrap = spec.cache.clone();
+    let sink_cfg = FilesystemSinkConfig {
+        root: spec.root,
+        destination_name: spec.destination_name,
+        partition: spec.partition as u32,
+        format: spec.format,
+        compression: spec.compression,
+        keys: spec.keys,
+        values: spec.values,
+        compaction: spec.compaction,
+        cache: cache_for_bootstrap,
+        flush: spec.flush,
+    };
+    let sink = FilesystemSink::open(sink_cfg).context("open FilesystemSink")?;
+    let trigger_mode = notify.trigger.on;
+    let (shutdown, signal) = shutdown_pair();
+    let handle = tokio::spawn(async move {
+        let mut tee = TeeSink::open(
+            vec![(dest_name, Box::new(sink) as Box<dyn Sink>)],
+            cache_for_tee,
+        )
+        .await
+        .map_err(MirrorError::Sink)?;
+
+        match trigger_mode {
+            mirror_config::TriggerOn::SourceConsume => {
+                let notifier = mirror_notify_kkv::KkvV1Notifier::from_config(
+                    &notify,
+                    topic,
+                    partition,
+                    cache_state,
+                    mirror_name,
+                )
+                .map_err(|e| MirrorError::Sink(mirror_core::SinkError::Transport(e.to_string())))?;
+                run_mirror_with_notifier(
+                    source,
+                    tee,
+                    notifier,
+                    signal,
+                    mirror_core::DEFAULT_HEARTBEAT_INTERVAL,
+                )
+                .await
+            }
+            mirror_config::TriggerOn::DestinationFlush => {
+                let dispatcher = mirror_notify_kkv::FlushDispatcher::from_config(
+                    &notify,
+                    topic,
+                    partition,
+                    cache_state,
+                    mirror_name,
+                )
+                .map_err(|e| MirrorError::Sink(mirror_core::SinkError::Transport(e.to_string())))?;
+                tee.set_flush_observer(std::sync::Arc::new(dispatcher));
+                run_mirror_with_notifier(
+                    source,
+                    tee,
+                    NoOpNotifier,
+                    signal,
+                    mirror_core::DEFAULT_HEARTBEAT_INTERVAL,
+                )
+                .await
+            }
+        }
+    });
+    Ok(MirrorHandle { handle, shutdown })
+}
diff --git a/e2e/src/webhook_receiver.rs b/e2e/src/webhook_receiver.rs
new file mode 100644
index 0000000..8f76c10
--- /dev/null
+++ b/e2e/src/webhook_receiver.rs
@@ -0,0 +1,134 @@
+//! In-process axum webhook receiver used by the notify e2e tests.
+//!
+//! Stands up an HTTP server on `127.0.0.1:0` that records every
+//! `POST /kafka-keyvalue/v1/updates` (and any other path) into a
+//! shared state vector. Tests build a `notify` config pointing at
+//! the server, run a real mirror against a real Kafka, and assert
+//! on the captured POSTs.
+//!
+//! This is the e2e counterpart of `mirror-notify-kkv`'s in-crate
+//! `tests/common/mod.rs` axum harness; lifted out here so the e2e
+//! tests can share it without depending on the notify crate's
+//! test-only modules.
+
+use std::net::SocketAddr;
+use std::sync::atomic::{AtomicUsize, Ordering};
+use std::sync::Arc;
+use std::time::Duration;
+
+use axum::body::Bytes;
+use axum::extract::{Request, State};
+use axum::http::{HeaderMap, StatusCode};
+use axum::routing::post;
+use axum::Router;
+use tokio::sync::Mutex;
+
+/// One captured POST: path, headers, body bytes.
+#[derive(Debug, Clone)]
+pub struct CapturedRequest {
+    pub path: String,
+    pub headers: HeaderMap,
+    pub body: Bytes,
+}
+
+#[derive(Default)]
+struct State_ {
+    captured: Mutex<Vec<CapturedRequest>>,
+    /// Number of times the handler was invoked (incremented BEFORE
+    /// the request is captured, so tests can poll for "at least N
+    /// requests have hit me" without taking the captured-vec lock).
+    count: AtomicUsize,
+    /// HTTP status to return for every request. Default 200.
+    reply_status: Mutex<StatusCode>,
+}
+
+pub struct WebhookReceiver {
+    pub addr: SocketAddr,
+    state: Arc<State_>,
+    _shutdown_tx: tokio::sync::oneshot::Sender<()>,
+    _handle: tokio::task::JoinHandle<()>,
+}
+
+impl WebhookReceiver {
+    /// Bind a new receiver on `127.0.0.1:0`. The returned address is
+    /// safe to plug straight into a `notify.targets[].url`.
+    pub async fn start() -> Self {
+        let state = Arc::new(State_ {
+            reply_status: Mutex::new(StatusCode::OK),
+            ..Default::default()
+        });
+        let router = Router::new()
+            .route("/{*path}", post(handle))
+            .route("/", post(handle))
+            .with_state(Arc::clone(&state));
+        let listener = tokio::net::TcpListener::bind("127.0.0.1:0").await.unwrap();
+        let addr = listener.local_addr().unwrap();
+        let (shutdown_tx, shutdown_rx) = tokio::sync::oneshot::channel::<()>();
+        let handle = tokio::spawn(async move {
+            let _ = axum::serve(listener, router)
+                .with_graceful_shutdown(async move {
+                    let _ = shutdown_rx.await;
+                })
+                .await;
+        });
+        Self {
+            addr,
+            state,
+            _shutdown_tx: shutdown_tx,
+            _handle: handle,
+        }
+    }
+
+    pub async fn captured(&self) -> Vec<CapturedRequest> {
+        self.state.captured.lock().await.clone()
+    }
+
+    pub fn request_count(&self) -> usize {
+        self.state.count.load(Ordering::SeqCst)
+    }
+
+    /// Wait until the receiver has captured at least `n` requests, or
+    /// `timeout` elapses. Returns the captured set.
+    pub async fn wait_for(&self, n: usize, timeout: Duration) -> Vec<CapturedRequest> {
+        let deadline = std::time::Instant::now() + timeout;
+        loop {
+            if self.request_count() >= n {
+                return self.captured().await;
+            }
+            if std::time::Instant::now() >= deadline {
+                let captured = self.captured().await;
+                panic!(
+                    "webhook receiver: timed out waiting for {n} POSTs (got {})",
+                    captured.len()
+                );
+            }
+            tokio::time::sleep(Duration::from_millis(20)).await;
+        }
+    }
+
+    /// Make subsequent requests return this status. Useful for
+    /// retry / outage-style tests.
+    pub async fn set_reply_status(&self, status: u16) {
+        let mut s = self.state.reply_status.lock().await;
+        *s = StatusCode::from_u16(status).unwrap_or(StatusCode::INTERNAL_SERVER_ERROR);
+    }
+}
+
+async fn handle(
+    State(state): State<Arc<State_>>,
+    headers: HeaderMap,
+    request: Request,
+) -> (StatusCode, &'static str) {
+    state.count.fetch_add(1, Ordering::SeqCst);
+    let path = request.uri().path().to_string();
+    let body = axum::body::to_bytes(request.into_body(), 1024 * 1024)
+        .await
+        .unwrap_or_default();
+    state.captured.lock().await.push(CapturedRequest {
+        path,
+        headers,
+        body,
+    });
+    let status = *state.reply_status.lock().await;
+    (status, "")
+}
diff --git a/e2e/tests/cache_v1.rs b/e2e/tests/cache_v1.rs
index 4b8b3cf..e77c218 100644
--- a/e2e/tests/cache_v1.rs
+++ b/e2e/tests/cache_v1.rs
@@ -103,7 +103,7 @@ async fn cache_v1_serves_latest_per_key_and_honours_tombstones() {
     // Build CacheState and register the mirror against the captured
     // watermark.
     let cache_state = Arc::new(CacheState::new());
-    cache_state.register_mirror("cache-mirror", bootstrap_hwm);
+    cache_state.register_mirror("cache-mirror", bootstrap_hwm, None, true);
     let binding = mirror_fs::CacheBinding {
         state: Arc::clone(&cache_state),
         mirror_name: "cache-mirror".into(),
@@ -259,7 +259,14 @@ async fn cache_v1_serves_latest_per_key_and_honours_tombstones() {
     assert_eq!(resp.status(), reqwest::StatusCode::OK);
     let spec: serde_json::Value = resp.json().await.unwrap();
     assert_eq!(spec["openapi"], "3.1.0");
-    assert!(spec["paths"]["/cache/v1/raw/{key}"].is_object());
+    // The static OpenAPI documents only the per-mirror paths; the
+    // unprefixed `cache-v1-main` aliases are config-conditional and
+    // intentionally omitted from the spec.
+    assert!(spec["paths"]["/cache/v1/{mirror}/raw/{key}"].is_object());
+    assert!(
+        spec["paths"]["/cache/v1/raw/{key}"].is_null(),
+        "unprefixed cache-v1-main aliases must stay off the static spec"
+    );
 
     mirror.abort();
     let _ = server_shutdown_tx.send(());
diff --git a/e2e/tests/cache_v1_compat.rs b/e2e/tests/cache_v1_compat.rs
index 345f9e9..b736c5e 100644
--- a/e2e/tests/cache_v1_compat.rs
+++ b/e2e/tests/cache_v1_compat.rs
@@ -138,7 +138,7 @@ async fn compare_kkv_and_mirror_v3_cache_v1() {
     // Spin up mirror-v3 in-process. Append mode with cache-v1.
     let root = tempfile::tempdir().expect("tempdir");
     let cache_state = Arc::new(CacheState::new());
-    cache_state.register_mirror("compat", bootstrap_hwm);
+    cache_state.register_mirror("compat", bootstrap_hwm, None, true);
     let mirror_addr = {
         let port = portpicker::pick_unused_port().expect("port");
         std::net::SocketAddr::from(([127, 0, 0, 1], port))
diff --git a/e2e/tests/kafka_source_commit_offsets.rs b/e2e/tests/kafka_source_commit_offsets.rs
new file mode 100644
index 0000000..8fa5966
--- /dev/null
+++ b/e2e/tests/kafka_source_commit_offsets.rs
@@ -0,0 +1,130 @@
+//! Round-trip the new `Source::commit_through` /
+//! `fetch_committed_offset` + `KafkaCommitHandle::commit_pending`
+//! against a real Kafka broker. Pins:
+//!   * a fresh group reports `None`,
+//!   * `commit_through` + `commit_pending` then a re-open with the
+//!     same group reports the previously-staged value,
+//!   * the monotonic guard ignores a regressing `commit_through`.
+
+use std::time::Duration;
+
+use mirror_core::Source;
+use mirror_e2e::docker::DockerProvisioner;
+use mirror_e2e::kafka_helpers::{create_topic, produce_records};
+use mirror_e2e::{ProvisionedStack, Provisioner};
+use mirror_kafka::{KafkaSource, KafkaSourceConfig};
+
+const TOPIC: &str = "mirror-e2e-commit-offsets";
+
+fn fresh_group(suffix: &str) -> String {
+    // Each test in this file uses a fresh group id so the previous
+    // test's commits don't leak. `uuid` is already a workspace dep
+    // (used by mirror-fs).
+    format!("mirror-e2e-commit-{suffix}-{}", uuid::Uuid::new_v4())
+}
+
+async fn poll_for_committed(bootstrap: &str, group: &str, timeout: Duration) -> Option<u64> {
+    let deadline = std::time::Instant::now() + timeout;
+    loop {
+        let cfg = KafkaSourceConfig::new(bootstrap.to_string(), group.to_string(), TOPIC, 0);
+        let mut s = KafkaSource::open(cfg).expect("re-open");
+        if let Ok(Some(off)) = s.fetch_committed_offset().await {
+            return Some(off);
+        }
+        if std::time::Instant::now() >= deadline {
+            return None;
+        }
+        tokio::time::sleep(Duration::from_millis(100)).await;
+    }
+}
+
+#[tokio::test(flavor = "multi_thread", worker_threads = 4)]
+async fn fresh_group_has_no_committed_offset() {
+    let stack = DockerProvisioner.provision().await.expect("provision");
+    let bootstrap = stack.source_bootstrap();
+    create_topic(&bootstrap, TOPIC, 1).await.expect("topic");
+    let group = fresh_group("fresh");
+    let mut source = KafkaSource::open(KafkaSourceConfig::new(bootstrap.clone(), group, TOPIC, 0))
+        .expect("open");
+    let got = source.fetch_committed_offset().await.expect("fetch");
+    assert_eq!(got, None, "fresh group must report None");
+}
+
+#[tokio::test(flavor = "multi_thread", worker_threads = 4)]
+async fn commit_through_then_commit_pending_round_trips() {
+    let stack = DockerProvisioner.provision().await.expect("provision");
+    let bootstrap = stack.source_bootstrap();
+    create_topic(&bootstrap, TOPIC, 1).await.expect("topic");
+    // The broker needs at least one record so the committed offset
+    // we stage is a valid one to read back.
+    let pairs: Vec<(String, String)> = (0..3).map(|i| (format!("k{i}"), format!("v{i}"))).collect();
+    produce_records(&bootstrap, TOPIC, 0, &pairs)
+        .await
+        .expect("produce");
+
+    let group = fresh_group("rt");
+    {
+        let mut source = KafkaSource::open(KafkaSourceConfig::new(
+            bootstrap.clone(),
+            group.clone(),
+            TOPIC,
+            0,
+        ))
+        .expect("open");
+        // `store_offsets` requires the partition to be in the
+        // consumer's assigned set; in production the run loop's
+        // `seek` establishes that before the supervisor's periodic
+        // commit task fires. Mirror it here.
+        source.seek(0).await.expect("seek");
+        // Trait method stages; handle flushes. This mirrors the
+        // supervisor's periodic-task wiring landing in a later
+        // commit.
+        source.commit_through(2).await.expect("commit_through");
+        let handle = source.commit_handle();
+        handle.commit_pending().expect("commit_pending");
+    }
+    // `commit_consumer_state(Async)` returns immediately; poll a
+    // fresh re-open until the broker has acknowledged the write.
+    let observed = poll_for_committed(&bootstrap, &group, Duration::from_secs(10)).await;
+    assert_eq!(
+        observed,
+        Some(2),
+        "round-trip must observe the staged offset"
+    );
+}
+
+#[tokio::test(flavor = "multi_thread", worker_threads = 4)]
+async fn commit_through_is_monotonic() {
+    let stack = DockerProvisioner.provision().await.expect("provision");
+    let bootstrap = stack.source_bootstrap();
+    create_topic(&bootstrap, TOPIC, 1).await.expect("topic");
+    let pairs: Vec<(String, String)> = (0..5).map(|i| (format!("k{i}"), format!("v{i}"))).collect();
+    produce_records(&bootstrap, TOPIC, 0, &pairs)
+        .await
+        .expect("produce");
+
+    let group = fresh_group("mono");
+    let mut source = KafkaSource::open(KafkaSourceConfig::new(
+        bootstrap.clone(),
+        group.clone(),
+        TOPIC,
+        0,
+    ))
+    .expect("open");
+    source.seek(0).await.expect("seek");
+    source.commit_through(4).await.expect("first stage");
+    // Regress; the guard must drop this silently. No error, no
+    // overwrite of the broker's committed value.
+    source.commit_through(1).await.expect("regress is no-op");
+    source
+        .commit_handle()
+        .commit_pending()
+        .expect("commit_pending");
+
+    let observed = poll_for_committed(&bootstrap, &group, Duration::from_secs(10)).await;
+    assert_eq!(
+        observed,
+        Some(4),
+        "regression must be ignored; broker keeps the higher value"
+    );
+}
diff --git a/e2e/tests/known_coverage_gaps.rs b/e2e/tests/known_coverage_gaps.rs
new file mode 100644
index 0000000..477baa3
--- /dev/null
+++ b/e2e/tests/known_coverage_gaps.rs
@@ -0,0 +1,177 @@
+//! Discoverable contracts for test coverage we know we owe but
+//! don't currently have. Each `#[ignore = "TODO: ..."]` test names
+//! the gap, the rationale, and a pointer to the strategy document.
+//!
+//! Why this file exists
+//! --------------------
+//!
+//! Several recent commits in this repo end up with a "the existing
+//! e2e doesn't catch this" or "the test was passing for the wrong
+//! reason" paragraph in their messages; useful prose, but it sits
+//! in `git log` rather than the test suite. The reviewer's smaller
+//! observation §1 in `REVIEW_TEST_STRATEGY.md` calls this out and
+//! asks us to convert each known gap into a `cargo test --list`-able
+//! contract. That's what this file is.
+//!
+//! Each test:
+//!   - is `#[ignore = "TODO: ..."]` with the strategy-doc section
+//!     it tracks,
+//!   - documents in its body what shape the eventual implementation
+//!     should take,
+//!   - uses `unimplemented!()` so it doesn't accidentally run if
+//!     `cargo test -- --include-ignored` is added to CI before the
+//!     body is written.
+//!
+//! Removing the `#[ignore]` once the test is implemented is the
+//! contract closure. `cargo test --list -p mirror-e2e | grep ignored`
+//! is the discovery surface for what's left.
+
+#![allow(unreachable_code, clippy::diverging_sub_expression)]
+
+#[tokio::test]
+#[ignore = "TODO: REVIEW_TEST_STRATEGY.md §3; needs real-broker compaction (not delete-records)"]
+async fn kafka_source_low_watermark_after_pure_compaction_only() {
+    //! Broker contract: a topic with `cleanup.policy=compact` (and
+    //! *not* `compact,delete`) keeps `LogStartOffset = 0` after
+    //! compaction has deduplicated keys; the segment start hasn't
+    //! moved. From a consumer's point of view, `fetch_watermarks`
+    //! returns `(0, high)` but `seek(0)` produces a record at some
+    //! offset > 0 because the earlier records were dropped by
+    //! upstream dedup.
+    //!
+    //! The existing `e2e/tests/compacted_source_with_compaction_log.rs`
+    //! claims to cover this case but is using `delete-records` as a
+    //! stand-in; that advances `LogStartOffset` and so doesn't
+    //! reproduce the contract this test would assert.
+    //!
+    //! Implementation sketch:
+    //!   1. Provision Redpanda (or Apache Kafka) with the topic
+    //!      created `cleanup.policy=compact` only, `retention.ms=-1`,
+    //!      `min.cleanable.dirty.ratio` = very low (e.g. 0.01),
+    //!      `segment.ms` small enough to force segment rolls.
+    //!   2. Produce N records over a small key-space (e.g. 1000
+    //!      records over 50 keys, looping).
+    //!   3. Force a segment roll (e.g. `rpk topic alter-config
+    //!      segment.ms=1`, wait, restore).
+    //!   4. Poll until the log cleaner runs and the segment on disk
+    //!      is smaller than the original record count.
+    //!   5. Call `KafkaSource::low_watermark()`; assert it returns
+    //!      `0` (the contract this test exists to pin).
+    //!   6. Call `consumer.seek(0)` + poll one; assert the first
+    //!      delivered offset is > 0 (the gap the mirror has to
+    //!      tolerate under `compaction:log`).
+    //!
+    //! Pairs with `kafka_source_low_watermark_contract.rs`, which
+    //! covers the *post-delete-records* case (low watermark advances,
+    //! the path 7fa70e7 fixed). Keeping both pinned at the broker-
+    //! contract level lets a future librdkafka or Redpanda upgrade
+    //! fail loudly here before the mirror-level tests break.
+    unimplemented!("see REVIEW_TEST_STRATEGY.md §3 for the harness work this depends on");
+}
+
+#[tokio::test]
+#[ignore = "TODO: REVIEW_TEST_STRATEGY.md §2; needs multi-broker Apache Kafka stack variant"]
+async fn kafka_source_low_watermark_against_realistic_metadata_latency() {
+    //! Bug class: `StreamConsumer::fetch_watermarks` on a fresh
+    //! consumer that has not yet completed broker connection /
+    //! metadata fetch returns `Ok((0, 0))` instead of querying the
+    //! broker, against a real multi-broker Kafka cluster. 7fa70e7
+    //! fixed this for `KafkaSource::low_watermark` by routing
+    //! through a fresh `BaseConsumer` via `spawn_blocking`, but the
+    //! local Redpanda harness can't reproduce the original failure
+    //! mode because single-broker boot establishes connections
+    //! fast enough that the StreamConsumer call also succeeds.
+    //!
+    //! Implementation options (REVIEW_TEST_STRATEGY.md §2 walks
+    //! these in more detail):
+    //!   - **Multi-broker Apache Kafka** via testcontainers. Slow
+    //!     (~60s cold start) and adds a real CI cost; catches the
+    //!     bug class directly.
+    //!   - **Single-broker Kafka with injected metadata-fetch
+    //!     latency** (e.g. a toxiproxy delay on the broker port).
+    //!     Cheaper; catches the same class of bug as long as the
+    //!     delay window crosses the consumer's "first call before
+    //!     metadata arrived" threshold.
+    //!
+    //! The test would: open a `KafkaSource`, immediately call
+    //! `low_watermark()`, assert the broker's actual value is
+    //! returned. A second variant (or a parameterised run) calls
+    //! `fetch_watermarks` *directly* on the StreamConsumer and
+    //! asserts it returns the broken `(0, 0)`; that becomes the
+    //! regression guard so a future commit can't silently revert
+    //! to the StreamConsumer path without this test failing.
+    unimplemented!(
+        "see REVIEW_TEST_STRATEGY.md §2 for the multi-broker / latency-injection choice"
+    );
+}
+
+#[tokio::test]
+#[ignore = "TODO: REVIEW_TEST_STRATEGY.md smaller obs §2; stress fixture, not per-PR CI"]
+async fn compaction_log_handles_production_scale_fixture() {
+    //! Production reproducer the current 12-record e2e seeds don't
+    //! exercise: 1.2M source offsets, multiple keys, real broker-
+    //! side compaction work. Catches buffer-pressure issues, flush-
+    //! trigger edge cases, and mid-stream-gap density patterns
+    //! (compact-heavy topics deliver one gap per surviving key after
+    //! upstream dedup; at scale, that's hundreds of thousands of
+    //! gaps per restart) that small seeds don't surface.
+    //!
+    //! Should NOT run on every PR; the data volume is the point.
+    //! Gate on a schedule (nightly?), a label, or a manual workflow
+    //! dispatch. The strategy document explicitly suggests not
+    //! conflating this with bug-catching coverage (that's what the
+    //! sink matrix and the contract tests above are for).
+    //!
+    //! Implementation sketch:
+    //!   1. Produce ~100k records over ~5k keys (cycle to force
+    //!      compaction work).
+    //!   2. Force broker compaction.
+    //!   3. Start a `compaction:log` mirror.
+    //!   4. Wait for the mirror to catch up.
+    //!   5. Assert: no crash, the destination snapshot has ~5k
+    //!      keys, the gap-accept counter
+    //!      (`mirror_v3_source_offset_gap_records_total`) is in
+    //!      the expected ballpark.
+    unimplemented!("see REVIEW_TEST_STRATEGY.md smaller obs §2 for sizing + gating discussion");
+}
+
+#[tokio::test]
+#[ignore = "TODO: REVIEW_TEST_STRATEGY.md §5; restart matrix, builds on §3 harness"]
+async fn restart_correctness_across_cleanup_policies() {
+    //! The seven-row matrix from REVIEW_TEST_STRATEGY.md §5:
+    //!
+    //! | Cleanup policy   | Destination state          | Behaviour |
+    //! |------------------|---------------------------|-----------|
+    //! | `delete`         | empty                      | seek(0)   |
+    //! | `delete`         | non-empty                  | seek(next_expected) |
+    //! | `compact,delete` | empty, after DeleteRecords | bootstrap-align |
+    //! | `compact,delete` | non-empty < broker low     | bootstrap-align |
+    //! | `compact,delete` | non-empty ≥ broker low     | no gap    |
+    //! | `compact` only   | empty                      | first-delivery gap |
+    //! | `compact` only   | non-empty                  | mid-stream gaps |
+    //!
+    //! The two `compact only` rows are the cells the PR-#1 work
+    //! turned from "silently misbehaving" into "correct"; but
+    //! there's no e2e test that exercises the full restart cycle
+    //! against them. The other five rows are individually covered
+    //! by existing tests; encoding them as one table catches "we
+    //! added a sixth row and forgot to update the table" later.
+    //!
+    //! Depends on the real-broker compaction harness from §3 (the
+    //! `compact only` rows can't run against a delete-records
+    //! stand-in without circularity).
+    //!
+    //! Implementation: same shape as `restart_correctness.rs` for
+    //! one cell, parameterised over the seven rows. Each cell:
+    //!   1. Provision the broker with the given cleanup policy.
+    //!   2. Seed records + apply the policy-specific advancement
+    //!      (DeleteRecords for `*delete`, forced compaction for
+    //!      `compact only`, nothing for `delete` empty case).
+    //!   3. Optionally pre-populate the destination (the "non-empty"
+    //!      rows).
+    //!   4. Start the mirror.
+    //!   5. Assert it reaches steady state without error, the
+    //!      destination matches the broker's deliverable set, no
+    //!      duplicates, no gaps that weren't legitimate compaction.
+    unimplemented!("see REVIEW_TEST_STRATEGY.md §5; blocked on §3");
+}
diff --git a/e2e/tests/notify_kkv_v1.rs b/e2e/tests/notify_kkv_v1.rs
new file mode 100644
index 0000000..6b47acc
--- /dev/null
+++ b/e2e/tests/notify_kkv_v1.rs
@@ -0,0 +1,249 @@
+//! E2e: kafka → mirror-v3 (filesystem) with `notify` enabled,
+//! against a real axum-backed webhook receiver in-process. Verifies
+//! the full surface end-to-end:
+//!   * `trigger.on: source-consume` POSTs match the kkv-v1 wire
+//!     contract (path, headers, body).
+//!   * `trigger.on: destination-flush` fires one POST per durable
+//!     flush, with `updates: {}` per spec.
+//!   * The receiver receives every record's key under source-consume
+//!     debounce.
+
+use std::time::Duration;
+
+use mirror_config::{
+    FanOut, Notify, NotifyApi, NotifyDebounce, NotifyOutcomes, NotifyRetry, NotifyTarget,
+    NotifyTrigger, TriggerOn,
+};
+use mirror_e2e::docker::DockerProvisioner;
+use mirror_e2e::kafka_helpers::{create_topic, produce_records};
+use mirror_e2e::mirror_runner::{spawn_kafka_to_fs_with_notify, FsMirrorSpec};
+use mirror_e2e::webhook_receiver::WebhookReceiver;
+use mirror_e2e::{ProvisionedStack, Provisioner};
+use mirror_fs::FlushTriggers;
+use serde_json::Value;
+
+fn init_tracing() {
+    let _ = tracing_subscriber::fmt()
+        .with_env_filter(
+            tracing_subscriber::EnvFilter::try_from_default_env()
+                .unwrap_or_else(|_| tracing_subscriber::EnvFilter::new("info")),
+        )
+        .try_init();
+}
+
+fn notify_pointing_at_with_trigger(
+    addr: std::net::SocketAddr,
+    trigger: NotifyTrigger,
+    max_attempts: u32,
+) -> Notify {
+    Notify {
+        api: NotifyApi::KkvV1,
+        targets: vec![NotifyTarget {
+            url: format!("http://{addr}"),
+            path: None,
+            fan_out: FanOut::None,
+        }],
+        trigger,
+        timeout_ms: 2000,
+        retry: NotifyRetry {
+            max_attempts,
+            backoff_ms: 50,
+        },
+        outcomes: NotifyOutcomes::default(),
+    }
+}
+
+#[tokio::test(flavor = "multi_thread", worker_threads = 4)]
+async fn source_consume_dispatches_kkv_v1_posts_for_produced_records() {
+    init_tracing();
+    let stack = DockerProvisioner.provision().await.expect("provision");
+    let source = stack.source_bootstrap();
+    let root = tempfile::tempdir().expect("tempdir");
+    let topic = "notify-kkv-source-consume";
+
+    create_topic(&source, topic, 1).await.expect("topic");
+
+    let receiver = WebhookReceiver::start().await;
+    let notify = notify_pointing_at_with_trigger(
+        receiver.addr,
+        NotifyTrigger {
+            on: TriggerOn::SourceConsume,
+            // Tight debounce so 10 produced records collapse into
+            // one or two POSTs.
+            debounce: Some(NotifyDebounce {
+                max_records: 10,
+                max_time_ms: 200,
+            }),
+        },
+        3,
+    );
+
+    let flush = FlushTriggers {
+        max_time: Duration::from_secs(3600),
+        max_bytes: u64::MAX,
+        max_offsets: 1_000,
+        daily_at_utc_seconds: None,
+    };
+    let mirror = spawn_kafka_to_fs_with_notify(
+        FsMirrorSpec::ndjson(
+            source.clone(),
+            topic.into(),
+            0,
+            "notify-source-consume".into(),
+            root.path().to_path_buf(),
+            "ops".into(),
+            flush,
+        ),
+        notify,
+    )
+    .await
+    .expect("spawn mirror");
+
+    let fixtures: Vec<(String, String)> = (0..10)
+        .map(|i| (format!("user-{i}"), format!("payload-{i}")))
+        .collect();
+    produce_records(&source, topic, 0, &fixtures)
+        .await
+        .expect("produce");
+
+    // Wait for the receiver to see at least one POST. The debounce
+    // window is 200ms; we give it generous slack for Kafka delivery
+    // + dispatcher latency.
+    let captured = receiver.wait_for(1, Duration::from_secs(15)).await;
+
+    // Sanity on the first POST's contract.
+    let req = &captured[0];
+    assert_eq!(
+        req.path, "/kafka-keyvalue/v1/updates",
+        "default kkv-v1 path"
+    );
+    assert_eq!(
+        req.headers
+            .get("x-kkv-topic")
+            .and_then(|v| v.to_str().ok())
+            .unwrap_or(""),
+        topic
+    );
+    assert_eq!(
+        req.headers
+            .get("content-type")
+            .and_then(|v| v.to_str().ok())
+            .unwrap_or(""),
+        "application/json"
+    );
+    let body: Value = serde_json::from_slice(&req.body).expect("body JSON");
+    assert_eq!(body["topic"], topic);
+    // Each captured POST must carry a non-empty updates map (all
+    // produced keys are kkv-routable strings).
+    let updates = body["updates"]
+        .as_object()
+        .expect("updates is a JSON object");
+    assert!(
+        !updates.is_empty(),
+        "first POST must carry at least one key"
+    );
+    // The highest source offset in the batch must equal the largest
+    // 0-based offset of the keys it carries; since we produced
+    // contiguously from 0, the offset must be one of 0..9.
+    let high = body["offsets"]["0"]
+        .as_u64()
+        .expect("offsets.0 must be u64");
+    assert!(
+        (0..10).contains(&high),
+        "highest offset out of range, got {high}"
+    );
+
+    // Across ALL POSTs, every produced key must appear at least once
+    // (a key may collapse twice into the same batch if produced
+    // bursts overlap a debounce window; "at least once" is the
+    // load-bearing contract for cache invalidation).
+    let mut seen: std::collections::HashSet<String> = std::collections::HashSet::new();
+    for r in &captured {
+        let body: Value = serde_json::from_slice(&r.body).expect("body JSON");
+        if let Some(updates) = body["updates"].as_object() {
+            for k in updates.keys() {
+                seen.insert(k.clone());
+            }
+        }
+    }
+    for (k, _) in &fixtures {
+        assert!(
+            seen.contains(k),
+            "produced key {k:?} never appeared in any notify POST"
+        );
+    }
+
+    mirror.shutdown().await.expect("graceful shutdown");
+}
+
+#[tokio::test(flavor = "multi_thread", worker_threads = 4)]
+async fn destination_flush_dispatches_one_post_per_flush_with_empty_updates() {
+    init_tracing();
+    let stack = DockerProvisioner.provision().await.expect("provision");
+    let source = stack.source_bootstrap();
+    let root = tempfile::tempdir().expect("tempdir");
+    let topic = "notify-kkv-dest-flush";
+
+    create_topic(&source, topic, 1).await.expect("topic");
+
+    let receiver = WebhookReceiver::start().await;
+    let notify = notify_pointing_at_with_trigger(
+        receiver.addr,
+        NotifyTrigger {
+            on: TriggerOn::DestinationFlush,
+            debounce: None,
+        },
+        3,
+    );
+
+    // Flush every 5 records → 2 flushes for 10 produced records.
+    let flush = FlushTriggers {
+        max_time: Duration::from_secs(3600),
+        max_bytes: u64::MAX,
+        max_offsets: 5,
+        daily_at_utc_seconds: None,
+    };
+    let mirror = spawn_kafka_to_fs_with_notify(
+        FsMirrorSpec::ndjson(
+            source.clone(),
+            topic.into(),
+            0,
+            "notify-dest-flush".into(),
+            root.path().to_path_buf(),
+            "ops".into(),
+            flush,
+        ),
+        notify,
+    )
+    .await
+    .expect("spawn mirror");
+
+    let fixtures: Vec<(String, String)> = (0..10)
+        .map(|i| (format!("k{i}"), format!("v{i}")))
+        .collect();
+    produce_records(&source, topic, 0, &fixtures)
+        .await
+        .expect("produce");
+
+    // Two flushes expected; wait for both POSTs to land.
+    let captured = receiver.wait_for(2, Duration::from_secs(20)).await;
+    assert_eq!(
+        captured.len(),
+        2,
+        "exactly two POSTs (one per max-offsets=5 flush)"
+    );
+
+    let body_0: Value = serde_json::from_slice(&captured[0].body).expect("body 0");
+    let body_1: Value = serde_json::from_slice(&captured[1].body).expect("body 1");
+
+    // Empty updates per spec for destination-flush.
+    assert_eq!(body_0["updates"], serde_json::json!({}));
+    assert_eq!(body_1["updates"], serde_json::json!({}));
+
+    // Offsets in dispatch order: first flush covers 0..4 → high=4;
+    // second covers 5..9 → high=9.
+    assert_eq!(body_0["offsets"]["0"], serde_json::json!(4));
+    assert_eq!(body_1["offsets"]["0"], serde_json::json!(9));
+
+    mirror.shutdown().await.expect("graceful shutdown");
+}
diff --git a/e2e/tests/restart_resumes_notify_from_commit.rs b/e2e/tests/restart_resumes_notify_from_commit.rs
new file mode 100644
index 0000000..a80c00a
--- /dev/null
+++ b/e2e/tests/restart_resumes_notify_from_commit.rs
@@ -0,0 +1,378 @@
+//! Dev2 symptom reproducer for the between-pods notify gap.
+//!
+//! Production symptom in `dev2` (checkit, June 2026): a consumer pod
+//! polled `mirror-v3-worker`'s `/cache/v1` and got a 200 with stale
+//! values after the worker pod restarted. Trace: mirror-v3 had
+//! `enable.auto.commit=false` and never called a commit, so the
+//! group had no broker-side state. The bootstrap-suppression PR
+//! (`5ef7c9e`) reseeded suppression at every restart from the
+//! broker high-watermark, so records produced between the previous
+//! shutdown and the new startup got silently suppressed instead of
+//! firing the consumer-invalidation webhook.
+//!
+//! Fix shape (commits 1-6 of the delivery-semantics PR):
+//!   * `Source::commit_through` + `commit_pending` write the
+//!     consumer's progress back to the broker.
+//!   * `KkvV1Notifier` accepts an `AckSink` and notes the high
+//!     offset of every successful drain.
+//!   * `register_mirror_with_topic` takes
+//!     `last_committed_offset: Option<u64>` and computes
+//!     `suppression_threshold = max(last_committed, bootstrap_hwm)`.
+//!     On a returning deploy with a previous commit, records in
+//!     `[last_committed, bootstrap_hwm)` are no longer suppressed —
+//!     the between-pods gap fires the webhook.
+//!
+//! This test exercises the whole flow against a real Kafka broker:
+//!
+//!   1. Produce 5 records. Run a mirror with `KkvV1Notifier`
+//!      pointing at an in-process webhook receiver. Wait for the
+//!      webhook to capture all 5 keys. Commit through offset 5.
+//!   2. Stop the mirror. Produce 5 more records (offsets 5-9).
+//!   3. Start a *new* mirror with the same `group.id`. Its
+//!      `register_mirror_with_topic` is fed
+//!      `last_committed_offset = fetch_committed_offset()`.
+//!      Assert the webhook now captures offsets 5-9 (the gap is
+//!      closed) and does NOT replay offsets 0-4 (the suppression
+//!      threshold blocks records below the committed value).
+
+use std::collections::HashSet;
+use std::sync::Arc;
+use std::time::Duration;
+
+use mirror_config::{
+    FanOut, Notify, NotifyApi, NotifyDebounce, NotifyOutcomes, NotifyRetry, NotifyTarget,
+    NotifyTrigger, TriggerOn,
+};
+use mirror_core::{run_mirror_with_notifier, CacheBinding, CacheState, Sink, Source, TeeSink};
+use mirror_e2e::docker::DockerProvisioner;
+use mirror_e2e::kafka_helpers::{create_topic, produce_records};
+use mirror_e2e::webhook_receiver::WebhookReceiver;
+use mirror_e2e::{ProvisionedStack, Provisioner};
+use mirror_envelope::{ColumnType, Format, ParquetCompression};
+use mirror_fs::{FilesystemSink, FilesystemSinkConfig, FlushTriggers};
+use mirror_kafka::{KafkaSource, KafkaSourceConfig};
+
+const TOPIC: &str = "mirror-e2e-restart-resumes-notify";
+
+fn init_tracing() {
+    let _ = tracing_subscriber::fmt()
+        .with_env_filter(
+            tracing_subscriber::EnvFilter::try_from_default_env()
+                .unwrap_or_else(|_| tracing_subscriber::EnvFilter::new("info")),
+        )
+        .try_init();
+}
+
+fn notify_pointing_at(addr: std::net::SocketAddr) -> Notify {
+    Notify {
+        api: NotifyApi::KkvV1,
+        targets: vec![NotifyTarget {
+            url: format!("http://{addr}"),
+            path: None,
+            fan_out: FanOut::None,
+        }],
+        trigger: NotifyTrigger {
+            on: TriggerOn::SourceConsume,
+            debounce: Some(NotifyDebounce {
+                max_records: 100,
+                // Tight enough that 5 records drain before the
+                // wait_for() timeout, slack enough that the dispatcher
+                // batches them in one or two POSTs (not five).
+                max_time_ms: 200,
+            }),
+        },
+        timeout_ms: 2000,
+        retry: NotifyRetry {
+            max_attempts: 3,
+            backoff_ms: 50,
+        },
+        outcomes: NotifyOutcomes::default(),
+    }
+}
+
+fn fs_spec(root: &std::path::Path) -> FilesystemSinkConfig {
+    FilesystemSinkConfig {
+        root: root.to_path_buf(),
+        destination_name: "notify".into(),
+        partition: 0,
+        format: Format::Ndjson,
+        compression: ParquetCompression::Zstd1,
+        keys: ColumnType::Utf8,
+        values: ColumnType::Utf8,
+        compaction: None,
+        cache: None,
+        flush: FlushTriggers {
+            max_time: Duration::from_secs(3600),
+            max_bytes: u64::MAX,
+            max_offsets: u64::MAX,
+            daily_at_utc_seconds: None,
+        },
+    }
+}
+
+/// Extract the `updates` map keys from a kkv-v1 notify body. The
+/// notifier POSTs JSON of shape `{"v":"v1","topic":..., "offsets":
+/// {...}, "updates": {"<key>": "<base64>"}}`.
+fn keys_in_body(body: &[u8]) -> HashSet<String> {
+    let v: serde_json::Value = serde_json::from_slice(body).expect("notify body is JSON");
+    v.get("updates")
+        .and_then(|u| u.as_object())
+        .map(|m| m.keys().cloned().collect())
+        .unwrap_or_default()
+}
+
+#[tokio::test(flavor = "multi_thread", worker_threads = 4)]
+async fn webhooks_resume_at_committed_offset_after_restart() {
+    init_tracing();
+    let stack = DockerProvisioner.provision().await.expect("provision");
+    let source_bootstrap = stack.source_bootstrap();
+    let root = tempfile::tempdir().expect("tempdir");
+    create_topic(&source_bootstrap, TOPIC, 1)
+        .await
+        .expect("topic");
+
+    let group_id = format!("mirror-e2e-restart-resumes-notify-{}", uuid::Uuid::new_v4());
+    let receiver = WebhookReceiver::start().await;
+    let notify = notify_pointing_at(receiver.addr);
+
+    // Stage 1: 5 records to source, run mirror, wait for webhook,
+    // commit through offset 5.
+    let pairs_a: Vec<(String, String)> = (0..5)
+        .map(|i| (format!("k{i:03}"), format!("v{i:03}")))
+        .collect();
+    produce_records(&source_bootstrap, TOPIC, 0, &pairs_a)
+        .await
+        .expect("produce stage A");
+
+    {
+        let cache = Arc::new(CacheState::new());
+        cache.register_mirror_with_topic("notify", 0, None, false, TOPIC, 0);
+        let cache_binding = CacheBinding {
+            state: Arc::clone(&cache),
+            mirror_name: "notify".into(),
+        };
+
+        let source = KafkaSource::open(KafkaSourceConfig::new(
+            source_bootstrap.clone(),
+            group_id.clone(),
+            TOPIC,
+            0,
+        ))
+        .expect("open source A");
+        let commit_handle = source.commit_handle();
+
+        let fs_cfg = FilesystemSinkConfig {
+            cache: Some(mirror_fs::CacheBinding {
+                state: Arc::clone(&cache),
+                mirror_name: "notify".into(),
+            }),
+            ..fs_spec(root.path())
+        };
+        let sink: Box<dyn Sink> = Box::new(FilesystemSink::open(fs_cfg).expect("open fs sink A"));
+        let tee = TeeSink::open(vec![("notify".into(), sink)], Some(cache_binding))
+            .await
+            .expect("tee A");
+
+        let notifier = mirror_notify_kkv::KkvV1Notifier::from_config(
+            &notify,
+            TOPIC.into(),
+            0,
+            Arc::clone(&cache),
+            "notify".into(),
+        )
+        .expect("notifier A");
+
+        let (shutdown_tx, mut shutdown_rx) = tokio::sync::watch::channel(false);
+        let signal = async move {
+            let _ = shutdown_rx.changed().await;
+        };
+        let handle = tokio::spawn(async move {
+            run_mirror_with_notifier(
+                source,
+                tee,
+                notifier,
+                signal,
+                mirror_core::DEFAULT_HEARTBEAT_INTERVAL,
+            )
+            .await
+        });
+
+        // Webhook receives every key we produced.
+        let captured = receiver.wait_for(1, Duration::from_secs(15)).await;
+        let mut got: HashSet<String> = HashSet::new();
+        for req in &captured {
+            got.extend(keys_in_body(&req.body));
+        }
+        for i in 0..5 {
+            let want = format!("k{i:03}");
+            assert!(
+                got.contains(&want),
+                "stage A webhooks must include {want}; got {got:?}"
+            );
+        }
+
+        // Shut the mirror down, then write the consumer's progress
+        // back to the broker. In production the supervisor's periodic
+        // commit task does this on a schedule; here we drive it once
+        // by hand to keep the test deterministic.
+        let _ = shutdown_tx.send(true);
+        handle.await.expect("join A").expect("mirror A ok");
+
+        // The notifier's drain already advanced the in-memory ack
+        // state; persist offset 5 to the broker so the next pod sees
+        // it as the group's committed offset.
+        commit_handle
+            .commit_through(5)
+            .expect("stage A commit_through");
+        commit_handle
+            .commit_pending()
+            .expect("stage A commit_pending");
+    }
+
+    // Verify the broker accepted the commit before producing stage B.
+    let observed = poll_for_committed(&source_bootstrap, &group_id, Duration::from_secs(10)).await;
+    assert_eq!(
+        observed,
+        Some(5),
+        "broker must report committed offset 5 after stage A"
+    );
+
+    // Stage 2: 5 more records to source.
+    let pairs_b: Vec<(String, String)> = (5..10)
+        .map(|i| (format!("k{i:03}"), format!("v{i:03}")))
+        .collect();
+    produce_records(&source_bootstrap, TOPIC, 0, &pairs_b)
+        .await
+        .expect("produce stage B");
+
+    // Stage 2 webhook capture starts from where stage A left off,
+    // since the same receiver is reused.
+    let baseline = receiver.request_count();
+
+    {
+        let bootstrap_hwm = 10u64;
+        let last_committed =
+            poll_for_committed(&source_bootstrap, &group_id, Duration::from_secs(5))
+                .await
+                .expect("group must already have a committed offset");
+        assert_eq!(last_committed, 5);
+
+        let cache = Arc::new(CacheState::new());
+        cache.register_mirror_with_topic(
+            "notify",
+            bootstrap_hwm,
+            Some(last_committed),
+            false,
+            TOPIC,
+            0,
+        );
+        let cache_binding = CacheBinding {
+            state: Arc::clone(&cache),
+            mirror_name: "notify".into(),
+        };
+
+        let source = KafkaSource::open(KafkaSourceConfig::new(
+            source_bootstrap.clone(),
+            group_id.clone(),
+            TOPIC,
+            0,
+        ))
+        .expect("open source B");
+
+        let fs_cfg = FilesystemSinkConfig {
+            cache: Some(mirror_fs::CacheBinding {
+                state: Arc::clone(&cache),
+                mirror_name: "notify".into(),
+            }),
+            ..fs_spec(root.path())
+        };
+        let sink: Box<dyn Sink> = Box::new(FilesystemSink::open(fs_cfg).expect("open fs sink B"));
+        let tee = TeeSink::open(vec![("notify".into(), sink)], Some(cache_binding))
+            .await
+            .expect("tee B");
+
+        let notifier = mirror_notify_kkv::KkvV1Notifier::from_config(
+            &notify,
+            TOPIC.into(),
+            0,
+            Arc::clone(&cache),
+            "notify".into(),
+        )
+        .expect("notifier B");
+
+        let (shutdown_tx, mut shutdown_rx) = tokio::sync::watch::channel(false);
+        let signal = async move {
+            let _ = shutdown_rx.changed().await;
+        };
+        let handle = tokio::spawn(async move {
+            run_mirror_with_notifier(
+                source,
+                tee,
+                notifier,
+                signal,
+                mirror_core::DEFAULT_HEARTBEAT_INTERVAL,
+            )
+            .await
+        });
+
+        // Stage B records (offsets 5-9) must fire the webhook. Wait
+        // until at least one new POST has arrived since baseline,
+        // then collect every captured key from stage B.
+        let deadline = std::time::Instant::now() + Duration::from_secs(15);
+        loop {
+            if receiver.request_count() > baseline {
+                tokio::time::sleep(Duration::from_millis(200)).await;
+                break;
+            }
+            if std::time::Instant::now() >= deadline {
+                panic!("stage B: webhook receiver got no new POSTs");
+            }
+            tokio::time::sleep(Duration::from_millis(50)).await;
+        }
+
+        let all_captured = receiver.captured().await;
+        let mut stage_b_keys: HashSet<String> = HashSet::new();
+        for req in &all_captured[baseline..] {
+            stage_b_keys.extend(keys_in_body(&req.body));
+        }
+        for i in 5..10 {
+            let want = format!("k{i:03}");
+            assert!(
+                stage_b_keys.contains(&want),
+                "stage B webhooks must include {want} (between-pods gap); \
+                 got stage-B keys {stage_b_keys:?}"
+            );
+        }
+        // Stage A records must NOT be replayed: the suppression
+        // threshold (committed offset 5) blocks notifies for records
+        // 0..5. The mirror's source.seek() also doesn't go below the
+        // group's committed offset, but the cache-side suppression
+        // gate is the load-bearing check.
+        for i in 0..5 {
+            let unwanted = format!("k{i:03}");
+            assert!(
+                !stage_b_keys.contains(&unwanted),
+                "stage A key {unwanted} must NOT replay on the new pod; \
+                 got stage-B keys {stage_b_keys:?}"
+            );
+        }
+
+        let _ = shutdown_tx.send(true);
+        handle.await.expect("join B").expect("mirror B ok");
+    }
+}
+
+async fn poll_for_committed(bootstrap: &str, group: &str, timeout: Duration) -> Option<u64> {
+    let deadline = std::time::Instant::now() + timeout;
+    loop {
+        let cfg = KafkaSourceConfig::new(bootstrap.to_string(), group.to_string(), TOPIC, 0);
+        let mut s = KafkaSource::open(cfg).expect("re-open");
+        if let Ok(Some(off)) = s.fetch_committed_offset().await {
+            return Some(off);
+        }
+        if std::time::Instant::now() >= deadline {
+            return None;
+        }
+        tokio::time::sleep(Duration::from_millis(100)).await;
+    }
+}
diff --git a/e2e/tests/tee_cache_v1.rs b/e2e/tests/tee_cache_v1.rs
index dd4f1a4..54dd2e6 100644
--- a/e2e/tests/tee_cache_v1.rs
+++ b/e2e/tests/tee_cache_v1.rs
@@ -108,7 +108,7 @@ async fn tee_with_cache_v1_serves_latest_per_key_across_both_destinations() {
     assert!(bootstrap_hwm >= 5);
 
     let cache_state = Arc::new(CacheState::new());
-    cache_state.register_mirror("cache-mirror", bootstrap_hwm);
+    cache_state.register_mirror("cache-mirror", bootstrap_hwm, None, true);
     let binding = mirror_core::CacheBinding {
         state: Arc::clone(&cache_state),
         mirror_name: "cache-mirror".into(),
diff --git a/examples/cache-v1.yaml b/examples/cache-v1.yaml
index fcda066..c9929f8 100644
--- a/examples/cache-v1.yaml
+++ b/examples/cache-v1.yaml
@@ -1,21 +1,24 @@
 # yaml-language-server: $schema=../schemas/mirror-v3.config.schema.json
 #
 # KKV drop-in: mirror Kafka topics to disk *and* serve the latest
-# value per key over `/cache/v1` on port 8080 (override with
-# `MIRROR_V3_CACHE_PORT`).
+# value per key over `/cache/v1/{mirror}/...` on port 8080 (override
+# with `MIRROR_V3_CACHE_PORT`). At most one mirror per process may
+# additionally opt into `cache-v1-main`, which mounts the unprefixed
+# `/cache/v1/...` paths onto that mirror's view as a migration alias
+# for legacy kkv consumers that don't carry a mirror name in the URL.
 #
 # The mirror does both jobs from the same consume loop:
 #   1. Writes records to disk via the chosen format (Parquet here).
 #      Files grow append-style; they're durable history, not the
 #      cache view itself.
-#   2. Maintains an in-memory `key → latest value` map updated
-#      per-record (decoupled from flush cadence — set flush
+#   2. Maintains a per-mirror in-memory `key → latest value` map
+#      updated per-record (decoupled from flush cadence — set flush
 #      thresholds high to minimise bucket ops without affecting
 #      cache freshness).
 #
 # On restart, mirror-v3 replays the on-disk chain into the in-memory
-# view before flipping `/cache/v1` to ready. KKV semantics: dependents
-# never see a partially-rebuilt cache.
+# view before flipping the mirror's slot to ready. KKV semantics:
+# dependents never see a partially-rebuilt cache.
 #
 # For very large topics where restart replay would be slow, switch
 # to `compaction: log` — the mirror then bootstraps from the latest
@@ -36,7 +39,12 @@ mirrors:
     # requires keys to be utf8 / json / json-parseable (URL-routable).
     # values: { type: json-parseable }
     http-access:
-      api: cache-v1
+      # Per-mirror /cache/v1/user-states/... is always mounted.
+      cache-v1: {}
+      # Also serve the unprefixed /cache/v1/... paths so legacy
+      # kkv consumers that don't yet pass a mirror name keep
+      # working. At most one mirror per process may set this.
+      cache-v1-main: {}
     flush:
       # Long flush window — cache freshness is independent of this;
       # the values are live in memory the instant the consume loop
@@ -45,8 +53,9 @@ mirrors:
       max-bytes: 67108864
       max-offsets: 10000
 
-  # `http-access` works with `compaction: log` too. Both mirrors below
-  # serve into the same /cache/v1 keyspace; their keys must not collide.
+  # A second mirror is fine. It serves its own /cache/v1/orders/...
+  # paths; it cannot also set `cache-v1-main` (validator rejects
+  # >1 mains).
   # - name: orders
   #   source: { bootstrap-servers: kafka:9092 }
   #   topic: orders
@@ -57,7 +66,8 @@ mirrors:
   #   format: parquet
   #   compression: zstd-1
   #   compaction: log
-  #   http-access: { api: cache-v1 }
+  #   http-access:
+  #     cache-v1: {}
   #   flush:
   #     max-time-ms: 60000
   #     max-bytes: 67108864
diff --git a/examples/notify-destination-flush.yaml b/examples/notify-destination-flush.yaml
new file mode 100644
index 0000000..9f2c751
--- /dev/null
+++ b/examples/notify-destination-flush.yaml
@@ -0,0 +1,49 @@
+# yaml-language-server: $schema=../schemas/mirror-v3.config.schema.json
+#
+# `trigger.on: destination-flush`. Fire one POST per durable blob
+# flush. Use case from WEBHOOKS.md: downstream consumers that care
+# about durability over freshness (e.g. an archival sync job that
+# wants "tell me when a parquet file lands so I can copy it
+# elsewhere"). Not appropriate for cache invalidation, since
+# destination flush cadence is typically minutes.
+#
+# Body shape per flush:
+#   POST /kafka-keyvalue/v1/updates
+#   { "topic": "...", "offsets": { "<partition>": <highest-offset> },
+#     "updates": {} }
+#
+# `updates: {}` is intentional. Destination-flush doesn't accumulate
+# record keys; the offset alone tells the consumer everything they
+# need to act on the just-landed file.
+
+mirrors:
+  - name: archival-feed
+    source:
+      bootstrap-servers: kafka:9092
+    topic: events
+    partition: 0
+    destinations:
+      - type: filesystem
+        root: /var/lib/mirror-v3
+    format: parquet
+    compression: zstd-1
+    http-access:
+      cache-v1: {}
+    notify:
+      api: kkv-v1
+      targets:
+        - url: http://archival-sync:8080
+          fan-out: none
+      trigger:
+        on: destination-flush
+        # No `debounce` block; the destination's flush triggers
+        # ARE the debounce in this mode. Validator rejects an
+        # explicit debounce here.
+      timeout-ms: 5000
+      retry:
+        max-attempts: 5
+        backoff-ms: 100
+    flush:
+      max-time-ms: 60000
+      max-bytes: 67108864
+      max-offsets: 10000
diff --git a/examples/notify-kkv-replacement.yaml b/examples/notify-kkv-replacement.yaml
new file mode 100644
index 0000000..f9df43a
--- /dev/null
+++ b/examples/notify-kkv-replacement.yaml
@@ -0,0 +1,55 @@
+# yaml-language-server: $schema=../schemas/mirror-v3.config.schema.json
+#
+# Full kkv replacement: durable Parquet on disk + cache-v1 GET surface
+# + outbound kkv-v1 webhook so consumers know when to invalidate. Drop-
+# in for any service stack still pointing at the legacy
+# `@yolean/kafka-keyvalue` Node client.
+#
+# Per WEBHOOKS.md:
+#   * trigger.on: source-consume   - POST as records arrive (default).
+#   * debounce  {100, 250}         - at most 100 records per POST and
+#                                    no more than 250 ms of staleness.
+#   * outcomes.5xx { retry: true, final: fail }
+#                                  - transient backend trouble retries
+#                                    per `notify.retry`; persistent
+#                                    trouble crashes the mirror so the
+#                                    orchestrator restarts it.
+
+mirrors:
+  - name: user-states
+    source:
+      bootstrap-servers: kafka:9092
+    topic: user-states
+    partition: 0
+    destinations:
+      - type: filesystem
+        root: /var/lib/mirror-v3
+    format: parquet
+    compression: zstd-1
+    http-access:
+      # /cache/v1/user-states/raw/{key} always; the unprefixed
+      # /cache/v1/raw/{key} is the legacy kkv path consumers hit,
+      # served onto this mirror's view via `cache-v1-main`.
+      cache-v1: {}
+      cache-v1-main: {}
+    notify:
+      api: kkv-v1
+      targets:
+        - url: http://user-states-cache-target:8080
+          # `fan-out: dns-a` resolves the headless Service to all pod
+          # IPs and POSTs each. Use `none` for a single-replica
+          # target or a non-K8s consumer behind a single hostname.
+          fan-out: dns-a
+      trigger:
+        on: source-consume
+        debounce:
+          max-records: 100
+          max-time-ms: 250
+      timeout-ms: 5000
+      retry:
+        max-attempts: 5
+        backoff-ms: 100
+    flush:
+      max-time-ms: 60000
+      max-bytes: 67108864
+      max-offsets: 10000
diff --git a/examples/notify-only.yaml b/examples/notify-only.yaml
new file mode 100644
index 0000000..141027c
--- /dev/null
+++ b/examples/notify-only.yaml
@@ -0,0 +1,41 @@
+# yaml-language-server: $schema=../schemas/mirror-v3.config.schema.json
+#
+# Notify-only mirror: zero durable destinations, just a webhook feed.
+# A pure invalidation pipe; useful when downstream doesn't need
+# mirror-v3 to store anything, only to translate "Kafka record landed"
+# into "POST `/kafka-keyvalue/v1/updates`".
+#
+# Restart behaviour: with no durable state, the mirror seeks to the
+# source's *low watermark* on every startup and re-fires webhooks for
+# every record from there forward. On a busy topic that's a burst per
+# restart; tune `debounce` upward (e.g. {1000, 1000}) to coalesce, or
+# add a small filesystem destination for resume-from-offset.
+#
+# Validator rules in mirror-config (see WEBHOOKS.md § Validation):
+#   * destinations may be empty IFF notify is set with ≥1 target;
+#   * trigger.on MUST be source-consume (destination-flush has no
+#     destinations to ack);
+#   * format / compression / compaction / flush / http-access are all
+#     forbidden; they parameterise destinations that don't exist.
+
+mirrors:
+  - name: events-invalidator
+    source:
+      bootstrap-servers: kafka:9092
+    topic: events
+    partition: 0
+    destinations: []
+    notify:
+      api: kkv-v1
+      targets:
+        - url: http://events-consumer:8080
+          fan-out: dns-a
+      trigger:
+        on: source-consume
+        debounce:
+          max-records: 100
+          max-time-ms: 250
+      timeout-ms: 5000
+      retry:
+        max-attempts: 5
+        backoff-ms: 100
diff --git a/schemas/mirror-v3.cache.openapi.json b/schemas/mirror-v3.cache.openapi.json
index 41e9380..1700835 100644
--- a/schemas/mirror-v3.cache.openapi.json
+++ b/schemas/mirror-v3.cache.openapi.json
@@ -2,7 +2,7 @@
   "openapi": "3.1.0",
   "info": {
     "title": "mirror-v3 cache",
-    "description": "Drop-in HTTP surface for Yolean/kafka-keyvalue's /cache/v1. The state is a merged in-memory `key → latest-value` view across every mirror with `http-access: { api: cache-v1 }`. Updates are per-record from the consume loop; reads return 503 until every registered mirror has caught up to its startup high-watermark.",
+    "description": "Drop-in HTTP surface for Yolean/kafka-keyvalue's /cache/v1. Each opt-in mirror (`http-access.cache-v1`) owns its own in-memory `key → latest-value` view, exposed under `/cache/v1/{mirror}/...`. A single mirror may additionally opt into `cache-v1-main`, which mounts the unprefixed `/cache/v1/...` paths onto its view as a migration alias for legacy kkv consumers; these unprefixed routes are config-conditional and intentionally omitted from this spec. Updates are per-record from the consume loop; reads return 503 until the target mirror has caught up to its startup high-watermark.",
     "license": {
       "name": "Apache-2.0",
       "identifier": "Apache-2.0"
@@ -15,7 +15,7 @@
         "tags": [
           "admin"
         ],
-        "summary": "POST /_admin/v1/shutdown — request graceful exit.",
+        "summary": "POST /_admin/v1/shutdown; request graceful exit.",
         "operationId": "admin_shutdown",
         "responses": {
           "202": {
@@ -29,7 +29,7 @@
         "tags": [
           "admin"
         ],
-        "summary": "POST /_admin/v1/shutdown/{exitcode} — request graceful exit with a specific code.",
+        "summary": "POST /_admin/v1/shutdown/{exitcode}; request graceful exit with a specific code.",
         "operationId": "admin_shutdown_with_exit_code",
         "parameters": [
           {
@@ -50,14 +50,25 @@
         }
       }
     },
-    "/cache/v1/keys": {
+    "/cache/v1/{mirror}/keys": {
       "get": {
         "tags": [
           "cache"
         ],
-        "summary": "GET /cache/v1/keys — newline-separated key list, every line\n(including the last) terminated by `\\n`. Order is the order each\nkey was first seen by the cache (insertion order).",
-        "description": "`Content-Type` is `application/octet-stream` to match KKV's\nbyte-for-byte response shape. A possible future enhancement (gated\non operator demand) is to surface the topic schema in the content\ntype — see the `values` handler for the same hook.",
+        "summary": "GET /cache/v1/{mirror}/keys; newline-separated key list for the\nnamed mirror's view. Every line (including the last) is\nterminated by `\\n`. Order is insertion order (the position a key\ngets the *first* time the mirror sees it).",
+        "description": "`Content-Type` is `application/octet-stream` to match KKV's\nbyte-for-byte response shape.",
         "operationId": "keys",
+        "parameters": [
+          {
+            "name": "mirror",
+            "in": "path",
+            "description": "Name of the `http-access.cache-v1` mirror to read from",
+            "required": true,
+            "schema": {
+              "type": "string"
+            }
+          }
+        ],
         "responses": {
           "200": {
             "description": "Newline-separated keys (UTF-8, trailing newline included)",
@@ -74,20 +85,39 @@
               }
             }
           },
+          "404": {
+            "description": "Mirror unknown"
+          },
           "503": {
-            "description": "Cache is not yet caught up to the source"
+            "description": "Mirror is not currently Ready; body is a MirrorReadiness object",
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/MirrorReadiness"
+                }
+              }
+            }
           }
         }
       }
     },
-    "/cache/v1/offset/{topic}/{partition}": {
+    "/cache/v1/{mirror}/offset/{topic}/{partition}": {
       "get": {
         "tags": [
           "cache"
         ],
-        "summary": "GET /cache/v1/offset/{topic}/{partition} — last-seen offset.",
+        "summary": "GET /cache/v1/{mirror}/offset/{topic}/{partition}; last-seen\noffset for that (topic, partition) within the named mirror.",
         "operationId": "offset_for_partition",
         "parameters": [
+          {
+            "name": "mirror",
+            "in": "path",
+            "description": "Name of the `http-access.cache-v1` mirror to read from",
+            "required": true,
+            "schema": {
+              "type": "string"
+            }
+          },
           {
             "name": "topic",
             "in": "path",
@@ -111,7 +141,7 @@
         ],
         "responses": {
           "200": {
-            "description": "Decimal offset of the last applied record, or empty if none yet",
+            "description": "Decimal offset of the last applied record on this mirror, or empty if none yet",
             "content": {
               "text/plain": {
                 "schema": {
@@ -122,18 +152,30 @@
           },
           "400": {
             "description": "Empty topic"
+          },
+          "404": {
+            "description": "Mirror unknown"
           }
         }
       }
     },
-    "/cache/v1/raw/{key}": {
+    "/cache/v1/{mirror}/raw/{key}": {
       "get": {
         "tags": [
           "cache"
         ],
-        "summary": "GET /cache/v1/raw/{key} — fetch a value by key.",
+        "summary": "GET /cache/v1/{mirror}/raw/{key}; fetch a value by key from the\nnamed mirror's view. The unprefixed `/cache/v1/raw/{key}` alias\nis mounted by `build_router` when one mirror opted into\n`http-access.cache-v1-main`, and dispatches here with that\nmirror's name.",
         "operationId": "raw_by_key",
         "parameters": [
+          {
+            "name": "mirror",
+            "in": "path",
+            "description": "Name of the `http-access.cache-v1` mirror to read from",
+            "required": true,
+            "schema": {
+              "type": "string"
+            }
+          },
           {
             "name": "key",
             "in": "path",
@@ -164,22 +206,39 @@
             "description": "Empty or invalid key"
           },
           "404": {
-            "description": "Key not in cache"
+            "description": "Mirror unknown, or key not in cache"
           },
           "503": {
-            "description": "Cache is not yet caught up to the source"
+            "description": "Mirror is not currently Ready; body is a MirrorReadiness object",
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/MirrorReadiness"
+                }
+              }
+            }
           }
         }
       }
     },
-    "/cache/v1/values": {
+    "/cache/v1/{mirror}/values": {
       "get": {
         "tags": [
           "cache"
         ],
-        "summary": "GET /cache/v1/values — newline-separated values (raw bytes).\nOrder matches `/cache/v1/keys`. Every line — including the last —\nis terminated by `\\n`. Binary-safe **only** when none of the values\ncontain a `0x0A` byte; binary topics should pin\n`values: { type: bytes-base64 }` so the cache returns the\nbase64-encoded form here.",
-        "description": "`Content-Type` is `text/plain; charset=utf-8` regardless of the\nconfigured value type. Future work — gated on operator demand —\nis to adapt the response content type to the topic schema:\n\n| `values.type`        | proposed `Content-Type`            |\n| -------------------- | ---------------------------------- |\n| `bytes-base64`       | `application/octet-stream`         |\n| `utf8`               | `text/plain; charset=utf-8`        |\n| `json` / `json-parseable` | `application/x-ndjson`        |\n\nNot implemented today to keep parity with KKV's\n`text/plain;charset=UTF-8` (mirror-v3 emits the RFC-normalised\nequivalent).",
+        "summary": "GET /cache/v1/{mirror}/values; newline-separated values for the\nnamed mirror's view, in `keys` order. Binary-safe **only** when\nnone of the values contain a `0x0A` byte; binary topics should\npin `values: { type: bytes-base64 }` so the cache returns the\nbase64-encoded form here.",
         "operationId": "values",
+        "parameters": [
+          {
+            "name": "mirror",
+            "in": "path",
+            "description": "Name of the `http-access.cache-v1` mirror to read from",
+            "required": true,
+            "schema": {
+              "type": "string"
+            }
+          }
+        ],
         "responses": {
           "200": {
             "description": "Newline-separated raw values with trailing newline; binary-safe iff no value contains 0x0A",
@@ -196,8 +255,18 @@
               }
             }
           },
+          "404": {
+            "description": "Mirror unknown"
+          },
           "503": {
-            "description": "Cache is not yet caught up to the source"
+            "description": "Mirror is not currently Ready; body is a MirrorReadiness object",
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/MirrorReadiness"
+                }
+              }
+            }
           }
         }
       }
@@ -205,6 +274,132 @@
   },
   "components": {
     "schemas": {
+      "AggregateReadiness": {
+        "type": "string",
+        "description": "Aggregate readiness state for the process. The discriminator\nstring lets a grep-friendly consumer distinguish \"warming up but\nexpected to clear shortly\" (a cold start) from \"something is\nwrong\" (a mirror went degraded after first reaching Ready).",
+        "enum": [
+          "ready",
+          "warming",
+          "degraded"
+        ]
+      },
+      "MirrorReadiness": {
+        "type": "object",
+        "description": "One mirror's slice of the readiness response. Returned both as\nan element of [`ReadinessReport::mirrors`] and as the standalone\nbody of the per-mirror `/cache/v1/{mirror}/...` 503 response so a\nclient library can surface the reason without a second request.",
+        "required": [
+          "name",
+          "status",
+          "source"
+        ],
+        "properties": {
+          "destination": {
+            "oneOf": [
+              {
+                "type": "null"
+              },
+              {
+                "$ref": "#/components/schemas/MirrorReadinessDestination",
+                "description": "Status-specific detail: the lagging destination's name + lag\n(when `status == \"destination_lagging\"`), or the source lag\n(when `status == \"lag_behind_source\"`). `None` otherwise."
+              }
+            ]
+          },
+          "name": {
+            "type": "string"
+          },
+          "source": {
+            "$ref": "#/components/schemas/MirrorReadinessSource",
+            "description": "Source-side detail: topic, partition, assignment, offsets."
+          },
+          "status": {
+            "type": "string",
+            "description": "String discriminator for the status, easy to grep:\n`ready` | `warming` | `lag_behind_source` | `source_unassigned`\n| `destination_lagging`."
+          }
+        }
+      },
+      "MirrorReadinessDestination": {
+        "type": "object",
+        "required": [
+          "name",
+          "lag"
+        ],
+        "properties": {
+          "lag": {
+            "type": "integer",
+            "format": "int64",
+            "minimum": 0
+          },
+          "name": {
+            "type": "string"
+          }
+        }
+      },
+      "MirrorReadinessSource": {
+        "type": "object",
+        "required": [
+          "topic",
+          "partition",
+          "assigned",
+          "end_offset",
+          "last_applied_offset",
+          "lag"
+        ],
+        "properties": {
+          "assigned": {
+            "type": "boolean"
+          },
+          "end_offset": {
+            "type": "integer",
+            "format": "int64",
+            "minimum": 0
+          },
+          "lag": {
+            "type": "integer",
+            "format": "int64",
+            "description": "`end_offset - last_applied_offset`, saturating at 0 so a\nlate-arriving high-watermark fetch can't underflow.",
+            "minimum": 0
+          },
+          "last_applied_offset": {
+            "type": "integer",
+            "format": "int64",
+            "minimum": 0
+          },
+          "partition": {
+            "type": "integer",
+            "format": "int32",
+            "minimum": 0
+          },
+          "topic": {
+            "type": "string"
+          }
+        }
+      },
+      "ReadinessReport": {
+        "type": "object",
+        "description": "Full body of the readiness endpoint. Always serialised; the\nHTTP status code (200 vs 503) is determined by `ready`.",
+        "required": [
+          "ready",
+          "mirrors",
+          "unhealthy"
+        ],
+        "properties": {
+          "mirrors": {
+            "type": "array",
+            "items": {
+              "$ref": "#/components/schemas/MirrorReadiness"
+            }
+          },
+          "ready": {
+            "$ref": "#/components/schemas/AggregateReadiness"
+          },
+          "unhealthy": {
+            "type": "array",
+            "items": {
+              "type": "string"
+            },
+            "description": "Grep-friendly list of mirror names whose status is not\n`ready`. Empty when `ready == \"ready\"`."
+          }
+        }
+      },
       "TopicPartitionOffsetJson": {
         "type": "object",
         "description": "`{topic, partition, offset}` shape serialized into the\n`x-kkv-last-seen-offsets` header. Mirrors KKV's\n`TopicPartitionOffset`, including JSON property order.",
diff --git a/schemas/mirror-v3.config.schema.json b/schemas/mirror-v3.config.schema.json
index 0f4c6a4..b8c345d 100644
--- a/schemas/mirror-v3.config.schema.json
+++ b/schemas/mirror-v3.config.schema.json
@@ -133,11 +133,22 @@
           ]
         },
         "enabled": {
-          "description": "Whether mirror-v3 should actually spawn this mirror at\nstartup. Defaults to `true`. Plain YAML boolean only —\n`true` / `false` (and the YAML-1.2 case variants\n`True`/`False`/`TRUE`/`FALSE`). The YAML-1.1 truthy/falsy\nstrings (`yes`/`no`/`on`/`off`) are deliberately NOT\naccepted; operators who want to flip a mirror via env\ninterpolation should write the env value as `true` or\n`false`:\n\n```yaml\n- name: requests\n  enabled: ${REQUESTS_ENABLED:-false}\n  ...\n```\n\nDisabled mirrors are validated the same as enabled ones (so\nflipping `false` → `true` won't surface latent config bugs)\nbut are not spawned, do not register with the cache-v1\nreadiness gate, and do not contribute to source-broker reads.\nIf *every* mirror in a process is disabled, startup fails\nloudly so a misconfigured deployment doesn't silently idle.",
+          "description": "Whether mirror-v3 should actually spawn this mirror at\nstartup. Defaults to `true`. Plain YAML boolean only -\n`true` / `false` (and the YAML-1.2 case variants\n`True`/`False`/`TRUE`/`FALSE`). The YAML-1.1 truthy/falsy\nstrings (`yes`/`no`/`on`/`off`) are deliberately NOT\naccepted; operators who want to flip a mirror via env\ninterpolation should write the env value as `true` or\n`false`:\n\n```yaml\n- name: requests\n  enabled: ${REQUESTS_ENABLED:-false}\n  ...\n```\n\nDisabled mirrors are validated the same as enabled ones (so\nflipping `false` → `true` won't surface latent config bugs)\nbut are not spawned, do not register with the cache-v1\nreadiness gate, and do not contribute to source-broker reads.\nIf *every* mirror in a process is disabled, startup fails\nloudly so a misconfigured deployment doesn't silently idle.",
           "type": [
             "boolean",
             "null"
           ]
+        },
+        "notify": {
+          "description": "Opt-in outbound webhook notify. Closes the legacy\n`Yolean/kafka-keyvalue` (kkv) \"onupdate\" gap: when a record\nlands in the mirror's view, POST to one or more downstream\nservices so their in-process caches can invalidate and\nre-fetch via `/cache/v1/raw/<key>`.\n\nToday the only `api` variant is `kkv-v1`, which matches the\nlegacy kkv wire contract byte-for-byte so the upstream\n`@yolean/kafka-keyvalue` Node client works unmodified.\n\nSee `WEBHOOKS.md` at the repo root for the full design,\ntrigger modes, outcome matrix, and DNS-A fan-out semantics.",
+          "anyOf": [
+            {
+              "$ref": "#/$defs/Notify"
+            },
+            {
+              "type": "null"
+            }
+          ]
         }
       },
       "additionalProperties": false,
@@ -194,6 +205,11 @@
               ],
               "default": null
             },
+            "affects-readiness": {
+              "description": "Whether this destination gates the mirror's readiness. When\n`true` (default), the supervisor reports\n`MirrorStatus::DestinationLagging` if this destination falls\nbehind the source by more than the configured tolerance,\nand the structured `/q/health/ready` body names the\ndestination by `name`. Set `false` for best-effort secondary\ndestinations (observability replicas, archival sync) that\nshould not flip the mirror's status.",
+              "type": "boolean",
+              "default": true
+            },
             "type": {
               "type": "string",
               "const": "kafka"
@@ -220,6 +236,11 @@
               "description": "Absolute path to the destination root directory.",
               "type": "string"
             },
+            "affects-readiness": {
+              "description": "See [`KafkaDestination::affects_readiness`].",
+              "type": "boolean",
+              "default": true
+            },
             "type": {
               "type": "string",
               "const": "filesystem"
@@ -264,6 +285,11 @@
               ],
               "default": null
             },
+            "affects-readiness": {
+              "description": "See [`KafkaDestination::affects_readiness`].",
+              "type": "boolean",
+              "default": true
+            },
             "type": {
               "type": "string",
               "const": "s3"
@@ -282,7 +308,7 @@
       "description": "Envelope format for Filesystem and S3 destinations.",
       "oneOf": [
         {
-          "description": "Apache Parquet. Columnar, embedded schema, compressed.\nStandard data-lake format — readable by DuckDB / Athena /\nSpark out of the box.",
+          "description": "Apache Parquet. Columnar, embedded schema, compressed.\nStandard data-lake format - readable by DuckDB / Athena /\nSpark out of the box.",
           "type": "string",
           "const": "parquet"
         },
@@ -441,25 +467,331 @@
       ]
     },
     "HttpAccess": {
-      "description": "HTTP read-access block. Today the only variant is the KKV-compatible\n`/cache/v1` surface; the field is grouped so future APIs can be\nadded without re-shaping the YAML.",
+      "description": "HTTP read-access block. Multiple API surfaces can be enabled on\nthe same mirror; each is configured by its presence under its\nown key. The map shape (rather than the original `{ api: ... }`\nenum) lets a mirror opt into more than one API and keeps room\nfor per-API knobs without further config reshaping.",
+      "type": "object",
+      "properties": {
+        "cache-v1": {
+          "description": "`/cache/v1/{mirror}/raw/{key}` etc. mounted at the mirror's\nown name. Required if `cache-v1-main` is set. See the\n`mirror-cache` crate for behavior and the committed OpenAPI\n3.1 spec in `schemas/mirror-v3.cache.openapi.json`.",
+          "anyOf": [
+            {
+              "$ref": "#/$defs/CacheV1Config"
+            },
+            {
+              "type": "null"
+            }
+          ]
+        },
+        "cache-v1-main": {
+          "description": "`/cache/v1/raw/{key}` etc. mounted at the unprefixed path,\ndispatching to this mirror's per-mirror view. At most one\nmirror in the whole config may set this; the validator\nrejects more than one so a `cache-v1-main` consumer sees a\nsingle deterministic view. Migration aid; once every consumer\nhas moved to `/cache/v1/{mirror}/...` it can be removed.",
+          "anyOf": [
+            {
+              "$ref": "#/$defs/CacheV1MainConfig"
+            },
+            {
+              "type": "null"
+            }
+          ]
+        }
+      },
+      "additionalProperties": false
+    },
+    "CacheV1Config": {
+      "description": "Per-API configuration block for `cache-v1`. Empty today, populated\nas the field is given operator-tunable knobs.",
+      "type": "object",
+      "additionalProperties": false
+    },
+    "CacheV1MainConfig": {
+      "description": "Per-API configuration block for `cache-v1-main`. Empty today.",
+      "type": "object",
+      "additionalProperties": false
+    },
+    "Notify": {
+      "description": "Per-mirror outbound notify block. Today only the `kkv-v1` API\nvariant is supported; future variants (e.g. `nats-v1`, a\n`kkv-v2` with auth) hang off the same block without re-shaping.",
       "type": "object",
       "properties": {
         "api": {
-          "$ref": "#/$defs/HttpAccessApi"
+          "$ref": "#/$defs/NotifyApi"
+        },
+        "targets": {
+          "description": "One or more downstream targets. Each target carries its own\nURL and fan-out mode. Multi-target notify fan-out is parallel\nand per-target outcomes resolve independently.",
+          "type": "array",
+          "items": {
+            "$ref": "#/$defs/NotifyTarget"
+          }
+        },
+        "trigger": {
+          "$ref": "#/$defs/NotifyTrigger",
+          "default": {
+            "on": "source-consume",
+            "debounce": {
+              "max-records": 100,
+              "max-time-ms": 250
+            }
+          }
+        },
+        "timeout-ms": {
+          "description": "Per-request HTTP timeout. Independent of retry policy: timing\nout is one of the six outcomes whose action is configurable.\nSpec default: 5000 ms.",
+          "type": "integer",
+          "format": "uint64",
+          "minimum": 0,
+          "default": 5000
+        },
+        "retry": {
+          "$ref": "#/$defs/NotifyRetry",
+          "default": {
+            "max-attempts": 5,
+            "backoff-ms": 100
+          }
+        },
+        "outcomes": {
+          "$ref": "#/$defs/NotifyOutcomes",
+          "default": {
+            "timeout": {
+              "retry": true,
+              "final": "fail"
+            },
+            "connrefused": {
+              "retry": true,
+              "final": "fail"
+            },
+            "2xx": {
+              "retry": false,
+              "final": "accept"
+            },
+            "3xx": {
+              "retry": false,
+              "final": "fail"
+            },
+            "4xx": {
+              "retry": false,
+              "final": "fail"
+            },
+            "5xx": {
+              "retry": true,
+              "final": "fail"
+            }
+          }
+        }
+      },
+      "additionalProperties": false,
+      "required": [
+        "api",
+        "targets"
+      ]
+    },
+    "NotifyApi": {
+      "description": "The wire-contract variant this notify block speaks. Today only\nthe legacy kkv shape exists. New variants must explicitly opt\nin - kkv-v1 is not the default to avoid silently changing\nbehaviour if we ever add e.g. a kkv-v2 with auth.",
+      "oneOf": [
+        {
+          "description": "`POST /kafka-keyvalue/v1/updates` with the legacy kkv body:\n`{ topic, offsets, updates: { <key>: null } }`. Matches the\n`@yolean/kafka-keyvalue` Node client's\n`getOnUpdateRoute()` / `ON_UPDATE_DEFAULT_PATH`.",
+          "type": "string",
+          "const": "kkv-v1"
+        }
+      ]
+    },
+    "NotifyTarget": {
+      "type": "object",
+      "properties": {
+        "url": {
+          "description": "Full URL of the target. Path defaults to\n`/kafka-keyvalue/v1/updates` under `api: kkv-v1` if `path`\nis unset; explicit override is allowed for non-kkv clients.",
+          "type": "string"
+        },
+        "path": {
+          "description": "Override the URL's path segment. Defaults to the\napi-variant-defined path (`/kafka-keyvalue/v1/updates`\nfor kkv-v1).",
+          "type": [
+            "string",
+            "null"
+          ]
+        },
+        "fan-out": {
+          "description": "How the URL's host is resolved. `none` (default) sends one\nPOST to a single keep-alive connection; `dns-a` resolves\nthe host to its full A/AAAA record set and POSTs to every\nreturned address concurrently - the K8s-headless-Service\nfan-out path without a Kubernetes API dependency.",
+          "$ref": "#/$defs/FanOut",
+          "default": "none"
+        }
+      },
+      "additionalProperties": false,
+      "required": [
+        "url"
+      ]
+    },
+    "FanOut": {
+      "oneOf": [
+        {
+          "description": "Standard DNS, single keep-alive connection. Adequate for a\nnon-K8s target or a single-replica deployment.",
+          "type": "string",
+          "const": "none"
+        },
+        {
+          "description": "Resolve the URL's host to all A/AAAA records and POST to\nevery address concurrently. Headless Kubernetes Services\nreturn one A-record per pod, giving the same fan-out the\nlegacy kkv did via the Endpoints API.",
+          "type": "string",
+          "const": "dns-a"
+        }
+      ]
+    },
+    "NotifyTrigger": {
+      "type": "object",
+      "properties": {
+        "on": {
+          "$ref": "#/$defs/TriggerOn"
+        },
+        "debounce": {
+          "description": "Required when `on: source-consume`; forbidden when\n`on: destination-flush` (the destination's own flush\ntriggers ARE the debounce in that mode). Defaults to\n`{ max-records: 100, max-time-ms: 250 }`.",
+          "anyOf": [
+            {
+              "$ref": "#/$defs/NotifyDebounce"
+            },
+            {
+              "type": "null"
+            }
+          ]
+        }
+      },
+      "additionalProperties": false,
+      "required": [
+        "on"
+      ]
+    },
+    "TriggerOn": {
+      "oneOf": [
+        {
+          "description": "POST as soon as the consume loop hands a record to the\nmirror - bounded by the `debounce` window. Default;\nmatches legacy kkv behaviour.",
+          "type": "string",
+          "const": "source-consume"
+        },
+        {
+          "description": "POST when *every* destination has durably committed past\nthe batch's high-water offset. The notify body's offset\nrange matches the flushed snapshot's `from`–`to`. Wrong\nfor cache invalidation; right for downstream archival\nhints.",
+          "type": "string",
+          "const": "destination-flush"
+        }
+      ]
+    },
+    "NotifyDebounce": {
+      "type": "object",
+      "properties": {
+        "max-records": {
+          "type": "integer",
+          "format": "uint64",
+          "minimum": 0
+        },
+        "max-time-ms": {
+          "type": "integer",
+          "format": "uint64",
+          "minimum": 0
+        }
+      },
+      "additionalProperties": false,
+      "required": [
+        "max-records",
+        "max-time-ms"
+      ]
+    },
+    "NotifyRetry": {
+      "type": "object",
+      "properties": {
+        "max-attempts": {
+          "type": "integer",
+          "format": "uint32",
+          "minimum": 0
+        },
+        "backoff-ms": {
+          "type": "integer",
+          "format": "uint64",
+          "minimum": 0
+        }
+      },
+      "additionalProperties": false,
+      "required": [
+        "max-attempts",
+        "backoff-ms"
+      ]
+    },
+    "NotifyOutcomes": {
+      "description": "The six request outcomes and what each one means for the mirror.\nPer-field omission falls back to the spec-default for that\noutcome only (one outcome being explicit doesn't force the\nothers to be).",
+      "type": "object",
+      "properties": {
+        "timeout": {
+          "$ref": "#/$defs/NotifyOutcome",
+          "default": {
+            "retry": true,
+            "final": "fail"
+          }
+        },
+        "connrefused": {
+          "$ref": "#/$defs/NotifyOutcome",
+          "default": {
+            "retry": true,
+            "final": "fail"
+          }
+        },
+        "2xx": {
+          "description": "HTTP 2xx - the only success outcome.",
+          "$ref": "#/$defs/NotifyOutcome",
+          "default": {
+            "retry": false,
+            "final": "accept"
+          }
+        },
+        "3xx": {
+          "description": "HTTP 3xx - almost always misconfiguration on a webhook.",
+          "$ref": "#/$defs/NotifyOutcome",
+          "default": {
+            "retry": false,
+            "final": "fail"
+          }
+        },
+        "4xx": {
+          "description": "HTTP 4xx - receiver says \"your request is wrong\";\nretrying the same payload doesn't help.",
+          "$ref": "#/$defs/NotifyOutcome",
+          "default": {
+            "retry": false,
+            "final": "fail"
+          }
+        },
+        "5xx": {
+          "description": "HTTP 5xx - receiver is transiently broken; retry per\npolicy and fail on exhaustion.",
+          "$ref": "#/$defs/NotifyOutcome",
+          "default": {
+            "retry": true,
+            "final": "fail"
+          }
+        }
+      },
+      "additionalProperties": false
+    },
+    "NotifyOutcome": {
+      "type": "object",
+      "properties": {
+        "retry": {
+          "description": "If `true`, the request is retried per [`NotifyRetry`] before\n[`Self::final_`] is applied. If `false`, the action in\n[`Self::final_`] is taken on the first attempt.",
+          "type": "boolean"
+        },
+        "final": {
+          "description": "What happens once retries (if any) are exhausted.",
+          "$ref": "#/$defs/FinalAction"
         }
       },
       "additionalProperties": false,
       "required": [
-        "api"
+        "retry",
+        "final"
       ]
     },
-    "HttpAccessApi": {
-      "description": "Variants of the read API surface mirror-v3 will host. Each opt-in\nmirror declares which one applies to it; today only `cache-v1`\nexists (a drop-in for `Yolean/kafka-keyvalue`'s `/cache/v1`).",
+    "FinalAction": {
       "oneOf": [
         {
-          "description": "`/cache/v1/raw/{key}`, `/cache/v1/keys`, `/cache/v1/values`,\n`/cache/v1/offset/{topic}/{partition}`. See the `mirror-cache`\ncrate for behavior and the committed OpenAPI 3.1 spec in\n`schemas/mirror-v3.cache.openapi.json`.",
+          "description": "Treat the batch as delivered, advance.",
+          "type": "string",
+          "const": "accept"
+        },
+        {
+          "description": "Log WARN, drop the batch, advance.",
+          "type": "string",
+          "const": "skip"
+        },
+        {
+          "description": "Mirror task errors out; orchestrator restarts; mirror\nreplays from durable state on restart.",
           "type": "string",
-          "const": "cache-v1"
+          "const": "fail"
         }
       ]
     }