foundryside-dev · tachyon-beep · Jun 5, 2026 · Jun 5, 2026 · chatgpt-codex-connector · Jun 5, 2026
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -55,6 +55,37 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
   CLI verb shares the same filter core. (WS-B1, WS-B2)
 
 ### Security
+- **Builtin trust-marker decorators are now trusted only when they resolve to the
+  real exports — closes a spoofable false-green.** The default decorator seeding
+  trusted ANY FQN whose prefix was a builtin marker module and whose final segment
+  was a known marker name, without verifying the decorator resolved to Wardline's
+  real package. A scanned project could ship its own `wardline/decorators/__init__.py`
+  (or `loom_markers/__init__.py`) defining a no-op `trusted`/`trust_boundary`, apply
+  it to a leaky function, and have the analyzer anchor it as TRUSTED — suppressing
+  real taint→sink flows (a false GREEN that hides defects). Nested spoof paths
+  (`wardline.decorators.evil.trusted`, `loom_markers.evil.trusted`) were also accepted.
+  Builtin markers now match ONLY their exact public re-export (`P.<name>`) or
+  implementation-module export (`P.trust.<name>`), and the provider FAILS CLOSED for a
+  builtin marker root the scanned project shadows (defines its own top-level `wardline`
+  / `loom_markers` package). The shadowed-root set is derived dynamically from the
+  grammar (`{bt.module_prefix.split('.')[0] for bt in BUILTIN_BOUNDARY_TYPES if
+  bt.builtin}`), so every builtin marker root is covered, not just `wardline`. Custom
+  (non-builtin) grammar markers keep the documented prefix + canonical-name behavior —
+  a project defining its own custom marker package is the intended extension use.
+  **Cache-key hardening:** the per-root shadow state is folded into a shadow-aware
+  provider fingerprint threaded through BOTH the pipeline dirty-detection key and the
+  resolver's summary cache, so a TRUSTED summary computed under one shadow state can
+  never be reused under another (cross-root cache poisoning). The fingerprint stays
+  byte-identical to today's value when nothing is shadowed. **Clarion residual
+  (documented, not threaded):** the opt-in `--clarion-url` taint-fact
+  `content_hash_at_compute` is whole-file raw-byte blake3 only — it cannot observe
+  shadow state, so identical file bytes scanned once unshadowed then under a shadow
+  could serve a stale TRUSTED fact via the MCP `explain_taint` / Clarion read path. The
+  shadow bit is deliberately NOT mixed into this hash because it is a cross-tool
+  contract value Clarion's read path independently recomputes and compares; mixing in a
+  Wardline-private bit would break fact reconciliation entirely. Closing it fully needs
+  a Clarion read-path contract change; the keying site carries an explicit comment. This
+  path is opt-in and not the scan gate, so impact is lower.
 - **Dangerous-sink rules now see lambda bodies (closes a false-green).** `_own_calls`
   treated `ast.Lambda` as a separate scope and only inspected lambda *default*
   expressions, so a sink reached inside a lambda *body* — `cb = lambda: eval(src)`,

diff --git a/src/wardline/clarion/facts.py b/src/wardline/clarion/facts.py
@@ -78,6 +78,19 @@ def build_taint_facts(result: ScanResult, root: Path) -> list[dict[str, Any]]:
         rel_path = entity.location.path
         if rel_path not in hash_cache:
             hash_cache[rel_path] = blake3.blake3(_read_bytes(root / rel_path)).hexdigest()
+        # RESIDUAL (builtin-marker shadow false-green): ``content_hash_at_compute``
+        # is whole-file raw-byte blake3 ONLY — it cannot observe the shadow state of
+        # a builtin marker root. So identical file bytes scanned once UNSHADOWED then
+        # under a project that shadows ``wardline``/``loom_markers`` could serve a
+        # stale TRUSTED fact via the MCP explain_taint / Clarion read path. We do NOT
+        # fold the shadow bit / provider fingerprint into this hash: it is a
+        # CROSS-TOOL contract value — Clarion's read path INDEPENDENTLY recomputes
+        # the whole-file blake3 (clarion_storage::current_file_hash) and compares it
+        # against the in-blob copy. Mixing in a Wardline-private bit would make every
+        # comparison mismatch and break fact reconciliation entirely; there is no
+        # separate Wardline-owned compute-key the freshness gate consults. Closing
+        # this fully needs a Clarion read-path contract change. Lower impact: this
+        # path is opt-in (--clarion-url) and not the scan gate. See CHANGELOG.
         content_hash = hash_cache[rel_path]
 
         declared = context.project_return_taints.get(qualname)

diff --git a/src/wardline/scanner/analyzer.py b/src/wardline/scanner/analyzer.py
@@ -128,18 +128,23 @@ def _analyze_inner(self, files: Sequence[Path], config: WardlineConfig, *, root:
         parse_findings = list(parse_stage.parse_findings)
         dirty_modules = set(parse_stage.dirty_modules)
 
+        # Use the SHADOW-AWARE provider fingerprint computed during the parse stage
+        # for BOTH the dirty-detection key (above, inside the parse stage) AND the
+        # resolver's summary cache here. They MUST agree, or a summary computed under
+        # a non-shadowed root could be served when re-scanning a shadowed one
+        # (cross-root cache poisoning → a spoofed-trust false GREEN survives).
         if self._cache is not None:
             result = resolve_project_taints(
                 modules=modules,
-                provider_fingerprint=self._provider.fingerprint(),
+                provider_fingerprint=parse_stage.provider_fingerprint,
                 summary_cache=self._cache,
                 dirty_modules=frozenset(dirty_modules),
                 config=config,
             )
         else:
             result = resolve_project_taints(
                 modules=modules,
-                provider_fingerprint=self._provider.fingerprint(),
+                provider_fingerprint=parse_stage.provider_fingerprint,
                 config=config,
             )
 

diff --git a/src/wardline/scanner/pipeline.py b/src/wardline/scanner/pipeline.py
@@ -7,7 +7,7 @@
 from collections.abc import Sequence
 from dataclasses import dataclass
 from pathlib import Path
-from typing import TYPE_CHECKING
+from typing import TYPE_CHECKING, Any, cast
 
 from wardline.core.finding import Finding, Kind, Location, Severity
 from wardline.core.qualname import module_dotted_name
@@ -59,6 +59,23 @@ class ParseProjectOutput:
     files: list[ParsedFile]
     parse_findings: list[Finding]
     dirty_modules: frozenset[str]
+    provider_fingerprint: str
+
+
+def _provider_fingerprint_for_project(provider: TaintSourceProvider, project_modules: frozenset[str]) -> str:
+    """Project-aware provider fingerprint, falling back to the bare one.
+
+    A provider may expose ``fingerprint_for_project(project_modules)`` to fold
+    project-shadow state (which builtin marker roots the scan shadows) into the
+    summary-cache key — preventing a warm cache from serving a TRUSTED summary
+    computed under a non-shadowed root when re-scanning a shadowed one. Providers
+    that do not (the trivial default) fall back to the plain ``fingerprint()``.
+    """
+    project_fingerprint = getattr(provider, "fingerprint_for_project", None)
+    if callable(project_fingerprint):
+        typed_project_fingerprint = cast(Any, project_fingerprint)
+        return str(typed_project_fingerprint(project_modules))
+    return provider.fingerprint()
 
 
 def run_parse_project_stage(stage_input: ParseProjectInput) -> ParseProjectOutput:
@@ -69,6 +86,22 @@ def run_parse_project_stage(stage_input: ParseProjectInput) -> ParseProjectOutpu
     dirty_modules: set[str] = set()
     root = stage_input.root.resolve()
 
+    # The set of dotted module names in the scan. Used to fail closed for builtin
+    # markers when the project shadows a builtin marker root, AND to compute the
+    # shadow-aware provider fingerprint threaded into BOTH the dirty-detection key
+    # below and the resolver's summary cache (see analyzer.py).
+    project_modules = frozenset(
+        module
+        for path in stage_input.files
+        if (
+            module := module_dotted_name(
+                path.relative_to(root).as_posix() if path.is_relative_to(root) else path.as_posix()
+            )
+        )
+        is not None
+    )
+    provider_fingerprint = _provider_fingerprint_for_project(stage_input.provider, project_modules)
+
     for path in stage_input.files:
         relpath = path.relative_to(root).as_posix() if path.is_relative_to(root) else path.as_posix()
         module = module_dotted_name(relpath)
@@ -90,7 +123,6 @@ def run_parse_project_stage(stage_input: ParseProjectInput) -> ParseProjectOutpu
             source = path.read_text(encoding="utf-8")
             source_bytes = source.encode("utf-8")
 
-            provider_fingerprint = stage_input.provider.fingerprint()
             from wardline.scanner.taint.project_resolver import _RESOLVER_VERSION
             from wardline.scanner.taint.summary import SUMMARY_SCHEMA_VERSION, compute_cache_key
 
@@ -116,7 +148,7 @@ def run_parse_project_stage(stage_input: ParseProjectInput) -> ParseProjectOutpu
             )
             seeds = seed_function_taints(
                 entities,
-                ctx=SeedContext(module=module, alias_map=alias_map),
+                ctx=SeedContext(module=module, alias_map=alias_map, project_modules=project_modules),
                 provider=stage_input.provider,
             )
             for ent in entities:
@@ -205,6 +237,7 @@ def run_parse_project_stage(stage_input: ParseProjectInput) -> ParseProjectOutpu
         files=parsed_files,
         parse_findings=parse_findings,
         dirty_modules=frozenset(dirty_modules),
+        provider_fingerprint=provider_fingerprint,
     )
 
 

diff --git a/src/wardline/scanner/taint/decorator_provider.py b/src/wardline/scanner/taint/decorator_provider.py
@@ -31,6 +31,15 @@
 _LOOM_MARKERS_PREFIX = "loom_markers"
 _TAINTSTATE_FQN = "wardline.core.taints.TaintState"
 
+# The top-level import roots of every BUILTIN marker module — derived dynamically
+# from the grammar so adding a builtin marker root (e.g. a future ``loom_markers``
+# sibling) automatically participates in shadow fail-closed + exact-export matching.
+# A ``loom_markers`` boundary type has module_prefix ``loom_markers`` (root
+# ``loom_markers``); a ``wardline.decorators`` one has root ``wardline``.
+_BUILTIN_MARKER_ROOTS: frozenset[str] = frozenset(
+    bt.module_prefix.split(".")[0] for bt in BUILTIN_BOUNDARY_TYPES if getattr(bt, "builtin", False)
+)
+
 
 def vocabulary_star_exports() -> dict[str, dict[str, str]]:
     """Statically-known star-export map for builtin trust-marker modules.
@@ -84,6 +93,38 @@ def _resolve_decorator_fqn(deco: ast.expr, alias_map: Mapping[str, str]) -> str
     return _resolve_dotted_fqn(func, alias_map)
 
 
+def _shadowed_builtin_roots(project_modules: frozenset[str]) -> frozenset[str]:
+    """Return the builtin marker roots the scanned project SHADOWS.
+
+    Builtin marker declarations must refer to the installed marker package, not a
+    module supplied by the scanned project. A root is shadowed when the project
+    itself defines a TOP-LEVEL module/package equal to that root (e.g. its own
+    ``wardline`` or ``loom_markers`` package): Python import resolution can then
+    bind ``wardline.decorators`` / ``loom_markers`` to attacker-controlled code, so
+    builtin matching fails closed for markers under that root.
+
+    Only the FIRST dotted component is compared, so an unrelated nested module such
+    as ``app.wardline_helper`` or ``myloom.wardline`` does NOT trip a shadow.
+    """
+    project_roots = {module.split(".", 1)[0] for module in project_modules}
+    return frozenset(project_roots & _BUILTIN_MARKER_ROOTS)
+
+
+def _is_builtin_decorator_fqn(fqn: str, canonical_name: str, module_prefix: str) -> bool:
+    """Return whether *fqn* is one of the exact builtin decorator exports.
+
+    For a builtin boundary type with prefix ``P``, only the public re-export
+    ``P.<name>`` and the implementation-module export ``P.trust.<name>`` are
+    accepted (mirroring ``wardline/decorators/__init__.py`` and
+    ``wardline/decorators/trust.py``). Prefix + arbitrary-nested + final-segment
+    paths (e.g. ``wardline.decorators.evil.trusted``) are rejected for builtins.
+    """
+    return fqn in {
+        f"{module_prefix}.{canonical_name}",
+        f"{module_prefix}.trust.{canonical_name}",
+    }
+
+
 def _level_token(value: ast.expr, alias_map: Mapping[str, str]) -> str | None:
     """Extract a TaintState name token from a keyword-argument value node.
 
@@ -184,8 +225,9 @@ def __init__(self, *, boundary_types: tuple[BoundaryType, ...] | None = None) ->
     def taint_for(self, entity: Entity, ctx: SeedContext) -> SeedResult:
         candidates: list[FunctionTaint] = []
         unprovable: list[str] = []
+        shadowed_roots = _shadowed_builtin_roots(ctx.project_modules)
         for deco in entity.node.decorator_list:
-            ft, unprov = self._match(deco, ctx.alias_map)
+            ft, unprov = self._match(deco, ctx.alias_map, shadowed_roots)
             if ft is not None:
                 candidates.append(ft)
             elif unprov is not None:
@@ -219,7 +261,30 @@ def fingerprint(self) -> str:
             return f"decorator-vocab:{REGISTRY_VERSION}"
         return f"decorator-vocab:{REGISTRY_VERSION}+grammar:{_grammar_digest(self._boundary_types)}"
 
-    def _match(self, deco: ast.expr, alias_map: Mapping[str, str]) -> tuple[FunctionTaint | None, str | None]:
+    def fingerprint_for_project(self, project_modules: frozenset[str]) -> str:
+        """Fingerprint declaration inputs that are external to a single module.
+
+        Builtin seeding depends on WHICH builtin marker roots the scanned project
+        shadows; bind the EXACT shadowed-root SET into the summary-cache key so a
+        warm cache cannot reuse a TRUSTED summary across scans with different
+        shadow states (cross-root cache poisoning). Crucially this is per-root: a
+        scan that shadows only ``wardline`` and one that shadows only
+        ``loom_markers`` must NOT collide on the cache key. When nothing is
+        shadowed (the common case), returns the bare :meth:`fingerprint` string,
+        preserving today's exact cache/baseline-stable value.
+        """
+        shadowed = _shadowed_builtin_roots(project_modules)
+        base = self.fingerprint()
+        if not shadowed:
+            return base
+        return f"{base}:shadowed-roots={','.join(sorted(shadowed))}"
+
+    def _match(
+        self,
+        deco: ast.expr,
+        alias_map: Mapping[str, str],
+        shadowed_roots: frozenset[str],
+    ) -> tuple[FunctionTaint | None, str | None]:
         """Match one decorator against the loaded boundary types. Returns:
 
         ``(seed, None)``   — a boundary type matched and its levels proved;
@@ -231,15 +296,22 @@ def _match(self, deco: ast.expr, alias_map: Mapping[str, str]) -> tuple[Function
         fqn = _resolve_decorator_fqn(deco, alias_map)
         if fqn is None:
             return None, None
-        # A decorator matches a boundary type when its FQN is UNDER the type's module
-        # prefix and its final segment is the canonical name. This accepts BOTH the
-        # package re-export (``wardline.decorators.trusted``) and the submodule path
-        # (``wardline.decorators.trust.trusted``) — preserving the pre-Track-2 matcher
-        # exactly (it used the same prefix + last-segment rule), and generalizing it
-        # consistently for custom types.
+        # Builtin markers are security-sensitive defaults: a scanned project could
+        # ship its own ``wardline/decorators`` (or ``loom_markers``) no-op shadowing
+        # the real package, spoof @trusted, and suppress real taint→sink flows (a
+        # false GREEN). So a builtin matches ONLY an EXACT known export
+        # (``P.<name>`` or ``P.trust.<name>``), and is rejected entirely when its
+        # marker ROOT is shadowed by a project-local top-level module. Custom
+        # (non-builtin) grammar markers keep the documented prefix + canonical-name
+        # rule — a project defining its OWN custom marker package is the intended
+        # extension use, and its root is not a builtin we ship.
         last = fqn.rsplit(".", 1)[-1]
         for bt in self._boundary_types:
-            if last != bt.canonical_name or not fqn.startswith(bt.module_prefix + "."):
+            if bt.builtin:
+                root = bt.module_prefix.split(".")[0]
+                if root in shadowed_roots or not _is_builtin_decorator_fqn(fqn, bt.canonical_name, bt.module_prefix):
+                    continue
+            elif last != bt.canonical_name or not fqn.startswith(bt.module_prefix + "."):
                 continue
             levels: dict[str, TaintState] = {}
             unreadable = False

diff --git a/src/wardline/scanner/taint/provider.py b/src/wardline/scanner/taint/provider.py
@@ -30,13 +30,17 @@ class SeedContext:
 
     ``alias_map`` is the file's ``{local_name: fully_qualified_name}`` import
     map (from ``build_import_alias_map``); a provider uses it to resolve aliased
-    decorator names against the trust vocabulary. Defaults to empty so callers
-    that do not seed from decorators (e.g. the trivial default provider's tests)
-    need not supply it.
+    decorator names against the trust vocabulary. ``project_modules`` is the set of
+    dotted module names discovered in the scanned project; a provider uses it to
+    fail closed for BUILTIN markers when the project shadows a builtin marker root
+    (e.g. ships its own ``wardline``/``loom_markers`` package). Both default to
+    empty so callers that do not seed from decorators (e.g. the trivial default
+    provider's tests) need not supply them.
     """
 
     module: str
     alias_map: Mapping[str, str] = field(default_factory=dict)
+    project_modules: frozenset[str] = field(default_factory=frozenset)
 
 
 @dataclass(frozen=True, slots=True)