kgdunn · kgdunn · Jun 30, 2026 · Jun 30, 2026 · Jun 30, 2026
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -11,6 +11,21 @@ those changes.
 
 ## [Unreleased]
 
+## [1.51.0] - 2026-06-30
+
+### Added
+
+- A reusable analysis-recipe framework (`process_improve.recipes`): frozen
+  `RecipeStep` / `AnalysisRecipe` dataclasses, a `register_recipe` registry with
+  lazy `discover_recipes`, a substring matcher `select_recipe`, and a general
+  `select_analysis_recipe` agent tool that maps a free-text request to a guided,
+  step-by-step workflow chaining existing tools. Any subpackage can register its
+  own recipes.
+- Sensory analysis recipes (`process_improve.sensory.recipes`): guided workflows
+  for data intake, panel consistency / scale-use correction, and relating
+  attributes to product covariates (with the genuine / proxy / coincidence
+  separation), plus a parked placeholder for a future visualisation workflow.
+
 ## [1.50.0] - 2026-06-30
 
 ### Added
@@ -2282,7 +2297,8 @@ this entry records them together.
 - Reworked the README with a sharper value proposition and a
   "Why not scikit-learn?" comparison table.
 
-[Unreleased]: https://github.com/kgdunn/process-improve/compare/v1.50.0...HEAD
+[Unreleased]: https://github.com/kgdunn/process-improve/compare/v1.51.0...HEAD
+[1.51.0]: https://github.com/kgdunn/process-improve/compare/v1.50.0...v1.51.0
 [1.50.0]: https://github.com/kgdunn/process-improve/compare/v1.49.1...v1.50.0
 [1.49.1]: https://github.com/kgdunn/process-improve/compare/v1.49.0...v1.49.1
 [1.49.0]: https://github.com/kgdunn/process-improve/compare/v1.48.0...v1.49.0

diff --git a/CITATION.cff b/CITATION.cff
@@ -12,7 +12,7 @@ authors:
 repository-code: "https://github.com/kgdunn/process-improve"
 url: "https://kgdunn.github.io/process-improve/"
 license: MIT
-version: 1.50.0
+version: 1.51.0
 date-released: "2026-06-30"
 keywords:
   - chemometrics

diff --git a/pyproject.toml b/pyproject.toml
@@ -1,6 +1,6 @@
 [project]
 name = "process-improve"
-version = "1.50.0"
+version = "1.51.0"
 description = 'Designed Experiments; Latent Variables (PCA, PLS, multivariate methods with missing data); Process Monitoring; Batch data analysis.'
 readme = "README.md"
 license = "MIT"

diff --git a/src/process_improve/recipes.py b/src/process_improve/recipes.py
@@ -0,0 +1,294 @@
+"""(c) Kevin Dunn, 2010-2026. MIT License.
+
+Reusable analysis-recipe framework.
+
+An *analysis recipe* is a predefined, step-by-step workflow an LLM agent can
+follow when a user's request matches a known analytical scenario (intake,
+panel processing, relating to covariates, ...). Recipes reference existing agent
+tools by name so the agent chains calls deterministically instead of improvising
+the order.
+
+The framework is package-wide and domain-agnostic: any subpackage may define its
+own recipes and register them. The sensory subpackage is the first consumer (see
+:mod:`process_improve.sensory.recipes`).
+
+Adding recipes for a subpackage
+-------------------------------
+1. Create ``process_improve/<subpackage>/recipes.py``.
+2. Build :class:`AnalysisRecipe` instances and pass each to
+   :func:`register_recipe`.
+3. Add ``"process_improve.<subpackage>.recipes"`` to ``_RECIPE_MODULES`` below so
+   :func:`discover_recipes` imports it.
+
+No changes to the agent tool layer are required: the single, general
+``select_analysis_recipe`` tool matches across every registered recipe.
+"""
+
+from __future__ import annotations
+
+import importlib
+import logging
+import re
+from dataclasses import dataclass, field
+from typing import Any
+
+from pydantic import BaseModel, ConfigDict, Field
+
+from process_improve.tool_spec import clean, tool_spec
+
+logger = logging.getLogger(__name__)
+
+# ---------------------------------------------------------------------------
+# Data structures
+# ---------------------------------------------------------------------------
+
+
+@dataclass(frozen=True)
+class RecipeStep:
+    """One step in an analysis recipe the agent should execute.
+
+    Attributes
+    ----------
+    order : int
+        1-based position of the step in the recipe.
+    directive : str
+        Natural-language instruction telling the agent what to do.
+    tools : list of str
+        Names of agent tools this step may call (empty for prose-only steps
+        such as interpretation or data assembly).
+    arg_hints : dict
+        Optional ``{parameter: "where the value comes from"}`` hints, for
+        example ``{"score_min": "0", "mode": "observational"}``.
+    """
+
+    order: int
+    directive: str
+    tools: list[str] = field(default_factory=list)
+    arg_hints: dict[str, str] = field(default_factory=dict)
+
+
+@dataclass(frozen=True)
+class AnalysisRecipe:
+    """A reusable, multi-step analysis workflow for the agent.
+
+    Attributes
+    ----------
+    key : str
+        Unique snake_case identifier.
+    title : str
+        Human-readable name.
+    summary : str
+        One-paragraph description of what the recipe does and when to use it.
+    domain : str
+        The subpackage the recipe belongs to (e.g. ``"sensory"``).
+    cue_phrases : list of str
+        Lower-case substrings; each one found in a user's request scores the
+        recipe one point during matching.
+    inputs_needed : list of str
+        What the agent must resolve from the user before running, each with a
+        short example.
+    stages : list of RecipeStep
+        The ordered steps. Empty for a planned (not yet available) recipe.
+    status : str
+        ``"available"`` (default) or ``"planned"`` for parked future work.
+    """
+
+    key: str
+    title: str
+    summary: str
+    domain: str
+    cue_phrases: list[str]
+    inputs_needed: list[str]
+    stages: list[RecipeStep]
+    status: str = "available"
+
+    def to_payload(self) -> dict[str, Any]:
+        """Serialise to a JSON-friendly dict the agent can consume."""
+        payload: dict[str, Any] = {
+            "recipe_key": self.key,
+            "title": self.title,
+            "summary": self.summary,
+            "domain": self.domain,
+            "status": self.status,
+            "inputs_needed": self.inputs_needed,
+            "stages": [
+                {
+                    "step": s.order,
+                    "directive": s.directive,
+                    **({"tools": s.tools} if s.tools else {}),
+                    **({"arg_hints": s.arg_hints} if s.arg_hints else {}),
+                }
+                for s in self.stages
+            ],
+        }
+        if self.status != "available":
+            payload["note"] = (
+                "This recipe is planned and not yet runnable; tell the user the workflow is "
+                "coming rather than attempting it."
+            )
+        return payload
+
+
+# ---------------------------------------------------------------------------
+# Registry and discovery (mirrors process_improve.tool_spec)
+# ---------------------------------------------------------------------------
+
+#: Maps recipe key -> registered recipe. Populated by ``register_recipe``.
+_RECIPE_REGISTRY: dict[str, AnalysisRecipe] = {}
+
+#: Whether ``discover_recipes()`` has already run.
+_recipes_discovered: bool = False
+
+#: Subpackage recipe modules imported by ``discover_recipes``. Append new
+#: ``process_improve.<subpackage>.recipes`` modules here as they are added.
+_RECIPE_MODULES: list[str] = [
+    "process_improve.sensory.recipes",
+]
+
+
+def register_recipe(recipe: AnalysisRecipe) -> AnalysisRecipe:
+    """Register *recipe* in the global catalog and return it.
+
+    Raises
+    ------
+    ValueError
+        If a recipe with the same ``key`` is already registered.
+    """
+    if recipe.key in _RECIPE_REGISTRY:
+        raise ValueError(f"A recipe with key {recipe.key!r} is already registered.")
+    _RECIPE_REGISTRY[recipe.key] = recipe
+    return recipe
+
+
+def _import_recipe_module(module: str) -> None:
+    """Import one subpackage recipe module, tolerating a missing dependency."""
+    try:
+        importlib.import_module(module)
+    except ModuleNotFoundError as exc:
+        logger.warning("Recipe module %r not loaded (missing dependency): %s", module, exc)
+
+
+def discover_recipes() -> None:
+    """Import every subpackage recipe module to populate the registry.
+
+    Called lazily by the public query helpers. Safe to call repeatedly
+    (subsequent calls are no-ops). A genuinely missing module is logged rather
+    than raised, mirroring :func:`process_improve.tool_spec.discover_tools`.
+    """
+    global _recipes_discovered  # noqa: PLW0603
+    if _recipes_discovered:
+        return
+    for module in _RECIPE_MODULES:
+        _import_recipe_module(module)
+    _recipes_discovered = True
+
+
+# ---------------------------------------------------------------------------
+# Matching
+# ---------------------------------------------------------------------------
+
+_WORD_PATTERN = re.compile(r"\w+")
+
+
+def _canonicalise(text: str) -> str:
+    """Lower-case and collapse to single-spaced word tokens."""
+    return " ".join(_WORD_PATTERN.findall(text.lower()))
+
+
+def select_recipe(query: str) -> AnalysisRecipe | None:
+    """Return the best-matching recipe for *query*, or ``None``.
+
+    Scoring is intentionally simple: each cue phrase that appears as a substring
+    of the canonicalised query contributes one point. The highest-scoring recipe
+    wins (ties broken by registration order); a minimum score of one is required
+    to match. Replace with embedding similarity if the catalog grows beyond a few
+    dozen recipes.
+    """
+    discover_recipes()
+    canonical = _canonicalise(query)
+    best: AnalysisRecipe | None = None
+    best_score = 0
+    for recipe in _RECIPE_REGISTRY.values():
+        score = sum(1 for phrase in recipe.cue_phrases if _canonicalise(phrase) in canonical)
+        if score > best_score:
+            best_score = score
+            best = recipe
+    return best
+
+
+def list_recipes() -> list[AnalysisRecipe]:
+    """Return every registered recipe (registration order)."""
+    discover_recipes()
+    return list(_RECIPE_REGISTRY.values())
+
+
+def get_recipe(key: str) -> AnalysisRecipe | None:
+    """Return the registered recipe with *key*, or ``None``."""
+    discover_recipes()
+    return _RECIPE_REGISTRY.get(key)
+
+
+# ---------------------------------------------------------------------------
+# Agent tool
+# ---------------------------------------------------------------------------
+
+
+class _RecipeQuery(BaseModel):
+    """Input contract for ``select_analysis_recipe``."""
+
+    model_config = ConfigDict(extra="forbid")
+
+    query: str = Field(
+        ...,
+        min_length=1,
+        description="The user's request in natural language; the best-matching analysis recipe is returned.",
+    )
+
+
+@tool_spec(
+    name="select_analysis_recipe",
+    description=(
+        "Match a free-text request to a predefined, step-by-step analysis recipe (a guided workflow that "
+        "chains existing process-improve tools in the right order). Use this first when a user asks an "
+        "open-ended 'how do I analyse this' question, then follow the returned stages. "
+        "Returns: {ok: true, matched: bool, recipe, available}. 'recipe' is the matched recipe payload "
+        "(recipe_key, title, summary, domain, status, inputs_needed, and ordered 'stages' each with a "
+        "directive plus optional tools/arg_hints; a planned recipe also carries a 'note') or null when "
+        "nothing matches. 'available' always lists every registered recipe as {recipe_key, title, "
+        "summary, domain, status} so you can offer a choice even when matched is false."
+    ),
+    input_model=_RecipeQuery,
+    category="recipes",
+)
+def select_analysis_recipe(spec: _RecipeQuery) -> dict:
+    """Return the best-matching recipe payload plus the full catalogue."""
+    match = select_recipe(spec.query)
+    available = [
+        {
+            "recipe_key": r.key,
+            "title": r.title,
+            "summary": r.summary,
+            "domain": r.domain,
+            "status": r.status,
+        }
+        for r in list_recipes()
+    ]
+    return clean(
+        {
+            "ok": True,
+            "matched": match is not None,
+            "recipe": match.to_payload() if match is not None else None,
+            "available": available,
+        }
+    )
+
+
+__all__ = [
+    "AnalysisRecipe",
+    "RecipeStep",
+    "get_recipe",
+    "list_recipes",
+    "register_recipe",
+    "select_analysis_recipe",
+    "select_recipe",
+]
diff --git a/src/process_improve/sensory/__init__.py b/src/process_improve/sensory/__init__.py
@@ -27,6 +27,7 @@
 from process_improve.sensory.ingest import reshape_to_long
 from process_improve.sensory.mam import MAMResult, align_scores, mixed_assessor_model
 from process_improve.sensory.panel import PanelScorecard, apply_correction, panel_scorecard
+from process_improve.sensory.recipes import SENSORY_RECIPES
 from process_improve.sensory.validation import (
     DESCRIPTIVE_LONG_COLUMNS,
     ValidationResult,
@@ -35,6 +36,7 @@
 
 __all__ = [
     "DESCRIPTIVE_LONG_COLUMNS",
+    "SENSORY_RECIPES",
     "AnalysisResult",
     "MAMResult",
     "PanelScorecard",