diff --git a/docs/settings.md b/docs/settings.md
index 360ee6ae..0d595a3d 100644
--- a/docs/settings.md
+++ b/docs/settings.md
@@ -2,6 +2,25 @@
 
 CAO stores user configuration in `~/.aws/cli-agent-orchestrator/settings.json`. This file is managed by the settings service and can be edited via the Web UI Settings page or the REST API.
 
+## CAO State Directory
+
+By default, CAO stores its state under `~/.aws/cli-agent-orchestrator`. This
+directory contains the database, logs, installed agent profiles, skills, and
+settings file.
+
+For isolated development, CI, or local smoke tests, set `CAO_HOME_DIR` before
+starting `cao-server` or running `cao` commands:
+
+```bash
+export CAO_HOME_DIR=/tmp/cao-sandbox
+cao-server
+```
+
+When `CAO_HOME_DIR` is set, CAO derives its internal state paths from that
+directory, including `db/`, `logs/`, `agent-store/`, `agent-context/`, and
+`skills/`. The value is expanded with `~` support but is otherwise used as
+provided, so prefer an absolute path for reproducible runs.
+
 ## Agent Profile Directories
 
 CAO discovers agent profiles by scanning multiple directories. When loading or listing profiles, directories are scanned in this order (first match wins):
diff --git a/src/cli_agent_orchestrator/constants.py b/src/cli_agent_orchestrator/constants.py
index 5f5b5c5a..0058d6ca 100644
--- a/src/cli_agent_orchestrator/constants.py
+++ b/src/cli_agent_orchestrator/constants.py
@@ -39,8 +39,11 @@
 # =============================================================================
 # Application Directory Structure
 # =============================================================================
-# Base directory for all CAO data (~/.aws/cli-agent-orchestrator)
-CAO_HOME_DIR = Path.home() / ".aws" / "cli-agent-orchestrator"
+# Base directory for all CAO data (~/.aws/cli-agent-orchestrator).
+# The CAO_HOME_DIR override is useful for isolated/local pilot runs.
+CAO_HOME_DIR = Path(
+    os.environ.get("CAO_HOME_DIR", str(Path.home() / ".aws" / "cli-agent-orchestrator"))
+).expanduser()
 
 # Managed environment variable file
 CAO_ENV_FILE = CAO_HOME_DIR / ".env"
diff --git a/src/cli_agent_orchestrator/providers/codex.py b/src/cli_agent_orchestrator/providers/codex.py
index 0128aff0..dcfa7c42 100644
--- a/src/cli_agent_orchestrator/providers/codex.py
+++ b/src/cli_agent_orchestrator/providers/codex.py
@@ -31,7 +31,7 @@
 IDLE_PROMPT_PATTERN_LOG = r"\? for shortcuts"
 # Match assistant response start: "assistant:/codex:/agent:" (label style from synthetic
 # test fixtures) or "•" bullet point (real Codex interactive output format).
-ASSISTANT_PREFIX_PATTERN = r"^(?:(?:assistant|codex|agent)\s*:|\s*•)"
+ASSISTANT_PREFIX_PATTERN = r"^(?:(?:assistant|codex|agent)\s*:|[^\S\n]*•)"
 # Match user input: "You ..." (label style) or "› text" (Codex interactive prompt).
 # The "›[^\S\n]*\S" alternative requires a non-whitespace character on the same line
 # to distinguish user input ("› what is your role?") from the empty idle prompt ("› ").
@@ -50,7 +50,15 @@
 # Used to detect when the bottom lines contain TUI chrome rather than user input.
 # v0.110 and earlier: "? for shortcuts" and "N% context left"
 # v0.111+: "model · N% left · path" (PR #13202 restored draft footer hints)
-TUI_FOOTER_PATTERN = r"(?:\?\s+for shortcuts|context left|\d+%\s+left)"
+# Current Codex builds may also render "gpt-5.5 xhigh · /path" without a
+# context percentage.
+TUI_FOOTER_PATTERN = (
+    r"^\s*(?:"
+    r"\?\s+for shortcuts(?:.*(?:\d+%\s+)?context left)?"
+    r"|\d+%\s+context left"
+    r"|(?:gpt|o)\S*(?:\s+[\w.-]+)*\s+·\s+(?:(?:\d+%\s+left)\s+·\s+)?(?:~|/).*"
+    r")\s*$"
+)
 # Codex TUI progress spinner: "• Working (0s • esc to interrupt)",
 # "• Thinking (2s ...)", "• Starting script creation (10s • esc to interrupt)".
 # The prefix text varies but the "(Ns • esc to interrupt)" format is consistent.
@@ -59,6 +67,16 @@
 # ASSISTANT_PREFIX_PATTERN and the TUI footer › matches idle prompt).
 TUI_PROGRESS_PATTERN = r"•.*\(\d+s\s*•\s*esc to interrupt\)"
 
+# Codex's TUI also renders tool activity as bullet rows. These are not final
+# assistant responses and must not complete handoff or become extracted output.
+TUI_ACTIVITY_PATTERN = (
+    r"^•\s+(?:"
+    r"Explored|Ran|Read|Edited|Viewed|Searched|Listed|Opened|Calling|Called|"
+    r"Working|Thinking|Updated(?:\s+Plan)?|Applied|Patched|Wrote|Created|"
+    r"Deleted|Moved|Copied"
+    r")\b.*$"
+)
+
 # Workspace trust/approval prompt shown when Codex opens a new directory
 TRUST_PROMPT_PATTERN = r"allow Codex to work in this folder"
 # Codex welcome banner indicating normal startup (no trust prompt)
@@ -104,6 +122,65 @@ def _compute_tui_footer_cutoff(all_lines: list) -> int:
     return len("\n".join(all_lines[:footer_start_idx]))
 
 
+def _assistant_response_matches(text: str) -> list[re.Match]:
+    """Return assistant markers that are response starts, not TUI activity rows."""
+    matches = []
+    for match in re.finditer(ASSISTANT_PREFIX_PATTERN, text, re.IGNORECASE | re.MULTILINE):
+        line_end = text.find("\n", match.start())
+        if line_end == -1:
+            line_end = len(text)
+        line = text[match.start() : line_end]
+        if re.match(TUI_PROGRESS_PATTERN, line):
+            continue
+        if _is_tui_activity_match(text, match.start()):
+            continue
+        matches.append(match)
+    return matches
+
+
+def _is_tui_activity_match(text: str, start_pos: int) -> bool:
+    """Return whether a bullet at start_pos is a Codex TUI activity row.
+
+    Activity rows are top-level bullets such as "• Ran pwd" followed by a
+    Codex-rendered tree/details line ("  └ ..."). Requiring the details line
+    prevents normal answer bullets like "  • Ran tests" or "• Ran tests
+    successfully" from being filtered out.
+    """
+    line_end = text.find("\n", start_pos)
+    if line_end == -1:
+        line_end = len(text)
+    line = text[start_pos:line_end]
+    if not re.match(TUI_ACTIVITY_PATTERN, line):
+        return False
+
+    rest = text[line_end + 1 :]
+    for next_line in rest.splitlines():
+        if not next_line.strip():
+            continue
+        return bool(re.match(r"[^\S\n]+└\s+", next_line))
+
+    return False
+
+
+def _tui_activity_matches(text: str) -> list[re.Match]:
+    """Return TUI activity row matches, excluding normal answer bullets."""
+    return [
+        match
+        for match in re.finditer(TUI_ACTIVITY_PATTERN, text, re.MULTILINE)
+        if _is_tui_activity_match(text, match.start())
+    ]
+
+
+def _last_tui_activity_or_progress_end(text: str) -> int:
+    """Return the end offset of the last Codex TUI activity/progress row."""
+    last_end = 0
+    for match in re.finditer(TUI_PROGRESS_PATTERN, text, re.MULTILINE):
+        last_end = max(last_end, match.end())
+    for match in _tui_activity_matches(text):
+        last_end = max(last_end, match.end())
+    return last_end
+
+
 class ProviderError(Exception):
     """Exception raised for provider-specific errors."""
 
@@ -233,7 +310,13 @@ def _handle_trust_prompt(self, timeout: float = 20.0) -> None:
             if re.search(TRUST_PROMPT_PATTERN, clean_output):
                 logger.info("Codex workspace trust prompt detected, auto-accepting")
                 session = tmux_client.server.sessions.get(session_name=self.session_name)
+                if session is None:
+                    logger.warning("Codex trust prompt detected but tmux session was not found")
+                    return
                 window = session.windows.get(window_name=self.window_name)
+                if window is None:
+                    logger.warning("Codex trust prompt detected but tmux window was not found")
+                    return
                 pane = window.active_pane
                 if pane:
                     pane.send_keys("", enter=True)
@@ -311,13 +394,18 @@ def get_status(self, tail_lines: Optional[int] = None) -> TerminalStatus:
             if match.start() < cutoff_pos:
                 last_user = match
 
-        output_after_last_user = clean_output[last_user.start() :] if last_user else clean_output
+        analysis_output = clean_output[:cutoff_pos]
+        output_after_last_user = (
+            analysis_output[last_user.start() :] if last_user else analysis_output
+        )
+        assistant_matches_after_last_user = (
+            _assistant_response_matches(output_after_last_user) if last_user else []
+        )
+        last_activity_end = _last_tui_activity_or_progress_end(output_after_last_user)
         assistant_after_last_user = bool(
             last_user
-            and re.search(
-                ASSISTANT_PREFIX_PATTERN,
-                output_after_last_user,
-                re.IGNORECASE | re.MULTILINE,
+            and any(
+                match.start() >= last_activity_end for match in assistant_matches_after_last_user
             )
         )
 
@@ -360,17 +448,23 @@ def get_status(self, tail_lines: Optional[int] = None) -> TerminalStatus:
             # With --no-alt-screen, the TUI footer (› hint + status bar) is always
             # rendered at the bottom, even during processing. The • in the progress
             # spinner matches ASSISTANT_PREFIX_PATTERN, causing a false COMPLETED.
-            # Detect the spinner and return PROCESSING before checking for COMPLETED.
-            if re.search(TUI_PROGRESS_PATTERN, tail_output, re.MULTILINE):
-                return TerminalStatus.PROCESSING
+            # Treat the spinner as active only when it is the newest assistant-like
+            # marker after the last user input. Codex can leave stale spinner lines
+            # in scrollback after the final answer is rendered.
+            progress_region = output_after_last_user if last_user is not None else tail_output
+            progress_matches = list(
+                re.finditer(TUI_PROGRESS_PATTERN, progress_region, re.MULTILINE)
+            )
+            if progress_matches:
+                assistant_matches = _assistant_response_matches(progress_region)
+                last_progress_start = progress_matches[-1].start()
+                last_assistant_start = assistant_matches[-1].start() if assistant_matches else -1
+                if last_assistant_start <= last_progress_start:
+                    return TerminalStatus.PROCESSING
 
             # Consider COMPLETED only if we see an assistant marker after the last user message.
             if last_user is not None:
-                if re.search(
-                    ASSISTANT_PREFIX_PATTERN,
-                    clean_output[last_user.start() :],
-                    re.IGNORECASE | re.MULTILINE,
-                ):
+                if assistant_after_last_user:
                     return TerminalStatus.COMPLETED
 
                 return TerminalStatus.IDLE
@@ -417,56 +511,71 @@ def extract_last_message_from_script(self, script_output: str) -> str:
 
         if user_matches:
             last_user = user_matches[-1]
+            response_search_start = last_user.start()
+
+            # If Codex left stale TUI progress spinners in scrollback, begin
+            # searching for the final response after the latest spinner.
+            progress_matches = list(
+                re.finditer(
+                    TUI_PROGRESS_PATTERN,
+                    clean_output[response_search_start:cutoff_pos],
+                    re.MULTILINE,
+                )
+            )
+            activity_matches = list(
+                _tui_activity_matches(clean_output[response_search_start:cutoff_pos])
+            )
+            chrome_matches = progress_matches + activity_matches
+            if chrome_matches:
+                response_search_start += max(match.end() for match in chrome_matches)
 
             # Find the first assistant response marker (• or assistant:) after
             # the user message. This correctly skips multi-line user messages
             # that wrap across several lines in the Codex TUI.
-            asst_after_user = re.search(
-                ASSISTANT_PREFIX_PATTERN,
-                clean_output[last_user.start() :],
-                re.IGNORECASE | re.MULTILINE,
-            )
-            if asst_after_user:
-                response_start = last_user.start() + asst_after_user.start()
-            else:
+            response_region = clean_output[response_search_start:cutoff_pos]
+            asst_matches = _assistant_response_matches(response_region)
+            if asst_matches:
+                response_start = response_search_start + asst_matches[0].start()
+            elif not tui_footer_detected and not _tui_activity_matches(response_region):
                 # No assistant marker found; fall back to skipping one line
                 user_line_end = clean_output.find("\n", last_user.start())
                 if user_line_end == -1:
                     user_line_end = len(clean_output)
                 response_start = user_line_end + 1
-
-            # Find extraction boundary: empty idle prompt or TUI footer area.
-            # With --no-alt-screen, the TUI footer (› hint + status bar) has no
-            # empty idle prompt. Use cutoff_pos as the boundary when TUI is present.
-            idle_after = re.search(
-                IDLE_PROMPT_STRICT_PATTERN,
-                clean_output[response_start:],
-                re.MULTILINE,
-            )
-            if idle_after:
-                end_pos = response_start + idle_after.start()
-            elif tui_footer_detected:
-                end_pos = cutoff_pos
             else:
-                end_pos = len(clean_output)
-
-            response_text = clean_output[response_start:end_pos].strip()
-
-            if response_text:
-                # Strip "assistant:" prefix if present (label format)
-                response_text = re.sub(
-                    r"^(?:assistant|codex|agent)\s*:\s*",
-                    "",
-                    response_text,
-                    count=1,
-                    flags=re.IGNORECASE,
+                response_start = None
+
+            if response_start is not None:
+                # Find extraction boundary: empty idle prompt or TUI footer area.
+                # With --no-alt-screen, the TUI footer (› hint + status bar) has no
+                # empty idle prompt. Use cutoff_pos as the boundary when TUI is present.
+                idle_after = re.search(
+                    IDLE_PROMPT_STRICT_PATTERN,
+                    clean_output[response_start:],
+                    re.MULTILINE,
                 )
-                return response_text.strip()
+                if idle_after:
+                    end_pos = response_start + idle_after.start()
+                elif tui_footer_detected:
+                    end_pos = cutoff_pos
+                else:
+                    end_pos = len(clean_output)
+
+                response_text = clean_output[response_start:end_pos].strip()
+
+                if response_text:
+                    # Strip "assistant:" prefix if present (label format)
+                    response_text = re.sub(
+                        r"^(?:assistant|codex|agent)\s*:\s*",
+                        "",
+                        response_text,
+                        count=1,
+                        flags=re.IGNORECASE,
+                    )
+                    return response_text.strip()
 
         # Fallback: assistant marker based extraction (no user message found).
-        matches = list(
-            re.finditer(ASSISTANT_PREFIX_PATTERN, clean_output, re.IGNORECASE | re.MULTILINE)
-        )
+        matches = _assistant_response_matches(clean_output)
 
         if not matches:
             raise ValueError("No Codex response found - no assistant marker detected")
diff --git a/src/cli_agent_orchestrator/services/settings_service.py b/src/cli_agent_orchestrator/services/settings_service.py
index 61c01a3e..ad398659 100644
--- a/src/cli_agent_orchestrator/services/settings_service.py
+++ b/src/cli_agent_orchestrator/services/settings_service.py
@@ -3,9 +3,9 @@
 import json
 import logging
 from pathlib import Path
-from typing import Any, Dict, List, Optional
+from typing import Any, Dict, List, cast
 
-from cli_agent_orchestrator.constants import CAO_HOME_DIR
+from cli_agent_orchestrator.constants import AGENT_CONTEXT_DIR, CAO_HOME_DIR, LOCAL_AGENT_STORE_DIR
 
 logger = logging.getLogger(__name__)
 
@@ -15,9 +15,9 @@
 _DEFAULTS = {
     "kiro_cli": str(Path.home() / ".kiro" / "agents"),
     "q_cli": str(Path.home() / ".aws" / "amazonq" / "cli-agents"),
-    "claude_code": str(Path.home() / ".aws" / "cli-agent-orchestrator" / "agent-store"),
-    "codex": str(Path.home() / ".aws" / "cli-agent-orchestrator" / "agent-store"),
-    "cao_installed": str(Path.home() / ".aws" / "cli-agent-orchestrator" / "agent-context"),
+    "claude_code": str(LOCAL_AGENT_STORE_DIR),
+    "codex": str(LOCAL_AGENT_STORE_DIR),
+    "cao_installed": str(AGENT_CONTEXT_DIR),
 }
 
 
@@ -25,7 +25,10 @@ def _load() -> Dict[str, Any]:
     """Load settings from disk."""
     if SETTINGS_FILE.exists():
         try:
-            return json.loads(SETTINGS_FILE.read_text())
+            data = json.loads(SETTINGS_FILE.read_text())
+            if isinstance(data, dict):
+                return cast(Dict[str, Any], data)
+            logger.warning("Settings file did not contain a JSON object")
         except Exception as e:
             logger.warning(f"Failed to read settings: {e}")
     return {}
@@ -67,12 +70,16 @@ def set_agent_dirs(dirs: Dict[str, str]) -> Dict[str, str]:
 def get_extra_agent_dirs() -> List[str]:
     """Get extra agent scan directories (user-added custom paths)."""
     settings = _load()
-    return settings.get("extra_agent_dirs", [])
+    extra_dirs = settings.get("extra_agent_dirs", [])
+    if not isinstance(extra_dirs, list):
+        return []
+    return [str(path) for path in extra_dirs]
 
 
 def set_extra_agent_dirs(dirs: List[str]) -> List[str]:
     """Set extra agent scan directories."""
     settings = _load()
-    settings["extra_agent_dirs"] = [d for d in dirs if d.strip()]
+    extra_dirs = [d for d in dirs if d.strip()]
+    settings["extra_agent_dirs"] = extra_dirs
     _save(settings)
-    return settings["extra_agent_dirs"]
+    return extra_dirs
diff --git a/test/providers/test_codex_provider_unit.py b/test/providers/test_codex_provider_unit.py
index aa61746f..db1ae8d7 100644
--- a/test/providers/test_codex_provider_unit.py
+++ b/test/providers/test_codex_provider_unit.py
@@ -775,6 +775,152 @@ def test_get_status_processing_v0111_spinner(self, mock_tmux):
 
         assert status == TerminalStatus.PROCESSING
 
+    @patch("cli_agent_orchestrator.providers.codex.tmux_client")
+    def test_get_status_completed_v0111_with_stale_spinner(self, mock_tmux):
+        """COMPLETED when stale spinner remains before the final answer."""
+        mock_tmux.get_history.return_value = (
+            "› [CAO Handoff] Inspect the workspace.\n"
+            "\n"
+            "• Working (21s • esc to interrupt)\n"
+            "\n"
+            "─────\n"
+            "• Objective: inspect only /tmp/pilot-workspace.\n"
+            "\n"
+            "  Visible top-level files/directories:\n"
+            "\n"
+            "  - SESSION_STATE.md\n"
+            "\n"
+            "  SESSION_STATE.md: exists.\n"
+            "─────\n"
+            "\n"
+            "› Find and fix a bug in @filename\n"
+            "\n"
+            "  gpt-5.5 xhigh · /tmp/pilot-workspace\n"
+        )
+
+        provider = CodexProvider("test1234", "test-session", "window-0")
+        status = provider.get_status()
+
+        assert status == TerminalStatus.COMPLETED
+
+    @patch("cli_agent_orchestrator.providers.codex.tmux_client")
+    def test_get_status_completed_when_answer_mentions_footer_like_text(self, mock_tmux):
+        """Footer-like text in an answer bullet is not TUI chrome."""
+        mock_tmux.get_history.return_value = (
+            "› explain the Codex footer\n"
+            "• The footer may show gpt-5.5 xhigh · /tmp/pilot-workspace.\n"
+            "\n"
+            "› \n"
+        )
+
+        provider = CodexProvider("test1234", "test-session", "window-0")
+        status = provider.get_status()
+
+        assert status == TerminalStatus.COMPLETED
+
+    @patch("cli_agent_orchestrator.providers.codex.tmux_client")
+    def test_get_status_not_completed_for_tool_activity_only(self, mock_tmux):
+        """Tool activity bullets are not final assistant responses."""
+        mock_tmux.get_history.return_value = (
+            "› [CAO Handoff] Inspect the workspace.\n"
+            "\n"
+            "• Explored\n"
+            "  └ Search SESSION_STATE.md in .\n"
+            "\n"
+            "• Ran pwd\n"
+            "  └ /tmp/pilot-workspace\n"
+            "\n"
+            "› Summarize recent commits\n"
+            "\n"
+            "  gpt-5.5 xhigh · /tmp/pilot-workspace\n"
+        )
+
+        provider = CodexProvider("test1234", "test-session", "window-0")
+        status = provider.get_status()
+
+        assert status == TerminalStatus.IDLE
+
+    @patch("cli_agent_orchestrator.providers.codex.tmux_client")
+    def test_get_status_not_completed_for_preamble_plus_tool_activity_only(self, mock_tmux):
+        """A pre-tool assistant note is not final completion after tool activity."""
+        mock_tmux.get_history.return_value = (
+            "› Use handoff to inspect the workspace.\n"
+            "\n"
+            "• I’ll route this through the CAO handoff path.\n"
+            "\n"
+            "• Called\n"
+            '  └ cao-mcp-server.handoff({"success": true})\n'
+            "\n"
+            "› Summarize recent commits\n"
+            "\n"
+            "  gpt-5.5 xhigh · /tmp/pilot-workspace\n"
+        )
+
+        provider = CodexProvider("test1234", "test-session", "window-0")
+        status = provider.get_status()
+
+        assert status == TerminalStatus.IDLE
+
+    @patch("cli_agent_orchestrator.providers.codex.tmux_client")
+    def test_get_status_completed_for_response_after_tool_activity(self, mock_tmux):
+        """COMPLETED when a final response appears after tool activity."""
+        mock_tmux.get_history.return_value = (
+            "› Use handoff to inspect the workspace.\n"
+            "\n"
+            "• I’ll route this through the CAO handoff path.\n"
+            "\n"
+            "• Called\n"
+            '  └ cao-mcp-server.handoff({"success": true})\n'
+            "\n"
+            "• The handoff succeeded.\n"
+            "\n"
+            "› Summarize recent commits\n"
+            "\n"
+            "  gpt-5.5 xhigh · /tmp/pilot-workspace\n"
+        )
+
+        provider = CodexProvider("test1234", "test-session", "window-0")
+        status = provider.get_status()
+
+        assert status == TerminalStatus.COMPLETED
+
+    @patch("cli_agent_orchestrator.providers.codex.tmux_client")
+    def test_get_status_completed_for_answer_bullets_that_look_like_activity(self, mock_tmux):
+        """Answer bullets starting with activity verbs are still responses."""
+        mock_tmux.get_history.return_value = (
+            "› summarize the work\n"
+            "• Done.\n"
+            "  • Ran tests successfully.\n"
+            "  • Updated docs.\n"
+            "  • Created a patch bundle.\n"
+            "\n"
+            "› Summarize recent commits\n"
+            "\n"
+            "  gpt-5.5 xhigh · /tmp/pilot-workspace\n"
+        )
+
+        provider = CodexProvider("test1234", "test-session", "window-0")
+        status = provider.get_status()
+
+        assert status == TerminalStatus.COMPLETED
+
+    @patch("cli_agent_orchestrator.providers.codex.tmux_client")
+    def test_get_status_completed_for_top_level_ran_answer_without_tree(self, mock_tmux):
+        """A top-level answer bullet starting with Ran is not TUI activity."""
+        mock_tmux.get_history.return_value = (
+            "› summarize the work\n"
+            "• Ran tests successfully and prepared the patch bundle.\n"
+            "\n"
+            "› Summarize recent commits\n"
+            "\n"
+            "  gpt-5.5 xhigh · /tmp/pilot-workspace\n"
+        )
+
+        provider = CodexProvider("test1234", "test-session", "window-0")
+        status = provider.get_status()
+
+        assert status == TerminalStatus.COMPLETED
+
 
 class TestCodexProviderMessageExtraction:
     def test_extract_last_message_success(self):
@@ -956,6 +1102,154 @@ def test_extract_double_blank_between_hint_and_status(self):
         assert "I've fixed the issue" in message
         assert "Find and fix a bug" not in message
 
+    def test_extract_bullet_with_v0111_footer_and_stale_spinner(self):
+        """Extract final answer after stale TUI spinner, excluding footer chrome."""
+        output = (
+            "› [CAO Handoff] Inspect the workspace.\n"
+            "\n"
+            "• Working (21s • esc to interrupt)\n"
+            "\n"
+            "─────\n"
+            "• Objective: inspect only /tmp/pilot-workspace.\n"
+            "\n"
+            "  Visible top-level files/directories:\n"
+            "\n"
+            "  - SESSION_STATE.md\n"
+            "\n"
+            "  SESSION_STATE.md: exists.\n"
+            "─────\n"
+            "\n"
+            "› Find and fix a bug in @filename\n"
+            "\n"
+            "  gpt-5.5 xhigh · /tmp/pilot-workspace\n"
+        )
+
+        provider = CodexProvider("test1234", "test-session", "window-0")
+        message = provider.extract_last_message_from_script(output)
+
+        assert "Objective: inspect only" in message
+        assert "SESSION_STATE.md: exists." in message
+        assert "Working (21s" not in message
+        assert "Find and fix a bug" not in message
+        assert "gpt-5.5" not in message
+
+    def test_extract_skips_tool_activity_before_final_answer(self):
+        """Tool activity rows before the answer should not be returned."""
+        output = (
+            "› [CAO Handoff] Inspect the workspace.\n"
+            "\n"
+            "• Explored\n"
+            "  └ Search SESSION_STATE.md in .\n"
+            "\n"
+            "• Ran pwd\n"
+            "  └ /tmp/pilot-workspace\n"
+            "\n"
+            "• Objective: inspect only /tmp/pilot-workspace.\n"
+            "  Visible top-level files/directories:\n"
+            "  - SESSION_STATE.md\n"
+            "  SESSION_STATE.md: exists.\n"
+            "\n"
+            "› Summarize recent commits\n"
+            "\n"
+            "  gpt-5.5 xhigh · /tmp/pilot-workspace\n"
+        )
+
+        provider = CodexProvider("test1234", "test-session", "window-0")
+        message = provider.extract_last_message_from_script(output)
+
+        assert "Objective: inspect only" in message
+        assert "SESSION_STATE.md: exists." in message
+        assert "Explored" not in message
+        assert "Ran pwd" not in message
+
+    def test_extract_raises_for_tool_activity_only(self):
+        """Tool activity alone is not a completed Codex response."""
+        output = (
+            "› [CAO Handoff] Inspect the workspace.\n"
+            "\n"
+            "• Explored\n"
+            "  └ Search SESSION_STATE.md in .\n"
+            "\n"
+            "• Ran pwd\n"
+            "  └ /tmp/pilot-workspace\n"
+            "\n"
+            "› Summarize recent commits\n"
+            "\n"
+            "  gpt-5.5 xhigh · /tmp/pilot-workspace\n"
+        )
+
+        provider = CodexProvider("test1234", "test-session", "window-0")
+
+        with pytest.raises(ValueError, match="No Codex response found"):
+            provider.extract_last_message_from_script(output)
+
+    def test_extract_final_answer_after_tool_activity(self):
+        """Extraction should return the final answer after MCP/tool activity."""
+        output = (
+            "› Use handoff to inspect the workspace.\n"
+            "\n"
+            "• I’ll route this through the CAO handoff path.\n"
+            "\n"
+            "• Called\n"
+            '  └ cao-mcp-server.handoff({"success": true})\n'
+            '    {"output": "• RESULT:\\n  SESSION_STATE.md exists: yes."}\n'
+            "\n"
+            "• The handoff succeeded.\n"
+            "  Worker output summary: SESSION_STATE.md exists.\n"
+            "\n"
+            "› Summarize recent commits\n"
+            "\n"
+            "  gpt-5.5 xhigh · /tmp/pilot-workspace\n"
+        )
+
+        provider = CodexProvider("test1234", "test-session", "window-0")
+        message = provider.extract_last_message_from_script(output)
+
+        assert "The handoff succeeded" in message
+        assert "SESSION_STATE.md exists" in message
+        assert "I’ll route" not in message
+        assert "cao-mcp-server.handoff" not in message
+
+    def test_extract_answer_bullets_that_look_like_activity(self):
+        """Normal answer bullets that start with activity verbs should remain."""
+        output = (
+            "› summarize the work\n"
+            "• Done.\n"
+            "  • Ran tests successfully.\n"
+            "  • Updated docs.\n"
+            "  • Created a patch bundle.\n"
+            "\n"
+            "› Summarize recent commits\n"
+            "\n"
+            "  gpt-5.5 xhigh · /tmp/pilot-workspace\n"
+        )
+
+        provider = CodexProvider("test1234", "test-session", "window-0")
+        message = provider.extract_last_message_from_script(output)
+
+        assert "Done." in message
+        assert "Ran tests successfully" in message
+        assert "Updated docs" in message
+        assert "Created a patch bundle" in message
+        assert "gpt-5.5" not in message
+
+    def test_extract_top_level_ran_answer_without_tree(self):
+        """A top-level Ran answer without a Codex tree line should extract."""
+        output = (
+            "› summarize the work\n"
+            "• Ran tests successfully and prepared the patch bundle.\n"
+            "\n"
+            "› Summarize recent commits\n"
+            "\n"
+            "  gpt-5.5 xhigh · /tmp/pilot-workspace\n"
+        )
+
+        provider = CodexProvider("test1234", "test-session", "window-0")
+        message = provider.extract_last_message_from_script(output)
+
+        assert "Ran tests successfully" in message
+        assert "gpt-5.5" not in message
+
 
 class TestCodexProviderMisc:
     def test_get_idle_pattern_for_log(self):
diff --git a/test/services/test_settings_service.py b/test/services/test_settings_service.py
index a9b81111..24840da3 100644
--- a/test/services/test_settings_service.py
+++ b/test/services/test_settings_service.py
@@ -1,5 +1,6 @@
 """Tests for settings_service module."""
 
+import importlib
 import json
 from pathlib import Path
 from unittest.mock import patch
@@ -118,6 +119,25 @@ def test_returns_all_default_keys(self, settings_file):
         for key in _DEFAULTS:
             assert key in result
 
+    def test_cao_managed_defaults_follow_cao_home_dir_env_override(self, tmp_path):
+        """CAO-managed agent directories stay inside an overridden CAO home."""
+        import cli_agent_orchestrator.constants as constants_module
+        import cli_agent_orchestrator.services.settings_service as settings_module
+
+        custom_home = tmp_path / "cao-home"
+        with patch.dict("os.environ", {"CAO_HOME_DIR": str(custom_home)}, clear=False):
+            importlib.reload(constants_module)
+            importlib.reload(settings_module)
+
+            result = settings_module.get_agent_dirs()
+
+            assert result["claude_code"] == str(custom_home / "agent-store")
+            assert result["codex"] == str(custom_home / "agent-store")
+            assert result["cao_installed"] == str(custom_home / "agent-context")
+
+        importlib.reload(constants_module)
+        importlib.reload(settings_module)
+
 
 class TestSetAgentDirs:
     """Tests for set_agent_dirs function."""
diff --git a/test/test_constants.py b/test/test_constants.py
index 303dd3c5..8b62f1f5 100644
--- a/test/test_constants.py
+++ b/test/test_constants.py
@@ -97,6 +97,23 @@ def test_cao_home_dir_is_pathlib_path(self):
 
         assert isinstance(CAO_HOME_DIR, Path)
 
+    def test_cao_home_dir_honors_env_override(self, tmp_path):
+        """Test that CAO_HOME_DIR can be isolated with an environment override."""
+        import importlib
+
+        import cli_agent_orchestrator.constants as constants_module
+
+        custom_home = tmp_path / "cao-home"
+        with patch.dict("os.environ", {"CAO_HOME_DIR": str(custom_home)}, clear=False):
+            importlib.reload(constants_module)
+
+            assert constants_module.CAO_HOME_DIR == custom_home
+            assert constants_module.DB_DIR == custom_home / "db"
+            assert constants_module.LOCAL_AGENT_STORE_DIR == custom_home / "agent-store"
+            assert constants_module.SKILLS_DIR == custom_home / "skills"
+
+        importlib.reload(constants_module)
+
     def test_db_dir_is_under_cao_home(self):
         """Test that DB_DIR is under CAO_HOME_DIR."""
         from cli_agent_orchestrator.constants import CAO_HOME_DIR, DB_DIR