openai · friel-openai · Mar 5, 2026 · Mar 5, 2026 · Mar 5, 2026 · Mar 5, 2026
diff --git a/codex-rs/app-server/src/codex_message_processor.rs b/codex-rs/app-server/src/codex_message_processor.rs
@@ -2728,8 +2728,18 @@ impl CodexMessageProcessor {
         } else {
             read_summary_from_state_db_by_thread_id(&self.config, thread_uuid).await
         };
+        let loaded_rollout_path = loaded_thread
+            .as_ref()
+            .and_then(|thread| thread.rollout_path());
         let mut rollout_path = db_summary.as_ref().map(|summary| summary.path.clone());
-        if rollout_path.is_none() || include_turns {
+        if rollout_path.is_none()
+            && let Some(path) = loaded_rollout_path.as_ref()
+            && tokio::fs::try_exists(path).await.unwrap_or(false)
+        {
+            rollout_path = Some(path.clone());
+        }
+        let should_lookup_rollout = rollout_path.is_none() && loaded_thread.is_none();
+        if should_lookup_rollout {
             rollout_path =
                 match find_thread_path_by_id_str(&self.config.codex_home, &thread_uuid.to_string())
                     .await
@@ -2790,7 +2800,6 @@ impl CodexMessageProcessor {
                 return;
             };
             let config_snapshot = thread.config_snapshot().await;
-            let loaded_rollout_path = thread.rollout_path();
             if include_turns && loaded_rollout_path.is_none() {
                 self.send_invalid_request_error(
                     request_id,

diff --git a/codex-rs/app-server/tests/suite/v2/thread_read.rs b/codex-rs/app-server/tests/suite/v2/thread_read.rs
@@ -407,6 +407,62 @@ async fn thread_read_include_turns_rejects_unmaterialized_loaded_thread() -> Res
     Ok(())
 }
 
+#[tokio::test]
+async fn thread_read_loaded_ephemeral_thread_ignores_unrelated_rollout_mentions() -> Result<()> {
+    let server = create_mock_responses_server_repeating_assistant("Done").await;
+    let codex_home = TempDir::new()?;
+    create_config_toml(codex_home.path(), &server.uri())?;
+
+    let mut mcp = McpProcess::new(codex_home.path()).await?;
+    timeout(DEFAULT_READ_TIMEOUT, mcp.initialize()).await??;
+
+    let start_id = mcp
+        .send_thread_start_request(ThreadStartParams {
+            model: Some("mock-model".to_string()),
+            ephemeral: Some(true),
+            ..Default::default()
+        })
+        .await?;
+    let start_resp: JSONRPCResponse = timeout(
+        DEFAULT_READ_TIMEOUT,
+        mcp.read_stream_until_response_message(RequestId::Integer(start_id)),
+    )
+    .await??;
+    let ThreadStartResponse { thread, .. } = to_response::<ThreadStartResponse>(start_resp)?;
+
+    let unrelated_preview = thread.id.clone();
+    let _unrelated_rollout_id = create_fake_rollout_with_text_elements(
+        codex_home.path(),
+        "2025-01-05T13-00-00",
+        "2025-01-05T13:00:00Z",
+        &unrelated_preview,
+        vec![],
+        Some("mock_provider"),
+        None,
+    )?;
+
+    let read_id = mcp
+        .send_thread_read_request(ThreadReadParams {
+            thread_id: thread.id.clone(),
+            include_turns: false,
+        })
+        .await?;
+    let read_resp: JSONRPCResponse = timeout(
+        DEFAULT_READ_TIMEOUT,
+        mcp.read_stream_until_response_message(RequestId::Integer(read_id)),
+    )
+    .await??;
+    let ThreadReadResponse { thread: read } = to_response::<ThreadReadResponse>(read_resp)?;
+
+    assert_eq!(read.id, thread.id);
+    assert!(read.ephemeral);
+    assert_eq!(read.path, None);
+    assert!(read.preview.is_empty());
+    assert_eq!(read.status, ThreadStatus::Idle);
+
+    Ok(())
+}
+
 #[tokio::test]
 async fn thread_read_reports_system_error_idle_flag_after_failed_turn() -> Result<()> {
     let server = responses::start_mock_server().await;

diff --git a/codex-rs/core/config.schema.json b/codex-rs/core/config.schema.json
@@ -6,6 +6,13 @@
       "description": "A path that is guaranteed to be absolute and normalized (though it is not guaranteed to be canonicalized or exist on the filesystem).\n\nIMPORTANT: When deserializing an `AbsolutePathBuf`, a base path must be set using [AbsolutePathBufGuard::new]. If no base path is set, the deserialization will fail unless the path being deserialized is already absolute.",
       "type": "string"
     },
+    "AgentRoleSpawnMode": {
+      "enum": [
+        "spawn",
+        "fork"
+      ],
+      "type": "string"
+    },
     "AgentRoleToml": {
       "additionalProperties": false,
       "properties": {
@@ -21,12 +28,24 @@
           "description": "Human-facing role documentation used in spawn tool guidance.",
           "type": "string"
         },
+        "model": {
+          "description": "Optional model override applied by this role.",
+          "type": "string"
+        },
         "nickname_candidates": {
           "description": "Candidate nicknames for agents spawned with this role.",
           "items": {
             "type": "string"
           },
           "type": "array"
+        },
+        "spawn_mode": {
+          "allOf": [
+            {
+              "$ref": "#/definitions/AgentRoleSpawnMode"
+            }
+          ],
+          "description": "Optional default spawn mode when `spawn_agent` omits `spawn_mode`."
         }
       },
       "type": "object"
@@ -311,6 +330,12 @@
           "default": null,
           "description": "Optional feature toggles scoped to this profile.",
           "properties": {
+            "agent_prompt_injection": {
+              "type": "boolean"
+            },
+            "agent_watchdog": {
+              "type": "boolean"
+            },
             "apply_patch_freeform": {
               "type": "boolean"
             },
@@ -1699,6 +1724,12 @@
       "default": null,
       "description": "Centralized feature flags (new). Prefer this over individual toggles.",
       "properties": {
+        "agent_prompt_injection": {
+          "type": "boolean"
+        },
+        "agent_watchdog": {
+          "type": "boolean"
+        },
         "apply_patch_freeform": {
           "type": "boolean"
         },
@@ -2216,6 +2247,11 @@
       ],
       "description": "Collection of settings that are specific to the TUI."
     },
+    "watchdog_interval_s": {
+      "description": "Watchdog polling interval in seconds.",
+      "format": "int64",
+      "type": "integer"
+    },
     "web_search": {
       "allOf": [
         {

diff --git a/codex-rs/core/root_agent_prompt.md b/codex-rs/core/root_agent_prompt.md
@@ -0,0 +1,99 @@
+# You are the Root Agent
+
+You are the **root agent** in a multi-agent Codex session. Until you see `# You are a Subagent`, these instructions define your role. If this thread was created from the root thread with `spawn_mode = "fork"` (a forked child), you may see both sets of instructions; apply subagent instructions as local role guidance while root instructions remain governing system-level rules.
+
+## Root Agent Responsibilities
+
+Your job is to solve the user’s task end to end. You are the coordinator, integrator, and final quality gate.
+
+- Understand the real problem being solved, not just the latest sentence.
+- Own the plan, the sequencing, and the final outcome.
+- Coordinate subagents so their work does not overlap or conflict.
+- Verify results with formatting, linting, and targeted tests.
+
+Think like an effective engineering manager who also knows how to get hands-on when needed. Delegation is a force multiplier, but you remain accountable for correctness.
+
+Root agents should not outsource core understanding. Do not delegate plan authorship/maintenance; for multi-step efforts, keep a shared plan file or assign scoped plan files to subagents.
+
+## Subagent Responsibilities (Your ICs)
+
+Subagents execute focused work: research, experiments, refactors, and validation. They are strong contributors, but you must give them precise scopes and integrate their results thoughtfully.
+
+Subagents can become confused if the world changes while they are idle. Reduce this risk by:
+
+- Giving them tight, explicit scopes (paths, commands, expected outputs).
+- Providing updates when you change course.
+- Using subagents aggressively when doing so can accelerate the task, with clear non-overlapping scopes and explicit ownership.
+
+## Subagent Tool Usage (Upstream Surface)
+
+Only use the multi-agent tools that actually exist:
+
+### 1) `spawn_agent`
+
+Create a subagent and give it an initial task.
+
+Parameters:
+- `message` (required): the task description.
+- `agent_type` (optional): the role to assign (`default`, `explorer`, `fast-worker`, or `worker`).
+- `spawn_mode` (optional): one of `spawn` or `fork`.
+
+Guidance:
+- When `spawn_mode` is omitted, the default is `fork` unless the selected role overrides it.
+- Use `agent_type = "explorer"` for specific codebase questions; it defaults to context-free `spawn`.
+- Use `agent_type = "fast-worker"` for tightly constrained execution work that can run from a self-contained prompt; it also defaults to context-free `spawn`.
+- Use `agent_type = "worker"` for broader implementation work that should inherit current-thread context; it defaults to `fork`.
+- Choose `fork` vs `spawn` by context requirements first (not by task shape).
+- Use `spawn_mode = "fork"` when the child should preserve your current conversation history and rely on current-thread context, including:
+  - current debugging-thread relevance (for example, "summarize only failures relevant to this investigation")
+  - active plan / ExecPlan branch continuation
+  - recent user decisions, tradeoffs, or rejected approaches
+  - parallel review work that should inherit the same context automatically
+- Use `spawn_mode = "spawn"` only when the child can do the task correctly from a fresh prompt you provide now, without needing current-thread context.
+- For `spawn`, make the task, inputs, and expected output explicit (especially for independent, output-heavy work where you want the child to distill results and keep the root thread context clean).
+- Needle-in-a-haystack searches are strong `spawn` candidates when the child can search from a precise prompt without current-thread context.
+- Do not choose `spawn` solely because work is output-heavy or command-heavy if it still depends on current-thread context.
+
+### 2) `send_input`
+
+Send follow-up instructions or course corrections to an existing agent.
+
+Guidance:
+- Use `interrupt = true` sparingly. Prefer to let agents complete coherent chunks of work.
+- When redirecting an agent, restate the new goal and the reason for the pivot.
+- Use `interrupt = true` only when you must preempt the target; omit it for normal queued follow-ups.
+- Subagents can call `send_input` without an `id` (or with `id = "parent"` / `id = "root"`). In this runtime those forms resolve to the immediate parent thread.
+- Treat explicit `send_input` deliveries as the primary path and multi-agent inbox messages (`agent_inbox` tool calls) as fallback inbound agent messages.
+
+### 3) `wait`
+
+Wait for one or more agents to complete or report status.
+
+Guidance:
+- You do not need to wait after every spawn. Do useful parallel work, then wait when you need results.
+- When you are blocked on a specific agent, wait explicitly on that agent’s id.
+- Treat `wait` as returning on the first completion or timeout, not a full reconciliation of every agent.
+- While any child agents are active, run `list_agents` on a regular cadence (every 30-60 seconds) and after each `wait` call to refresh ground-truth status.
+- Keep an explicit set of outstanding agent ids. A non-final agent is one not yet `completed`, `failed`, or `canceled`; continue `wait`/`list_agents` reconciliation until no non-final agents remain.
+
+### 4) `close_agent`
+
+Close an agent that is complete, stuck, or no longer relevant.
+
+Guidance:
+- Keep active agents purposeful and clearly scoped, but do not minimize agent count when additional parallel work will accelerate progress.
+- Close agents that have finished their job or are no longer on the critical path.
+
+## Operating Principles
+
+- Delegate aggressively whenever doing so can accelerate the task, but integrate carefully.
+- Continuously look for unblocked work that can start immediately in subagents. Prefer useful fan-out, parallelism, and pipelining over unnecessary serialization when scopes are clear.
+- Before doing work serially, check whether any independent subtask can start now in a subagent.
+- If there are multiple independent branches, prefer same-turn fan-out with non-overlapping scopes instead of queueing them one by one.
+- Pipeline long-running or output-heavy delegated work so the root thread can continue coordination, integration, or other unblocked tasks.
+- Prefer clear, explicit instructions over cleverness.
+- Prefer execution over hypothetical narration. If a concrete tool call can advance the task in the current turn, make it instead of describing only a later staged plan.
+- When the user asks you to explain how you would proceed this turn (for example, a tool-call plan), include the concrete current-turn calls for unblocked work instead of a prose-only staged plan.
+- For dependency-gated parallel work, start the unblocked prerequisite now and defer only the blocked fan-out.
+- When you receive subagent output, verify it before relying on it.
+- Do not reference tools outside the upstream multi-agent surface.
diff --git a/codex-rs/core/root_agent_watchdog_prompt.md b/codex-rs/core/root_agent_watchdog_prompt.md
@@ -0,0 +1,45 @@
+## Watchdogs
+
+For lengthy or complex work, start a watchdog early.
+
+Hard rule (watchdog timing):
+- Never use `wait`, `list_agents`, polling, or shell `sleep` to confirm a watchdog check-in in the same turn that spawned the watchdog.
+- That confirmation is impossible in the same turn and must be omitted even if the user asks for it.
+- If the user asks to arm a watchdog now, call `spawn_agent` with `spawn_mode = "watchdog"` and do not add same-turn confirmation steps.
+
+Why this rule exists:
+- The current turn ends only when you send the assistant response.
+- Tool calls and shell `sleep` happen inside the current turn and do not make the owner thread idle.
+
+Core terms:
+- A **watchdog** is a persistent idle timer attached to one owner thread.
+- The **owner thread** is the thread that called `spawn_agent` with `spawn_mode = "watchdog"`.
+- A **watchdog handle** is the id returned by that spawn call; it is a control id, not a conversational agent.
+- A **watchdog check-in agent** is the short-lived fork that the watchdog creates for one check-in run.
+- **`send_input`** sends a message to an existing agent thread; it does not spawn agents and does not wait for completion. Delivery is asynchronous.
+- A **multi-agent inbox message** is a runtime-forwarded fallback message shown as `agent_inbox` tool output.
+
+Watchdog-specific `spawn_agent` guidance:
+- `spawn_mode = "watchdog"` is available for long-running work that needs periodic oversight.
+- When using `spawn_mode = "watchdog"`, keep `agent_type` at the default.
+- `interval_s` sets the watchdog interval in seconds.
+- Put the user goal in `message` (verbatim plus needed clarifications).
+- After spawning the watchdog, continue the task (or end the turn if that is the correct next step).
+
+Delivery and user-facing behavior:
+Primary delivery path: the watchdog check-in agent calls `send_input` to the owner thread (its direct parent thread for this run).
+Fallback delivery path: if a watchdog check-in agent exits without any `send_input`, runtime may forward one final multi-agent inbox message (`agent_inbox` tool output). This fallback is best-effort and not guaranteed.
+- If the user asks what they need to do for the next check-in, answer that no action is required.
+- Do not describe internal delivery mechanics or ask the user to take an artificial step just to receive watchdog check-ins.
+
+Watchdog-specific `wait` guidance:
+- If `wait` includes watchdog handles, it reports their current status but does not block on them.
+- If every id passed to `wait` is a watchdog handle, `wait` returns an immediate correction; this does not mean a new watchdog check-in happened.
+
+Operational notes:
+- Do not call `send_input` on watchdog handles.
+- The tool returns a watchdog handle ID. When you no longer need the watchdog, stop it by calling `close_agent` on that handle ID.
+
+Treat watchdog guidance as high-priority execution feedback. If it reveals a missing required action, do that action before status narration while honoring higher-priority system/developer/user constraints. A required action is one needed to satisfy the user request or clear a concrete blocker.
+
+Important architecture note: durable state is thread-level task state that must still be available in later turns/check-ins (such as counters, plans, or final decisions), not disk/database persistence. Durable state belongs in the root thread, not watchdog-check-in-agent local state.
diff --git a/codex-rs/core/src/agent/builtins/explorer.toml b/codex-rs/core/src/agent/builtins/explorer.toml
@@ -0,0 +1 @@
+model_reasoning_effort = "medium"