fix(parser): harden Agent subagent state machine, file matching, query performance and streaming child grouping

- Codex: decouple active_agent_count decrement from close_agent target parsing and reset counter on turn_context to prevent main assistant messages from being swallowed when close_agent events are malformed - Codex: use exact filename match with separator-aware fallback and sorted candidates for deterministic subagent session file resolution - Codex/OpenCode: truncate subagent tool call previews to 500 chars - OpenCode: batch-load all subagent tool calls in a single SQL query instead of per-task N+1 queries to avoid slow detail page loads - Streaming: restrict positional child grouping fallback to in-progress agents only, preventing top-level tool calls from being incorrectly folded into completed Agent cards - Tests: update Claude context window assertions to match 1M default
2026-04-17 09:38:52 +08:00
parent 73a910bb62
commit 3e30ab7d60
4 changed files with 143 additions and 66 deletions
--- a/src-tauri/src/parsers/claude.rs
+++ b/src-tauri/src/parsers/claude.rs
@@ -1369,7 +1369,7 @@ mod tests {
    fn defaults_context_limit_for_claude_models() {
        assert_eq!(
            claude_context_window_max_tokens_for_model(Some("claude-sonnet-4-6")),
-            Some(200_000)
+            Some(1_000_000)
        );
        assert_eq!(
            claude_context_window_max_tokens_for_model(Some("custom-model-x")),
@@ -1472,11 +1472,11 @@ mod tests {
        let stats = detail.session_stats.expect("session stats");
        assert_eq!(stats.context_window_used_tokens, Some(1700));
-        assert_eq!(stats.context_window_max_tokens, Some(200_000));
+        assert_eq!(stats.context_window_max_tokens, Some(1_000_000));
        let percent = stats
            .context_window_usage_percent
            .expect("context window usage percent");
-        assert!((percent - 0.85).abs() < f64::EPSILON);
+        assert!((percent - 0.17).abs() < 0.01);
    }
    #[test]
@@ -1586,7 +1586,7 @@ mod tests {
        // Stats should reflect only the real assistant usage
        let stats = detail.session_stats.expect("session stats");
        assert_eq!(stats.context_window_used_tokens, Some(1700));
-        assert_eq!(stats.context_window_max_tokens, Some(200_000));
+        assert_eq!(stats.context_window_max_tokens, Some(1_000_000));
        let total = stats.total_tokens.expect("total tokens");
        assert_eq!(total, 1900); // 1000 + 200 + 300 + 400
    }
--- a/src-tauri/src/parsers/codex.rs
+++ b/src-tauri/src/parsers/codex.rs
@@ -482,20 +482,37 @@ fn parse_codex_subagent_stats(
        return None;
    }
-    let session_file = fs::read_dir(session_dir).ok()?.find_map(|entry| {
+    // Try exact filename first (e.g., "agent-{agent_id}.jsonl"), then fall
-        let path = entry.ok()?.path();
+    // back to files whose stem ends with the agent_id. Collect and sort
-        if path.extension().and_then(|e| e.to_str()) == Some("jsonl")
+    // candidates to ensure deterministic selection across platforms.
-            && path
+    let exact_path = session_dir.join(format!("agent-{}.jsonl", agent_id));
-                .file_name()
+    let session_file = if exact_path.is_file() {
-                .unwrap_or_default()
+        exact_path
-                .to_string_lossy()
+    } else {
-                .contains(agent_id)
+        let mut candidates: Vec<_> = fs::read_dir(session_dir)
-        {
+            .ok()?
-            Some(path)
+            .filter_map(|entry| {
-        } else {
+                let path = entry.ok()?.path();
-            None
+                if path.extension().and_then(|e| e.to_str()) != Some("jsonl") {
-        }
+                    return None;
-    })?;
+                }
                let stem = path.file_stem()?.to_string_lossy().into_owned();
                // Match only if the stem ends with the agent_id after a separator
                // (e.g., "session-abc123" matches agent_id "abc123")
                if stem == agent_id
                    || stem
                        .strip_suffix(agent_id)
                        .is_some_and(|prefix| prefix.ends_with('-') || prefix.ends_with('_'))
                {
                    Some(path)
                } else {
                    None
                }
            })
            .collect();
        candidates.sort();
        candidates.into_iter().next()?
    };
    let file = fs::File::open(&session_file).ok()?;
    let reader = BufReader::new(file);
@@ -569,7 +586,7 @@ fn parse_codex_subagent_stats(
                let tc = AgentToolCall {
                    tool_name,
-                    input_preview,
+                    input_preview: input_preview.map(|s| truncate_str(&s, 500)),
                    output_preview: None,
                    is_error: false,
                };
@@ -592,9 +609,9 @@ fn parse_codex_subagent_stats(
                        let raw_output = value_to_preview(output_value);
                        if tc.tool_name == "exec_command" {
                            tc.output_preview =
-                                raw_output.map(|s| clean_codex_exec_output(&s));
+                                raw_output.map(|s| truncate_str(&clean_codex_exec_output(&s), 500));
                        } else {
-                            tc.output_preview = raw_output;
+                            tc.output_preview = raw_output.map(|s| truncate_str(&s, 500));
                        }
                        tc.is_error = infer_tool_call_output_is_error(
                            payload,
@@ -669,6 +686,7 @@ impl CodexParser {
        let mut agent_id_to_spawn_call_id: HashMap<String, String> = HashMap::new();
        let mut agent_final_results: HashMap<String, String> = HashMap::new();
        let mut wait_agent_call_ids: HashSet<String> = HashSet::new();
        let mut close_agent_call_ids: HashSet<String> = HashSet::new();
        let mut close_agent_targets: HashMap<String, String> = HashMap::new();
        let mut active_agent_count: u32 = 0;
        let mut call_id_tool_names: HashMap<String, String> = HashMap::new();
@@ -713,6 +731,8 @@ impl CodexParser {
                    }
                }
                "turn_context" => {
                    // A new API turn means any prior agent lifecycle is complete.
                    active_agent_count = 0;
                    if model.is_none() {
                        model = value
                            .get("payload")
@@ -972,6 +992,7 @@ impl CodexParser {
                                    }
                                    "close_agent" => {
                                        if let Some(ref id) = tool_use_id {
                                            close_agent_call_ids.insert(id.clone());
                                            let target = parse_codex_json_arg(payload)
                                                .and_then(|a| {
                                                    a.get("target")
@@ -1045,7 +1066,7 @@ impl CodexParser {
                                    .is_some_and(|id| wait_agent_call_ids.contains(id));
                                let is_close = tool_use_id
                                    .as_ref()
-                                    .is_some_and(|id| close_agent_targets.contains_key(id));
+                                    .is_some_and(|id| close_agent_call_ids.contains(id));
                                if is_spawn {
                                    if let Some(output_obj) = parse_codex_json_output(payload) {
--- a/src-tauri/src/parsers/opencode.rs
+++ b/src-tauri/src/parsers/opencode.rs
@@ -1,3 +1,4 @@
 use std::collections::HashMap;
 use std::future::Future;
 use std::path::PathBuf;
 use std::time::Duration;
@@ -9,7 +10,7 @@ use sea_orm::{
 };
 use crate::models::*;
-use crate::parsers::{folder_name_from_path, AgentParser, ParseError};
+use crate::parsers::{folder_name_from_path, truncate_str, AgentParser, ParseError};
 pub struct OpenCodeParser {
    base_dir: PathBuf,
@@ -225,6 +226,13 @@ impl OpenCodeParser {
            ))
            .await?;
        // Pre-scan: collect all subagent session IDs from task tool parts so we
        // can batch-load their tool calls in a single query instead of N queries.
        let subagent_session_ids = self
            .scan_subagent_session_ids(conn, conversation_id)
            .await;
        let subagent_tools = batch_load_subagent_tool_calls(conn, &subagent_session_ids).await;
        let mut messages = Vec::with_capacity(rows.len());
        for row in rows {
@@ -263,7 +271,7 @@ impl OpenCodeParser {
            };
            let (content_blocks, usage_from_step_finish) =
-                self.load_sqlite_parts(conn, &msg_id).await?;
+                self.load_sqlite_parts(conn, &msg_id, &subagent_tools).await?;
            let usage = if is_assistant {
                extract_opencode_usage(&value).or(usage_from_step_finish)
@@ -298,10 +306,43 @@ impl OpenCodeParser {
        Ok(messages)
    }
    /// Scan all tool parts in this conversation to extract subagent session IDs.
    async fn scan_subagent_session_ids(
        &self,
        conn: &DatabaseConnection,
        conversation_id: &str,
    ) -> Vec<String> {
        let rows = match conn
            .query_all(Statement::from_sql_and_values(
                DbBackend::Sqlite,
                r#"
                SELECT DISTINCT json_extract(p.data, '$.state.metadata.sessionId') AS sid
                FROM part p
                INNER JOIN message m ON m.id = p.message_id
                WHERE m.session_id = ?
                  AND json_extract(p.data, '$.type') = 'tool'
                  AND json_extract(p.data, '$.tool') = 'task'
                  AND json_extract(p.data, '$.state.input.subagent_type') IS NOT NULL
                  AND sid IS NOT NULL
                "#,
                [conversation_id.into()],
            ))
            .await
        {
            Ok(r) => r,
            Err(_) => return Vec::new(),
        };
        rows.iter()
            .filter_map(|row| row.try_get::<String>("", "sid").ok())
            .collect()
    }
    async fn load_sqlite_parts(
        &self,
        conn: &DatabaseConnection,
        message_id: &str,
        subagent_tools: &HashMap<String, Vec<AgentToolCall>>,
    ) -> Result<(Vec<ContentBlock>, Option<TurnUsage>), ParseError> {
        let rows = conn
            .query_all(Statement::from_sql_and_values(
@@ -435,12 +476,11 @@ impl OpenCodeParser {
                            _ => None,
                        };
-                        // Load sub-agent tool calls from the sub-agent session
+                        // Look up pre-fetched sub-agent tool calls
-                        let tool_calls = if let Some(sid) = session_id {
+                        let tool_calls = session_id
-                            load_subagent_tool_calls(conn, sid).await
+                            .and_then(|sid| subagent_tools.get(sid))
-                        } else {
+                            .cloned()
-                            Vec::new()
+                            .unwrap_or_default();
                        };
                        let tool_count = tool_calls.len() as u32;
                        let agent_stats = Some(AgentExecutionStats {
@@ -820,36 +860,47 @@ fn extract_task_result_content(raw: &str) -> String {
    raw.to_string()
 }
-/// Load tool calls from a sub-agent's session in the OpenCode SQLite database.
+/// Batch-load tool calls from multiple sub-agent sessions in a single query.
 ///
-/// Queries all messages and their parts in the given session, extracts tool-type
+/// Returns a map from session_id to its list of `AgentToolCall` records.
-/// parts, and returns a compact list of `AgentToolCall` records for display
+/// This avoids N+1 queries when a conversation has many agent tasks.
-/// inside the parent Agent card.
+async fn batch_load_subagent_tool_calls(
 async fn load_subagent_tool_calls(
    conn: &DatabaseConnection,
-    session_id: &str,
+    session_ids: &[String],
-) -> Vec<AgentToolCall> {
+) -> HashMap<String, Vec<AgentToolCall>> {
    if session_ids.is_empty() {
        return HashMap::new();
    }
    // Build parameterized IN clause
    let placeholders: Vec<&str> = session_ids.iter().map(|_| "?").collect();
    let sql = format!(
        r#"
        SELECT m.session_id, p.data
        FROM part p
        INNER JOIN message m ON m.id = p.message_id
        WHERE m.session_id IN ({})
          AND json_extract(p.data, '$.type') = 'tool'
        ORDER BY m.session_id, p.time_created ASC, p.id ASC
        "#,
        placeholders.join(", ")
    );
    let values: Vec<sea_orm::Value> = session_ids.iter().map(|s| s.as_str().into()).collect();
    let rows = match conn
-        .query_all(Statement::from_sql_and_values(
+        .query_all(Statement::from_sql_and_values(DbBackend::Sqlite, &sql, values))
            DbBackend::Sqlite,
            r#"
            SELECT p.data
            FROM part p
            INNER JOIN message m ON m.id = p.message_id
            WHERE m.session_id = ?
              AND json_extract(p.data, '$.type') = 'tool'
            ORDER BY p.time_created ASC, p.id ASC
            "#,
            [session_id.into()],
        ))
        .await
    {
        Ok(r) => r,
-        Err(_) => return Vec::new(),
+        Err(_) => return HashMap::new(),
    };
-    let mut tool_calls = Vec::new();
+    let mut result: HashMap<String, Vec<AgentToolCall>> = HashMap::new();
    for row in rows {
        let sid: String = match row.try_get("", "session_id") {
            Ok(s) => s,
            Err(_) => continue,
        };
        let data_raw: String = match row.try_get("", "data") {
            Ok(d) => d,
            Err(_) => continue,
@@ -879,17 +930,19 @@ async fn load_subagent_tool_calls(
        let state = value.get("state");
        let input_preview = state
            .and_then(|s| s.get("input"))
-            .and_then(|v| value_to_preview(Some(v)));
+            .and_then(|v| value_to_preview(Some(v)))
            .map(|s| truncate_str(&s, 500));
        let output_preview = state
            .and_then(|s| s.get("output"))
-            .and_then(|v| value_to_preview(Some(v)));
+            .and_then(|v| value_to_preview(Some(v)))
            .map(|s| truncate_str(&s, 500));
        let status = state
            .and_then(|s| s.get("status"))
            .and_then(|s| s.as_str())
            .unwrap_or("");
        let has_error_field = state.and_then(|s| s.get("error")).is_some();
-        tool_calls.push(AgentToolCall {
+        result.entry(sid).or_default().push(AgentToolCall {
            tool_name,
            input_preview,
            output_preview,
@@ -897,7 +950,7 @@ async fn load_subagent_tool_calls(
        });
    }
-    tool_calls
+    result
 }
 #[cfg(test)]
--- a/src/contexts/conversation-runtime-context.tsx
+++ b/src/contexts/conversation-runtime-context.tsx
@@ -295,18 +295,20 @@ function buildStreamingTurnsFromLiveMessage(
    }
  }
-  // Second pass: assign children using parentToolUseId or position fallback
+  // Second pass: assign children using parentToolUseId or position fallback.
  // Positional fallback only captures while the agent is still in-progress;
  // once it completes/fails, subsequent tool calls are treated as top-level.
  let positionalAgentId: string | null = null
  let positionalAgentCompleted = false
  for (const block of liveMessage.content) {
    if (block.type === "tool_call") {
      const toolName = getToolName(block.info)
      if (toolName === "agent") {
-        positionalAgentId = block.info.tool_call_id
+        const isFinal =
        positionalAgentCompleted =
          block.info.status === "completed" || block.info.status === "failed"
        // Only capture children while the agent is still running
        positionalAgentId = isFinal ? null : block.info.tool_call_id
      } else {
        // Extract parentToolUseId from ACP meta (Claude Code embeds this
        // under meta.claudeCode.parentToolUseId). Guard each access level
@@ -321,21 +323,22 @@ function buildStreamingTurnsFromLiveMessage(
          }
        }
        // Use explicit parentToolUseId when available, positional fallback
        // only for in-progress agents
        const resolvedParent =
-          parentId && agentIds.has(parentId) ? parentId : positionalAgentId // fallback
+          parentId && agentIds.has(parentId) ? parentId : positionalAgentId
        if (resolvedParent) {
          childToolCallIds.add(block.info.tool_call_id)
          agentChildren
-            .get(resolvedParent)!
+            .get(resolvedParent)
-            .push({ info: block.info, toolName })
+            ?.push({ info: block.info, toolName })
        }
      }
-    } else if (positionalAgentId && positionalAgentCompleted) {
+    } else if (positionalAgentId) {
-      // A text/thinking/plan block after a completed agent means the main
+      // A non-tool block (text/thinking/plan) means the main agent is
-      // agent is producing new content — stop position-based capture.
+      // producing new content — stop position-based capture.
      positionalAgentId = null
      positionalAgentCompleted = false
    }
  }