fix(agent): retry malformed tool_call payloads in tool loop

2026-02-17 21:51:00 +08:00 · 2026-02-17 21:51:00 +08:00 · 3522d51f98
commit 3522d51f98
parent 4b89e91a5a
1 changed files with 136 additions and 1 deletions
--- a/src/agent/loop_.rs
+++ b/src/agent/loop_.rs
@ -660,13 +660,26 @@ pub(crate) async fn run_tool_call_loop(
                }
            };
-        let display_text = if parsed_text.is_empty() {
+        let parsed_text_is_empty = parsed_text.trim().is_empty();
        let display_text = if parsed_text_is_empty {
            response_text.clone()
        } else {
            parsed_text
        };
        let has_tool_call_markup =
            response_text.contains("<tool_call>") && response_text.contains("</tool_call>");
        if tool_calls.is_empty() {
            // Recovery path: the model attempted tool use but emitted malformed JSON.
            // Ask it to re-send valid tool-call payload instead of leaking raw markup to users.
            if has_tool_call_markup && parsed_text_is_empty {
                history.push(ChatMessage::assistant(response_text.clone()));
                history.push(ChatMessage::user(
                    "[Tool parser error]\nYour previous <tool_call> payload was invalid JSON and was NOT executed. Re-send the same tool call using strict valid JSON only. Escape inner double quotes inside string values.",
                ));
                continue;
            }
            // No tool calls — this is the final response
            history.push(ChatMessage::assistant(response_text.clone()));
            return Ok(display_text);
@ -1382,6 +1395,12 @@ mod tests {
        assert!(scrubbed.contains("public"));
    }
    use crate::memory::{Memory, MemoryCategory, SqliteMemory};
    use crate::observability::NoopObserver;
    use crate::providers::Provider;
    use crate::tools::{Tool, ToolResult};
    use async_trait::async_trait;
    use std::sync::Arc;
    use std::sync::atomic::{AtomicUsize, Ordering};
    use tempfile::TempDir;
    #[test]
@ -1923,4 +1942,120 @@ Done."#;
        let result = parse_tool_calls_from_json_value(&value);
        assert_eq!(result.len(), 2);
    }
    struct MalformedThenValidToolProvider;
    #[async_trait]
    impl Provider for MalformedThenValidToolProvider {
        async fn chat_with_system(
            &self,
            _system_prompt: Option<&str>,
            _message: &str,
            _model: &str,
            _temperature: f64,
        ) -> anyhow::Result<String> {
            anyhow::bail!("chat_with_system should not be called in this test");
        }
        async fn chat_with_history(
            &self,
            messages: &[ChatMessage],
            _model: &str,
            _temperature: f64,
        ) -> anyhow::Result<String> {
            if messages
                .iter()
                .any(|m| m.role == "user" && m.content.contains("[Tool results]"))
            {
                return Ok("Top memory users parsed successfully.".to_string());
            }
            if messages
                .iter()
                .any(|m| m.role == "user" && m.content.contains("[Tool parser error]"))
            {
                return Ok(
                    r#"<tool_call>
 {"name":"shell","arguments":{"command":"echo fixed"}}
 </tool_call>"#
                        .to_string(),
                );
            }
            Ok(
                r#"<tool_call>
 {"name":"shell","arguments":{"command":"echo "$rss $name ($pid)""}}
 </tool_call>"#
                    .to_string(),
            )
        }
    }
    struct CountingShellTool {
        runs: Arc<AtomicUsize>,
    }
    #[async_trait]
    impl Tool for CountingShellTool {
        fn name(&self) -> &str {
            "shell"
        }
        fn description(&self) -> &str {
            "Count shell executions"
        }
        fn parameters_schema(&self) -> serde_json::Value {
            serde_json::json!({
                "type": "object",
                "properties": {
                    "command": { "type": "string" }
                },
                "required": ["command"]
            })
        }
        async fn execute(&self, args: serde_json::Value) -> anyhow::Result<ToolResult> {
            self.runs.fetch_add(1, Ordering::SeqCst);
            Ok(ToolResult {
                success: true,
                output: args
                    .get("command")
                    .and_then(serde_json::Value::as_str)
                    .unwrap_or_default()
                    .to_string(),
                error: None,
            })
        }
    }
    #[tokio::test]
    async fn run_tool_call_loop_retries_invalid_tool_call_markup() {
        let runs = Arc::new(AtomicUsize::new(0));
        let tools_registry: Vec<Box<dyn Tool>> = vec![Box::new(CountingShellTool {
            runs: Arc::clone(&runs),
        })];
        let mut history = vec![ChatMessage::system("sys"), ChatMessage::user("check memory")];
        let response = run_tool_call_loop(
            &MalformedThenValidToolProvider,
            &mut history,
            &tools_registry,
            &NoopObserver,
            "test-provider",
            "test-model",
            0.0,
            true,
        )
        .await
        .unwrap();
        assert_eq!(response, "Top memory users parsed successfully.");
        assert_eq!(runs.load(Ordering::SeqCst), 1);
        assert!(!response.contains("<tool_call>"));
        assert!(history
            .iter()
            .any(|m| m.role == "user" && m.content.contains("[Tool parser error]")));
    }
 }