Reuse conversation cache when streaming edits (#30245)

Release Notes: - Improved latency when the agent applies edits.
2025-05-08 14:36:34 +02:00 · 2025-05-08 14:36:34 +02:00 · 9f6809a28d
commit 9f6809a28d
parent 032022e37b
50 changed files with 847 additions and 21557 deletions
--- a/crates/agent/src/active_thread.rs
+++ b/crates/agent/src/active_thread.rs
@ -1411,6 +1411,7 @@ impl ActiveThread {
                        mode: None,
                        messages: vec![request_message],
                        tools: vec![],
+                        tool_choice: None,
                        stop: vec![],
                        temperature: AssistantSettings::temperature_for_model(
                            &configured_model.model,
@ -3256,7 +3257,7 @@ impl ActiveThread {
                        c.tool_use_id.clone(),
                        c.ui_text.clone(),
                        c.input.clone(),
-                        &c.messages,
+                        c.request.clone(),
                        c.tool.clone(),
                        configured.model,
                        Some(window.window_handle()),