config: default agent settings and provider override

2026-01-14 20:14:33 +05:30
parent 38828c7757
commit f4562cd4c9
5 changed files with 595 additions and 396 deletions
--- a/config.example.toml
+++ b/config.example.toml
@@ -1,24 +1,30 @@
 # g3 Configuration Example
 #
-# This file demonstrates the new provider configuration format.
+# Most settings have sensible defaults. A minimal config only needs:
-# Provider references use the format: "<provider_type>.<config_name>"
+#
 #   [providers]
 #   default_provider = "anthropic.default"
 #
 #   [providers.anthropic.default]
 #   api_key = "your-api-key"
 #   model = "claude-sonnet-4-5"
 #
 # Everything else below is optional.
 [providers]
 # Default provider used when no specific provider is specified
 default_provider = "anthropic.default"
 # Optional: Specify different providers for each mode
 # If not specified, these fall back to default_provider
 # planner = "anthropic.planner"   # Provider for planning mode
-# coach = "anthropic.default"     # Provider for coach (code reviewer) in autonomous mode
+# coach = "anthropic.default"     # Provider for coach in autonomous mode
-# player = "anthropic.default"    # Provider for player (code implementer) in autonomous mode
+# player = "anthropic.default"    # Provider for player in autonomous mode
 # Named Anthropic configurations
 [providers.anthropic.default]
 api_key = "your-anthropic-api-key"
 model = "claude-sonnet-4-5"
-max_tokens = 64000
+# max_tokens = 64000              # Optional (default: provider's max)
-temperature = 0.3
+# temperature = 0.3               # Optional
 # cache_config = "ephemeral"      # Optional: Enable prompt caching
 # enable_1m_context = true        # Optional: Enable 1M context (costs extra)
 # thinking_budget_tokens = 10000  # Optional: Enable extended thinking mode
@@ -27,99 +33,50 @@ temperature = 0.3
 # [providers.anthropic.planner]
 # api_key = "your-anthropic-api-key"
 # model = "claude-opus-4-5"
 # max_tokens = 64000
 # thinking_budget_tokens = 16000
-# Named Databricks configurations
+# Databricks provider example
-[providers.databricks.default]
+# [providers.databricks.default]
-host = "https://your-workspace.cloud.databricks.com"
+# host = "https://your-workspace.cloud.databricks.com"
-# token = "your-databricks-token"  # Optional - will use OAuth if not provided
+# model = "databricks-claude-sonnet-4"
-model = "databricks-claude-sonnet-4"
+# use_oauth = true
 max_tokens = 4096
 temperature = 0.1
 use_oauth = true
-# Named OpenAI configurations
+# OpenAI provider example
 # [providers.openai.default]
 # api_key = "your-openai-api-key"
 # model = "gpt-4-turbo"
 # max_tokens = 4096
 # temperature = 0.1
-# Multiple OpenAI-compatible providers can be configured
+# OpenAI-compatible providers (OpenRouter, Groq, etc.)
 # [providers.openai_compatible.openrouter]
 # api_key = "your-openrouter-api-key"
 # model = "anthropic/claude-3.5-sonnet"
 # base_url = "https://openrouter.ai/api/v1"
 # max_tokens = 4096
 # temperature = 0.1
-# [providers.openai_compatible.groq]
+# =============================================================================
-# api_key = "your-groq-api-key"
+# Agent settings (all optional - these are the defaults)
-# model = "llama-3.3-70b-versatile"
+# =============================================================================
-# base_url = "https://api.groq.com/openai/v1"
+# [agent]
-# max_tokens = 4096
+# fallback_default_max_tokens = 8192
-# temperature = 0.1
+# enable_streaming = true
 # timeout_seconds = 120
 # auto_compact = true
 # max_retry_attempts = 3
 # autonomous_max_retry_attempts = 6
 # max_context_length = 200000     # Override context window size
-[agent]
+# =============================================================================
-fallback_default_max_tokens = 8192
+# Computer control (all optional - enabled by default)
-# max_context_length: Override the context window size for all providers
+# =============================================================================
-# This is the total size of conversation history, not per-request output limit
+# [computer_control]
-# max_context_length = 200000
+# enabled = true                  # Requires OS accessibility permissions
-enable_streaming = true
+# require_confirmation = true
-timeout_seconds = 60
+# max_actions_per_second = 5
 max_retry_attempts = 3
 autonomous_max_retry_attempts = 6
 allow_multiple_tool_calls = true
-# Retry Configuration for Planning/Autonomous Mode
+# =============================================================================
-#
+# WebDriver browser automation (all optional)
-# The retry infrastructure handles transient errors during LLM API calls:
+# =============================================================================
-# - Rate limits (HTTP 429)
+# [webdriver]
-# - Network errors (connection failures)
+# enabled = true
-# - Server errors (HTTP 5xx)
+# browser = "chrome-headless"     # Default. Alternative: "safari"
-# - Request timeouts
+# chrome_binary = "/path/to/chrome"        # Optional: custom Chrome path
-# - Model capacity issues (model busy)
+# chromedriver_binary = "/path/to/driver"  # Optional: custom ChromeDriver path
 #
 # Default retry behavior:
 # - max_retry_attempts: Used by default interactive mode (3 retries)
 # - autonomous_max_retry_attempts: Used by planning/autonomous mode (6 retries)
 #
 # Note: The retry logic uses exponential backoff with longer delays in
 # autonomous mode to handle rate limits gracefully.
 #
 # Example player retry config (in code):
 #   RetryConfig::planning("player")  # Creates: max_retries=3, is_autonomous=true
 #   RetryConfig::planning("player").with_max_retries(6)  # Override max retries
 #
 # Example coach retry config (in code):
 #   RetryConfig::planning("coach")   # Creates: max_retries=3, is_autonomous=true
 #   RetryConfig::planning("coach").with_max_retries(6)   # Override max retries
 #
 [computer_control]
 enabled = false  # Set to true to enable computer control (requires OS permissions)
 require_confirmation = true
 max_actions_per_second = 5
 [webdriver]
 enabled = false
 safari_port = 4444
 chrome_port = 9515
 # Browser to use: "safari" (default) or "chrome-headless"
 # Safari opens a visible browser window
 # Chrome headless runs in the background without a visible window
 browser = "safari"
 # Optional: Path to Chrome binary (e.g., Chrome for Testing)
 # If not set, ChromeDriver will use the default Chrome installation
 # Use this to avoid version mismatch issues between Chrome and ChromeDriver
 # Run: ./scripts/setup-chrome-for-testing.sh to install matching versions
 # chrome_binary = "/Users/yourname/.chrome-for-testing/chrome-mac-arm64/Google Chrome for Testing.app/Contents/MacOS/Google Chrome for Testing"
 # chrome_binary = "/Users/yourname/.chrome-for-testing/chrome-mac-x64/Google Chrome for Testing.app/Contents/MacOS/Google Chrome for Testing"
 # Optional: Path to ChromeDriver binary
 # If not set, looks for 'chromedriver' in PATH
 # The setup script creates a symlink at ~/.local/bin/chromedriver
 # chromedriver_binary = "/Users/yourname/.local/bin/chromedriver"
 [macax]
 enabled = false
--- a/crates/g3-cli/src/cli_args.rs
+++ b/crates/g3-cli/src/cli_args.rs
@@ -55,7 +55,7 @@ pub struct Cli {
    #[arg(long)]
    pub chat: bool,
-    /// Override the configured provider (anthropic, databricks, embedded, openai)
+    /// Override the configured provider (e.g., 'openai' or 'openai.default')
    #[arg(long, value_name = "PROVIDER")]
    pub provider: Option<String>,
--- a/crates/g3-config/src/lib.rs
+++ b/crates/g3-config/src/lib.rs
@@ -7,8 +7,11 @@ use std::path::Path;
 #[derive(Debug, Clone, Serialize, Deserialize)]
 pub struct Config {
    pub providers: ProvidersConfig,
    #[serde(default)]
    pub agent: AgentConfig,
    #[serde(default)]
    pub computer_control: ComputerControlConfig,
    #[serde(default)]
    pub webdriver: WebDriverConfig,
 }
@@ -92,24 +95,59 @@ pub struct EmbeddedConfig {
 #[derive(Debug, Clone, Serialize, Deserialize)]
 pub struct AgentConfig {
    pub max_context_length: Option<u32>,
    #[serde(default = "default_fallback_max_tokens")]
    pub fallback_default_max_tokens: usize,
    #[serde(default = "default_true")]
    pub enable_streaming: bool,
    #[serde(default = "default_timeout_seconds")]
    pub timeout_seconds: u64,
    #[serde(default = "default_true")]
    pub auto_compact: bool,
    #[serde(default = "default_max_retry_attempts")]
    pub max_retry_attempts: u32,
    #[serde(default = "default_autonomous_max_retry_attempts")]
    pub autonomous_max_retry_attempts: u32,
    #[serde(default = "default_check_todo_staleness")]
    pub check_todo_staleness: bool,
 }
 fn default_fallback_max_tokens() -> usize {
    8192
 }
 fn default_true() -> bool {
    true
 }
 fn default_false() -> bool {
    false
 }
 fn default_timeout_seconds() -> u64 {
    120
 }
 fn default_max_retry_attempts() -> u32 {
    3
 }
 fn default_autonomous_max_retry_attempts() -> u32 {
    6
 }
 fn default_max_actions_per_second() -> u32 {
    5
 }
 fn default_check_todo_staleness() -> bool {
    true
 }
-
+fn default_safari_port() -> u16 {
    4444
 }
 fn default_chrome_port() -> u16 {
    9515
 }
 #[derive(Debug, Clone, Serialize, Deserialize)]
 pub struct ComputerControlConfig {
    #[serde(default = "default_true")]
    pub enabled: bool,
    #[serde(default = "default_false")]
    pub require_confirmation: bool,
    #[serde(default = "default_max_actions_per_second")]
    pub max_actions_per_second: u32,
 }
@@ -117,17 +155,19 @@ pub struct ComputerControlConfig {
 #[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Default)]
 #[serde(rename_all = "lowercase")]
 pub enum WebDriverBrowser {
    #[default]
    Safari,
    #[default]
    #[serde(rename = "chrome-headless")]
    ChromeHeadless,
 }
-#[derive(Debug, Clone, Serialize, Deserialize)]
+#[derive(Debug, Clone, Serialize, Deserialize, Default)]
 pub struct WebDriverConfig {
    #[serde(default = "default_true")]
    pub enabled: bool,
    #[serde(default = "default_safari_port")]
    pub safari_port: u16,
-    #[serde(default)]
+    #[serde(default = "default_chrome_port")]
    pub chrome_port: u16,
    #[serde(default)]
    /// Optional path to Chrome binary (e.g., Chrome for Testing)
@@ -141,24 +181,25 @@ pub struct WebDriverConfig {
    pub browser: WebDriverBrowser,
 }
-impl Default for WebDriverConfig {
+impl Default for AgentConfig {
    fn default() -> Self {
        Self {
-            enabled: true,
+            max_context_length: None,
-            safari_port: 4444,
+            fallback_default_max_tokens: 8192,
-            chrome_port: 9515,
+            enable_streaming: true,
-            chrome_binary: None,
+            timeout_seconds: 120,
-            chromedriver_binary: None,
+            auto_compact: true,
-            browser: WebDriverBrowser::Safari,
+            max_retry_attempts: 3,
            autonomous_max_retry_attempts: 6,
            check_todo_staleness: true,
        }
    }
 }
 impl Default for ComputerControlConfig {
    fn default() -> Self {
        Self {
-            enabled: false,
+            enabled: true,
-            require_confirmation: true,
+            require_confirmation: false,
            max_actions_per_second: 5,
        }
    }
@@ -445,20 +486,26 @@ impl Config {
        // Apply provider override
        if let Some(provider) = provider_override {
-            // Validate the override
+            // If provider doesn't contain '.', assume '.default'
            let provider = if provider.contains('.') {
                provider
            } else {
                format!("{}.default", provider)
            };
            config.validate_provider_reference(&provider)?;
            config.providers.default_provider = provider;
        }
        // Apply model override to the active provider
        if let Some(model) = model_override {
-            let (provider_type, config_name) = Self::parse_provider_reference(
+            let (provider_type, config_name) =
-                &config.providers.default_provider
+                Self::parse_provider_reference(&config.providers.default_provider)?;
            )?;
            match provider_type.as_str() {
                "anthropic" => {
-                    if let Some(ref mut anthropic_config) = config.providers.anthropic.get_mut(&config_name) {
+                    if let Some(ref mut anthropic_config) =
                        config.providers.anthropic.get_mut(&config_name)
                    {
                        anthropic_config.model = model;
                    } else {
                        return Err(anyhow::anyhow!(
@@ -468,7 +515,9 @@ impl Config {
                    }
                }
                "databricks" => {
-                    if let Some(ref mut databricks_config) = config.providers.databricks.get_mut(&config_name) {
+                    if let Some(ref mut databricks_config) =
                        config.providers.databricks.get_mut(&config_name)
                    {
                        databricks_config.model = model;
                    } else {
                        return Err(anyhow::anyhow!(
@@ -478,7 +527,9 @@ impl Config {
                    }
                }
                "embedded" => {
-                    if let Some(ref mut embedded_config) = config.providers.embedded.get_mut(&config_name) {
+                    if let Some(ref mut embedded_config) =
                        config.providers.embedded.get_mut(&config_name)
                    {
                        embedded_config.model_path = model;
                    } else {
                        return Err(anyhow::anyhow!(
@@ -488,7 +539,9 @@ impl Config {
                    }
                }
                "openai" => {
-                    if let Some(ref mut openai_config) = config.providers.openai.get_mut(&config_name) {
+                    if let Some(ref mut openai_config) =
                        config.providers.openai.get_mut(&config_name)
                    {
                        openai_config.model = model;
                    } else {
                        return Err(anyhow::anyhow!(
@@ -499,13 +552,12 @@ impl Config {
                }
                _ => {
                    // Check openai_compatible
-                    if let Some(ref mut compat_config) = config.providers.openai_compatible.get_mut(&provider_type) {
+                    if let Some(ref mut compat_config) =
                        config.providers.openai_compatible.get_mut(&provider_type)
                    {
                        compat_config.model = model;
                    } else {
-                        return Err(anyhow::anyhow!(
+                        return Err(anyhow::anyhow!("Unknown provider type: {}", provider_type));
                            "Unknown provider type: {}",
                            provider_type
                        ));
                    }
                }
            }
@@ -585,36 +637,42 @@ impl Config {
    /// Get the current default provider's config
    pub fn get_default_provider_config(&self) -> Result<ProviderConfigRef<'_>> {
-        let (provider_type, config_name) = Self::parse_provider_reference(
+        let (provider_type, config_name) =
-            &self.providers.default_provider
+            Self::parse_provider_reference(&self.providers.default_provider)?;
        )?;
        match provider_type.as_str() {
-            "anthropic" => {
+            "anthropic" => self
-                self.providers.anthropic.get(&config_name)
+                .providers
                .anthropic
                .get(&config_name)
                .map(ProviderConfigRef::Anthropic)
-                    .ok_or_else(|| anyhow::anyhow!("Anthropic config '{}' not found", config_name))
+                .ok_or_else(|| anyhow::anyhow!("Anthropic config '{}' not found", config_name)),
-            }
+            "openai" => self
-            "openai" => {
+                .providers
-                self.providers.openai.get(&config_name)
+                .openai
                .get(&config_name)
                .map(ProviderConfigRef::OpenAI)
-                    .ok_or_else(|| anyhow::anyhow!("OpenAI config '{}' not found", config_name))
+                .ok_or_else(|| anyhow::anyhow!("OpenAI config '{}' not found", config_name)),
-            }
+            "databricks" => self
-            "databricks" => {
+                .providers
-                self.providers.databricks.get(&config_name)
+                .databricks
                .get(&config_name)
                .map(ProviderConfigRef::Databricks)
-                    .ok_or_else(|| anyhow::anyhow!("Databricks config '{}' not found", config_name))
+                .ok_or_else(|| anyhow::anyhow!("Databricks config '{}' not found", config_name)),
-            }
+            "embedded" => self
-            "embedded" => {
+                .providers
-                self.providers.embedded.get(&config_name)
+                .embedded
                .get(&config_name)
                .map(ProviderConfigRef::Embedded)
-                    .ok_or_else(|| anyhow::anyhow!("Embedded config '{}' not found", config_name))
+                .ok_or_else(|| anyhow::anyhow!("Embedded config '{}' not found", config_name)),
-            }
+            _ => self
-            _ => {
+                .providers
-                self.providers.openai_compatible.get(&provider_type)
+                .openai_compatible
                .get(&provider_type)
                .map(ProviderConfigRef::OpenAICompatible)
-                    .ok_or_else(|| anyhow::anyhow!("OpenAI compatible config '{}' not found", provider_type))
+                .ok_or_else(|| {
-            }
+                    anyhow::anyhow!("OpenAI compatible config '{}' not found", provider_type)
                }),
        }
    }
 }
--- a/crates/g3-core/src/lib.rs
+++ b/crates/g3-core/src/lib.rs
@@ -1,32 +1,38 @@
 pub mod acd;
 pub mod context_window;
 pub mod background_process;
 pub mod compaction;
 pub mod code_search;
 pub mod compaction;
 pub mod context_window;
 pub mod error_handling;
 pub mod feedback_extraction;
 pub mod paths;
 pub mod project;
 pub mod provider_registration;
 pub mod provider_config;
 pub mod provider_registration;
 pub mod retry;
 pub mod session;
 pub mod session_continuation;
 pub mod stats;
 pub mod streaming;
 pub mod streaming_parser;
 pub mod task_result;
 pub mod tool_dispatch;
 pub mod tool_definitions;
 pub mod tool_dispatch;
 pub mod tools;
 pub mod ui_writer;
 pub mod streaming;
 pub mod utils;
 pub mod webdriver_session;
 pub mod stats;
 pub use feedback_extraction::{
    extract_coach_feedback, ExtractedFeedback, FeedbackExtractionConfig, FeedbackSource,
 };
 pub use retry::{execute_with_retry, retry_operation, RetryConfig, RetryResult};
 pub use session_continuation::{
    clear_continuation, find_incomplete_agent_session, format_session_time, get_session_dir,
    has_valid_continuation, list_sessions_for_directory, load_context_from_session_log,
    load_continuation, save_continuation, SessionContinuation,
 };
 pub use task_result::TaskResult;
 pub use retry::{RetryConfig, RetryResult, execute_with_retry, retry_operation};
 pub use feedback_extraction::{ExtractedFeedback, FeedbackSource, FeedbackExtractionConfig, extract_coach_feedback};
 pub use session_continuation::{SessionContinuation, load_continuation, save_continuation, clear_continuation, has_valid_continuation, get_session_dir, load_context_from_session_log, find_incomplete_agent_session, list_sessions_for_directory, format_session_time};
 // Re-export context window types
 pub use context_window::{ContextWindow, ThinScope};
@@ -55,12 +61,12 @@ use tokio_util::sync::CancellationToken;
 use tracing::{debug, error, warn};
 // Re-export path utilities
 pub use paths::{
    G3_WORKSPACE_PATH_ENV, ensure_session_dir, get_context_summary_file, get_g3_dir,
    get_session_file, get_session_logs_dir, get_session_todo_path, get_thinned_dir,
    get_errors_dir, get_background_processes_dir, get_discovery_dir,
 };
 use paths::get_todo_path;
 pub use paths::{
    ensure_session_dir, get_background_processes_dir, get_context_summary_file, get_discovery_dir,
    get_errors_dir, get_g3_dir, get_session_file, get_session_logs_dir, get_session_todo_path,
    get_thinned_dir, G3_WORKSPACE_PATH_ENV,
 };
 #[derive(Debug, Clone, Serialize, Deserialize)]
 pub struct ToolCall {
@@ -68,7 +74,6 @@ pub struct ToolCall {
    pub args: serde_json::Value, // Should be a JSON object with tool-specific arguments
 }
 // Re-export WebDriverSession from its own module
 pub use webdriver_session::WebDriverSession;
@@ -87,9 +92,8 @@ pub enum StreamState {
    Resuming,
 }
 // Re-export StreamingToolParser from its own module
-pub use streaming_parser::{StreamingToolParser, sanitize_inline_tool_patterns, LBRACE_HOMOGLYPH};
+pub use streaming_parser::{sanitize_inline_tool_patterns, StreamingToolParser, LBRACE_HOMOGLYPH};
 pub struct Agent<W: UiWriter> {
    providers: ProviderRegistry,
@@ -108,9 +112,7 @@ pub struct Agent<W: UiWriter> {
    computer_controller: Option<Box<dyn g3_computer_control::ComputerController>>,
    todo_content: std::sync::Arc<tokio::sync::RwLock<String>>,
    webdriver_session: std::sync::Arc<
-        tokio::sync::RwLock<
+        tokio::sync::RwLock<Option<std::sync::Arc<tokio::sync::Mutex<WebDriverSession>>>>,
            Option<std::sync::Arc<tokio::sync::Mutex<WebDriverSession>>>,
        >,
    >,
    webdriver_process: std::sync::Arc<tokio::sync::RwLock<Option<tokio::process::Child>>>,
    tool_call_count: usize,
@@ -167,7 +169,15 @@ impl<W: UiWriter> Agent<W> {
        custom_system_prompt: String,
        readme_content: Option<String>,
    ) -> Result<Self> {
-        Self::new_with_mode_and_readme(config, ui_writer, false, readme_content, false, Some(custom_system_prompt)).await
+        Self::new_with_mode_and_readme(
            config,
            ui_writer,
            false,
            readme_content,
            false,
            Some(custom_system_prompt),
        )
        .await
    }
    async fn new_with_mode(
@@ -188,8 +198,10 @@ impl<W: UiWriter> Agent<W> {
        custom_system_prompt: Option<String>,
    ) -> Result<Self> {
        // Register providers using the extracted module
-        let providers_to_register = provider_registration::determine_providers_to_register(&config, is_autonomous);
+        let providers_to_register =
-        let providers = provider_registration::register_providers(&config, &providers_to_register).await?;
+            provider_registration::determine_providers_to_register(&config, is_autonomous);
        let providers =
            provider_registration::register_providers(&config, &providers_to_register).await?;
        // Determine context window size based on active provider
        let mut context_warnings = Vec::new();
@@ -273,8 +285,9 @@ impl<W: UiWriter> Agent<W> {
            working_dir: None,
            background_process_manager: std::sync::Arc::new(
                background_process::BackgroundProcessManager::new(
-                    paths::get_background_processes_dir()
+                    paths::get_background_processes_dir(),
-                )),
+                ),
            ),
            pending_images: Vec::new(),
            is_agent_mode: false,
            agent_name: None,
@@ -309,7 +322,9 @@ impl<W: UiWriter> Agent<W> {
        // Check for system prompt markers that are present in both standard and agent mode
        // Agent mode replaces the identity line but keeps all other instructions
-        let has_tool_instructions = first_message.content.contains("IMPORTANT: You must call tools to achieve goals");
+        let has_tool_instructions = first_message
            .content
            .contains("IMPORTANT: You must call tools to achieve goals");
        if !has_tool_instructions {
            panic!("FATAL: First system message does not contain the system prompt. This likely means the README was added before the system prompt.");
        }
@@ -347,7 +362,10 @@ impl<W: UiWriter> Agent<W> {
        let (provider_type, config_name) = provider_config::parse_provider_ref(provider_name);
        match provider_type {
-            "anthropic" => self.config.providers.anthropic
+            "anthropic" => self
                .config
                .providers
                .anthropic
                .get(config_name)
                .and_then(|c| c.cache_config.as_ref())
                .and_then(|config| Self::parse_cache_control(config)),
@@ -362,8 +380,16 @@ impl<W: UiWriter> Agent<W> {
    /// Get the thinking budget tokens for Anthropic provider, if configured.
    /// Pre-flight check to validate max_tokens for thinking.budget_tokens constraint.
-    fn preflight_validate_max_tokens(&self, provider_name: &str, proposed_max_tokens: u32) -> (u32, bool) {
+    fn preflight_validate_max_tokens(
-        provider_config::preflight_validate_max_tokens(&self.config, provider_name, proposed_max_tokens)
+        &self,
        provider_name: &str,
        proposed_max_tokens: u32,
    ) -> (u32, bool) {
        provider_config::preflight_validate_max_tokens(
            &self.config,
            provider_name,
            proposed_max_tokens,
        )
    }
    /// Calculate max_tokens for a summary request.
@@ -377,8 +403,17 @@ impl<W: UiWriter> Agent<W> {
    }
    /// Apply the fallback sequence to free up context space for thinking budget.
-    fn apply_max_tokens_fallback_sequence(&mut self, provider_name: &str, initial_max_tokens: u32, hard_coded_minimum: u32) -> u32 {
+    fn apply_max_tokens_fallback_sequence(
-        self.apply_fallback_sequence_impl(provider_name, Some(initial_max_tokens), hard_coded_minimum)
+        &mut self,
        provider_name: &str,
        initial_max_tokens: u32,
        hard_coded_minimum: u32,
    ) -> u32 {
        self.apply_fallback_sequence_impl(
            provider_name,
            Some(initial_max_tokens),
            hard_coded_minimum,
        )
    }
    /// Unified implementation of the fallback sequence for freeing context space.
@@ -405,27 +440,33 @@ impl<W: UiWriter> Agent<W> {
        );
        // Step 1: Try thinnify (first third of context)
-        self.ui_writer.print_context_status("🥒 Step 1: Trying thinnify...\n");
+        self.ui_writer
            .print_context_status("🥒 Step 1: Trying thinnify...\n");
        let thin_msg = self.do_thin_context();
        self.ui_writer.print_context_thinning(&thin_msg);
        // Recalculate after thinnify
-        let (new_max, still_needs_reduction) = self.recalculate_max_tokens(provider_name, initial_max_tokens.is_some());
+        let (new_max, still_needs_reduction) =
            self.recalculate_max_tokens(provider_name, initial_max_tokens.is_some());
        max_tokens = new_max;
        if !still_needs_reduction {
-            self.ui_writer.print_context_status("✅ Thinnify resolved capacity issue. Continuing...\n");
+            self.ui_writer
                .print_context_status("✅ Thinnify resolved capacity issue. Continuing...\n");
            return max_tokens;
        }
        // Step 2: Try skinnify (entire context)
-        self.ui_writer.print_context_status("🦴 Step 2: Trying skinnify...\n");
+        self.ui_writer
            .print_context_status("🦴 Step 2: Trying skinnify...\n");
        let skinny_msg = self.do_thin_context_all();
        self.ui_writer.print_context_thinning(&skinny_msg);
        // Recalculate after skinnify
-        let (final_max, final_needs_reduction) = self.recalculate_max_tokens(provider_name, initial_max_tokens.is_some());
+        let (final_max, final_needs_reduction) =
            self.recalculate_max_tokens(provider_name, initial_max_tokens.is_some());
        if !final_needs_reduction {
-            self.ui_writer.print_context_status("✅ Skinnify resolved capacity issue. Continuing...\n");
+            self.ui_writer
                .print_context_status("✅ Skinnify resolved capacity issue. Continuing...\n");
            return final_max;
        }
@@ -937,7 +978,7 @@ impl<W: UiWriter> Agent<W> {
    /// Manually trigger context compaction regardless of context window size
    /// Returns Ok(true) if compaction was successful, Ok(false) if it failed
    pub async fn force_compact(&mut self) -> Result<bool> {
-        use crate::compaction::{CompactionConfig, perform_compaction};
+        use crate::compaction::{perform_compaction, CompactionConfig};
        debug!("Manual compaction triggered");
@@ -971,10 +1012,12 @@ impl<W: UiWriter> Agent<W> {
            compaction_config,
            &self.ui_writer,
            &mut self.thinning_events,
-        ).await?;
+        )
        .await?;
        if result.success {
-            self.ui_writer.print_context_status("✅ Context compacted successfully.\n");
+            self.ui_writer
                .print_context_status("✅ Context compacted successfully.\n");
            self.compaction_events.push(result.chars_saved);
            Ok(true)
        } else {
@@ -1006,7 +1049,9 @@ impl<W: UiWriter> Agent<W> {
    /// Internal helper: thin all context and track the event
    fn do_thin_context_all(&mut self) -> String {
-        let (message, chars_saved) = self.context_window.thin_context_all(self.session_id.as_deref());
+        let (message, chars_saved) = self
            .context_window
            .thin_context_all(self.session_id.as_deref());
        self.thinning_events.push(chars_saved);
        message
    }
@@ -1030,10 +1075,12 @@ impl<W: UiWriter> Agent<W> {
            self.ui_writer.print_context_thinning(&thin_summary);
            if !self.context_window.should_compact() {
-                self.ui_writer.print_context_status("✅ Thinning resolved capacity issue. Continuing...\n");
+                self.ui_writer
                    .print_context_status("✅ Thinning resolved capacity issue. Continuing...\n");
                return Ok(false);
            }
-            self.ui_writer.print_context_status("⚠️ Thinning insufficient. Proceeding with compaction...\n");
+            self.ui_writer
                .print_context_status("⚠️ Thinning insufficient. Proceeding with compaction...\n");
        }
        // Compaction still needed
@@ -1041,7 +1088,7 @@ impl<W: UiWriter> Agent<W> {
            return Ok(false);
        }
-        use crate::compaction::{CompactionConfig, perform_compaction};
+        use crate::compaction::{perform_compaction, CompactionConfig};
        self.ui_writer.print_context_status(&format!(
            "\n🗜️ Context window reaching capacity ({}%). Compacting...",
@@ -1049,7 +1096,10 @@ impl<W: UiWriter> Agent<W> {
        ));
        let provider_name = self.providers.get(None)?.name().to_string();
-        let latest_user_msg = request.messages.iter().rev()
+        let latest_user_msg = request
            .messages
            .iter()
            .rev()
            .find(|m| matches!(m.role, MessageRole::User))
            .map(|m| m.content.clone());
@@ -1065,17 +1115,21 @@ impl<W: UiWriter> Agent<W> {
            compaction_config,
            &self.ui_writer,
            &mut self.thinning_events,
-        ).await?;
+        )
        .await?;
        if result.success {
-            self.ui_writer.print_context_status("✅ Context compacted successfully. Continuing...\n");
+            self.ui_writer
                .print_context_status("✅ Context compacted successfully. Continuing...\n");
            self.compaction_events.push(result.chars_saved);
            request.messages = self.context_window.conversation_history.clone();
            return Ok(true);
        }
        self.ui_writer.print_context_status("⚠️ Unable to compact context. Consider starting a new session if you continue to see errors.\n");
-        Err(anyhow::anyhow!("Context window at capacity and compaction failed. Please start a new session."))
+        Err(anyhow::anyhow!(
            "Context window at capacity and compaction failed. Please start a new session."
        ))
    }
    /// Check if a tool call is a duplicate of the last tool call in the previous assistant message.
@@ -1090,11 +1144,13 @@ impl<W: UiWriter> Agent<W> {
            let content = &msg.content;
            // Look for the last occurrence of a tool call pattern
-            let last_tool_start = content.rfind(r#"{"tool""#)
+            let last_tool_start = content
                .rfind(r#"{"tool""#)
                .or_else(|| content.rfind(r#"{ "tool""#))?;
            // Find the end of this JSON object
-            let end_offset = StreamingToolParser::find_complete_json_object_end(&content[last_tool_start..])?;
+            let end_offset =
                StreamingToolParser::find_complete_json_object_end(&content[last_tool_start..])?;
            let end_idx = last_tool_start + end_offset + 1;
            let tool_json = &content[last_tool_start..end_idx];
@@ -1234,7 +1290,10 @@ impl<W: UiWriter> Agent<W> {
            .unwrap_or_else(|_| ".".to_string());
        // Get description from first user message (strip "Task: " prefix if present)
-        let description = self.context_window.conversation_history.iter()
+        let description = self
            .context_window
            .conversation_history
            .iter()
            .find(|m| matches!(m.role, g3_providers::MessageRole::User))
            .map(|m| {
                let content = m.content.strip_prefix("Task: ").unwrap_or(&m.content);
@@ -1272,13 +1331,19 @@ impl<W: UiWriter> Agent<W> {
    /// Enable auto-memory reminders after turns with tool calls
    pub fn set_auto_memory(&mut self, enabled: bool) {
        self.auto_memory = enabled;
-        debug!("Auto-memory reminders: {}", if enabled { "enabled" } else { "disabled" });
+        debug!(
            "Auto-memory reminders: {}",
            if enabled { "enabled" } else { "disabled" }
        );
    }
    /// Enable or disable aggressive context dehydration (ACD)
    pub fn set_acd_enabled(&mut self, enabled: bool) {
        self.acd_enabled = enabled;
-        debug!("ACD (aggressive context dehydration): {}", if enabled { "enabled" } else { "disabled" });
+        debug!(
            "ACD (aggressive context dehydration): {}",
            if enabled { "enabled" } else { "disabled" }
        );
    }
    /// Build the final response and prepare for return.
@@ -1342,7 +1407,8 @@ impl<W: UiWriter> Agent<W> {
        // Find the index of the last dehydration stub (marks the end of previously dehydrated content)
        // We only want to dehydrate messages AFTER the last stub+summary pair
-        let last_stub_index = self.context_window
+        let last_stub_index = self
            .context_window
            .conversation_history
            .iter()
            .rposition(|m| m.is_dehydrated_stub());
@@ -1356,14 +1422,19 @@ impl<W: UiWriter> Agent<W> {
        };
        // Get the preceding fragment ID (if any)
-        let preceding_id = crate::acd::get_latest_fragment_id(&session_id).ok().flatten();
+        let preceding_id = crate::acd::get_latest_fragment_id(&session_id)
            .ok()
            .flatten();
        // Extract only NEW non-system messages to dehydrate (after the last stub+summary)
-        let messages_to_dehydrate: Vec<_> = self.context_window
+        let messages_to_dehydrate: Vec<_> = self
            .context_window
            .conversation_history
            .iter()
            .enumerate()
-            .filter(|(idx, m)| *idx >= dehydrate_start && !matches!(m.role, g3_providers::MessageRole::System))
+            .filter(|(idx, m)| {
                *idx >= dehydrate_start && !matches!(m.role, g3_providers::MessageRole::System)
            })
            .map(|(_, m)| m.clone())
            .collect();
@@ -1393,7 +1464,8 @@ impl<W: UiWriter> Agent<W> {
        // Now replace the context: keep system messages + previous stubs/summaries, add new stub, add new summary
        // Extract messages to keep: system messages + everything up to (but not including) dehydrate_start
-        let messages_to_keep: Vec<_> = self.context_window
+        let messages_to_keep: Vec<_> = self
            .context_window
            .conversation_history
            .iter()
            .enumerate()
@@ -1445,14 +1517,18 @@ impl<W: UiWriter> Agent<W> {
        // Check if any tools were called this turn
        if self.tool_calls_this_turn.is_empty() {
            debug!("Auto-memory: No tools called, skipping reminder");
-            self.ui_writer.print_context_status("📝 Auto-memory: No tools called this turn, skipping reminder.\n");
+            self.ui_writer.print_context_status(
                "📝 Auto-memory: No tools called this turn, skipping reminder.\n",
            );
            return Ok(false);
        }
        // Check if remember was already called this turn - no need to remind
        if self.tool_calls_this_turn.iter().any(|t| t == "remember") {
            debug!("Auto-memory: 'remember' was already called this turn, skipping reminder");
-            self.ui_writer.print_context_status("\n📝 Auto-memory: 'remember' already called, skipping reminder.\n");
+            self.ui_writer.print_context_status(
                "\n📝 Auto-memory: 'remember' already called, skipping reminder.\n",
            );
            self.tool_calls_this_turn.clear();
            return Ok(false);
        }
@@ -1460,7 +1536,11 @@ impl<W: UiWriter> Agent<W> {
        // Take the tools list and reset for next turn
        let tools_called = std::mem::take(&mut self.tool_calls_this_turn);
-        debug!("Auto-memory: Sending reminder to LLM ({} tools called this turn: {:?})", tools_called.len(), tools_called);
+        debug!(
            "Auto-memory: Sending reminder to LLM ({} tools called this turn: {:?})",
            tools_called.len(),
            tools_called
        );
        self.ui_writer.print_context_status("\nMemory checkpoint: ");
        let reminder = r#"MEMORY CHECKPOINT: If you discovered code locations worth remembering, call `remember` now.
@@ -1496,10 +1576,8 @@ Save/restore session state across g3 invocations using symlink-based approach.
 Skip if nothing new. Be brief."#;
        // Add the reminder as a user message and get a response
-        self.context_window.add_message(Message::new(
+        self.context_window
-            MessageRole::User,
+            .add_message(Message::new(MessageRole::User, reminder.to_string()));
            reminder.to_string(),
        ));
        // Build the completion request
        let messages = self.context_window.conversation_history.clone();
@@ -1584,7 +1662,8 @@ Skip if nothing new. Be brief."#;
                        // Restore messages from session log (skip system messages as they're preserved)
                        for msg in messages {
-                            let role_str = msg.get("role").and_then(|r| r.as_str()).unwrap_or("user");
+                            let role_str =
                                msg.get("role").and_then(|r| r.as_str()).unwrap_or("user");
                            let content = msg.get("content").and_then(|c| c.as_str()).unwrap_or("");
                            let role = match role_str {
@@ -1918,10 +1997,10 @@ Skip if nothing new. Be brief."#;
                        // Always process all tool calls - they will be executed after stream ends
                        // De-duplicate tool calls (sequential duplicates in chunk + duplicates from previous message)
-                        let deduplicated_tools = streaming::deduplicate_tool_calls(
+                        let deduplicated_tools =
-                            completed_tools,
+                            streaming::deduplicate_tool_calls(completed_tools, |tc| {
-                            |tc| self.check_duplicate_in_previous_message(tc),
+                                self.check_duplicate_in_previous_message(tc)
-                        );
+                            });
                        // Process each tool call
                        for (tool_call, duplicate_type) in deduplicated_tools {
@@ -1933,7 +2012,8 @@ Skip if nothing new. Be brief."#;
                                    "Skipping duplicate tool call ({}): {} with args {}",
                                    dup_type,
                                    tool_call.tool,
-                                    serde_json::to_string(&tool_call.args).unwrap_or_else(|_| "<unserializable>".to_string())
+                                    serde_json::to_string(&tool_call.args)
                                        .unwrap_or_else(|_| "<unserializable>".to_string())
                                );
                                continue;
                            }
@@ -1954,11 +2034,13 @@ Skip if nothing new. Be brief."#;
                            let text_content = parser.get_text_content();
                            let clean_content = streaming::clean_llm_tokens(&text_content);
                            let raw_content_for_log = clean_content.clone();
-                            let filtered_content = self.ui_writer.filter_json_tool_calls(&clean_content);
+                            let filtered_content =
                                self.ui_writer.filter_json_tool_calls(&clean_content);
                            let final_display_content = filtered_content.trim();
                            // Extract only the new (undisplayed) portion
-                            let new_content = if current_response.len() <= final_display_content.len() {
+                            let new_content =
                                if current_response.len() <= final_display_content.len() {
                                    final_display_content
                                        .chars()
                                        .skip(already_displayed_chars)
@@ -1981,11 +2063,13 @@ Skip if nothing new. Be brief."#;
                            self.ui_writer.finish_streaming_markdown();
-                            let is_todo_tool = tool_call.tool == "todo_read" || tool_call.tool == "todo_write";
+                            let is_todo_tool =
                                tool_call.tool == "todo_read" || tool_call.tool == "todo_write";
                            // Tool call header (TODO tools print their own)
                            if !is_todo_tool {
-                            self.ui_writer.print_tool_header(&tool_call.tool, Some(&tool_call.args));
+                                self.ui_writer
                                    .print_tool_header(&tool_call.tool, Some(&tool_call.args));
                                if let Some(args_obj) = tool_call.args.as_object() {
                                    for (key, value) in args_obj {
                                        let value_str = streaming::format_tool_arg_value(
@@ -1999,7 +2083,17 @@ Skip if nothing new. Be brief."#;
                            }
                            // Check if this is a compact tool (file operations)
-                            let is_compact_tool = matches!(tool_call.tool.as_str(), "read_file" | "write_file" | "str_replace" | "remember" | "screenshot" | "coverage" | "rehydrate" | "code_search");
+                            let is_compact_tool = matches!(
                                tool_call.tool.as_str(),
                                "read_file"
                                    | "write_file"
                                    | "str_replace"
                                    | "remember"
                                    | "screenshot"
                                    | "coverage"
                                    | "rehydrate"
                                    | "code_search"
                            );
                            // Only print output header for non-compact tools
                            if !is_compact_tool && !is_todo_tool {
@@ -2051,29 +2145,53 @@ Skip if nothing new. Be brief."#;
                                        Some(streaming::truncate_for_display(&tool_result, 60))
                                    } else {
                                        match tool_call.tool.as_str() {
-                                        "read_file" => Some(streaming::format_read_file_summary(output_len, tool_result.len())),
+                                            "read_file" => {
-                                        "write_file" => Some(streaming::format_write_file_result(&tool_result)),
+                                                Some(streaming::format_read_file_summary(
                                                    output_len,
                                                    tool_result.len(),
                                                ))
                                            }
                                            "write_file" => Some(
                                                streaming::format_write_file_result(&tool_result),
                                            ),
                                            "str_replace" => {
                                                let (ins, del) = parse_diff_stats(&tool_result);
-                                            Some(streaming::format_str_replace_summary(ins, del))
+                                                Some(streaming::format_str_replace_summary(
                                                    ins, del,
                                                ))
                                            }
-                                        "remember" => Some(streaming::format_remember_summary(&tool_result)),
+                                            "remember" => Some(streaming::format_remember_summary(
-                                        "screenshot" => Some(streaming::format_screenshot_summary(&tool_result)),
+                                                &tool_result,
-                                        "coverage" => Some(streaming::format_coverage_summary(&tool_result)),
+                                            )),
-                                        "rehydrate" => Some(streaming::format_rehydrate_summary(&tool_result)),
+                                            "screenshot" => Some(
-                                        "code_search" => Some(streaming::format_code_search_summary(&tool_result)),
+                                                streaming::format_screenshot_summary(&tool_result),
                                            ),
                                            "coverage" => Some(streaming::format_coverage_summary(
                                                &tool_result,
                                            )),
                                            "rehydrate" => Some(
                                                streaming::format_rehydrate_summary(&tool_result),
                                            ),
                                            "code_search" => Some(
                                                streaming::format_code_search_summary(&tool_result),
                                            ),
                                            _ => Some("✅ completed".to_string()),
                                        }
                                    }
                                } else {
                                    // Regular tools: show truncated output lines
-                                    let max_lines_to_show = if wants_full { output_len } else { MAX_LINES };
+                                    let max_lines_to_show =
                                        if wants_full { output_len } else { MAX_LINES };
                                    for (idx, line) in output_lines.iter().enumerate() {
                                        if !wants_full && idx >= max_lines_to_show {
                                            break;
                                        }
                                        self.ui_writer.update_tool_output_line(
-                                            &streaming::truncate_line(line, MAX_LINE_WIDTH, !wants_full)
+                                            &streaming::truncate_line(
                                                line,
                                                MAX_LINE_WIDTH,
                                                !wants_full,
                                            ),
                                        );
                                    }
                                    if !wants_full && output_len > MAX_LINES {
@@ -2143,7 +2261,10 @@ Skip if nothing new. Be brief."#;
                            self.context_window.add_message(result_message);
                            // Closure marker with timing
-                            let tokens_delta = self.context_window.used_tokens.saturating_sub(tokens_before);
+                            let tokens_delta = self
                                .context_window
                                .used_tokens
                                .saturating_sub(tokens_before);
                            // TODO tools handle their own output via print_todo_compact, skip timing
                            if !is_todo_tool {
@@ -2157,10 +2278,11 @@ Skip if nothing new. Be brief."#;
                                        self.context_window.percentage_used(),
                                    );
                                } else {
-                                    self.ui_writer
+                                    self.ui_writer.print_tool_timing(
-                                        .print_tool_timing(&streaming::format_duration(exec_duration),
+                                        &streaming::format_duration(exec_duration),
                                        tokens_delta,
-                                            self.context_window.percentage_used());
+                                        self.context_window.percentage_used(),
                                    );
                                }
                            }
                            self.ui_writer.print_agent_prompt();
@@ -2179,7 +2301,8 @@ Skip if nothing new. Be brief."#;
                                if self.agent_name.as_deref() == Some("scout") {
                                    tool_config = tool_config.with_research_excluded();
                                }
-                                request.tools = Some(tool_definitions::create_tool_definitions(tool_config));
+                                request.tools =
                                    Some(tool_definitions::create_tool_definitions(tool_config));
                            }
                            // DO NOT add final_display_content to full_response here!
@@ -2196,7 +2319,6 @@ Skip if nothing new. Be brief."#;
                            // This gives the LLM fresh attempts since it's making progress
                            auto_summary_attempts = 0;
                            // Reset the JSON tool call filter state after each tool execution
                            // This ensures the filter doesn't stay in suppression mode for subsequent streaming content
                            self.ui_writer.reset_json_filter();
@@ -2204,7 +2326,9 @@ Skip if nothing new. Be brief."#;
                            // Only reset parser if there are no more unexecuted tool calls in the buffer
                            // This handles the case where the LLM emits multiple tool calls in one response
                            if parser.has_unexecuted_tool_call() {
-                                debug!("Parser still has unexecuted tool calls, not resetting buffer");
+                                debug!(
                                    "Parser still has unexecuted tool calls, not resetting buffer"
                                );
                                // Mark current tool as consumed so we don't re-detect it
                                parser.mark_tool_calls_consumed();
                            } else {
@@ -2366,7 +2490,6 @@ Skip if nothing new. Be brief."#;
                        error!("Parser state at error: text_buffer_len={}, has_incomplete={}, message_stopped={}",
                            parser.text_buffer_len(), parser.has_incomplete_tool_call(), parser.is_message_stopped());
                        // Check if this is a recoverable connection error
                        let is_connection_error = streaming::is_connection_error(&error_msg);
@@ -2452,7 +2575,8 @@ Skip if nothing new. Be brief."#;
                }
                // Check if the response was truncated due to max_tokens
-                let was_truncated_by_max_tokens = stream_stop_reason.as_deref() == Some("max_tokens");
+                let was_truncated_by_max_tokens =
                    stream_stop_reason.as_deref() == Some("max_tokens");
                if was_truncated_by_max_tokens {
                    debug!("Response was truncated due to max_tokens limit");
                    warn!("LLM response was cut off due to max_tokens limit - will auto-continue");
@@ -2491,8 +2615,13 @@ Skip if nothing new. Be brief."#;
                                "\n🔄 Model stopped without providing summary. Auto-continuing...\n",
                            ),
                        };
-                        warn!("{} ({} iterations, auto-continue attempt {}/{})",
+                        warn!(
-                            log_msg, iteration_count, auto_summary_attempts, MAX_AUTO_SUMMARY_ATTEMPTS);
+                            "{} ({} iterations, auto-continue attempt {}/{})",
                            log_msg,
                            iteration_count,
                            auto_summary_attempts,
                            MAX_AUTO_SUMMARY_ATTEMPTS
                        );
                        self.ui_writer.print_context_status(ui_msg);
                        // Add any text response to context before prompting for continuation
@@ -2613,11 +2742,14 @@ Skip if nothing new. Be brief."#;
            Ok(s) => s.clone(),
            Err(e) => format!("ERROR: {}", e),
        };
-        debug!("Tool {} completed: {}", tool_call.tool, &log_str.chars().take(100).collect::<String>());
+        debug!(
            "Tool {} completed: {}",
            tool_call.tool,
            &log_str.chars().take(100).collect::<String>()
        );
        result
    }
    async fn execute_tool_inner_in_dir(
        &mut self,
        tool_call: &ToolCall,
@@ -2660,11 +2792,8 @@ Skip if nothing new. Be brief."#;
        Ok(result)
    }
 }
 // Re-export utility functions
 pub use utils::apply_unified_diff_to_string;
 use utils::truncate_to_word_boundary;
@@ -2678,12 +2807,20 @@ fn parse_diff_stats(result: &str) -> (i32, i32) {
    // Look for "+N insertions" pattern
    if let Some(pos) = result.find("+") {
        let after_plus = &result[pos + 1..];
-        insertions = after_plus.split_whitespace().next().and_then(|s| s.parse().ok()).unwrap_or(0);
+        insertions = after_plus
            .split_whitespace()
            .next()
            .and_then(|s| s.parse().ok())
            .unwrap_or(0);
    }
    // Look for "-M deletions" pattern
    if let Some(pos) = result.find("-") {
        let after_minus = &result[pos + 1..];
-        deletions = after_minus.split_whitespace().next().and_then(|s| s.parse().ok()).unwrap_or(0);
+        deletions = after_minus
            .split_whitespace()
            .next()
            .and_then(|s| s.parse().ok())
            .unwrap_or(0);
    }
    (insertions, deletions)
 }
--- a/crates/g3-providers/src/anthropic.rs
+++ b/crates/g3-providers/src/anthropic.rs
@@ -110,9 +110,12 @@ use tokio_stream::wrappers::ReceiverStream;
 use tracing::{debug, error};
 use crate::{
    streaming::{
        decode_utf8_streaming, make_final_chunk, make_final_chunk_with_reason, make_text_chunk,
        make_tool_chunk,
    },
    CompletionChunk, CompletionRequest, CompletionResponse, CompletionStream, LLMProvider, Message,
    MessageRole, Tool, ToolCall, Usage,
    streaming::{decode_utf8_streaming, make_final_chunk, make_final_chunk_with_reason, make_text_chunk, make_tool_chunk},
 };
 const ANTHROPIC_API_URL: &str = "https://api.anthropic.com/v1/messages";
@@ -156,7 +159,7 @@ impl AnthropicProvider {
            name: "anthropic".to_string(),
            api_key,
            model,
-            max_tokens: max_tokens.unwrap_or(4096),
+            max_tokens: max_tokens.unwrap_or(32768),
            temperature: temperature.unwrap_or(0.1),
            cache_config,
            enable_1m_context: enable_1m_context.unwrap_or(false),
@@ -182,14 +185,17 @@ impl AnthropicProvider {
        let model = model.unwrap_or_else(|| "claude-3-5-sonnet-20241022".to_string());
-        debug!("Initialized Anthropic provider '{}' with model: {}", name, model);
+        debug!(
            "Initialized Anthropic provider '{}' with model: {}",
            name, model
        );
        Ok(Self {
            client,
            name,
            api_key,
            model,
-            max_tokens: max_tokens.unwrap_or(4096),
+            max_tokens: max_tokens.unwrap_or(32768),
            temperature: temperature.unwrap_or(0.1),
            cache_config,
            enable_1m_context: enable_1m_context.unwrap_or(false),
@@ -292,7 +298,10 @@ impl AnthropicProvider {
                    // Add text content
                    content_blocks.push(AnthropicContent::Text {
                        text: message.content.clone(),
-                        cache_control: message.cache_control.as_ref().map(Self::convert_cache_control),
+                        cache_control: message
                            .cache_control
                            .as_ref()
                            .map(Self::convert_cache_control),
                    });
                    anthropic_messages.push(AnthropicMessage {
@@ -427,7 +436,10 @@ impl AnthropicProvider {
                        if let Some(data) = line.strip_prefix("data: ") {
                            if data == "[DONE]" {
                                debug!("Received stream completion marker");
-                                let final_chunk = make_final_chunk(current_tool_calls.clone(), accumulated_usage.clone());
+                                let final_chunk = make_final_chunk(
                                    current_tool_calls.clone(),
                                    accumulated_usage.clone(),
                                );
                                if tx.send(Ok(final_chunk)).await.is_err() {
                                    debug!("Receiver dropped, stopping stream");
                                }
@@ -491,7 +503,8 @@ impl AnthropicProvider {
                                                        {
                                                            // We have complete arguments, send the tool call immediately
                                                            debug!("Tool call has complete args, sending immediately: {:?}", tool_call);
-                                                            let chunk = make_tool_chunk(vec![tool_call]);
+                                                            let chunk =
                                                                make_tool_chunk(vec![tool_call]);
                                                            if tx.send(Ok(chunk)).await.is_err() {
                                                                debug!("Receiver dropped, stopping stream");
                                                                return accumulated_usage;
@@ -575,7 +588,8 @@ impl AnthropicProvider {
                                            // Send the complete tool call
                                            if !current_tool_calls.is_empty() {
-                                                let chunk = make_tool_chunk(current_tool_calls.clone());
+                                                let chunk =
                                                    make_tool_chunk(current_tool_calls.clone());
                                                if tx.send(Ok(chunk)).await.is_err() {
                                                    debug!("Receiver dropped, stopping stream");
                                                    return accumulated_usage;
@@ -597,7 +611,11 @@ impl AnthropicProvider {
                                        "message_stop" => {
                                            debug!("Received message stop event");
                                            message_stopped = true;
-                                            let final_chunk = make_final_chunk_with_reason(current_tool_calls.clone(), accumulated_usage.clone(), stop_reason.clone());
+                                            let final_chunk = make_final_chunk_with_reason(
                                                current_tool_calls.clone(),
                                                accumulated_usage.clone(),
                                                stop_reason.clone(),
                                            );
                                            if tx.send(Ok(final_chunk)).await.is_err() {
                                                debug!("Receiver dropped, stopping stream");
                                            }
@@ -826,7 +844,10 @@ struct ThinkingConfig {
 impl ThinkingConfig {
    fn enabled(budget_tokens: u32) -> Self {
-        Self { thinking_type: "enabled".to_string(), budget_tokens }
+        Self {
            thinking_type: "enabled".to_string(),
            budget_tokens,
        }
    }
 }
@@ -889,9 +910,7 @@ enum AnthropicContent {
        input: serde_json::Value,
    },
    #[serde(rename = "image")]
-    Image {
+    Image { source: AnthropicImageSource },
        source: AnthropicImageSource,
    },
 }
 /// Image source for Anthropic API
@@ -962,7 +981,8 @@ mod tests {
    #[test]
    fn test_message_conversion() {
        let provider =
-            AnthropicProvider::new("test-key".to_string(), None, None, None, None, None, None).unwrap();
+            AnthropicProvider::new("test-key".to_string(), None, None, None, None, None, None)
                .unwrap();
        let messages = vec![
            Message::new(
@@ -1011,7 +1031,8 @@ mod tests {
    #[test]
    fn test_tool_conversion() {
        let provider =
-            AnthropicProvider::new("test-key".to_string(), None, None, None, None, None, None).unwrap();
+            AnthropicProvider::new("test-key".to_string(), None, None, None, None, None, None)
                .unwrap();
        let tools = vec![Tool {
            name: "get_weather".to_string(),
@@ -1044,7 +1065,8 @@ mod tests {
    #[test]
    fn test_cache_control_serialization() {
        let provider =
-            AnthropicProvider::new("test-key".to_string(), None, None, None, None, None, None).unwrap();
+            AnthropicProvider::new("test-key".to_string(), None, None, None, None, None, None)
                .unwrap();
        // Test message WITHOUT cache_control
        let messages_without = vec![Message::new(MessageRole::User, "Hello".to_string())];
@@ -1106,7 +1128,10 @@ mod tests {
            .create_request_body(&messages, None, false, 1000, 0.5, false)
            .unwrap();
        let json_without = serde_json::to_string(&request_without).unwrap();
-        assert!(!json_without.contains("thinking"), "JSON should not contain 'thinking' field when not configured");
+        assert!(
            !json_without.contains("thinking"),
            "JSON should not contain 'thinking' field when not configured"
        );
        // Test WITH thinking parameter - max_tokens must be > budget_tokens + 1024
        // Using budget=10000 requires max_tokens > 11024
@@ -1125,16 +1150,28 @@ mod tests {
            .create_request_body(&messages, None, false, 20000, 0.5, false)
            .unwrap();
        let json_with = serde_json::to_string(&request_with).unwrap();
-        assert!(json_with.contains("thinking"), "JSON should contain 'thinking' field when configured");
+        assert!(
-        assert!(json_with.contains("\"type\":\"enabled\""), "JSON should contain type: enabled");
+            json_with.contains("thinking"),
-        assert!(json_with.contains("\"budget_tokens\":10000"), "JSON should contain budget_tokens: 10000");
+            "JSON should contain 'thinking' field when configured"
        );
        assert!(
            json_with.contains("\"type\":\"enabled\""),
            "JSON should contain type: enabled"
        );
        assert!(
            json_with.contains("\"budget_tokens\":10000"),
            "JSON should contain budget_tokens: 10000"
        );
        // Test WITH thinking parameter but INSUFFICIENT max_tokens - thinking should be disabled
        let request_insufficient = provider_with
            .create_request_body(&messages, None, false, 5000, 0.5, false) // Less than budget + 1024
            .unwrap();
        let json_insufficient = serde_json::to_string(&request_insufficient).unwrap();
-        assert!(!json_insufficient.contains("thinking"), "JSON should NOT contain 'thinking' field when max_tokens is insufficient");
+        assert!(
            !json_insufficient.contains("thinking"),
            "JSON should NOT contain 'thinking' field when max_tokens is insufficient"
        );
    }
    #[test]
@@ -1158,14 +1195,20 @@ mod tests {
            .create_request_body(&messages, None, false, 20000, 0.5, false)
            .unwrap();
        let json_with = serde_json::to_string(&request_with_thinking).unwrap();
-        assert!(json_with.contains("thinking"), "JSON should contain 'thinking' field when not disabled");
+        assert!(
            json_with.contains("thinking"),
            "JSON should contain 'thinking' field when not disabled"
        );
        // With disable_thinking=true, thinking should be disabled even with sufficient max_tokens
        let request_without_thinking = provider
            .create_request_body(&messages, None, false, 20000, 0.5, true)
            .unwrap();
        let json_without = serde_json::to_string(&request_without_thinking).unwrap();
-        assert!(!json_without.contains("thinking"), "JSON should NOT contain 'thinking' field when explicitly disabled");
+        assert!(
            !json_without.contains("thinking"),
            "JSON should NOT contain 'thinking' field when explicitly disabled"
        );
    }
    #[test]
@@ -1188,10 +1231,14 @@ mod tests {
        assert_eq!(response.model, "claude-sonnet-4-5");
        // Extract only text content (thinking should be filtered out)
-        let text_content: Vec<_> = response.content.iter().filter_map(|c| match c {
+        let text_content: Vec<_> = response
            .content
            .iter()
            .filter_map(|c| match c {
                AnthropicContent::Text { text, .. } => Some(text.as_str()),
                _ => None,
-        }).collect();
+            })
            .collect();
        assert_eq!(text_content.len(), 1);
        assert_eq!(text_content[0], "Here is my response.");