nearai · ilblackdragon · May 7, 2026 · May 7, 2026 · May 7, 2026 · May 7, 2026
diff --git a/providers.json b/providers.json
@@ -124,13 +124,13 @@
     "aliases": [
       "open_router"
     ],
-    "protocol": "open_ai_completions",
-    "default_base_url": "https://openrouter.ai/api/v1",
+    "protocol": "open_router",
+    "default_base_url": "",
     "api_key_env": "OPENROUTER_API_KEY",
     "api_key_required": true,
     "model_env": "OPENROUTER_MODEL",
     "default_model": "openai/gpt-4o",
-    "description": "OpenRouter multi-provider gateway (200+ models)",
+    "description": "OpenRouter multi-provider gateway (200+ models, preserves reasoning across turns)",
     "setup": {
       "kind": "api_key",
       "secret_name": "llm_openrouter_api_key",
@@ -246,13 +246,13 @@
     "aliases": [
       "deep_seek"
     ],
-    "protocol": "open_ai_completions",
-    "default_base_url": "https://api.deepseek.com/v1",
+    "protocol": "deep_seek",
+    "default_base_url": "",
     "api_key_env": "DEEPSEEK_API_KEY",
     "api_key_required": true,
     "model_env": "DEEPSEEK_MODEL",
     "default_model": "deepseek-chat",
-    "description": "DeepSeek inference API",
+    "description": "DeepSeek inference API (preserves reasoning_content for thinking-mode models)",
     "setup": {
       "kind": "api_key",
       "secret_name": "llm_deepseek_api_key",
@@ -325,13 +325,13 @@
       "google_gemini",
       "google"
     ],
-    "protocol": "open_ai_completions",
-    "default_base_url": "https://generativelanguage.googleapis.com/v1beta/openai",
+    "protocol": "gemini",
+    "default_base_url": "",
     "api_key_env": "GEMINI_API_KEY",
     "api_key_required": true,
     "model_env": "GEMINI_MODEL",
     "default_model": "gemini-2.5-flash",
-    "description": "Google Gemini (via OpenAI-compatible endpoint)",
+    "description": "Google Gemini native API (preserves thought_signature on tool calls)",
     "setup": {
       "kind": "api_key",
       "secret_name": "llm_gemini_api_key",

diff --git a/src/llm/mod.rs b/src/llm/mod.rs
@@ -187,6 +187,9 @@ fn create_registry_provider(
         ProviderProtocol::OpenAiCompletions => create_openai_compat_from_registry(config),
         ProviderProtocol::Anthropic => create_anthropic_from_registry(config),
         ProviderProtocol::Ollama => create_ollama_from_registry(config),
+        ProviderProtocol::DeepSeek => create_deepseek_from_registry(config),
+        ProviderProtocol::Gemini => create_gemini_from_registry(config),
+        ProviderProtocol::OpenRouter => create_openrouter_from_registry(config),
         ProviderProtocol::GithubCopilot => {
             let provider =
                 github_copilot::GithubCopilotProvider::new(config, request_timeout_secs)?;
@@ -424,6 +427,179 @@ fn create_ollama_from_registry(
     Ok(Arc::new(adapter))
 }
 
+/// Build a DeepSeek provider via rig-core's dedicated DeepSeek client.
+///
+/// Routing through this client (rather than the generic OpenAI-compat path)
+/// is what makes thinking-mode tool calling work: rig-core's DeepSeek
+/// implementation captures `reasoning_content` from each response and writes
+/// it back onto the assistant message in the next request. Without that
+/// round-trip the API rejects the second turn with HTTP 400 ("The
+/// reasoning_content in the thinking mode must be passed back to the API").
+/// See #3201.
+fn create_deepseek_from_registry(
+    config: &RegistryProviderConfig,
+) -> Result<Arc<dyn LlmProvider>, LlmError> {
+    use rig::providers::deepseek;
+
+    let api_key = config
+        .api_key
+        .as_ref()
+        .map(|k| k.expose_secret().to_string())
+        .ok_or_else(|| LlmError::AuthFailed {
+            provider: config.provider_id.clone(),
+        })?;
+
+    let client: deepseek::Client = if config.base_url.is_empty() {
+        deepseek::Client::new(&api_key)
+    } else {
+        deepseek::Client::builder()
+            .api_key(&api_key)
+            .base_url(&config.base_url)
+            .build()
+    }
+    .map_err(|e| LlmError::RequestFailed {
+        provider: config.provider_id.clone(),
+        reason: format!("Failed to create DeepSeek client: {e}"),
+    })?;
+
+    let model = client.completion_model(&config.model);
+
+    tracing::debug!(
+        provider = %config.provider_id,
+        model = %config.model,
+        base_url = if config.base_url.is_empty() { "default" } else { &config.base_url },
+        "Using DeepSeek provider (preserves reasoning_content across turns)"
+    );
+
+    Ok(Arc::new(
+        RigAdapter::new(model, &config.model)
+            .with_unsupported_params(config.unsupported_params.clone()),
+    ))
+}
+
+/// Build an OpenRouter provider via rig-core's dedicated OpenRouter client.
+///
+/// Routing through this client (rather than the generic OpenAI-compat path)
+/// preserves OpenRouter's `reasoning`, `reasoning_details`, and per-tool-call
+/// signatures across turns. The generic OpenAI client strips all of them, so
+/// any thinking-mode model accessed via OpenRouter (Claude with thinking,
+/// OpenAI o-series, DeepSeek-R1, Gemini 2.5+, Qwen QwQ, …) loses its
+/// reasoning artifacts on the assistant message and the next request fails
+/// the same way as #3201 / #3225.
+fn create_openrouter_from_registry(
+    config: &RegistryProviderConfig,
+) -> Result<Arc<dyn LlmProvider>, LlmError> {
+    use rig::providers::openrouter;
+
+    let api_key = config
+        .api_key
+        .as_ref()
+        .map(|k| k.expose_secret().to_string())
+        .ok_or_else(|| LlmError::AuthFailed {
+            provider: config.provider_id.clone(),
+        })?;
+
+    // OpenRouter attribution headers (`HTTP-Referer`, `X-Title`) and any other
+    // user-configured extras must follow the request through.
+    let mut extra_headers = reqwest::header::HeaderMap::new();
+    for (key, value) in &config.extra_headers {
+        let name = match reqwest::header::HeaderName::from_bytes(key.as_bytes()) {
+            Ok(n) => n,
+            Err(e) => {
+                tracing::warn!(header = %key, error = %e, "Skipping extra header: invalid name");
+                continue;
+            }
+        };
+        let val = match reqwest::header::HeaderValue::from_str(value) {
+            Ok(v) => v,
+            Err(e) => {
+                tracing::warn!(header = %key, error = %e, "Skipping extra header: invalid value");
+                continue;
+            }
+        };
+        extra_headers.insert(name, val);
+    }
+
+    let mut builder = openrouter::Client::builder().api_key(&api_key);
+    if !config.base_url.is_empty() {
+        builder = builder.base_url(&config.base_url);
+    }
+    if !extra_headers.is_empty() {
+        builder = builder.http_headers(extra_headers);
+    }
+
+    let client: openrouter::Client = builder.build().map_err(|e| LlmError::RequestFailed {
+        provider: config.provider_id.clone(),
+        reason: format!("Failed to create OpenRouter client: {e}"),
+    })?;
+
+    let model = client.completion_model(&config.model);
+
+    tracing::debug!(
+        provider = %config.provider_id,
+        model = %config.model,
+        base_url = if config.base_url.is_empty() { "default" } else { &config.base_url },
+        "Using OpenRouter provider (preserves reasoning + signatures across turns)"
+    );
+
+    Ok(Arc::new(
+        RigAdapter::new(model, &config.model)
+            .with_unsupported_params(config.unsupported_params.clone()),
+    ))
+}
+
+/// Build a Gemini provider via rig-core's dedicated Gemini client.
+///
+/// Routing through this client (rather than the generic OpenAI-compat path
+/// at `/v1beta/openai`) is what makes Gemini thinking-mode tool calling
+/// work: rig-core's Gemini implementation round-trips `thought_signature`
+/// on each `functionCall`. Without that round-trip the API rejects the
+/// next turn with HTTP 400 ("Function call is missing a thought_signature
+/// in functionCall parts"). See #3225.
+///
+/// This is API-key auth only (`GEMINI_API_KEY`). Users on Gemini OAuth go
+/// through the separate `gemini_oauth` backend.
+fn create_gemini_from_registry(
+    config: &RegistryProviderConfig,
+) -> Result<Arc<dyn LlmProvider>, LlmError> {
+    use rig::providers::gemini;
+
+    let api_key = config
+        .api_key
+        .as_ref()
+        .map(|k| k.expose_secret().to_string())
+        .ok_or_else(|| LlmError::AuthFailed {
+            provider: config.provider_id.clone(),
+        })?;
+
+    let client: gemini::Client = if config.base_url.is_empty() {
+        gemini::Client::new(&api_key)
+    } else {
+        gemini::Client::builder()
+            .api_key(&api_key)
+            .base_url(&config.base_url)
+            .build()
+    }
+    .map_err(|e| LlmError::RequestFailed {
+        provider: config.provider_id.clone(),
+        reason: format!("Failed to create Gemini client: {e}"),
+    })?;
+
+    let model = client.completion_model(&config.model);
+
+    tracing::debug!(
+        provider = %config.provider_id,
+        model = %config.model,
+        base_url = if config.base_url.is_empty() { "default" } else { &config.base_url },
+        "Using Gemini provider (preserves thought_signature across turns)"
+    );
+
+    Ok(Arc::new(
+        RigAdapter::new(model, &config.model)
+            .with_unsupported_params(config.unsupported_params.clone()),
+    ))
+}
+
 /// Create an OpenAI Codex provider with OAuth authentication.
 ///
 /// This is async because it needs to ensure authentication before

diff --git a/src/llm/registry.rs b/src/llm/registry.rs
@@ -39,6 +39,21 @@ pub enum ProviderProtocol {
     Ollama,
     /// GitHub Copilot API (OpenAI-compatible with token exchange).
     GithubCopilot,
+    /// DeepSeek API. Routes through rig-core's dedicated DeepSeek client,
+    /// which round-trips `reasoning_content` for thinking-mode models —
+    /// the generic OpenAI client strips it. (#3201)
+    DeepSeek,
+    /// Google Gemini native API. Routes through rig-core's dedicated Gemini
+    /// client, which round-trips `thought_signature` on tool calls —
+    /// the OpenAI-compat shim strips it. (#3225)
+    Gemini,
+    /// OpenRouter (multi-model gateway). Routes through rig-core's dedicated
+    /// OpenRouter client, which round-trips `reasoning`, `reasoning_details`
+    /// (Summary / Encrypted / Text), and per-tool-call signatures —
+    /// the generic OpenAI client strips all of them, breaking thinking-mode
+    /// tool calling on every reasoning model OpenRouter exposes (Claude with
+    /// thinking, OpenAI o-series, DeepSeek-R1, Gemini 2.5+, Qwen QwQ, …).
+    OpenRouter,
 }
 
 /// How the setup wizard should collect credentials for this provider.
@@ -478,6 +493,48 @@ mod tests {
         }
     }
 
+    /// Regression for #3201 / #3225 and the OpenRouter generalisation:
+    /// providers whose APIs return reasoning artifacts (DeepSeek's
+    /// `reasoning_content`, Gemini's `thought_signature`, OpenRouter's
+    /// `reasoning_details` + signatures) must NOT use the generic
+    /// `OpenAiCompletions` protocol. The OpenAI-compat path goes through
+    /// rig-core's OpenAI client, which strips those fields, breaking
+    /// multi-turn tool calling for every thinking-mode model these
+    /// providers expose. They must route through the dedicated rig-core
+    /// clients which round-trip the artifacts on the next request.
+    #[test]
+    fn reasoning_aware_providers_use_dedicated_protocol_not_openai_compat() {
+        let providers: Vec<ProviderDefinition> =
+            serde_json::from_str(include_str!("../../providers.json")).unwrap();
+        let by_id = |id: &str| providers.iter().find(|p| p.id == id).cloned();
+
+        let deepseek = by_id("deepseek").expect("deepseek entry must exist");
+        assert_eq!(
+            deepseek.protocol,
+            ProviderProtocol::DeepSeek,
+            "deepseek must use DeepSeek protocol — OpenAiCompletions strips \
+             reasoning_content and breaks thinking-mode tool calling (#3201)",
+        );
+
+        let gemini = by_id("gemini").expect("gemini entry must exist");
+        assert_eq!(
+            gemini.protocol,
+            ProviderProtocol::Gemini,
+            "gemini must use Gemini protocol — OpenAiCompletions strips \
+             thought_signature and breaks tool calling on thinking models (#3225)",
+        );
+
+        let openrouter = by_id("openrouter").expect("openrouter entry must exist");
+        assert_eq!(
+            openrouter.protocol,
+            ProviderProtocol::OpenRouter,
+            "openrouter must use OpenRouter protocol — OpenAiCompletions \
+             strips reasoning_details and tool-call signatures, breaking \
+             every thinking-mode model OpenRouter exposes (Claude with \
+             thinking, OpenAI o-series, DeepSeek-R1, Gemini 2.5+, Qwen QwQ)",
+        );
+    }
+
     #[test]
     fn test_openai_compatible_providers_have_base_url() {
         let providers: Vec<ProviderDefinition> =