From a5e7aa1342f9b0f51dce1a42f698038f7383e872 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 27 Nov 2025 15:30:19 +0800
Subject: [PATCH 01/53] feat: Implement shared provider utilities and API host
 formatting

- Added provider API host formatting utilities to handle differences between Cherry Studio and AI SDK.
- Introduced functions for formatting provider API hosts, including support for Azure OpenAI and Vertex AI.
- Created a simple API key rotator for managing API key rotation.
- Developed shared provider initialization and mapping utilities for resolving provider IDs.
- Implemented AI SDK configuration utilities for converting Cherry Studio providers to AI SDK configurations.
- Added support for various providers including OpenRouter, Google Vertex AI, and Amazon Bedrock.
- Enhanced error handling and logging in the unified messages service for better debugging.
- Introduced functions for streaming and generating unified messages using AI SDK.
---
 .../shared/adapters/AiSdkToAnthropicSSE.ts    | 593 ++++++++++++++++++
 packages/shared/adapters/index.ts             |  13 +
 packages/shared/api/index.ts                  | 173 +++++
 .../shared}/provider/config/aihubmix.ts       |  29 +-
 .../shared/provider/config/azure-anthropic.ts |  22 +
 packages/shared/provider/config/helper.ts     |  32 +
 packages/shared/provider/config/index.ts      |   6 +
 .../shared}/provider/config/newApi.ts         |  24 +-
 packages/shared/provider/config/types.ts      |   9 +
 .../provider/config/vertex-anthropic.ts       |  19 +
 packages/shared/provider/detection.ts         | 100 +++
 packages/shared/provider/format.ts            | 136 ++++
 packages/shared/provider/index.ts             |  48 ++
 packages/shared/provider/initialization.ts    | 107 ++++
 packages/shared/provider/mapping.ts           |  95 +++
 packages/shared/provider/resolve.ts           |  44 ++
 packages/shared/provider/sdk-config.ts        | 240 +++++++
 packages/shared/provider/types.ts             | 174 +++++
 packages/shared/utils/index.ts                |   1 +
 packages/shared/utils/naming.ts               |  31 +
 src/main/apiServer/routes/messages.ts         | 241 ++++++-
 src/main/apiServer/services/models.ts         |  27 +-
 .../apiServer/services/unified-messages.ts    | 455 ++++++++++++++
 .../agents/services/claudecode/index.ts       |  29 +-
 .../legacy/clients/gemini/VertexAPIClient.ts  |   2 +-
 .../aiCore/provider/config/azure-anthropic.ts |  22 -
 .../src/aiCore/provider/config/helper.ts      |  22 -
 .../src/aiCore/provider/config/index.ts       |  10 +-
 .../src/aiCore/provider/config/types.ts       |   9 -
 .../provider/config/vertext-anthropic.ts      |  19 -
 src/renderer/src/aiCore/provider/factory.ts   |  63 +-
 .../src/aiCore/provider/providerConfig.ts     | 227 ++-----
 .../aiCore/provider/providerInitialization.ts | 112 +---
 src/renderer/src/types/index.ts               |   4 +-
 src/renderer/src/types/provider.ts            | 158 +----
 src/renderer/src/utils/api.ts                 | 178 +-----
 src/renderer/src/utils/naming.ts              |  34 +-
 src/renderer/src/utils/provider.ts            |  69 +-
 38 files changed, 2681 insertions(+), 896 deletions(-)
 create mode 100644 packages/shared/adapters/AiSdkToAnthropicSSE.ts
 create mode 100644 packages/shared/adapters/index.ts
 create mode 100644 packages/shared/api/index.ts
 rename {src/renderer/src/aiCore => packages/shared}/provider/config/aihubmix.ts (53%)
 create mode 100644 packages/shared/provider/config/azure-anthropic.ts
 create mode 100644 packages/shared/provider/config/helper.ts
 create mode 100644 packages/shared/provider/config/index.ts
 rename {src/renderer/src/aiCore => packages/shared}/provider/config/newApi.ts (52%)
 create mode 100644 packages/shared/provider/config/types.ts
 create mode 100644 packages/shared/provider/config/vertex-anthropic.ts
 create mode 100644 packages/shared/provider/detection.ts
 create mode 100644 packages/shared/provider/format.ts
 create mode 100644 packages/shared/provider/index.ts
 create mode 100644 packages/shared/provider/initialization.ts
 create mode 100644 packages/shared/provider/mapping.ts
 create mode 100644 packages/shared/provider/resolve.ts
 create mode 100644 packages/shared/provider/sdk-config.ts
 create mode 100644 packages/shared/provider/types.ts
 create mode 100644 packages/shared/utils/index.ts
 create mode 100644 packages/shared/utils/naming.ts
 create mode 100644 src/main/apiServer/services/unified-messages.ts
 delete mode 100644 src/renderer/src/aiCore/provider/config/azure-anthropic.ts
 delete mode 100644 src/renderer/src/aiCore/provider/config/helper.ts
 delete mode 100644 src/renderer/src/aiCore/provider/config/types.ts
 delete mode 100644 src/renderer/src/aiCore/provider/config/vertext-anthropic.ts

diff --git a/packages/shared/adapters/AiSdkToAnthropicSSE.ts b/packages/shared/adapters/AiSdkToAnthropicSSE.ts
new file mode 100644
index 0000000000..38fab703ac
--- /dev/null
+++ b/packages/shared/adapters/AiSdkToAnthropicSSE.ts
@@ -0,0 +1,593 @@
+/**
+ * AI SDK to Anthropic SSE Adapter
+ *
+ * Converts AI SDK's fullStream (TextStreamPart) events to Anthropic Messages API SSE format.
+ * This enables any AI provider supported by AI SDK to be exposed via Anthropic-compatible API.
+ *
+ * Anthropic SSE Event Flow:
+ * 1. message_start - Initial message with metadata
+ * 2. content_block_start - Begin a content block (text, tool_use, thinking)
+ * 3. content_block_delta - Incremental content updates
+ * 4. content_block_stop - End a content block
+ * 5. message_delta - Updates to overall message (stop_reason, usage)
+ * 6. message_stop - Stream complete
+ *
+ * @see https://docs.anthropic.com/en/api/messages-streaming
+ */
+
+import type {
+  ContentBlock,
+  InputJSONDelta,
+  Message,
+  MessageDeltaUsage,
+  RawContentBlockDeltaEvent,
+  RawContentBlockStartEvent,
+  RawContentBlockStopEvent,
+  RawMessageDeltaEvent,
+  RawMessageStartEvent,
+  RawMessageStopEvent,
+  RawMessageStreamEvent,
+  StopReason,
+  TextBlock,
+  TextDelta,
+  ThinkingBlock,
+  ThinkingDelta,
+  ToolUseBlock,
+  Usage
+} from '@anthropic-ai/sdk/resources/messages'
+import { loggerService } from '@logger'
+import type { TextStreamPart, ToolSet } from 'ai'
+
+const logger = loggerService.withContext('AiSdkToAnthropicSSE')
+
+interface ContentBlockState {
+  type: 'text' | 'tool_use' | 'thinking'
+  index: number
+  started: boolean
+  content: string
+  // For tool_use blocks
+  toolId?: string
+  toolName?: string
+  toolInput?: string
+}
+
+interface AdapterState {
+  messageId: string
+  model: string
+  inputTokens: number
+  outputTokens: number
+  currentBlockIndex: number
+  blocks: Map<number, ContentBlockState>
+  textBlockIndex: number | null
+  thinkingBlockIndex: number | null
+  toolBlocks: Map<string, number> // toolCallId -> blockIndex
+  stopReason: StopReason | null
+  hasEmittedMessageStart: boolean
+}
+
+// ============================================================================
+// Adapter Class
+// ============================================================================
+
+export type SSEEventCallback = (event: RawMessageStreamEvent) => void
+
+export interface AiSdkToAnthropicSSEOptions {
+  model: string
+  messageId?: string
+  inputTokens?: number
+  onEvent: SSEEventCallback
+}
+
+/**
+ * Adapter that converts AI SDK fullStream events to Anthropic SSE events
+ */
+export class AiSdkToAnthropicSSE {
+  private state: AdapterState
+  private onEvent: SSEEventCallback
+
+  constructor(options: AiSdkToAnthropicSSEOptions) {
+    this.onEvent = options.onEvent
+    this.state = {
+      messageId: options.messageId || `msg_${Date.now()}_${Math.random().toString(36).substring(2, 11)}`,
+      model: options.model,
+      inputTokens: options.inputTokens || 0,
+      outputTokens: 0,
+      currentBlockIndex: 0,
+      blocks: new Map(),
+      textBlockIndex: null,
+      thinkingBlockIndex: null,
+      toolBlocks: new Map(),
+      stopReason: null,
+      hasEmittedMessageStart: false
+    }
+  }
+
+  /**
+   * Process the AI SDK stream and emit Anthropic SSE events
+   */
+  async processStream(fullStream: ReadableStream<TextStreamPart<ToolSet>>): Promise<void> {
+    const reader = fullStream.getReader()
+
+    try {
+      // Emit message_start at the beginning
+      this.emitMessageStart()
+
+      while (true) {
+        const { done, value } = await reader.read()
+
+        if (done) {
+          break
+        }
+
+        this.processChunk(value)
+      }
+
+      // Ensure all blocks are closed and emit final events
+      this.finalize()
+    } finally {
+      reader.releaseLock()
+    }
+  }
+
+  /**
+   * Process a single AI SDK chunk and emit corresponding Anthropic events
+   */
+  private processChunk(chunk: TextStreamPart<ToolSet>): void {
+    logger.silly('AiSdkToAnthropicSSE - Processing chunk:', chunk)
+    switch (chunk.type) {
+      // === Text Events ===
+      case 'text-start':
+        this.startTextBlock()
+        break
+
+      case 'text-delta':
+        this.emitTextDelta(chunk.text || '')
+        break
+
+      case 'text-end':
+        this.stopTextBlock()
+        break
+
+      // === Reasoning/Thinking Events ===
+      case 'reasoning-start':
+        this.startThinkingBlock()
+        break
+
+      case 'reasoning-delta':
+        this.emitThinkingDelta(chunk.text || '')
+        break
+
+      case 'reasoning-end':
+        this.stopThinkingBlock()
+        break
+
+      // === Tool Events ===
+      case 'tool-call':
+        this.handleToolCall({
+          type: 'tool-call',
+          toolCallId: chunk.toolCallId,
+          toolName: chunk.toolName,
+          // AI SDK uses 'args' in some versions and 'input' in others
+          args: 'args' in chunk ? chunk.args : (chunk as any).input
+        })
+        break
+
+      case 'tool-result':
+        // Tool results are handled separately in Anthropic API
+        // They come from user messages, not assistant stream
+        break
+
+      // === Completion Events ===
+      case 'finish-step':
+        if (chunk.finishReason === 'tool-calls') {
+          this.state.stopReason = 'tool_use'
+        }
+        break
+
+      case 'finish':
+        this.handleFinish(chunk)
+        break
+
+      // === Error Events ===
+      case 'error':
+        // Anthropic doesn't have a standard error event in the stream
+        // Errors are typically sent as separate HTTP responses
+        // For now, we'll just log and continue
+        break
+
+      // Ignore other event types
+      default:
+        break
+    }
+  }
+
+  private emitMessageStart(): void {
+    if (this.state.hasEmittedMessageStart) return
+
+    this.state.hasEmittedMessageStart = true
+
+    const usage: Usage = {
+      input_tokens: this.state.inputTokens,
+      output_tokens: 0,
+      cache_creation_input_tokens: 0,
+      cache_read_input_tokens: 0,
+      server_tool_use: null
+    }
+
+    const message: Message = {
+      id: this.state.messageId,
+      type: 'message',
+      role: 'assistant',
+      content: [],
+      model: this.state.model,
+      stop_reason: null,
+      stop_sequence: null,
+      usage
+    }
+
+    const event: RawMessageStartEvent = {
+      type: 'message_start',
+      message
+    }
+
+    this.onEvent(event)
+  }
+
+  private startTextBlock(): void {
+    // If we already have a text block, don't create another
+    if (this.state.textBlockIndex !== null) return
+
+    const index = this.state.currentBlockIndex++
+    this.state.textBlockIndex = index
+    this.state.blocks.set(index, {
+      type: 'text',
+      index,
+      started: true,
+      content: ''
+    })
+
+    const contentBlock: TextBlock = {
+      type: 'text',
+      text: '',
+      citations: null
+    }
+
+    const event: RawContentBlockStartEvent = {
+      type: 'content_block_start',
+      index,
+      content_block: contentBlock
+    }
+
+    this.onEvent(event)
+  }
+
+  private emitTextDelta(text: string): void {
+    if (!text) return
+
+    // Auto-start text block if not started
+    if (this.state.textBlockIndex === null) {
+      this.startTextBlock()
+    }
+
+    const index = this.state.textBlockIndex!
+    const block = this.state.blocks.get(index)
+    if (block) {
+      block.content += text
+    }
+
+    const delta: TextDelta = {
+      type: 'text_delta',
+      text
+    }
+
+    const event: RawContentBlockDeltaEvent = {
+      type: 'content_block_delta',
+      index,
+      delta
+    }
+
+    this.onEvent(event)
+  }
+
+  private stopTextBlock(): void {
+    if (this.state.textBlockIndex === null) return
+
+    const index = this.state.textBlockIndex
+
+    const event: RawContentBlockStopEvent = {
+      type: 'content_block_stop',
+      index
+    }
+
+    this.onEvent(event)
+    this.state.textBlockIndex = null
+  }
+
+  private startThinkingBlock(): void {
+    if (this.state.thinkingBlockIndex !== null) return
+
+    const index = this.state.currentBlockIndex++
+    this.state.thinkingBlockIndex = index
+    this.state.blocks.set(index, {
+      type: 'thinking',
+      index,
+      started: true,
+      content: ''
+    })
+
+    const contentBlock: ThinkingBlock = {
+      type: 'thinking',
+      thinking: '',
+      signature: ''
+    }
+
+    const event: RawContentBlockStartEvent = {
+      type: 'content_block_start',
+      index,
+      content_block: contentBlock
+    }
+
+    this.onEvent(event)
+  }
+
+  private emitThinkingDelta(text: string): void {
+    if (!text) return
+
+    // Auto-start thinking block if not started
+    if (this.state.thinkingBlockIndex === null) {
+      this.startThinkingBlock()
+    }
+
+    const index = this.state.thinkingBlockIndex!
+    const block = this.state.blocks.get(index)
+    if (block) {
+      block.content += text
+    }
+
+    const delta: ThinkingDelta = {
+      type: 'thinking_delta',
+      thinking: text
+    }
+
+    const event: RawContentBlockDeltaEvent = {
+      type: 'content_block_delta',
+      index,
+      delta
+    }
+
+    this.onEvent(event)
+  }
+
+  private stopThinkingBlock(): void {
+    if (this.state.thinkingBlockIndex === null) return
+
+    const index = this.state.thinkingBlockIndex
+
+    const event: RawContentBlockStopEvent = {
+      type: 'content_block_stop',
+      index
+    }
+
+    this.onEvent(event)
+    this.state.thinkingBlockIndex = null
+  }
+
+  private handleToolCall(chunk: { type: 'tool-call'; toolCallId: string; toolName: string; args: unknown }): void {
+    const { toolCallId, toolName, args } = chunk
+
+    // Check if we already have this tool call
+    if (this.state.toolBlocks.has(toolCallId)) {
+      return
+    }
+
+    const index = this.state.currentBlockIndex++
+    this.state.toolBlocks.set(toolCallId, index)
+
+    const inputJson = JSON.stringify(args)
+
+    this.state.blocks.set(index, {
+      type: 'tool_use',
+      index,
+      started: true,
+      content: inputJson,
+      toolId: toolCallId,
+      toolName,
+      toolInput: inputJson
+    })
+
+    // Emit content_block_start for tool_use
+    const contentBlock: ToolUseBlock = {
+      type: 'tool_use',
+      id: toolCallId,
+      name: toolName,
+      input: {}
+    }
+
+    const startEvent: RawContentBlockStartEvent = {
+      type: 'content_block_start',
+      index,
+      content_block: contentBlock
+    }
+
+    this.onEvent(startEvent)
+
+    // Emit the full input as a delta (Anthropic streams JSON incrementally)
+    const delta: InputJSONDelta = {
+      type: 'input_json_delta',
+      partial_json: inputJson
+    }
+
+    const deltaEvent: RawContentBlockDeltaEvent = {
+      type: 'content_block_delta',
+      index,
+      delta
+    }
+
+    this.onEvent(deltaEvent)
+
+    // Emit content_block_stop
+    const stopEvent: RawContentBlockStopEvent = {
+      type: 'content_block_stop',
+      index
+    }
+
+    this.onEvent(stopEvent)
+
+    // Mark that we have tool use
+    this.state.stopReason = 'tool_use'
+  }
+
+  private handleFinish(chunk: {
+    type: 'finish'
+    finishReason?: string
+    totalUsage?: {
+      inputTokens?: number
+      outputTokens?: number
+    }
+  }): void {
+    // Update usage
+    if (chunk.totalUsage) {
+      this.state.inputTokens = chunk.totalUsage.inputTokens || 0
+      this.state.outputTokens = chunk.totalUsage.outputTokens || 0
+    }
+
+    // Determine finish reason
+    if (!this.state.stopReason) {
+      switch (chunk.finishReason) {
+        case 'stop':
+        case 'end_turn':
+          this.state.stopReason = 'end_turn'
+          break
+        case 'length':
+        case 'max_tokens':
+          this.state.stopReason = 'max_tokens'
+          break
+        case 'tool-calls':
+          this.state.stopReason = 'tool_use'
+          break
+        default:
+          this.state.stopReason = 'end_turn'
+      }
+    }
+  }
+
+  private finalize(): void {
+    // Close any open blocks
+    if (this.state.textBlockIndex !== null) {
+      this.stopTextBlock()
+    }
+    if (this.state.thinkingBlockIndex !== null) {
+      this.stopThinkingBlock()
+    }
+
+    // Emit message_delta with final stop reason and usage
+    const usage: MessageDeltaUsage = {
+      output_tokens: this.state.outputTokens,
+      input_tokens: null,
+      cache_creation_input_tokens: null,
+      cache_read_input_tokens: null,
+      server_tool_use: null
+    }
+
+    const messageDeltaEvent: RawMessageDeltaEvent = {
+      type: 'message_delta',
+      delta: {
+        stop_reason: this.state.stopReason || 'end_turn',
+        stop_sequence: null
+      },
+      usage
+    }
+
+    this.onEvent(messageDeltaEvent)
+
+    // Emit message_stop
+    const messageStopEvent: RawMessageStopEvent = {
+      type: 'message_stop'
+    }
+
+    this.onEvent(messageStopEvent)
+  }
+
+  /**
+   * Set input token count (typically from prompt)
+   */
+  setInputTokens(count: number): void {
+    this.state.inputTokens = count
+  }
+
+  /**
+   * Get the current message ID
+   */
+  getMessageId(): string {
+    return this.state.messageId
+  }
+
+  /**
+   * Build a complete Message object for non-streaming responses
+   */
+  buildNonStreamingResponse(): Message {
+    const content: ContentBlock[] = []
+
+    // Collect all content blocks in order
+    const sortedBlocks = Array.from(this.state.blocks.values()).sort((a, b) => a.index - b.index)
+
+    for (const block of sortedBlocks) {
+      switch (block.type) {
+        case 'text':
+          content.push({
+            type: 'text',
+            text: block.content,
+            citations: null
+          } as TextBlock)
+          break
+        case 'thinking':
+          content.push({
+            type: 'thinking',
+            thinking: block.content
+          } as ThinkingBlock)
+          break
+        case 'tool_use':
+          content.push({
+            type: 'tool_use',
+            id: block.toolId!,
+            name: block.toolName!,
+            input: JSON.parse(block.toolInput || '{}')
+          } as ToolUseBlock)
+          break
+      }
+    }
+
+    return {
+      id: this.state.messageId,
+      type: 'message',
+      role: 'assistant',
+      content,
+      model: this.state.model,
+      stop_reason: this.state.stopReason || 'end_turn',
+      stop_sequence: null,
+      usage: {
+        input_tokens: this.state.inputTokens,
+        output_tokens: this.state.outputTokens,
+        cache_creation_input_tokens: 0,
+        cache_read_input_tokens: 0,
+        server_tool_use: null
+      }
+    }
+  }
+}
+
+/**
+ * Format an Anthropic SSE event for HTTP streaming
+ */
+export function formatSSEEvent(event: RawMessageStreamEvent): string {
+  return `event: ${event.type}\ndata: ${JSON.stringify(event)}\n\n`
+}
+
+/**
+ * Create a done marker for SSE stream
+ */
+export function formatSSEDone(): string {
+  return 'data: [DONE]\n\n'
+}
+
+export default AiSdkToAnthropicSSE
diff --git a/packages/shared/adapters/index.ts b/packages/shared/adapters/index.ts
new file mode 100644
index 0000000000..a19db9594e
--- /dev/null
+++ b/packages/shared/adapters/index.ts
@@ -0,0 +1,13 @@
+/**
+ * Shared Adapters
+ *
+ * This module exports adapters for converting between different AI API formats.
+ */
+
+export {
+  AiSdkToAnthropicSSE,
+  type AiSdkToAnthropicSSEOptions,
+  formatSSEDone,
+  formatSSEEvent,
+  type SSEEventCallback
+} from './AiSdkToAnthropicSSE'
diff --git a/packages/shared/api/index.ts b/packages/shared/api/index.ts
new file mode 100644
index 0000000000..0cf652b427
--- /dev/null
+++ b/packages/shared/api/index.ts
@@ -0,0 +1,173 @@
+/**
+ * Shared API Utilities
+ *
+ * Common utilities for API URL formatting and validation.
+ * Used by both main process (API Server) and renderer.
+ */
+
+import type { MinimalProvider } from '@shared/provider'
+import { trim } from 'lodash'
+
+// Supported endpoints for routing
+export const SUPPORTED_IMAGE_ENDPOINT_LIST = ['images/generations', 'images/edits', 'predict'] as const
+export const SUPPORTED_ENDPOINT_LIST = [
+  'chat/completions',
+  'responses',
+  'messages',
+  'generateContent',
+  'streamGenerateContent',
+  ...SUPPORTED_IMAGE_ENDPOINT_LIST
+] as const
+
+/**
+ * Removes the trailing slash from a URL string if it exists.
+ */
+export function withoutTrailingSlash<T extends string>(url: T): T {
+  return url.replace(/\/$/, '') as T
+}
+
+/**
+ * Checks if the host path contains a version string (e.g., /v1, /v2beta).
+ */
+export function hasAPIVersion(host?: string): boolean {
+  if (!host) return false
+
+  const versionRegex = /\/v\d+(?:alpha|beta)?(?=\/|$)/i
+
+  try {
+    const url = new URL(host)
+    return versionRegex.test(url.pathname)
+  } catch {
+    return versionRegex.test(host)
+  }
+}
+
+/**
+ * 格式化 Azure OpenAI 的 API 主机地址。
+ */
+export function formatAzureOpenAIApiHost(host: string): string {
+  const normalizedHost = withoutTrailingSlash(host)
+    ?.replace(/\/v1$/, '')
+    .replace(/\/openai$/, '')
+  // NOTE: AISDK会添加上`v1`
+  return formatApiHost(normalizedHost + '/openai', false)
+}
+
+export function formatVertexApiHost(provider: MinimalProvider, project: string, location: string): string {
+  const { apiHost } = provider
+  const trimmedHost = withoutTrailingSlash(trim(apiHost))
+  if (!trimmedHost || trimmedHost.endsWith('aiplatform.googleapis.com')) {
+    const host =
+      location == 'global' ? 'https://aiplatform.googleapis.com' : `https://${location}-aiplatform.googleapis.com`
+    return `${formatApiHost(host)}/projects/${project}/locations/${location}`
+  }
+  return formatApiHost(trimmedHost)
+}
+
+/**
+ * Formats an API host URL by normalizing it and optionally appending an API version.
+ *
+ * @param host - The API host URL to format
+ * @param isSupportedAPIVersion - Whether the API version is supported. Defaults to `true`.
+ * @param apiVersion - The API version to append if needed. Defaults to `'v1'`.
+ *
+ * @example
+ * formatApiHost('https://api.example.com/') // Returns 'https://api.example.com/v1'
+ * formatApiHost('https://api.example.com#') // Returns 'https://api.example.com#'
+ * formatApiHost('https://api.example.com/v2', true, 'v1') // Returns 'https://api.example.com/v2'
+ */
+export function formatApiHost(host?: string, isSupportedAPIVersion: boolean = true, apiVersion: string = 'v1'): string {
+  const normalizedHost = withoutTrailingSlash((host || '').trim())
+  if (!normalizedHost) {
+    return ''
+  }
+
+  if (normalizedHost.endsWith('#') || !isSupportedAPIVersion || hasAPIVersion(normalizedHost)) {
+    return normalizedHost
+  }
+  return `${normalizedHost}/${apiVersion}`
+}
+
+/**
+ * Converts an API host URL into separate base URL and endpoint components.
+ *
+ * This function extracts endpoint information from a composite API host string.
+ * If the host ends with '#', it attempts to match the preceding part against the supported endpoint list.
+ *
+ * @param apiHost - The API host string to parse
+ * @returns An object containing:
+ *   - `baseURL`: The base URL without the endpoint suffix
+ *   - `endpoint`: The matched endpoint identifier, or empty string if no match found
+ *
+ * @example
+ * routeToEndpoint('https://api.example.com/openai/chat/completions#')
+ * // Returns: { baseURL: 'https://api.example.com/v1', endpoint: 'chat/completions' }
+ *
+ * @example
+ * routeToEndpoint('https://api.example.com/v1')
+ * // Returns: { baseURL: 'https://api.example.com/v1', endpoint: '' }
+ */
+export function routeToEndpoint(apiHost: string): { baseURL: string; endpoint: string } {
+  const trimmedHost = (apiHost || '').trim()
+  if (!trimmedHost.endsWith('#')) {
+    return { baseURL: trimmedHost, endpoint: '' }
+  }
+  // Remove trailing #
+  const host = trimmedHost.slice(0, -1)
+  const endpointMatch = SUPPORTED_ENDPOINT_LIST.find((endpoint) => host.endsWith(endpoint))
+  if (!endpointMatch) {
+    const baseURL = withoutTrailingSlash(host)
+    return { baseURL, endpoint: '' }
+  }
+  const baseSegment = host.slice(0, host.length - endpointMatch.length)
+  const baseURL = withoutTrailingSlash(baseSegment).replace(/:$/, '') // Remove trailing colon (gemini special case)
+  return { baseURL, endpoint: endpointMatch }
+}
+
+/**
+ * Gets the AI SDK compatible base URL from a provider's apiHost.
+ *
+ * AI SDK expects baseURL WITH version suffix (e.g., /v1).
+ * This function:
+ * 1. Handles '#' endpoint routing format
+ * 2. Ensures the URL has a version suffix (adds /v1 if missing)
+ *
+ * @param apiHost - The provider's apiHost value (may or may not have /v1)
+ * @param apiVersion - The API version to use if missing. Defaults to 'v1'.
+ * @returns The baseURL suitable for AI SDK (with version suffix)
+ *
+ * @example
+ * getAiSdkBaseUrl('https://api.openai.com') // 'https://api.openai.com/v1'
+ * getAiSdkBaseUrl('https://api.openai.com/v1') // 'https://api.openai.com/v1'
+ * getAiSdkBaseUrl('https://api.example.com/chat/completions#') // 'https://api.example.com'
+ */
+export function getAiSdkBaseUrl(apiHost: string, apiVersion: string = 'v1'): string {
+  // First handle '#' endpoint routing format
+  const { baseURL } = routeToEndpoint(apiHost)
+
+  // If already has version, return as-is
+  if (hasAPIVersion(baseURL)) {
+    return withoutTrailingSlash(baseURL)
+  }
+
+  // Add version suffix
+  return `${withoutTrailingSlash(baseURL)}/${apiVersion}`
+}
+
+/**
+ * Validates an API host address.
+ *
+ * @param apiHost - The API host address to validate
+ * @returns true if valid URL with http/https protocol, false otherwise
+ */
+export function validateApiHost(apiHost: string): boolean {
+  if (!apiHost || !apiHost.trim()) {
+    return true // Allow empty
+  }
+  try {
+    const url = new URL(apiHost.trim())
+    return url.protocol === 'http:' || url.protocol === 'https:'
+  } catch {
+    return false
+  }
+}
diff --git a/src/renderer/src/aiCore/provider/config/aihubmix.ts b/packages/shared/provider/config/aihubmix.ts
similarity index 53%
rename from src/renderer/src/aiCore/provider/config/aihubmix.ts
rename to packages/shared/provider/config/aihubmix.ts
index 8feed89909..5214e8d06a 100644
--- a/src/renderer/src/aiCore/provider/config/aihubmix.ts
+++ b/packages/shared/provider/config/aihubmix.ts
@@ -1,13 +1,13 @@
 /**
  * AiHubMix规则集
  */
-import { isOpenAILLMModel } from '@renderer/config/models'
-import type { Provider } from '@renderer/types'
+import { getLowerBaseModelName } from '@shared/utils/naming'
 
+import type { MinimalModel, MinimalProvider } from '../types'
 import { provider2Provider, startsWith } from './helper'
 import type { RuleSet } from './types'
 
-const extraProviderConfig = (provider: Provider) => {
+const extraProviderConfig = <P extends MinimalProvider>(provider: P) => {
   return {
     ...provider,
     extra_headers: {
@@ -17,11 +17,23 @@ const extraProviderConfig = (provider: Provider) => {
   }
 }
 
+function isOpenAILLMModel<M extends MinimalModel>(model: M): boolean {
+  const modelId = getLowerBaseModelName(model.id)
+  const reasonings = ['o1', 'o3', 'o4', 'gpt-oss']
+  if (reasonings.some((r) => modelId.includes(r))) {
+    return true
+  }
+  if (modelId.includes('gpt')) {
+    return true
+  }
+  return false
+}
+
 const AIHUBMIX_RULES: RuleSet = {
   rules: [
     {
       match: startsWith('claude'),
-      provider: (provider: Provider) => {
+      provider: (provider) => {
         return extraProviderConfig({
           ...provider,
           type: 'anthropic'
@@ -34,7 +46,7 @@ const AIHUBMIX_RULES: RuleSet = {
         !model.id.endsWith('-nothink') &&
         !model.id.endsWith('-search') &&
         !model.id.includes('embedding'),
-      provider: (provider: Provider) => {
+      provider: (provider) => {
         return extraProviderConfig({
           ...provider,
           type: 'gemini',
@@ -44,7 +56,7 @@ const AIHUBMIX_RULES: RuleSet = {
     },
     {
       match: isOpenAILLMModel,
-      provider: (provider: Provider) => {
+      provider: (provider) => {
         return extraProviderConfig({
           ...provider,
           type: 'openai-response'
@@ -52,7 +64,8 @@ const AIHUBMIX_RULES: RuleSet = {
       }
     }
   ],
-  fallbackRule: (provider: Provider) => extraProviderConfig(provider)
+  fallbackRule: (provider) => extraProviderConfig(provider)
 }
 
-export const aihubmixProviderCreator = provider2Provider.bind(null, AIHUBMIX_RULES)
+export const aihubmixProviderCreator = <P extends MinimalProvider>(model: MinimalModel, provider: P): P =>
+  provider2Provider<MinimalModel, MinimalProvider, P>(AIHUBMIX_RULES, model, provider)
diff --git a/packages/shared/provider/config/azure-anthropic.ts b/packages/shared/provider/config/azure-anthropic.ts
new file mode 100644
index 0000000000..e176614df3
--- /dev/null
+++ b/packages/shared/provider/config/azure-anthropic.ts
@@ -0,0 +1,22 @@
+import type { MinimalModel, MinimalProvider, ProviderType } from '../types'
+import { provider2Provider, startsWith } from './helper'
+import type { RuleSet } from './types'
+
+// https://platform.claude.com/docs/en/build-with-claude/claude-in-microsoft-foundry
+const AZURE_ANTHROPIC_RULES: RuleSet = {
+  rules: [
+    {
+      match: startsWith('claude'),
+      provider: (provider: MinimalProvider) => ({
+        ...provider,
+        type: 'anthropic' as ProviderType,
+        apiHost: provider.apiHost + 'anthropic/v1',
+        id: 'azure-anthropic'
+      })
+    }
+  ],
+  fallbackRule: (provider: MinimalProvider) => provider
+}
+
+export const azureAnthropicProviderCreator = <P extends MinimalProvider>(model: MinimalModel, provider: P): P =>
+  provider2Provider<MinimalModel, MinimalProvider, P>(AZURE_ANTHROPIC_RULES, model, provider)
diff --git a/packages/shared/provider/config/helper.ts b/packages/shared/provider/config/helper.ts
new file mode 100644
index 0000000000..4e821a6c8f
--- /dev/null
+++ b/packages/shared/provider/config/helper.ts
@@ -0,0 +1,32 @@
+import type { MinimalModel, MinimalProvider } from '../types'
+import type { RuleSet } from './types'
+
+export const startsWith =
+  (prefix: string) =>
+  <M extends MinimalModel>(model: M) =>
+    model.id.toLowerCase().startsWith(prefix.toLowerCase())
+
+export const endpointIs =
+  (type: string) =>
+  <M extends MinimalModel>(model: M) =>
+    model.endpoint_type === type
+
+/**
+ * 解析模型对应的Provider
+ * @param ruleSet 规则集对象
+ * @param model 模型对象
+ * @param provider 原始provider对象
+ * @returns 解析出的provider对象
+ */
+export function provider2Provider<
+  M extends MinimalModel,
+  R extends MinimalProvider,
+  P extends R = R
+>(ruleSet: RuleSet<M, R>, model: M, provider: P): P {
+  for (const rule of ruleSet.rules) {
+    if (rule.match(model)) {
+      return rule.provider(provider) as P
+    }
+  }
+  return ruleSet.fallbackRule(provider) as P
+}
diff --git a/packages/shared/provider/config/index.ts b/packages/shared/provider/config/index.ts
new file mode 100644
index 0000000000..1273319ecd
--- /dev/null
+++ b/packages/shared/provider/config/index.ts
@@ -0,0 +1,6 @@
+export { aihubmixProviderCreator } from './aihubmix'
+export { azureAnthropicProviderCreator } from './azure-anthropic'
+export { endpointIs, provider2Provider, startsWith } from './helper'
+export { newApiResolverCreator } from './newApi'
+export type { RuleSet } from './types'
+export { vertexAnthropicProviderCreator } from './vertex-anthropic'
diff --git a/src/renderer/src/aiCore/provider/config/newApi.ts b/packages/shared/provider/config/newApi.ts
similarity index 52%
rename from src/renderer/src/aiCore/provider/config/newApi.ts
rename to packages/shared/provider/config/newApi.ts
index 97de62597d..fd1b74085f 100644
--- a/src/renderer/src/aiCore/provider/config/newApi.ts
+++ b/packages/shared/provider/config/newApi.ts
@@ -1,8 +1,7 @@
 /**
  * NewAPI规则集
  */
-import type { Provider } from '@renderer/types'
-
+import type { MinimalModel, MinimalProvider, ProviderType } from '../types'
 import { endpointIs, provider2Provider } from './helper'
 import type { RuleSet } from './types'
 
@@ -10,42 +9,43 @@ const NEWAPI_RULES: RuleSet = {
   rules: [
     {
       match: endpointIs('anthropic'),
-      provider: (provider: Provider) => {
+      provider: (provider) => {
         return {
           ...provider,
-          type: 'anthropic'
+          type: 'anthropic' as ProviderType
         }
       }
     },
     {
       match: endpointIs('gemini'),
-      provider: (provider: Provider) => {
+      provider: (provider) => {
         return {
           ...provider,
-          type: 'gemini'
+          type: 'gemini' as ProviderType
         }
       }
     },
     {
       match: endpointIs('openai-response'),
-      provider: (provider: Provider) => {
+      provider: (provider) => {
         return {
           ...provider,
-          type: 'openai-response'
+          type: 'openai-response' as ProviderType
         }
       }
     },
     {
       match: (model) => endpointIs('openai')(model) || endpointIs('image-generation')(model),
-      provider: (provider: Provider) => {
+      provider: (provider) => {
         return {
           ...provider,
-          type: 'openai'
+          type: 'openai' as ProviderType
         }
       }
     }
   ],
-  fallbackRule: (provider: Provider) => provider
+  fallbackRule: (provider) => provider
 }
 
-export const newApiResolverCreator = provider2Provider.bind(null, NEWAPI_RULES)
+export const newApiResolverCreator = <P extends MinimalProvider>(model: MinimalModel, provider: P): P =>
+  provider2Provider<MinimalModel, MinimalProvider, P>(NEWAPI_RULES, model, provider)
diff --git a/packages/shared/provider/config/types.ts b/packages/shared/provider/config/types.ts
new file mode 100644
index 0000000000..fdb1309869
--- /dev/null
+++ b/packages/shared/provider/config/types.ts
@@ -0,0 +1,9 @@
+import type { MinimalModel, MinimalProvider } from '../types'
+
+export interface RuleSet<M extends MinimalModel = MinimalModel, P extends MinimalProvider = MinimalProvider> {
+  rules: Array<{
+    match: (model: M) => boolean
+    provider: (provider: P) => P
+  }>
+  fallbackRule: (provider: P) => P
+}
diff --git a/packages/shared/provider/config/vertex-anthropic.ts b/packages/shared/provider/config/vertex-anthropic.ts
new file mode 100644
index 0000000000..242ba2a9f5
--- /dev/null
+++ b/packages/shared/provider/config/vertex-anthropic.ts
@@ -0,0 +1,19 @@
+import type { MinimalModel, MinimalProvider } from '../types'
+import { provider2Provider, startsWith } from './helper'
+import type { RuleSet } from './types'
+
+const VERTEX_ANTHROPIC_RULES: RuleSet = {
+  rules: [
+    {
+      match: startsWith('claude'),
+      provider: (provider: MinimalProvider) => ({
+        ...provider,
+        id: 'google-vertex-anthropic'
+      })
+    }
+  ],
+  fallbackRule: (provider: MinimalProvider) => provider
+}
+
+export const vertexAnthropicProviderCreator = <P extends MinimalProvider>(model: MinimalModel, provider: P): P =>
+  provider2Provider<MinimalModel, MinimalProvider, P>(VERTEX_ANTHROPIC_RULES, model, provider)
diff --git a/packages/shared/provider/detection.ts b/packages/shared/provider/detection.ts
new file mode 100644
index 0000000000..19fff2dff9
--- /dev/null
+++ b/packages/shared/provider/detection.ts
@@ -0,0 +1,100 @@
+/**
+ * Provider Type Detection Utilities
+ *
+ * Functions to detect provider types based on provider configuration.
+ * These are pure functions that only depend on provider.type and provider.id.
+ *
+ * NOTE: These functions should match the logic in @renderer/utils/provider.ts
+ */
+
+import type { MinimalProvider } from './types'
+
+/**
+ * Check if provider is Anthropic type
+ */
+export function isAnthropicProvider<P extends MinimalProvider>(provider: P): boolean {
+  return provider.type === 'anthropic'
+}
+
+/**
+ * Check if provider is OpenAI Response type (openai-response)
+ * NOTE: This matches isOpenAIProvider in renderer/utils/provider.ts
+ */
+export function isOpenAIProvider<P extends MinimalProvider>(provider: P): boolean {
+  return provider.type === 'openai-response'
+}
+
+/**
+ * Check if provider is Gemini type
+ */
+export function isGeminiProvider<P extends MinimalProvider>(provider: P): boolean {
+  return provider.type === 'gemini'
+}
+
+/**
+ * Check if provider is Azure OpenAI type
+ */
+export function isAzureOpenAIProvider<P extends MinimalProvider>(provider: P): boolean {
+  return provider.type === 'azure-openai'
+}
+
+/**
+ * Check if provider is Vertex AI type
+ */
+export function isVertexProvider<P extends MinimalProvider>(provider: P): boolean {
+  return provider.type === 'vertexai'
+}
+
+/**
+ * Check if provider is AWS Bedrock type
+ */
+export function isAwsBedrockProvider<P extends MinimalProvider>(provider: P): boolean {
+  return provider.type === 'aws-bedrock'
+}
+
+/**
+ * Check if provider is AI Gateway type
+ */
+export function isAIGatewayProvider<P extends MinimalProvider>(provider: P): boolean {
+  return provider.type === 'ai-gateway'
+}
+
+/**
+ * Check if Azure OpenAI provider uses responses endpoint
+ * Matches isAzureResponsesEndpoint in renderer/utils/provider.ts
+ */
+export function isAzureResponsesEndpoint<P extends MinimalProvider>(provider: P): boolean {
+  return provider.apiVersion === 'preview' || provider.apiVersion === 'v1'
+}
+
+/**
+ * Check if provider is Cherry AI type
+ * Matches isCherryAIProvider in renderer/utils/provider.ts
+ */
+export function isCherryAIProvider<P extends MinimalProvider>(provider: P): boolean {
+  return provider.id === 'cherryai'
+}
+
+/**
+ * Check if provider is Perplexity type
+ * Matches isPerplexityProvider in renderer/utils/provider.ts
+ */
+export function isPerplexityProvider<P extends MinimalProvider>(provider: P): boolean {
+  return provider.id === 'perplexity'
+}
+
+/**
+ * Check if provider is new-api type (supports multiple backends)
+ * Matches isNewApiProvider in renderer/utils/provider.ts
+ */
+export function isNewApiProvider<P extends MinimalProvider>(provider: P): boolean {
+  return ['new-api', 'cherryin'].includes(provider.id) || provider.type === ('new-api' as string)
+}
+
+/**
+ * Check if provider is OpenAI compatible
+ * Matches isOpenAICompatibleProvider in renderer/utils/provider.ts
+ */
+export function isOpenAICompatibleProvider<P extends MinimalProvider>(provider: P): boolean {
+  return ['openai', 'new-api', 'mistral'].includes(provider.type)
+}
diff --git a/packages/shared/provider/format.ts b/packages/shared/provider/format.ts
new file mode 100644
index 0000000000..72e768d9b3
--- /dev/null
+++ b/packages/shared/provider/format.ts
@@ -0,0 +1,136 @@
+/**
+ * Provider API Host Formatting
+ *
+ * Utilities for formatting provider API hosts to work with AI SDK.
+ * These handle the differences between how Cherry Studio stores API hosts
+ * and how AI SDK expects them.
+ */
+
+import {
+  formatApiHost,
+  formatAzureOpenAIApiHost,
+  formatVertexApiHost,
+  routeToEndpoint,
+  withoutTrailingSlash
+} from '../api'
+import {
+  isAnthropicProvider,
+  isAzureOpenAIProvider,
+  isCherryAIProvider,
+  isGeminiProvider,
+  isPerplexityProvider,
+  isVertexProvider
+} from './detection'
+import type { MinimalProvider } from './types'
+import { SystemProviderIds } from './types'
+
+/**
+ * Interface for environment-specific implementations
+ * Renderer and Main process can provide their own implementations
+ */
+export interface ProviderFormatContext {
+  vertex: {
+    project: string
+    location: string
+  }
+}
+
+/**
+ * Default Azure OpenAI API host formatter
+ */
+export function defaultFormatAzureOpenAIApiHost(host: string): string {
+  const normalizedHost = withoutTrailingSlash(host)
+    ?.replace(/\/v1$/, '')
+    .replace(/\/openai$/, '')
+  // AI SDK will add /v1
+  return formatApiHost(normalizedHost + '/openai', false)
+}
+
+/**
+ * Format provider API host for AI SDK
+ *
+ * This function normalizes the apiHost to work with AI SDK.
+ * Different providers have different requirements:
+ * - Most providers: add /v1 suffix
+ * - Gemini: add /v1beta suffix
+ * - Some providers: no suffix needed
+ *
+ * @param provider - The provider to format
+ * @param context - Optional context with environment-specific implementations
+ * @returns Provider with formatted apiHost (and anthropicApiHost if applicable)
+ */
+export function formatProviderApiHost<T extends MinimalProvider>(provider: T, context: ProviderFormatContext): T {
+  const formatted = { ...provider }
+
+  // Format anthropicApiHost if present
+  if (formatted.anthropicApiHost) {
+    formatted.anthropicApiHost = formatApiHost(formatted.anthropicApiHost)
+  }
+
+  // Format based on provider type
+  if (isAnthropicProvider(provider)) {
+    const baseHost = formatted.anthropicApiHost || formatted.apiHost
+    // AI SDK needs /v1 in baseURL
+    formatted.apiHost = formatApiHost(baseHost)
+    if (!formatted.anthropicApiHost) {
+      formatted.anthropicApiHost = formatted.apiHost
+    }
+  } else if (formatted.id === SystemProviderIds.copilot || formatted.id === SystemProviderIds.github) {
+    formatted.apiHost = formatApiHost(formatted.apiHost, false)
+  } else if (isGeminiProvider(formatted)) {
+    formatted.apiHost = formatApiHost(formatted.apiHost, true, 'v1beta')
+  } else if (isAzureOpenAIProvider(formatted)) {
+    formatted.apiHost = formatAzureOpenAIApiHost(formatted.apiHost)
+  } else if (isVertexProvider(formatted)) {
+    formatted.apiHost = formatVertexApiHost(formatted, context.vertex.project, context.vertex.location)
+  } else if (isCherryAIProvider(formatted)) {
+    formatted.apiHost = formatApiHost(formatted.apiHost, false)
+  } else if (isPerplexityProvider(formatted)) {
+    formatted.apiHost = formatApiHost(formatted.apiHost, false)
+  } else {
+    formatted.apiHost = formatApiHost(formatted.apiHost)
+  }
+
+  return formatted
+}
+
+/**
+ * Get the base URL for AI SDK from a formatted provider
+ *
+ * This extracts the baseURL that AI SDK expects, handling
+ * the '#' endpoint routing format if present.
+ *
+ * @param formattedApiHost - The formatted apiHost (after formatProviderApiHost)
+ * @returns The baseURL for AI SDK
+ */
+export function getBaseUrlForAiSdk(formattedApiHost: string): string {
+  const { baseURL } = routeToEndpoint(formattedApiHost)
+  return baseURL
+}
+
+/**
+ * Get rotated API key from comma-separated keys
+ *
+ * This is the interface for API key rotation. The actual implementation
+ * depends on the environment (renderer uses window.keyv, main uses its own storage).
+ */
+export interface ApiKeyRotator {
+  /**
+   * Get the next API key in rotation
+   * @param providerId - The provider ID for tracking rotation
+   * @param keys - Comma-separated API keys
+   * @returns The next API key to use
+   */
+  getRotatedKey(providerId: string, keys: string): string
+}
+
+/**
+ * Simple API key rotator that always returns the first key
+ * Use this when rotation is not needed
+ */
+export const simpleKeyRotator: ApiKeyRotator = {
+  getRotatedKey(_providerId: string, keys: string): string {
+    const keyList = keys.split(',').map((k) => k.trim())
+    return keyList[0] || keys
+  }
+}
diff --git a/packages/shared/provider/index.ts b/packages/shared/provider/index.ts
new file mode 100644
index 0000000000..f0b9b11d10
--- /dev/null
+++ b/packages/shared/provider/index.ts
@@ -0,0 +1,48 @@
+/**
+ * Shared Provider Utilities
+ *
+ * This module exports utilities for working with AI providers
+ * that can be shared between main process and renderer process.
+ */
+
+// Type definitions
+export type { MinimalProvider, ProviderType, SystemProviderId } from './types'
+export { SystemProviderIds } from './types'
+
+// Provider type detection
+export {
+  isAIGatewayProvider,
+  isAnthropicProvider,
+  isAwsBedrockProvider,
+  isAzureOpenAIProvider,
+  isAzureResponsesEndpoint,
+  isCherryAIProvider,
+  isGeminiProvider,
+  isNewApiProvider,
+  isOpenAICompatibleProvider,
+  isOpenAIProvider,
+  isPerplexityProvider,
+  isVertexProvider
+} from './detection'
+
+// API host formatting
+export type { ApiKeyRotator, ProviderFormatContext } from './format'
+export {
+  defaultFormatAzureOpenAIApiHost,
+  formatProviderApiHost,
+  getBaseUrlForAiSdk,
+  simpleKeyRotator
+} from './format'
+
+// Provider ID mapping
+export { getAiSdkProviderId, STATIC_PROVIDER_MAPPING, tryResolveProviderId } from './mapping'
+
+// AI SDK configuration
+export type { AiSdkConfig, AiSdkConfigContext } from './sdk-config'
+export { providerToAiSdkConfig } from './sdk-config'
+
+// Provider resolution
+export { resolveActualProvider } from './resolve'
+
+// Provider initialization
+export { initializeSharedProviders, SHARED_PROVIDER_CONFIGS } from './initialization'
diff --git a/packages/shared/provider/initialization.ts b/packages/shared/provider/initialization.ts
new file mode 100644
index 0000000000..fbb5fba54f
--- /dev/null
+++ b/packages/shared/provider/initialization.ts
@@ -0,0 +1,107 @@
+import { type ProviderConfig, registerMultipleProviderConfigs } from '@cherrystudio/ai-core/provider'
+
+type ProviderInitializationLogger = {
+  warn?: (message: string) => void
+  error?: (message: string, error: Error) => void
+}
+
+export const SHARED_PROVIDER_CONFIGS: ProviderConfig[] = [
+  {
+    id: 'openrouter',
+    name: 'OpenRouter',
+    import: () => import('@openrouter/ai-sdk-provider'),
+    creatorFunctionName: 'createOpenRouter',
+    supportsImageGeneration: true,
+    aliases: ['openrouter']
+  },
+  {
+    id: 'google-vertex',
+    name: 'Google Vertex AI',
+    import: () => import('@ai-sdk/google-vertex/edge'),
+    creatorFunctionName: 'createVertex',
+    supportsImageGeneration: true,
+    aliases: ['vertexai']
+  },
+  {
+    id: 'google-vertex-anthropic',
+    name: 'Google Vertex AI Anthropic',
+    import: () => import('@ai-sdk/google-vertex/anthropic/edge'),
+    creatorFunctionName: 'createVertexAnthropic',
+    supportsImageGeneration: true,
+    aliases: ['vertexai-anthropic']
+  },
+  {
+    id: 'azure-anthropic',
+    name: 'Azure AI Anthropic',
+    import: () => import('@ai-sdk/anthropic'),
+    creatorFunctionName: 'createAnthropic',
+    supportsImageGeneration: false,
+    aliases: ['azure-anthropic']
+  },
+  {
+    id: 'github-copilot-openai-compatible',
+    name: 'GitHub Copilot OpenAI Compatible',
+    import: () => import('@opeoginni/github-copilot-openai-compatible'),
+    creatorFunctionName: 'createGitHubCopilotOpenAICompatible',
+    supportsImageGeneration: false,
+    aliases: ['copilot', 'github-copilot']
+  },
+  {
+    id: 'bedrock',
+    name: 'Amazon Bedrock',
+    import: () => import('@ai-sdk/amazon-bedrock'),
+    creatorFunctionName: 'createAmazonBedrock',
+    supportsImageGeneration: true,
+    aliases: ['aws-bedrock']
+  },
+  {
+    id: 'perplexity',
+    name: 'Perplexity',
+    import: () => import('@ai-sdk/perplexity'),
+    creatorFunctionName: 'createPerplexity',
+    supportsImageGeneration: false,
+    aliases: ['perplexity']
+  },
+  {
+    id: 'mistral',
+    name: 'Mistral',
+    import: () => import('@ai-sdk/mistral'),
+    creatorFunctionName: 'createMistral',
+    supportsImageGeneration: false,
+    aliases: ['mistral']
+  },
+  {
+    id: 'huggingface',
+    name: 'HuggingFace',
+    import: () => import('@ai-sdk/huggingface'),
+    creatorFunctionName: 'createHuggingFace',
+    supportsImageGeneration: true,
+    aliases: ['hf', 'hugging-face']
+  },
+  {
+    id: 'ai-gateway',
+    name: 'AI Gateway',
+    import: () => import('@ai-sdk/gateway'),
+    creatorFunctionName: 'createGateway',
+    supportsImageGeneration: true,
+    aliases: ['gateway']
+  },
+  {
+    id: 'cerebras',
+    name: 'Cerebras',
+    import: () => import('@ai-sdk/cerebras'),
+    creatorFunctionName: 'createCerebras',
+    supportsImageGeneration: false
+  }
+] as const
+
+export function initializeSharedProviders(logger?: ProviderInitializationLogger): void {
+  try {
+    const successCount = registerMultipleProviderConfigs(SHARED_PROVIDER_CONFIGS)
+    if (successCount < SHARED_PROVIDER_CONFIGS.length) {
+      logger?.warn?.('Some providers failed to register. Check previous error logs.')
+    }
+  } catch (error) {
+    logger?.error?.('Failed to initialize shared providers', error as Error)
+  }
+}
diff --git a/packages/shared/provider/mapping.ts b/packages/shared/provider/mapping.ts
new file mode 100644
index 0000000000..20e2e10c3f
--- /dev/null
+++ b/packages/shared/provider/mapping.ts
@@ -0,0 +1,95 @@
+/**
+ * Provider ID Mapping
+ *
+ * Maps Cherry Studio provider IDs/types to AI SDK provider IDs.
+ * This logic should match @renderer/aiCore/provider/factory.ts
+ */
+
+import { hasProviderConfigByAlias, type ProviderId, resolveProviderConfigId } from '@cherrystudio/ai-core/provider'
+
+import { isAzureOpenAIProvider, isAzureResponsesEndpoint } from './detection'
+import type { MinimalProvider } from './types'
+
+/**
+ * Static mapping from Cherry Studio provider ID/type to AI SDK provider ID
+ * Matches STATIC_PROVIDER_MAPPING in @renderer/aiCore/provider/factory.ts
+ */
+export const STATIC_PROVIDER_MAPPING: Record<string, ProviderId> = {
+  gemini: 'google', // Google Gemini -> google
+  'azure-openai': 'azure', // Azure OpenAI -> azure
+  'openai-response': 'openai', // OpenAI Responses -> openai
+  grok: 'xai', // Grok -> xai
+  copilot: 'github-copilot-openai-compatible'
+}
+
+/**
+ * Try to resolve a provider identifier to an AI SDK provider ID
+ * Matches tryResolveProviderId in @renderer/aiCore/provider/factory.ts
+ *
+ * @param identifier - The provider ID or type to resolve
+ * @param checker - Provider config checker (defaults to static mapping only)
+ * @returns The resolved AI SDK provider ID, or null if not found
+ */
+export function tryResolveProviderId(identifier: string): ProviderId | null {
+  // 1. 检查静态映射
+  const staticMapping = STATIC_PROVIDER_MAPPING[identifier]
+  if (staticMapping) {
+    return staticMapping
+  }
+
+  // 2. 检查AiCore是否支持（包括别名支持）
+  if (hasProviderConfigByAlias(identifier)) {
+    // 解析为真实的Provider ID
+    return resolveProviderConfigId(identifier) as ProviderId
+  }
+
+  return null
+}
+
+/**
+ * Get the AI SDK Provider ID for a Cherry Studio provider
+ * Matches getAiSdkProviderId in @renderer/aiCore/provider/factory.ts
+ *
+ * Logic:
+ * 1. Handle Azure OpenAI specially (check responses endpoint)
+ * 2. Try to resolve from provider.id
+ * 3. Try to resolve from provider.type (but not for generic 'openai' type)
+ * 4. Check for OpenAI API host pattern
+ * 5. Fallback to provider's own ID
+ *
+ * @param provider - The Cherry Studio provider
+ * @param checker - Provider config checker (defaults to static mapping only)
+ * @returns The AI SDK provider ID to use
+ */
+export function getAiSdkProviderId(provider: MinimalProvider): ProviderId {
+  // 1. Handle Azure OpenAI specially - check this FIRST before other resolution
+  if (isAzureOpenAIProvider(provider)) {
+    if (isAzureResponsesEndpoint(provider)) {
+      return 'azure-responses'
+    }
+    return 'azure'
+  }
+
+  // 2. 尝试解析provider.id
+  const resolvedFromId = tryResolveProviderId(provider.id)
+  if (resolvedFromId) {
+    return resolvedFromId
+  }
+
+  // 3. 尝试解析provider.type
+  // 会把所有类型为openai的自定义provider解析到aisdk的openaiProvider上
+  if (provider.type !== 'openai') {
+    const resolvedFromType = tryResolveProviderId(provider.type)
+    if (resolvedFromType) {
+      return resolvedFromType
+    }
+  }
+
+  // 4. Check for OpenAI API host pattern
+  if (provider.apiHost.includes('api.openai.com')) {
+    return 'openai-chat'
+  }
+
+  // 5. 最后的fallback（使用provider本身的id）
+  return provider.id
+}
diff --git a/packages/shared/provider/resolve.ts b/packages/shared/provider/resolve.ts
new file mode 100644
index 0000000000..9055a36c6e
--- /dev/null
+++ b/packages/shared/provider/resolve.ts
@@ -0,0 +1,44 @@
+import { aihubmixProviderCreator, newApiResolverCreator, vertexAnthropicProviderCreator } from './config'
+import { azureAnthropicProviderCreator } from './config/azure-anthropic'
+import { isAzureOpenAIProvider, isNewApiProvider } from './detection'
+import type { MinimalModel, MinimalProvider } from './types'
+
+export interface ResolveActualProviderOptions<P extends MinimalProvider> {
+  isSystemProvider?: (provider: P) => boolean
+}
+
+const defaultIsSystemProvider = <P extends MinimalProvider>(provider: P): boolean => {
+  if ('isSystem' in provider) {
+    return Boolean((provider as unknown as { isSystem?: boolean }).isSystem)
+  }
+  return false
+}
+
+export function resolveActualProvider<M extends MinimalModel, P extends MinimalProvider>(
+  provider: P,
+  model: M,
+  options: ResolveActualProviderOptions<P> = {}
+): P {
+  let resolvedProvider = provider
+
+  if (isNewApiProvider(resolvedProvider)) {
+    resolvedProvider = newApiResolverCreator(model, resolvedProvider)
+  }
+
+  const isSystemProvider =
+    options.isSystemProvider?.(resolvedProvider) ?? defaultIsSystemProvider(resolvedProvider)
+
+  if (isSystemProvider && resolvedProvider.id === 'aihubmix') {
+    resolvedProvider = aihubmixProviderCreator(model, resolvedProvider)
+  }
+
+  if (isSystemProvider && resolvedProvider.id === 'vertexai') {
+    resolvedProvider = vertexAnthropicProviderCreator(model, resolvedProvider)
+  }
+
+  if (isAzureOpenAIProvider(resolvedProvider)) {
+    resolvedProvider = azureAnthropicProviderCreator(model, resolvedProvider)
+  }
+
+  return resolvedProvider
+}
diff --git a/packages/shared/provider/sdk-config.ts b/packages/shared/provider/sdk-config.ts
new file mode 100644
index 0000000000..a03b3b1417
--- /dev/null
+++ b/packages/shared/provider/sdk-config.ts
@@ -0,0 +1,240 @@
+/**
+ * AI SDK Configuration
+ *
+ * Shared utilities for converting Cherry Studio Provider to AI SDK configuration.
+ * Environment-specific logic (renderer/main) is injected via context interfaces.
+ */
+
+import { formatPrivateKey, hasProviderConfig, ProviderConfigFactory } from '@cherrystudio/ai-core/provider'
+
+import { routeToEndpoint } from '../api'
+import { getAiSdkProviderId } from './mapping'
+import type { MinimalProvider } from './types'
+import { SystemProviderIds } from './types'
+
+/**
+ * AI SDK configuration result
+ */
+export interface AiSdkConfig {
+  providerId: string
+  options: Record<string, unknown>
+}
+
+/**
+ * Context for environment-specific implementations
+ */
+export interface AiSdkConfigContext {
+  /**
+   * Get the rotated API key (for multi-key support)
+   * Default: returns first key
+   */
+  getRotatedApiKey?: (provider: MinimalProvider) => string
+
+  /**
+   * Check if a model uses chat completion only (for OpenAI response mode)
+   * Default: returns false
+   */
+  isOpenAIChatCompletionOnlyModel?: (modelId: string) => boolean
+
+  /**
+   * Get Copilot default headers (constants)
+   * Default: returns empty object
+   */
+  getCopilotDefaultHeaders?: () => Record<string, string>
+
+  /**
+   * Get Copilot stored headers from state
+   * Default: returns empty object
+   */
+  getCopilotStoredHeaders?: () => Record<string, string>
+
+  /**
+   * Get AWS Bedrock configuration
+   * Default: returns undefined (not configured)
+   */
+  getAwsBedrockConfig?: () =>
+    | {
+        authType: 'apiKey' | 'iam'
+        region: string
+        apiKey?: string
+        accessKeyId?: string
+        secretAccessKey?: string
+      }
+    | undefined
+
+  /**
+   * Get Vertex AI configuration
+   * Default: returns undefined (not configured)
+   */
+  getVertexConfig?: (provider: MinimalProvider) =>
+    | {
+        project: string
+        location: string
+        googleCredentials: {
+          privateKey: string
+          clientEmail: string
+        }
+      }
+    | undefined
+
+  /**
+   * Get endpoint type for cherryin provider
+   */
+  getEndpointType?: (modelId: string) => string | undefined
+
+  /**
+   * Custom fetch implementation
+   * Main process: use Electron net.fetch
+   * Renderer process: use browser fetch (default)
+   */
+  fetch?: typeof globalThis.fetch
+}
+
+/**
+ * Default simple key rotator - returns first key
+ */
+function defaultGetRotatedApiKey(provider: MinimalProvider): string {
+  const keys = provider.apiKey.split(',').map((k) => k.trim())
+  return keys[0] || provider.apiKey
+}
+
+/**
+ * Convert Cherry Studio Provider to AI SDK configuration
+ *
+ * @param provider - The formatted provider (after formatProviderApiHost)
+ * @param modelId - The model ID to use
+ * @param context - Environment-specific implementations
+ * @returns AI SDK configuration
+ */
+export function providerToAiSdkConfig(
+  provider: MinimalProvider,
+  modelId: string,
+  context: AiSdkConfigContext = {}
+): AiSdkConfig {
+  const getRotatedApiKey = context.getRotatedApiKey || defaultGetRotatedApiKey
+  const isOpenAIChatCompletionOnlyModel = context.isOpenAIChatCompletionOnlyModel || (() => false)
+
+  const aiSdkProviderId = getAiSdkProviderId(provider)
+
+  // Build base config
+  const { baseURL, endpoint } = routeToEndpoint(provider.apiHost)
+  const baseConfig = {
+    baseURL,
+    apiKey: getRotatedApiKey(provider)
+  }
+
+  // Handle Copilot specially
+  if (provider.id === SystemProviderIds.copilot) {
+    const defaultHeaders = context.getCopilotDefaultHeaders?.() ?? {}
+    const storedHeaders = context.getCopilotStoredHeaders?.() ?? {}
+    const options = ProviderConfigFactory.fromProvider('github-copilot-openai-compatible', baseConfig, {
+      headers: {
+        ...defaultHeaders,
+        ...storedHeaders,
+        ...provider.extra_headers
+      },
+      name: provider.id,
+      includeUsage: true
+    })
+
+    return {
+      providerId: 'github-copilot-openai-compatible',
+      options
+    }
+  }
+
+  // Build extra options
+  const extraOptions: Record<string, unknown> = {}
+  if (endpoint) {
+    extraOptions.endpoint = endpoint
+  }
+
+  // Handle OpenAI mode
+  if (provider.type === 'openai-response' && !isOpenAIChatCompletionOnlyModel(modelId)) {
+    extraOptions.mode = 'responses'
+  } else if (aiSdkProviderId === 'openai' || (aiSdkProviderId === 'cherryin' && provider.type === 'openai')) {
+    extraOptions.mode = 'chat'
+  }
+
+  // Add extra headers
+  if (provider.extra_headers) {
+    extraOptions.headers = provider.extra_headers
+    if (aiSdkProviderId === 'openai') {
+      extraOptions.headers = {
+        ...(extraOptions.headers as Record<string, string>),
+        'HTTP-Referer': 'https://cherry-ai.com',
+        'X-Title': 'Cherry Studio',
+        'X-Api-Key': baseConfig.apiKey
+      }
+    }
+  }
+
+  // Handle Azure modes
+  if (aiSdkProviderId === 'azure-responses') {
+    extraOptions.mode = 'responses'
+  } else if (aiSdkProviderId === 'azure') {
+    extraOptions.mode = 'chat'
+  }
+
+  // Handle AWS Bedrock
+  if (aiSdkProviderId === 'bedrock') {
+    const bedrockConfig = context.getAwsBedrockConfig?.()
+    if (bedrockConfig) {
+      extraOptions.region = bedrockConfig.region
+      if (bedrockConfig.authType === 'apiKey') {
+        extraOptions.apiKey = bedrockConfig.apiKey
+      } else {
+        extraOptions.accessKeyId = bedrockConfig.accessKeyId
+        extraOptions.secretAccessKey = bedrockConfig.secretAccessKey
+      }
+    }
+  }
+
+  // Handle Vertex AI
+  if (aiSdkProviderId === 'google-vertex' || aiSdkProviderId === 'google-vertex-anthropic') {
+    const vertexConfig = context.getVertexConfig?.(provider)
+    if (vertexConfig) {
+      extraOptions.project = vertexConfig.project
+      extraOptions.location = vertexConfig.location
+      extraOptions.googleCredentials = {
+        ...vertexConfig.googleCredentials,
+        privateKey: formatPrivateKey(vertexConfig.googleCredentials.privateKey)
+      }
+      baseConfig.baseURL += aiSdkProviderId === 'google-vertex' ? '/publishers/google' : '/publishers/anthropic/models'
+    }
+  }
+
+  // Handle cherryin endpoint type
+  if (aiSdkProviderId === 'cherryin') {
+    const endpointType = context.getEndpointType?.(modelId)
+    if (endpointType) {
+      extraOptions.endpointType = endpointType
+    }
+  }
+
+  // Inject custom fetch if provided
+  if (context.fetch) {
+    extraOptions.fetch = context.fetch
+  }
+
+  // Check if AI SDK supports this provider natively
+  if (hasProviderConfig(aiSdkProviderId) && aiSdkProviderId !== 'openai-compatible') {
+    const options = ProviderConfigFactory.fromProvider(aiSdkProviderId, baseConfig, extraOptions)
+    return {
+      providerId: aiSdkProviderId,
+      options
+    }
+  }
+
+  // Fallback to openai-compatible
+  const options = ProviderConfigFactory.createOpenAICompatible(baseConfig.baseURL, baseConfig.apiKey)
+  return {
+    providerId: 'openai-compatible',
+    options: {
+      ...options,
+      name: provider.id,
+      ...extraOptions,
+      includeUsage: true
+    }
+  }
+}
diff --git a/packages/shared/provider/types.ts b/packages/shared/provider/types.ts
new file mode 100644
index 0000000000..b9745f9d3a
--- /dev/null
+++ b/packages/shared/provider/types.ts
@@ -0,0 +1,174 @@
+import * as z from 'zod'
+
+export const ProviderTypeSchema = z.enum([
+  'openai',
+  'openai-response',
+  'anthropic',
+  'gemini',
+  'azure-openai',
+  'vertexai',
+  'mistral',
+  'aws-bedrock',
+  'vertex-anthropic',
+  'new-api',
+  'ai-gateway'
+])
+
+export type ProviderType = z.infer<typeof ProviderTypeSchema>
+
+/**
+ * Minimal provider interface for shared utilities
+ * This is the subset of Provider that shared code needs
+ */
+export type MinimalProvider = {
+  id: string
+  type: ProviderType
+  apiKey: string
+  apiHost: string
+  anthropicApiHost?: string
+  apiVersion?: string
+  extra_headers?: Record<string, string>
+}
+
+/**
+ * Minimal model interface for shared utilities
+ * This is the subset of Model that shared code needs
+ */
+export type MinimalModel = {
+  id: string
+  endpoint_type?: string
+}
+
+export const SystemProviderIdSchema = z.enum([
+  'cherryin',
+  'silicon',
+  'aihubmix',
+  'ocoolai',
+  'deepseek',
+  'ppio',
+  'alayanew',
+  'qiniu',
+  'dmxapi',
+  'burncloud',
+  'tokenflux',
+  '302ai',
+  'cephalon',
+  'lanyun',
+  'ph8',
+  'openrouter',
+  'ollama',
+  'ovms',
+  'new-api',
+  'lmstudio',
+  'anthropic',
+  'openai',
+  'azure-openai',
+  'gemini',
+  'vertexai',
+  'github',
+  'copilot',
+  'zhipu',
+  'yi',
+  'moonshot',
+  'baichuan',
+  'dashscope',
+  'stepfun',
+  'doubao',
+  'infini',
+  'minimax',
+  'groq',
+  'together',
+  'fireworks',
+  'nvidia',
+  'grok',
+  'hyperbolic',
+  'mistral',
+  'jina',
+  'perplexity',
+  'modelscope',
+  'xirang',
+  'hunyuan',
+  'tencent-cloud-ti',
+  'baidu-cloud',
+  'gpustack',
+  'voyageai',
+  'aws-bedrock',
+  'poe',
+  'aionly',
+  'longcat',
+  'huggingface',
+  'sophnet',
+  'ai-gateway',
+  'cerebras'
+])
+
+export type SystemProviderId = z.infer<typeof SystemProviderIdSchema>
+
+export const isSystemProviderId = (id: string): id is SystemProviderId => {
+  return SystemProviderIdSchema.safeParse(id).success
+}
+
+export const SystemProviderIds = {
+  cherryin: 'cherryin',
+  silicon: 'silicon',
+  aihubmix: 'aihubmix',
+  ocoolai: 'ocoolai',
+  deepseek: 'deepseek',
+  ppio: 'ppio',
+  alayanew: 'alayanew',
+  qiniu: 'qiniu',
+  dmxapi: 'dmxapi',
+  burncloud: 'burncloud',
+  tokenflux: 'tokenflux',
+  '302ai': '302ai',
+  cephalon: 'cephalon',
+  lanyun: 'lanyun',
+  ph8: 'ph8',
+  sophnet: 'sophnet',
+  openrouter: 'openrouter',
+  ollama: 'ollama',
+  ovms: 'ovms',
+  'new-api': 'new-api',
+  lmstudio: 'lmstudio',
+  anthropic: 'anthropic',
+  openai: 'openai',
+  'azure-openai': 'azure-openai',
+  gemini: 'gemini',
+  vertexai: 'vertexai',
+  github: 'github',
+  copilot: 'copilot',
+  zhipu: 'zhipu',
+  yi: 'yi',
+  moonshot: 'moonshot',
+  baichuan: 'baichuan',
+  dashscope: 'dashscope',
+  stepfun: 'stepfun',
+  doubao: 'doubao',
+  infini: 'infini',
+  minimax: 'minimax',
+  groq: 'groq',
+  together: 'together',
+  fireworks: 'fireworks',
+  nvidia: 'nvidia',
+  grok: 'grok',
+  hyperbolic: 'hyperbolic',
+  mistral: 'mistral',
+  jina: 'jina',
+  perplexity: 'perplexity',
+  modelscope: 'modelscope',
+  xirang: 'xirang',
+  hunyuan: 'hunyuan',
+  'tencent-cloud-ti': 'tencent-cloud-ti',
+  'baidu-cloud': 'baidu-cloud',
+  gpustack: 'gpustack',
+  voyageai: 'voyageai',
+  'aws-bedrock': 'aws-bedrock',
+  poe: 'poe',
+  aionly: 'aionly',
+  longcat: 'longcat',
+  huggingface: 'huggingface',
+  'ai-gateway': 'ai-gateway',
+  cerebras: 'cerebras'
+} as const satisfies Record<SystemProviderId, SystemProviderId>
+
+export type SystemProviderIdTypeMap = typeof SystemProviderIds
diff --git a/packages/shared/utils/index.ts b/packages/shared/utils/index.ts
new file mode 100644
index 0000000000..838c28e6c0
--- /dev/null
+++ b/packages/shared/utils/index.ts
@@ -0,0 +1 @@
+export { getBaseModelName, getLowerBaseModelName } from './naming'
diff --git a/packages/shared/utils/naming.ts b/packages/shared/utils/naming.ts
new file mode 100644
index 0000000000..a8b4f5501d
--- /dev/null
+++ b/packages/shared/utils/naming.ts
@@ -0,0 +1,31 @@
+/**
+ * 从模型 ID 中提取基础名称。
+ * 例如：
+ * - 'deepseek/deepseek-r1' => 'deepseek-r1'
+ * - 'deepseek-ai/deepseek/deepseek-r1' => 'deepseek-r1'
+ * @param {string} id 模型 ID
+ * @param {string} [delimiter='/'] 分隔符，默认为 '/'
+ * @returns {string} 基础名称
+ */
+export const getBaseModelName = (id: string, delimiter: string = '/'): string => {
+  const parts = id.split(delimiter)
+  return parts[parts.length - 1]
+}
+
+/**
+ * 从模型 ID 中提取基础名称并转换为小写。
+ * 例如：
+ * - 'deepseek/DeepSeek-R1' => 'deepseek-r1'
+ * - 'deepseek-ai/deepseek/DeepSeek-R1' => 'deepseek-r1'
+ * @param {string} id 模型 ID
+ * @param {string} [delimiter='/'] 分隔符，默认为 '/'
+ * @returns {string} 小写的基础名称
+ */
+export const getLowerBaseModelName = (id: string, delimiter: string = '/'): string => {
+  const baseModelName = getBaseModelName(id, delimiter).toLowerCase()
+  // for openrouter
+  if (baseModelName.endsWith(':free')) {
+    return baseModelName.replace(':free', '')
+  }
+  return baseModelName
+}
diff --git a/src/main/apiServer/routes/messages.ts b/src/main/apiServer/routes/messages.ts
index 02ce0544e8..1ce42c46ea 100644
--- a/src/main/apiServer/routes/messages.ts
+++ b/src/main/apiServer/routes/messages.ts
@@ -5,6 +5,7 @@ import type { Request, Response } from 'express'
 import express from 'express'
 
 import { messagesService } from '../services/messages'
+import { generateUnifiedMessage, streamUnifiedMessages } from '../services/unified-messages'
 import { getProviderById, validateModelId } from '../utils'
 
 const logger = loggerService.withContext('ApiServerMessagesRoutes')
@@ -33,21 +34,35 @@ async function validateRequestBody(req: Request): Promise<{ valid: boolean; erro
 }
 
 interface HandleMessageProcessingOptions {
-  req: Request
   res: Response
   provider: Provider
   request: MessageCreateParams
   modelId?: string
 }
 
+/**
+ * Handle message processing using unified AI SDK
+ * All providers (including Anthropic) are handled through AI SDK:
+ * - Anthropic providers use @ai-sdk/anthropic which outputs native Anthropic SSE
+ * - Other providers use their respective AI SDK adapters, with output converted to Anthropic SSE
+ */
 async function handleMessageProcessing({
-  req,
   res,
   provider,
   request,
   modelId
 }: HandleMessageProcessingOptions): Promise<void> {
+  const actualModelId = modelId || request.model
+
+  logger.info('Processing message via unified AI SDK', {
+    providerId: provider.id,
+    providerType: provider.type,
+    modelId: actualModelId,
+    stream: !!request.stream
+  })
+
   try {
+    // Validate request
     const validation = messagesService.validateRequest(request)
     if (!validation.isValid) {
       res.status(400).json({
@@ -60,21 +75,23 @@ async function handleMessageProcessing({
       return
     }
 
-    const extraHeaders = messagesService.prepareHeaders(req.headers)
-    const { client, anthropicRequest } = await messagesService.processMessage({
-      provider,
-      request,
-      extraHeaders,
-      modelId
-    })
-
     if (request.stream) {
-      await messagesService.handleStreaming(client, anthropicRequest, { response: res }, provider)
-      return
+      await streamUnifiedMessages({
+        response: res,
+        provider,
+        modelId: actualModelId,
+        params: request,
+        onError: (error) => {
+          logger.error('Stream error', error as Error)
+        },
+        onComplete: () => {
+          logger.debug('Stream completed')
+        }
+      })
+    } else {
+      const response = await generateUnifiedMessage(provider, actualModelId, request)
+      res.json(response)
     }
-
-    const response = await client.messages.create(anthropicRequest)
-    res.json(response)
   } catch (error: any) {
     logger.error('Message processing error', { error })
     const { statusCode, errorResponse } = messagesService.transformError(error)
@@ -235,7 +252,7 @@ router.post('/', async (req: Request, res: Response) => {
     const provider = modelValidation.provider!
     const modelId = modelValidation.modelId!
 
-    return handleMessageProcessing({ req, res, provider, request, modelId })
+    return handleMessageProcessing({ res, provider, request, modelId })
   } catch (error: any) {
     logger.error('Message processing error', { error })
     const { statusCode, errorResponse } = messagesService.transformError(error)
@@ -393,7 +410,7 @@ providerRouter.post('/', async (req: Request, res: Response) => {
 
     const request: MessageCreateParams = req.body
 
-    return handleMessageProcessing({ req, res, provider, request })
+    return handleMessageProcessing({ res, provider, request })
   } catch (error: any) {
     logger.error('Message processing error', { error })
     const { statusCode, errorResponse } = messagesService.transformError(error)
@@ -401,4 +418,194 @@ providerRouter.post('/', async (req: Request, res: Response) => {
   }
 })
 
+/**
+ * @swagger
+ * /v1/messages/count_tokens:
+ *   post:
+ *     summary: Count tokens for messages
+ *     description: Count tokens for Anthropic Messages API format (required by Claude Code SDK)
+ *     tags: [Messages]
+ *     requestBody:
+ *       required: true
+ *       content:
+ *         application/json:
+ *           schema:
+ *             type: object
+ *             required:
+ *               - model
+ *               - messages
+ *             properties:
+ *               model:
+ *                 type: string
+ *                 description: Model ID
+ *               messages:
+ *                 type: array
+ *                 items:
+ *                   type: object
+ *               system:
+ *                 type: string
+ *                 description: System message
+ *     responses:
+ *       200:
+ *         description: Token count response
+ *         content:
+ *           application/json:
+ *             schema:
+ *               type: object
+ *               properties:
+ *                 input_tokens:
+ *                   type: integer
+ *       400:
+ *         description: Bad request
+ */
+router.post('/count_tokens', async (req: Request, res: Response) => {
+  try {
+    const { model, messages, system } = req.body
+
+    if (!model) {
+      return res.status(400).json({
+        type: 'error',
+        error: {
+          type: 'invalid_request_error',
+          message: 'model parameter is required'
+        }
+      })
+    }
+
+    if (!messages || !Array.isArray(messages)) {
+      return res.status(400).json({
+        type: 'error',
+        error: {
+          type: 'invalid_request_error',
+          message: 'messages parameter is required'
+        }
+      })
+    }
+
+    // Simple token estimation based on character count
+    // This is a rough approximation: ~4 characters per token for English text
+    let totalChars = 0
+
+    // Count system message tokens
+    if (system) {
+      if (typeof system === 'string') {
+        totalChars += system.length
+      } else if (Array.isArray(system)) {
+        for (const block of system) {
+          if (block.type === 'text' && block.text) {
+            totalChars += block.text.length
+          }
+        }
+      }
+    }
+
+    // Count message tokens
+    for (const msg of messages) {
+      if (typeof msg.content === 'string') {
+        totalChars += msg.content.length
+      } else if (Array.isArray(msg.content)) {
+        for (const block of msg.content) {
+          if (block.type === 'text' && block.text) {
+            totalChars += block.text.length
+          }
+        }
+      }
+      // Add overhead for role
+      totalChars += 10
+    }
+
+    // Estimate tokens (~4 chars per token, with some overhead)
+    const estimatedTokens = Math.ceil(totalChars / 4) + messages.length * 3
+
+    logger.debug('Token count estimated', {
+      model,
+      messageCount: messages.length,
+      totalChars,
+      estimatedTokens
+    })
+
+    return res.json({
+      input_tokens: estimatedTokens
+    })
+  } catch (error: any) {
+    logger.error('Token counting error', { error })
+    return res.status(500).json({
+      type: 'error',
+      error: {
+        type: 'api_error',
+        message: error.message || 'Internal server error'
+      }
+    })
+  }
+})
+
+/**
+ * Provider-specific count_tokens endpoint
+ */
+providerRouter.post('/count_tokens', async (req: Request, res: Response) => {
+  try {
+    const { model, messages, system } = req.body
+
+    if (!messages || !Array.isArray(messages)) {
+      return res.status(400).json({
+        type: 'error',
+        error: {
+          type: 'invalid_request_error',
+          message: 'messages parameter is required'
+        }
+      })
+    }
+
+    // Simple token estimation
+    let totalChars = 0
+
+    if (system) {
+      if (typeof system === 'string') {
+        totalChars += system.length
+      } else if (Array.isArray(system)) {
+        for (const block of system) {
+          if (block.type === 'text' && block.text) {
+            totalChars += block.text.length
+          }
+        }
+      }
+    }
+
+    for (const msg of messages) {
+      if (typeof msg.content === 'string') {
+        totalChars += msg.content.length
+      } else if (Array.isArray(msg.content)) {
+        for (const block of msg.content) {
+          if (block.type === 'text' && block.text) {
+            totalChars += block.text.length
+          }
+        }
+      }
+      totalChars += 10
+    }
+
+    const estimatedTokens = Math.ceil(totalChars / 4) + messages.length * 3
+
+    logger.debug('Token count estimated (provider route)', {
+      providerId: req.params.provider,
+      model,
+      messageCount: messages.length,
+      estimatedTokens
+    })
+
+    return res.json({
+      input_tokens: estimatedTokens
+    })
+  } catch (error: any) {
+    logger.error('Token counting error', { error })
+    return res.status(500).json({
+      type: 'error',
+      error: {
+        type: 'api_error',
+        message: error.message || 'Internal server error'
+      }
+    })
+  }
+})
+
 export { providerRouter as messagesProviderRoutes, router as messagesRoutes }
diff --git a/src/main/apiServer/services/models.ts b/src/main/apiServer/services/models.ts
index 52f0db857f..b72c21b1e1 100644
--- a/src/main/apiServer/services/models.ts
+++ b/src/main/apiServer/services/models.ts
@@ -1,13 +1,6 @@
-import { isEmpty } from 'lodash'
-
 import type { ApiModel, ApiModelsFilter, ApiModelsResponse } from '../../../renderer/src/types/apiModels'
 import { loggerService } from '../../services/LoggerService'
-import {
-  getAvailableProviders,
-  getProviderAnthropicModelChecker,
-  listAllAvailableModels,
-  transformModelToOpenAI
-} from '../utils'
+import { getAvailableProviders, listAllAvailableModels, transformModelToOpenAI } from '../utils'
 
 const logger = loggerService.withContext('ModelsService')
 
@@ -20,11 +13,12 @@ export class ModelsService {
     try {
       logger.debug('Getting available models from providers', { filter })
 
-      let providers = await getAvailableProviders()
+      const providers = await getAvailableProviders()
 
-      if (filter.providerType === 'anthropic') {
-        providers = providers.filter((p) => p.type === 'anthropic' || !isEmpty(p.anthropicApiHost?.trim()))
-      }
+      // Note: When providerType === 'anthropic', we now return ALL available models
+      // because the API Server's unified adapter (AiSdkToAnthropicSSE) can convert
+      // any provider's response to Anthropic SSE format. This enables Claude Code Agent
+      // to work with OpenAI, Gemini, and other providers transparently.
 
       const models = await listAllAvailableModels(providers)
       // Use Map to deduplicate models by their full ID (provider:model_id)
@@ -32,20 +26,11 @@ export class ModelsService {
 
       for (const model of models) {
         const provider = providers.find((p) => p.id === model.provider)
-        // logger.debug(`Processing model ${model.id}`)
         if (!provider) {
           logger.debug(`Skipping model ${model.id} . Reason: Provider not found.`)
           continue
         }
 
-        if (filter.providerType === 'anthropic') {
-          const checker = getProviderAnthropicModelChecker(provider.id)
-          if (!checker(model)) {
-            logger.debug(`Skipping model ${model.id} from ${model.provider}. Reason: Not an Anthropic model.`)
-            continue
-          }
-        }
-
         const openAIModel = transformModelToOpenAI(model, provider)
         const fullModelId = openAIModel.id // This is already in format "provider:model_id"
 
diff --git a/src/main/apiServer/services/unified-messages.ts b/src/main/apiServer/services/unified-messages.ts
new file mode 100644
index 0000000000..d0acd70231
--- /dev/null
+++ b/src/main/apiServer/services/unified-messages.ts
@@ -0,0 +1,455 @@
+import type { LanguageModelV2ToolResultOutput } from '@ai-sdk/provider'
+import type { ReasoningPart, ToolCallPart, ToolResultPart } from '@ai-sdk/provider-utils'
+import type { ImageBlockParam, MessageCreateParams, TextBlockParam } from '@anthropic-ai/sdk/resources/messages'
+import { createProvider as createProviderCore } from '@cherrystudio/ai-core/provider'
+import { loggerService } from '@logger'
+import { reduxService } from '@main/services/ReduxService'
+import { AiSdkToAnthropicSSE, formatSSEDone, formatSSEEvent } from '@shared/adapters'
+import {
+  type AiSdkConfig,
+  type AiSdkConfigContext,
+  formatProviderApiHost,
+  initializeSharedProviders,
+  type ProviderFormatContext,
+  providerToAiSdkConfig as sharedProviderToAiSdkConfig,
+  resolveActualProvider
+} from '@shared/provider'
+import { defaultAppHeaders } from '@shared/utils'
+import type { Provider } from '@types'
+import type { ImagePart, LanguageModel, ModelMessage, Provider as AiSdkProvider, TextPart } from 'ai'
+import { stepCountIs, streamText } from 'ai'
+import { net } from 'electron'
+import type { Response } from 'express'
+
+const logger = loggerService.withContext('UnifiedMessagesService')
+
+initializeSharedProviders({
+  warn: (message) => logger.warn(message),
+  error: (message, error) => logger.error(message, error)
+})
+
+export interface UnifiedStreamConfig {
+  response: Response
+  provider: Provider
+  modelId: string
+  params: MessageCreateParams
+  onError?: (error: unknown) => void
+  onComplete?: () => void
+}
+
+// ============================================================================
+// Provider Factory
+// ============================================================================
+
+/**
+ * Main process format context for formatProviderApiHost
+ * Unlike renderer, main process doesn't have direct access to store getters, so use reduxService cache
+ */
+function getMainProcessFormatContext(): ProviderFormatContext {
+  const vertexSettings = reduxService.selectSync<{ projectId: string; location: string }>('state.llm.settings.vertexai')
+  return {
+    vertex: {
+      project: vertexSettings?.projectId || 'default-project',
+      location: vertexSettings?.location || 'us-central1'
+    }
+  }
+}
+
+/**
+ * Main process context for providerToAiSdkConfig
+ * Main process doesn't have access to browser APIs like window.keyv
+ */
+const mainProcessSdkContext: AiSdkConfigContext = {
+  // Simple key rotation - just return first key (no persistent rotation in main process)
+  getRotatedApiKey: (provider) => {
+    const keys = provider.apiKey.split(',').map((k) => k.trim())
+    return keys[0] || provider.apiKey
+  },
+  fetch: net.fetch as typeof globalThis.fetch
+}
+
+/**
+ * Get actual provider configuration for a model
+ *
+ * For aggregated providers (new-api, aihubmix, vertexai, azure-openai),
+ * this resolves the actual provider type based on the model's characteristics.
+ */
+function getActualProvider(provider: Provider, modelId: string): Provider {
+  // Find the model in provider's models list
+  const model = provider.models?.find((m) => m.id === modelId)
+  if (!model) {
+    // If model not found, return provider as-is
+    return provider
+  }
+
+  // Resolve actual provider based on model
+  return resolveActualProvider(provider, model)
+}
+
+/**
+ * Convert Cherry Studio Provider to AI SDK config
+ * Uses shared implementation with main process context
+ */
+function providerToAiSdkConfig(provider: Provider, modelId: string): AiSdkConfig {
+  // First resolve actual provider for aggregated providers
+  const actualProvider = getActualProvider(provider, modelId)
+
+  // Format the provider's apiHost for AI SDK
+  const formattedProvider = formatProviderApiHost(actualProvider, getMainProcessFormatContext())
+
+  // Use shared implementation
+  return sharedProviderToAiSdkConfig(formattedProvider, modelId, mainProcessSdkContext)
+}
+
+/**
+ * Create an AI SDK provider from Cherry Studio provider configuration
+ */
+async function createAiSdkProvider(config: AiSdkConfig): Promise<AiSdkProvider | null> {
+  try {
+    const provider = await createProviderCore(config.providerId, config.options)
+    logger.debug('AI SDK provider created', {
+      providerId: config.providerId,
+      hasOptions: !!config.options
+    })
+    return provider
+  } catch (error) {
+    logger.error('Failed to create AI SDK provider', error as Error, {
+      providerId: config.providerId
+    })
+    throw error
+  }
+}
+
+/**
+ * Create an AI SDK language model from a Cherry Studio provider configuration
+ * Uses shared provider utilities for consistent behavior with renderer
+ */
+async function createLanguageModel(provider: Provider, modelId: string): Promise<LanguageModel> {
+  logger.debug('Creating language model', {
+    providerId: provider.id,
+    providerType: provider.type,
+    modelId,
+    apiHost: provider.apiHost
+  })
+
+  // Convert provider config to AI SDK config
+  const config = providerToAiSdkConfig(provider, modelId)
+
+  // Create the AI SDK provider
+  const aiSdkProvider = await createAiSdkProvider(config)
+  if (!aiSdkProvider) {
+    throw new Error(`Failed to create AI SDK provider for ${provider.id}`)
+  }
+
+  // Get the language model
+  return aiSdkProvider.languageModel(modelId)
+}
+
+function convertAnthropicToolResultToAiSdk(
+  content: string | Array<TextBlockParam | ImageBlockParam>
+): LanguageModelV2ToolResultOutput {
+  if (typeof content === 'string') {
+    return {
+      type: 'text',
+      value: content
+    }
+  } else {
+    const values: Array<
+      | { type: 'text'; text: string }
+      | {
+          type: 'media'
+          /**
+Base-64 encoded media data.
+*/
+          data: string
+          /**
+IANA media type.
+@see https://www.iana.org/assignments/media-types/media-types.xhtml
+*/
+          mediaType: string
+        }
+    > = []
+    for (const block of content) {
+      if (block.type === 'text') {
+        values.push({
+          type: 'text',
+          text: block.text
+        })
+      } else if (block.type === 'image') {
+        values.push({
+          type: 'media',
+          data: block.source.type === 'base64' ? block.source.data : block.source.url,
+          mediaType: block.source.type === 'base64' ? block.source.media_type : 'image/png'
+        })
+      }
+    }
+    return {
+      type: 'content',
+      value: []
+    }
+  }
+}
+
+/**
+ * Convert Anthropic MessageCreateParams to AI SDK message format
+ */
+function convertAnthropicToAiMessages(params: MessageCreateParams): ModelMessage[] {
+  const messages: ModelMessage[] = []
+
+  // Add system message if present
+  if (params.system) {
+    if (typeof params.system === 'string') {
+      messages.push({
+        role: 'system',
+        content: params.system
+      })
+    } else if (Array.isArray(params.system)) {
+      // Handle TextBlockParam array
+      const systemText = params.system
+        .filter((block) => block.type === 'text')
+        .map((block) => block.text)
+        .join('\n')
+      if (systemText) {
+        messages.push({
+          role: 'system',
+          content: systemText
+        })
+      }
+    }
+  }
+
+  // Convert user/assistant messages
+  for (const msg of params.messages) {
+    if (typeof msg.content === 'string') {
+      if (msg.role === 'user') {
+        messages.push({ role: 'user', content: msg.content })
+      } else {
+        messages.push({ role: 'assistant', content: msg.content })
+      }
+    } else if (Array.isArray(msg.content)) {
+      // Handle content blocks
+      const textParts: TextPart[] = []
+      const imageParts: ImagePart[] = []
+      const reasoningParts: ReasoningPart[] = []
+      const toolCallParts: ToolCallPart[] = []
+      const toolResultParts: ToolResultPart[] = []
+
+      for (const block of msg.content) {
+        if (block.type === 'text') {
+          textParts.push({ type: 'text', text: block.text })
+        } else if (block.type === 'thinking') {
+          reasoningParts.push({ type: 'reasoning', text: block.thinking })
+        } else if (block.type === 'redacted_thinking') {
+          reasoningParts.push({ type: 'reasoning', text: block.data })
+        } else if (block.type === 'image') {
+          const source = block.source
+          if (source.type === 'base64') {
+            imageParts.push({
+              type: 'image',
+              image: `data:${source.media_type};base64,${source.data}`
+            })
+          } else if (source.type === 'url') {
+            imageParts.push({
+              type: 'image',
+              image: source.url
+            })
+          }
+        } else if (block.type === 'tool_use') {
+          toolCallParts.push({
+            type: 'tool-call',
+            toolName: block.name,
+            toolCallId: block.id,
+            input: block.input
+          })
+        } else if (block.type === 'tool_result') {
+          toolResultParts.push({
+            type: 'tool-result',
+            toolCallId: block.tool_use_id,
+            toolName: toolCallParts.find((t) => t.toolCallId === block.tool_use_id)?.toolName || 'unknown',
+            output: block.content ? convertAnthropicToolResultToAiSdk(block.content) : { type: 'text', value: '' }
+          })
+        }
+      }
+
+      // Build the message based on role
+      if (msg.role === 'user') {
+        messages.push({
+          role: 'user',
+          content: [...textParts, ...imageParts]
+        })
+      } else {
+        // Assistant messages can only have text
+        if (textParts.length > 0) {
+          messages.push({
+            role: 'assistant',
+            content: [...reasoningParts, ...textParts, ...toolCallParts, ...toolResultParts]
+          })
+        }
+      }
+    }
+  }
+
+  return messages
+}
+
+/**
+ * Stream a message request using AI SDK and convert to Anthropic SSE format
+ */
+export async function streamUnifiedMessages(config: UnifiedStreamConfig): Promise<void> {
+  const { response, provider, modelId, params, onError, onComplete } = config
+
+  logger.info('Starting unified message stream', {
+    providerId: provider.id,
+    providerType: provider.type,
+    modelId,
+    stream: params.stream
+  })
+
+  try {
+    response.setHeader('Content-Type', 'text/event-stream')
+    response.setHeader('Cache-Control', 'no-cache')
+    response.setHeader('Connection', 'keep-alive')
+    response.setHeader('X-Accel-Buffering', 'no')
+
+    const model = await createLanguageModel(provider, modelId)
+
+    const coreMessages = convertAnthropicToAiMessages(params)
+
+    logger.debug('Converted messages', {
+      originalCount: params.messages.length,
+      convertedCount: coreMessages.length,
+      hasSystem: !!params.system
+    })
+
+    // Create the adapter
+    const adapter = new AiSdkToAnthropicSSE({
+      model: `${provider.id}:${modelId}`,
+      onEvent: (event) => {
+        const sseData = formatSSEEvent(event)
+        response.write(sseData)
+      }
+    })
+
+    // Start streaming
+    const result = streamText({
+      model,
+      messages: coreMessages,
+      maxOutputTokens: params.max_tokens,
+      temperature: params.temperature,
+      topP: params.top_p,
+      stopSequences: params.stop_sequences,
+      stopWhen: stepCountIs(100),
+      headers: defaultAppHeaders(),
+      providerOptions: {}
+    })
+
+    // Process the stream through the adapter
+    await adapter.processStream(result.fullStream)
+
+    // Send done marker
+    response.write(formatSSEDone())
+    response.end()
+
+    logger.info('Unified message stream completed', {
+      providerId: provider.id,
+      modelId
+    })
+
+    onComplete?.()
+  } catch (error) {
+    logger.error('Error in unified message stream', error as Error, {
+      providerId: provider.id,
+      modelId
+    })
+
+    // Try to send error event if response is still writable
+    if (!response.writableEnded) {
+      try {
+        const errorMessage = error instanceof Error ? error.message : 'Unknown error'
+        response.write(
+          `event: error\ndata: ${JSON.stringify({
+            type: 'error',
+            error: {
+              type: 'api_error',
+              message: errorMessage
+            }
+          })}\n\n`
+        )
+        response.end()
+      } catch {
+        // Response already ended
+      }
+    }
+
+    onError?.(error)
+    throw error
+  }
+}
+
+/**
+ * Generate a non-streaming message response
+ */
+export async function generateUnifiedMessage(
+  provider: Provider,
+  modelId: string,
+  params: MessageCreateParams
+): Promise<ReturnType<typeof AiSdkToAnthropicSSE.prototype.buildNonStreamingResponse>> {
+  logger.info('Starting unified message generation', {
+    providerId: provider.id,
+    providerType: provider.type,
+    modelId
+  })
+
+  try {
+    // Create language model (async - uses @cherrystudio/ai-core)
+    const model = await createLanguageModel(provider, modelId)
+
+    // Convert messages
+    const coreMessages = convertAnthropicToAiMessages(params)
+
+    // Create adapter to collect the response
+    let finalResponse: ReturnType<typeof AiSdkToAnthropicSSE.prototype.buildNonStreamingResponse> | null = null
+    const adapter = new AiSdkToAnthropicSSE({
+      model: `${provider.id}:${modelId}`,
+      onEvent: () => {
+        // We don't need to emit events for non-streaming
+      }
+    })
+
+    // Generate text
+    const result = streamText({
+      model,
+      messages: coreMessages,
+      maxOutputTokens: params.max_tokens,
+      temperature: params.temperature,
+      topP: params.top_p,
+      stopSequences: params.stop_sequences,
+      headers: defaultAppHeaders(),
+      stopWhen: stepCountIs(100)
+    })
+
+    // Process the stream to build the response
+    await adapter.processStream(result.fullStream)
+
+    // Get the final response
+    finalResponse = adapter.buildNonStreamingResponse()
+
+    logger.info('Unified message generation completed', {
+      providerId: provider.id,
+      modelId
+    })
+
+    return finalResponse
+  } catch (error) {
+    logger.error('Error in unified message generation', error as Error, {
+      providerId: provider.id,
+      modelId
+    })
+    throw error
+  }
+}
+
+export default {
+  streamUnifiedMessages,
+  generateUnifiedMessage
+}
diff --git a/src/main/services/agents/services/claudecode/index.ts b/src/main/services/agents/services/claudecode/index.ts
index 53b318c5b2..261ff7c07e 100644
--- a/src/main/services/agents/services/claudecode/index.ts
+++ b/src/main/services/agents/services/claudecode/index.ts
@@ -84,18 +84,14 @@ class ClaudeCodeService implements AgentServiceInterface {
       })
       return aiStream
     }
-    if (
-      (modelInfo.provider?.type !== 'anthropic' &&
-        (modelInfo.provider?.anthropicApiHost === undefined || modelInfo.provider.anthropicApiHost.trim() === '')) ||
-      modelInfo.provider.apiKey === ''
-    ) {
-      logger.error('Anthropic provider configuration is missing', {
-        modelInfo
-      })
-
+    // Validate provider has required configuration
+    // Note: We no longer restrict to anthropic type only - the API Server's unified adapter
+    // handles format conversion for any provider type (OpenAI, Gemini, etc.)
+    if (!modelInfo.provider?.apiKey) {
+      logger.error('Provider API key is missing', { modelInfo })
       aiStream.emit('data', {
         type: 'error',
-        error: new Error(`Invalid provider type '${modelInfo.provider?.type}'. Expected 'anthropic' provider type.`)
+        error: new Error(`Provider '${modelInfo.provider?.id}' is missing API key configuration.`)
       })
       return aiStream
     }
@@ -106,15 +102,14 @@ class ClaudeCodeService implements AgentServiceInterface {
       Object.entries(loginShellEnv).filter(([key]) => !key.toLowerCase().endsWith('_proxy'))
     ) as Record<string, string>
 
+    // Route through local API Server which handles format conversion via unified adapter
+    // This enables Claude Code Agent to work with any provider (OpenAI, Gemini, etc.)
+    // The API Server converts AI SDK responses to Anthropic SSE format transparently
     const env = {
       ...loginShellEnvWithoutProxies,
-      // TODO: fix the proxy api server
-      // ANTHROPIC_API_KEY: apiConfig.apiKey,
-      // ANTHROPIC_AUTH_TOKEN: apiConfig.apiKey,
-      // ANTHROPIC_BASE_URL: `http://${apiConfig.host}:${apiConfig.port}/${modelInfo.provider.id}`,
-      ANTHROPIC_API_KEY: modelInfo.provider.apiKey,
-      ANTHROPIC_AUTH_TOKEN: modelInfo.provider.apiKey,
-      ANTHROPIC_BASE_URL: modelInfo.provider.anthropicApiHost?.trim() || modelInfo.provider.apiHost,
+      ANTHROPIC_API_KEY: apiConfig.apiKey,
+      ANTHROPIC_AUTH_TOKEN: apiConfig.apiKey,
+      ANTHROPIC_BASE_URL: `http://${apiConfig.host}:${apiConfig.port}/${modelInfo.provider.id}`,
       ANTHROPIC_MODEL: modelInfo.modelId,
       ANTHROPIC_DEFAULT_OPUS_MODEL: modelInfo.modelId,
       ANTHROPIC_DEFAULT_SONNET_MODEL: modelInfo.modelId,
diff --git a/src/renderer/src/aiCore/legacy/clients/gemini/VertexAPIClient.ts b/src/renderer/src/aiCore/legacy/clients/gemini/VertexAPIClient.ts
index fb371d9ae5..3eaf2f0fb9 100644
--- a/src/renderer/src/aiCore/legacy/clients/gemini/VertexAPIClient.ts
+++ b/src/renderer/src/aiCore/legacy/clients/gemini/VertexAPIClient.ts
@@ -24,7 +24,7 @@ export class VertexAPIClient extends GeminiAPIClient {
     this.anthropicVertexClient = new AnthropicVertexClient(provider)
     // 如果传入的是普通 Provider，转换为 VertexProvider
     if (isVertexProvider(provider)) {
-      this.vertexProvider = provider
+      this.vertexProvider = provider as VertexProvider
     } else {
       this.vertexProvider = createVertexProvider(provider)
     }
diff --git a/src/renderer/src/aiCore/provider/config/azure-anthropic.ts b/src/renderer/src/aiCore/provider/config/azure-anthropic.ts
deleted file mode 100644
index c6cb521386..0000000000
--- a/src/renderer/src/aiCore/provider/config/azure-anthropic.ts
+++ /dev/null
@@ -1,22 +0,0 @@
-import type { Provider } from '@renderer/types'
-
-import { provider2Provider, startsWith } from './helper'
-import type { RuleSet } from './types'
-
-// https://platform.claude.com/docs/en/build-with-claude/claude-in-microsoft-foundry
-const AZURE_ANTHROPIC_RULES: RuleSet = {
-  rules: [
-    {
-      match: startsWith('claude'),
-      provider: (provider: Provider) => ({
-        ...provider,
-        type: 'anthropic',
-        apiHost: provider.apiHost + 'anthropic/v1',
-        id: 'azure-anthropic'
-      })
-    }
-  ],
-  fallbackRule: (provider: Provider) => provider
-}
-
-export const azureAnthropicProviderCreator = provider2Provider.bind(null, AZURE_ANTHROPIC_RULES)
diff --git a/src/renderer/src/aiCore/provider/config/helper.ts b/src/renderer/src/aiCore/provider/config/helper.ts
deleted file mode 100644
index 656911fc76..0000000000
--- a/src/renderer/src/aiCore/provider/config/helper.ts
+++ /dev/null
@@ -1,22 +0,0 @@
-import type { Model, Provider } from '@renderer/types'
-
-import type { RuleSet } from './types'
-
-export const startsWith = (prefix: string) => (model: Model) => model.id.toLowerCase().startsWith(prefix.toLowerCase())
-export const endpointIs = (type: string) => (model: Model) => model.endpoint_type === type
-
-/**
- * 解析模型对应的Provider
- * @param ruleSet 规则集对象
- * @param model 模型对象
- * @param provider 原始provider对象
- * @returns 解析出的provider对象
- */
-export function provider2Provider(ruleSet: RuleSet, model: Model, provider: Provider): Provider {
-  for (const rule of ruleSet.rules) {
-    if (rule.match(model)) {
-      return rule.provider(provider)
-    }
-  }
-  return ruleSet.fallbackRule(provider)
-}
diff --git a/src/renderer/src/aiCore/provider/config/index.ts b/src/renderer/src/aiCore/provider/config/index.ts
index 2f51234cec..b1d57d5a1a 100644
--- a/src/renderer/src/aiCore/provider/config/index.ts
+++ b/src/renderer/src/aiCore/provider/config/index.ts
@@ -1,3 +1,7 @@
-export { aihubmixProviderCreator } from './aihubmix'
-export { newApiResolverCreator } from './newApi'
-export { vertexAnthropicProviderCreator } from './vertext-anthropic'
+// Re-export from shared config
+export {
+  aihubmixProviderCreator,
+  azureAnthropicProviderCreator,
+  newApiResolverCreator,
+  vertexAnthropicProviderCreator
+} from '@shared/provider/config'
diff --git a/src/renderer/src/aiCore/provider/config/types.ts b/src/renderer/src/aiCore/provider/config/types.ts
deleted file mode 100644
index f3938b84d1..0000000000
--- a/src/renderer/src/aiCore/provider/config/types.ts
+++ /dev/null
@@ -1,9 +0,0 @@
-import type { Model, Provider } from '@renderer/types'
-
-export interface RuleSet {
-  rules: Array<{
-    match: (model: Model) => boolean
-    provider: (provider: Provider) => Provider
-  }>
-  fallbackRule: (provider: Provider) => Provider
-}
diff --git a/src/renderer/src/aiCore/provider/config/vertext-anthropic.ts b/src/renderer/src/aiCore/provider/config/vertext-anthropic.ts
deleted file mode 100644
index 23c8b5185c..0000000000
--- a/src/renderer/src/aiCore/provider/config/vertext-anthropic.ts
+++ /dev/null
@@ -1,19 +0,0 @@
-import type { Provider } from '@renderer/types'
-
-import { provider2Provider, startsWith } from './helper'
-import type { RuleSet } from './types'
-
-const VERTEX_ANTHROPIC_RULES: RuleSet = {
-  rules: [
-    {
-      match: startsWith('claude'),
-      provider: (provider: Provider) => ({
-        ...provider,
-        id: 'google-vertex-anthropic'
-      })
-    }
-  ],
-  fallbackRule: (provider: Provider) => provider
-}
-
-export const vertexAnthropicProviderCreator = provider2Provider.bind(null, VERTEX_ANTHROPIC_RULES)
diff --git a/src/renderer/src/aiCore/provider/factory.ts b/src/renderer/src/aiCore/provider/factory.ts
index 9760839389..97ab29db81 100644
--- a/src/renderer/src/aiCore/provider/factory.ts
+++ b/src/renderer/src/aiCore/provider/factory.ts
@@ -1,8 +1,7 @@
-import { hasProviderConfigByAlias, type ProviderId, resolveProviderConfigId } from '@cherrystudio/ai-core/provider'
 import { createProvider as createProviderCore } from '@cherrystudio/ai-core/provider'
 import { loggerService } from '@logger'
 import type { Provider } from '@renderer/types'
-import { isAzureOpenAIProvider, isAzureResponsesEndpoint } from '@renderer/utils/provider'
+import { getAiSdkProviderId as sharedGetAiSdkProviderId } from '@shared/provider'
 import type { Provider as AiSdkProvider } from 'ai'
 
 import type { AiSdkConfig } from '../types'
@@ -22,68 +21,12 @@ const logger = loggerService.withContext('ProviderFactory')
   }
 })()
 
-/**
- * 静态Provider映射表
- * 处理Cherry Studio特有的provider ID到AI SDK标准ID的映射
- */
-const STATIC_PROVIDER_MAPPING: Record<string, ProviderId> = {
-  gemini: 'google', // Google Gemini -> google
-  'azure-openai': 'azure', // Azure OpenAI -> azure
-  'openai-response': 'openai', // OpenAI Responses -> openai
-  grok: 'xai', // Grok -> xai
-  copilot: 'github-copilot-openai-compatible'
-}
-
-/**
- * 尝试解析provider标识符（支持静态映射和别名）
- */
-function tryResolveProviderId(identifier: string): ProviderId | null {
-  // 1. 检查静态映射
-  const staticMapping = STATIC_PROVIDER_MAPPING[identifier]
-  if (staticMapping) {
-    return staticMapping
-  }
-
-  // 2. 检查AiCore是否支持（包括别名支持）
-  if (hasProviderConfigByAlias(identifier)) {
-    // 解析为真实的Provider ID
-    return resolveProviderConfigId(identifier) as ProviderId
-  }
-
-  return null
-}
-
 /**
  * 获取AI SDK Provider ID
- * 简化版：减少重复逻辑，利用通用解析函数
+ * Uses shared implementation with renderer-specific config checker
  */
 export function getAiSdkProviderId(provider: Provider): string {
-  // 1. 尝试解析provider.id
-  const resolvedFromId = tryResolveProviderId(provider.id)
-  if (isAzureOpenAIProvider(provider)) {
-    if (isAzureResponsesEndpoint(provider)) {
-      return 'azure-responses'
-    } else {
-      return 'azure'
-    }
-  }
-  if (resolvedFromId) {
-    return resolvedFromId
-  }
-
-  // 2. 尝试解析provider.type
-  // 会把所有类型为openai的自定义provider解析到aisdk的openaiProvider上
-  if (provider.type !== 'openai') {
-    const resolvedFromType = tryResolveProviderId(provider.type)
-    if (resolvedFromType) {
-      return resolvedFromType
-    }
-  }
-  if (provider.apiHost.includes('api.openai.com')) {
-    return 'openai-chat'
-  }
-  // 3. 最后的fallback（使用provider本身的id）
-  return provider.id
+  return sharedGetAiSdkProviderId(provider)
 }
 
 export async function createAiSdkProvider(config: AiSdkConfig): Promise<AiSdkProvider | null> {
diff --git a/src/renderer/src/aiCore/provider/providerConfig.ts b/src/renderer/src/aiCore/provider/providerConfig.ts
index 53194d3506..8e1a63f5a0 100644
--- a/src/renderer/src/aiCore/provider/providerConfig.ts
+++ b/src/renderer/src/aiCore/provider/providerConfig.ts
@@ -1,4 +1,4 @@
-import { formatPrivateKey, hasProviderConfig, ProviderConfigFactory } from '@cherrystudio/ai-core/provider'
+import { hasProviderConfig } from '@cherrystudio/ai-core/provider'
 import { isOpenAIChatCompletionOnlyModel } from '@renderer/config/models'
 import {
   getAwsBedrockAccessKeyId,
@@ -10,22 +10,17 @@ import {
 import { createVertexProvider, isVertexAIConfigured } from '@renderer/hooks/useVertexAI'
 import { getProviderByModel } from '@renderer/services/AssistantService'
 import store from '@renderer/store'
-import { isSystemProvider, type Model, type Provider, SystemProviderIds } from '@renderer/types'
-import { formatApiHost, formatAzureOpenAIApiHost, formatVertexApiHost, routeToEndpoint } from '@renderer/utils/api'
+import { isSystemProvider, type Model, type Provider } from '@renderer/types'
 import {
-  isAnthropicProvider,
-  isAzureOpenAIProvider,
-  isCherryAIProvider,
-  isGeminiProvider,
-  isNewApiProvider,
-  isPerplexityProvider,
-  isVertexProvider
-} from '@renderer/utils/provider'
+  type AiSdkConfigContext,
+  formatProviderApiHost as sharedFormatProviderApiHost,
+  type ProviderFormatContext,
+  providerToAiSdkConfig as sharedProviderToAiSdkConfig,
+  resolveActualProvider
+} from '@shared/provider'
 import { cloneDeep } from 'lodash'
 
 import type { AiSdkConfig } from '../types'
-import { aihubmixProviderCreator, newApiResolverCreator, vertexAnthropicProviderCreator } from './config'
-import { azureAnthropicProviderCreator } from './config/azure-anthropic'
 import { COPILOT_DEFAULT_HEADERS } from './constants'
 import { getAiSdkProviderId } from './factory'
 
@@ -56,61 +51,51 @@ function getRotatedApiKey(provider: Provider): string {
 }
 
 /**
- * 处理特殊provider的转换逻辑
+ * Renderer-specific context for providerToAiSdkConfig
+ * Provides implementations using browser APIs, store, and hooks
  */
-function handleSpecialProviders(model: Model, provider: Provider): Provider {
-  if (isNewApiProvider(provider)) {
-    return newApiResolverCreator(model, provider)
+function createRendererSdkContext(model: Model): AiSdkConfigContext {
+  return {
+    getRotatedApiKey: (provider) => getRotatedApiKey(provider as Provider),
+    isOpenAIChatCompletionOnlyModel: () => isOpenAIChatCompletionOnlyModel(model),
+    getCopilotDefaultHeaders: () => COPILOT_DEFAULT_HEADERS,
+    getCopilotStoredHeaders: () => store.getState().copilot.defaultHeaders ?? {},
+    getAwsBedrockConfig: () => {
+      const authType = getAwsBedrockAuthType()
+      return {
+        authType,
+        region: getAwsBedrockRegion(),
+        apiKey: authType === 'apiKey' ? getAwsBedrockApiKey() : undefined,
+        accessKeyId: authType === 'iam' ? getAwsBedrockAccessKeyId() : undefined,
+        secretAccessKey: authType === 'iam' ? getAwsBedrockSecretAccessKey() : undefined
+      }
+    },
+    getVertexConfig: (provider) => {
+      if (!isVertexAIConfigured()) {
+        return undefined
+      }
+      return createVertexProvider(provider as Provider)
+    },
+    getEndpointType: () => model.endpoint_type
   }
-
-  if (isSystemProvider(provider)) {
-    if (provider.id === 'aihubmix') {
-      return aihubmixProviderCreator(model, provider)
-    }
-    if (provider.id === 'vertexai') {
-      return vertexAnthropicProviderCreator(model, provider)
-    }
-  }
-  if (isAzureOpenAIProvider(provider)) {
-    return azureAnthropicProviderCreator(model, provider)
-  }
-  return provider
 }
 
 /**
  * 主要用来对齐AISdk的BaseURL格式
- * @param provider
- * @returns
+ * Uses shared implementation with renderer-specific context
  */
-function formatProviderApiHost(provider: Provider): Provider {
-  const formatted = { ...provider }
-  if (formatted.anthropicApiHost) {
-    formatted.anthropicApiHost = formatApiHost(formatted.anthropicApiHost)
-  }
-
-  if (isAnthropicProvider(provider)) {
-    const baseHost = formatted.anthropicApiHost || formatted.apiHost
-    // AI SDK needs /v1 in baseURL, Anthropic SDK will strip it in getSdkClient
-    formatted.apiHost = formatApiHost(baseHost)
-    if (!formatted.anthropicApiHost) {
-      formatted.anthropicApiHost = formatted.apiHost
+function getRendererFormatContext(): ProviderFormatContext {
+  const vertexSettings = store.getState().llm.settings.vertexai
+  return {
+    vertex: {
+      project: vertexSettings.projectId || 'default-project',
+      location: vertexSettings.location || 'us-central1'
     }
-  } else if (formatted.id === SystemProviderIds.copilot || formatted.id === SystemProviderIds.github) {
-    formatted.apiHost = formatApiHost(formatted.apiHost, false)
-  } else if (isGeminiProvider(formatted)) {
-    formatted.apiHost = formatApiHost(formatted.apiHost, true, 'v1beta')
-  } else if (isAzureOpenAIProvider(formatted)) {
-    formatted.apiHost = formatAzureOpenAIApiHost(formatted.apiHost)
-  } else if (isVertexProvider(formatted)) {
-    formatted.apiHost = formatVertexApiHost(formatted)
-  } else if (isCherryAIProvider(formatted)) {
-    formatted.apiHost = formatApiHost(formatted.apiHost, false)
-  } else if (isPerplexityProvider(formatted)) {
-    formatted.apiHost = formatApiHost(formatted.apiHost, false)
-  } else {
-    formatted.apiHost = formatApiHost(formatted.apiHost)
   }
-  return formatted
+}
+
+function formatProviderApiHost(provider: Provider): Provider {
+  return sharedFormatProviderApiHost(provider, getRendererFormatContext())
 }
 
 /**
@@ -122,7 +107,9 @@ export function getActualProvider(model: Model): Provider {
 
   // 按顺序处理各种转换
   let actualProvider = cloneDeep(baseProvider)
-  actualProvider = handleSpecialProviders(model, actualProvider)
+  actualProvider = resolveActualProvider(actualProvider, model, {
+    isSystemProvider
+  }) as Provider
   actualProvider = formatProviderApiHost(actualProvider)
 
   return actualProvider
@@ -130,121 +117,11 @@ export function getActualProvider(model: Model): Provider {
 
 /**
  * 将 Provider 配置转换为新 AI SDK 格式
- * 简化版：利用新的别名映射系统
+ * Uses shared implementation with renderer-specific context
  */
 export function providerToAiSdkConfig(actualProvider: Provider, model: Model): AiSdkConfig {
-  const aiSdkProviderId = getAiSdkProviderId(actualProvider)
-
-  // 构建基础配置
-  const { baseURL, endpoint } = routeToEndpoint(actualProvider.apiHost)
-  const baseConfig = {
-    baseURL: baseURL,
-    apiKey: getRotatedApiKey(actualProvider)
-  }
-
-  const isCopilotProvider = actualProvider.id === SystemProviderIds.copilot
-  if (isCopilotProvider) {
-    const storedHeaders = store.getState().copilot.defaultHeaders ?? {}
-    const options = ProviderConfigFactory.fromProvider('github-copilot-openai-compatible', baseConfig, {
-      headers: {
-        ...COPILOT_DEFAULT_HEADERS,
-        ...storedHeaders,
-        ...actualProvider.extra_headers
-      },
-      name: actualProvider.id,
-      includeUsage: true
-    })
-
-    return {
-      providerId: 'github-copilot-openai-compatible',
-      options
-    }
-  }
-
-  // 处理OpenAI模式
-  const extraOptions: any = {}
-  extraOptions.endpoint = endpoint
-  if (actualProvider.type === 'openai-response' && !isOpenAIChatCompletionOnlyModel(model)) {
-    extraOptions.mode = 'responses'
-  } else if (aiSdkProviderId === 'openai' || (aiSdkProviderId === 'cherryin' && actualProvider.type === 'openai')) {
-    extraOptions.mode = 'chat'
-  }
-
-  // 添加额外headers
-  if (actualProvider.extra_headers) {
-    extraOptions.headers = actualProvider.extra_headers
-    // copy from openaiBaseClient/openaiResponseApiClient
-    if (aiSdkProviderId === 'openai') {
-      extraOptions.headers = {
-        ...extraOptions.headers,
-        'HTTP-Referer': 'https://cherry-ai.com',
-        'X-Title': 'Cherry Studio',
-        'X-Api-Key': baseConfig.apiKey
-      }
-    }
-  }
-  // azure
-  // https://learn.microsoft.com/en-us/azure/ai-foundry/openai/latest
-  // https://learn.microsoft.com/en-us/azure/ai-foundry/openai/how-to/responses?tabs=python-key#responses-api
-  if (aiSdkProviderId === 'azure-responses') {
-    extraOptions.mode = 'responses'
-  } else if (aiSdkProviderId === 'azure') {
-    extraOptions.mode = 'chat'
-  }
-
-  // bedrock
-  if (aiSdkProviderId === 'bedrock') {
-    const authType = getAwsBedrockAuthType()
-    extraOptions.region = getAwsBedrockRegion()
-
-    if (authType === 'apiKey') {
-      extraOptions.apiKey = getAwsBedrockApiKey()
-    } else {
-      extraOptions.accessKeyId = getAwsBedrockAccessKeyId()
-      extraOptions.secretAccessKey = getAwsBedrockSecretAccessKey()
-    }
-  }
-  // google-vertex
-  if (aiSdkProviderId === 'google-vertex' || aiSdkProviderId === 'google-vertex-anthropic') {
-    if (!isVertexAIConfigured()) {
-      throw new Error('VertexAI is not configured. Please configure project, location and service account credentials.')
-    }
-    const { project, location, googleCredentials } = createVertexProvider(actualProvider)
-    extraOptions.project = project
-    extraOptions.location = location
-    extraOptions.googleCredentials = {
-      ...googleCredentials,
-      privateKey: formatPrivateKey(googleCredentials.privateKey)
-    }
-    baseConfig.baseURL += aiSdkProviderId === 'google-vertex' ? '/publishers/google' : '/publishers/anthropic/models'
-  }
-
-  // cherryin
-  if (aiSdkProviderId === 'cherryin') {
-    if (model.endpoint_type) {
-      extraOptions.endpointType = model.endpoint_type
-    }
-  }
-
-  if (hasProviderConfig(aiSdkProviderId) && aiSdkProviderId !== 'openai-compatible') {
-    const options = ProviderConfigFactory.fromProvider(aiSdkProviderId, baseConfig, extraOptions)
-    return {
-      providerId: aiSdkProviderId,
-      options
-    }
-  }
-
-  // 否则fallback到openai-compatible
-  const options = ProviderConfigFactory.createOpenAICompatible(baseConfig.baseURL, baseConfig.apiKey)
-  return {
-    providerId: 'openai-compatible',
-    options: {
-      ...options,
-      name: actualProvider.id,
-      ...extraOptions,
-      includeUsage: true
-    }
-  }
+  const context = createRendererSdkContext(model)
+  return sharedProviderToAiSdkConfig(actualProvider, model.id, context) as AiSdkConfig
 }
 
 /**
@@ -287,13 +164,13 @@ export async function prepareSpecialProviderConfig(
       break
     }
     case 'cherryai': {
-      config.options.fetch = async (url, options) => {
+      config.options.fetch = async (url: RequestInfo | URL, options: RequestInit) => {
         // 在这里对最终参数进行签名
         const signature = await window.api.cherryai.generateSignature({
           method: 'POST',
           path: '/chat/completions',
           query: '',
-          body: JSON.parse(options.body)
+          body: JSON.parse(options.body as string)
         })
         return fetch(url, {
           ...options,
diff --git a/src/renderer/src/aiCore/provider/providerInitialization.ts b/src/renderer/src/aiCore/provider/providerInitialization.ts
index 2e4b9fced2..5254e78851 100644
--- a/src/renderer/src/aiCore/provider/providerInitialization.ts
+++ b/src/renderer/src/aiCore/provider/providerInitialization.ts
@@ -1,113 +1,13 @@
-import { type ProviderConfig, registerMultipleProviderConfigs } from '@cherrystudio/ai-core/provider'
 import { loggerService } from '@logger'
+import { initializeSharedProviders, SHARED_PROVIDER_CONFIGS } from '@shared/provider'
 
 const logger = loggerService.withContext('ProviderConfigs')
 
-/**
- * 新Provider配置定义
- * 定义了需要动态注册的AI Providers
- */
-export const NEW_PROVIDER_CONFIGS: ProviderConfig[] = [
-  {
-    id: 'openrouter',
-    name: 'OpenRouter',
-    import: () => import('@openrouter/ai-sdk-provider'),
-    creatorFunctionName: 'createOpenRouter',
-    supportsImageGeneration: true,
-    aliases: ['openrouter']
-  },
-  {
-    id: 'google-vertex',
-    name: 'Google Vertex AI',
-    import: () => import('@ai-sdk/google-vertex/edge'),
-    creatorFunctionName: 'createVertex',
-    supportsImageGeneration: true,
-    aliases: ['vertexai']
-  },
-  {
-    id: 'google-vertex-anthropic',
-    name: 'Google Vertex AI Anthropic',
-    import: () => import('@ai-sdk/google-vertex/anthropic/edge'),
-    creatorFunctionName: 'createVertexAnthropic',
-    supportsImageGeneration: true,
-    aliases: ['vertexai-anthropic']
-  },
-  {
-    id: 'azure-anthropic',
-    name: 'Azure AI Anthropic',
-    import: () => import('@ai-sdk/anthropic'),
-    creatorFunctionName: 'createAnthropic',
-    supportsImageGeneration: false,
-    aliases: ['azure-anthropic']
-  },
-  {
-    id: 'github-copilot-openai-compatible',
-    name: 'GitHub Copilot OpenAI Compatible',
-    import: () => import('@opeoginni/github-copilot-openai-compatible'),
-    creatorFunctionName: 'createGitHubCopilotOpenAICompatible',
-    supportsImageGeneration: false,
-    aliases: ['copilot', 'github-copilot']
-  },
-  {
-    id: 'bedrock',
-    name: 'Amazon Bedrock',
-    import: () => import('@ai-sdk/amazon-bedrock'),
-    creatorFunctionName: 'createAmazonBedrock',
-    supportsImageGeneration: true,
-    aliases: ['aws-bedrock']
-  },
-  {
-    id: 'perplexity',
-    name: 'Perplexity',
-    import: () => import('@ai-sdk/perplexity'),
-    creatorFunctionName: 'createPerplexity',
-    supportsImageGeneration: false,
-    aliases: ['perplexity']
-  },
-  {
-    id: 'mistral',
-    name: 'Mistral',
-    import: () => import('@ai-sdk/mistral'),
-    creatorFunctionName: 'createMistral',
-    supportsImageGeneration: false,
-    aliases: ['mistral']
-  },
-  {
-    id: 'huggingface',
-    name: 'HuggingFace',
-    import: () => import('@ai-sdk/huggingface'),
-    creatorFunctionName: 'createHuggingFace',
-    supportsImageGeneration: true,
-    aliases: ['hf', 'hugging-face']
-  },
-  {
-    id: 'ai-gateway',
-    name: 'AI Gateway',
-    import: () => import('@ai-sdk/gateway'),
-    creatorFunctionName: 'createGateway',
-    supportsImageGeneration: true,
-    aliases: ['gateway']
-  },
-  {
-    id: 'cerebras',
-    name: 'Cerebras',
-    import: () => import('@ai-sdk/cerebras'),
-    creatorFunctionName: 'createCerebras',
-    supportsImageGeneration: false
-  }
-] as const
+export const NEW_PROVIDER_CONFIGS = SHARED_PROVIDER_CONFIGS
 
-/**
- * 初始化新的Providers
- * 使用aiCore的动态注册功能
- */
 export async function initializeNewProviders(): Promise<void> {
-  try {
-    const successCount = registerMultipleProviderConfigs(NEW_PROVIDER_CONFIGS)
-    if (successCount < NEW_PROVIDER_CONFIGS.length) {
-      logger.warn('Some providers failed to register. Check previous error logs.')
-    }
-  } catch (error) {
-    logger.error('Failed to initialize new providers:', error as Error)
-  }
+  initializeSharedProviders({
+    warn: (message) => logger.warn(message),
+    error: (message, error) => logger.error(message, error)
+  })
 }
diff --git a/src/renderer/src/types/index.ts b/src/renderer/src/types/index.ts
index bff57185a7..7db6cbf4bd 100644
--- a/src/renderer/src/types/index.ts
+++ b/src/renderer/src/types/index.ts
@@ -7,6 +7,8 @@ import type { CSSProperties } from 'react'
 export * from './file'
 export * from './note'
 
+import type { MinimalModel } from '@shared/provider/types'
+
 import type { StreamTextParams } from './aiCoreTypes'
 import type { Chunk } from './chunk'
 import type { FileMetadata } from './file'
@@ -256,7 +258,7 @@ export type ModelCapability = {
   isUserSelected?: boolean
 }
 
-export type Model = {
+export type Model = MinimalModel & {
   id: string
   provider: string
   name: string
diff --git a/src/renderer/src/types/provider.ts b/src/renderer/src/types/provider.ts
index 9d948f16d0..573e1e1007 100644
--- a/src/renderer/src/types/provider.ts
+++ b/src/renderer/src/types/provider.ts
@@ -1,24 +1,14 @@
 import type OpenAI from '@cherrystudio/openai'
+import type { MinimalProvider } from '@shared/provider'
+import type { ProviderType, SystemProviderId, SystemProviderIdTypeMap } from '@shared/provider/types'
+import { isSystemProviderId, SystemProviderIds } from '@shared/provider/types'
 import type { Model } from '@types'
-import * as z from 'zod'
 
 import type { OpenAIVerbosity } from './aiCoreTypes'
 
-export const ProviderTypeSchema = z.enum([
-  'openai',
-  'openai-response',
-  'anthropic',
-  'gemini',
-  'azure-openai',
-  'vertexai',
-  'mistral',
-  'aws-bedrock',
-  'vertex-anthropic',
-  'new-api',
-  'ai-gateway'
-])
-
-export type ProviderType = z.infer<typeof ProviderTypeSchema>
+export type { ProviderType } from '@shared/provider'
+export type { SystemProviderId, SystemProviderIdTypeMap } from '@shared/provider/types'
+export { isSystemProviderId, ProviderTypeSchema, SystemProviderIds } from '@shared/provider/types'
 
 // undefined is treated as supported, enabled by default
 export type ProviderApiOptions = {
@@ -93,7 +83,7 @@ export function isAwsBedrockAuthType(type: string): type is AwsBedrockAuthType {
   return Object.hasOwn(AwsBedrockAuthTypes, type)
 }
 
-export type Provider = {
+export type Provider = MinimalProvider & {
   id: string
   type: ProviderType
   name: string
@@ -128,140 +118,6 @@ export type Provider = {
   extra_headers?: Record<string, string>
 }
 
-export const SystemProviderIdSchema = z.enum([
-  'cherryin',
-  'silicon',
-  'aihubmix',
-  'ocoolai',
-  'deepseek',
-  'ppio',
-  'alayanew',
-  'qiniu',
-  'dmxapi',
-  'burncloud',
-  'tokenflux',
-  '302ai',
-  'cephalon',
-  'lanyun',
-  'ph8',
-  'openrouter',
-  'ollama',
-  'ovms',
-  'new-api',
-  'lmstudio',
-  'anthropic',
-  'openai',
-  'azure-openai',
-  'gemini',
-  'vertexai',
-  'github',
-  'copilot',
-  'zhipu',
-  'yi',
-  'moonshot',
-  'baichuan',
-  'dashscope',
-  'stepfun',
-  'doubao',
-  'infini',
-  'minimax',
-  'groq',
-  'together',
-  'fireworks',
-  'nvidia',
-  'grok',
-  'hyperbolic',
-  'mistral',
-  'jina',
-  'perplexity',
-  'modelscope',
-  'xirang',
-  'hunyuan',
-  'tencent-cloud-ti',
-  'baidu-cloud',
-  'gpustack',
-  'voyageai',
-  'aws-bedrock',
-  'poe',
-  'aionly',
-  'longcat',
-  'huggingface',
-  'sophnet',
-  'ai-gateway',
-  'cerebras'
-])
-
-export type SystemProviderId = z.infer<typeof SystemProviderIdSchema>
-
-export const isSystemProviderId = (id: string): id is SystemProviderId => {
-  return SystemProviderIdSchema.safeParse(id).success
-}
-
-export const SystemProviderIds = {
-  cherryin: 'cherryin',
-  silicon: 'silicon',
-  aihubmix: 'aihubmix',
-  ocoolai: 'ocoolai',
-  deepseek: 'deepseek',
-  ppio: 'ppio',
-  alayanew: 'alayanew',
-  qiniu: 'qiniu',
-  dmxapi: 'dmxapi',
-  burncloud: 'burncloud',
-  tokenflux: 'tokenflux',
-  '302ai': '302ai',
-  cephalon: 'cephalon',
-  lanyun: 'lanyun',
-  ph8: 'ph8',
-  sophnet: 'sophnet',
-  openrouter: 'openrouter',
-  ollama: 'ollama',
-  ovms: 'ovms',
-  'new-api': 'new-api',
-  lmstudio: 'lmstudio',
-  anthropic: 'anthropic',
-  openai: 'openai',
-  'azure-openai': 'azure-openai',
-  gemini: 'gemini',
-  vertexai: 'vertexai',
-  github: 'github',
-  copilot: 'copilot',
-  zhipu: 'zhipu',
-  yi: 'yi',
-  moonshot: 'moonshot',
-  baichuan: 'baichuan',
-  dashscope: 'dashscope',
-  stepfun: 'stepfun',
-  doubao: 'doubao',
-  infini: 'infini',
-  minimax: 'minimax',
-  groq: 'groq',
-  together: 'together',
-  fireworks: 'fireworks',
-  nvidia: 'nvidia',
-  grok: 'grok',
-  hyperbolic: 'hyperbolic',
-  mistral: 'mistral',
-  jina: 'jina',
-  perplexity: 'perplexity',
-  modelscope: 'modelscope',
-  xirang: 'xirang',
-  hunyuan: 'hunyuan',
-  'tencent-cloud-ti': 'tencent-cloud-ti',
-  'baidu-cloud': 'baidu-cloud',
-  gpustack: 'gpustack',
-  voyageai: 'voyageai',
-  'aws-bedrock': 'aws-bedrock',
-  poe: 'poe',
-  aionly: 'aionly',
-  longcat: 'longcat',
-  huggingface: 'huggingface',
-  'ai-gateway': 'ai-gateway',
-  cerebras: 'cerebras'
-} as const satisfies Record<SystemProviderId, SystemProviderId>
-
-type SystemProviderIdTypeMap = typeof SystemProviderIds
-
 export type SystemProvider = Provider & {
   id: SystemProviderId
   isSystem: true
diff --git a/src/renderer/src/utils/api.ts b/src/renderer/src/utils/api.ts
index 845187eb80..ab411e6f15 100644
--- a/src/renderer/src/utils/api.ts
+++ b/src/renderer/src/utils/api.ts
@@ -1,6 +1,15 @@
-import store from '@renderer/store'
-import type { VertexProvider } from '@renderer/types'
-import { trim } from 'lodash'
+export {
+  formatApiHost,
+  formatAzureOpenAIApiHost,
+  formatVertexApiHost,
+  getAiSdkBaseUrl,
+  hasAPIVersion,
+  routeToEndpoint,
+  SUPPORTED_ENDPOINT_LIST,
+  SUPPORTED_IMAGE_ENDPOINT_LIST,
+  validateApiHost,
+  withoutTrailingSlash
+} from '@shared/api'
 
 /**
  * 格式化 API key 字符串。
@@ -12,169 +21,6 @@ export function formatApiKeys(value: string): string {
   return value.replaceAll('，', ',').replaceAll('\n', ',')
 }
 
-/**
- * 判断 host 的 path 中是否包含形如版本的字符串（例如 /v1、/v2beta 等），
- *
- * @param host - 要检查的 host 或 path 字符串
- * @returns 如果 path 中包含版本字符串则返回 true，否则 false
- */
-export function hasAPIVersion(host?: string): boolean {
-  if (!host) return false
-
-  // 匹配路径中以 `/v<number>` 开头并可选跟随 `alpha` 或 `beta` 的版本段，
-  // 该段后面可以跟 `/` 或字符串结束（用于匹配诸如 `/v3alpha/resources` 的情况）。
-  const versionRegex = /\/v\d+(?:alpha|beta)?(?=\/|$)/i
-
-  try {
-    const url = new URL(host)
-    return versionRegex.test(url.pathname)
-  } catch {
-    // 若无法作为完整 URL 解析，则当作路径直接检测
-    return versionRegex.test(host)
-  }
-}
-
-/**
- * Removes the trailing slash from a URL string if it exists.
- *
- * @template T - The string type to preserve type safety
- * @param {T} url - The URL string to process
- * @returns {T} The URL string without a trailing slash
- *
- * @example
- * ```ts
- * withoutTrailingSlash('https://example.com/') // 'https://example.com'
- * withoutTrailingSlash('https://example.com')  // 'https://example.com'
- * ```
- */
-export function withoutTrailingSlash<T extends string>(url: T): T {
-  return url.replace(/\/$/, '') as T
-}
-
-/**
- * Formats an API host URL by normalizing it and optionally appending an API version.
- *
- * @param host - The API host URL to format. Leading/trailing whitespace will be trimmed and trailing slashes removed.
- * @param isSupportedAPIVerion - Whether the API version is supported. Defaults to `true`.
- * @param apiVersion - The API version to append if needed. Defaults to `'v1'`.
- *
- * @returns The formatted API host URL. If the host is empty after normalization, returns an empty string.
- *          If the host ends with '#', API version is not supported, or the host already contains a version, returns the normalized host as-is.
- *          Otherwise, returns the host with the API version appended.
- *
- * @example
- * formatApiHost('https://api.example.com/') // Returns 'https://api.example.com/v1'
- * formatApiHost('https://api.example.com#') // Returns 'https://api.example.com#'
- * formatApiHost('https://api.example.com/v2', true, 'v1') // Returns 'https://api.example.com/v2'
- */
-export function formatApiHost(host?: string, isSupportedAPIVerion: boolean = true, apiVersion: string = 'v1'): string {
-  const normalizedHost = withoutTrailingSlash(trim(host))
-  if (!normalizedHost) {
-    return ''
-  }
-
-  if (normalizedHost.endsWith('#') || !isSupportedAPIVerion || hasAPIVersion(normalizedHost)) {
-    return normalizedHost
-  }
-  return `${normalizedHost}/${apiVersion}`
-}
-
-/**
- * 格式化 Azure OpenAI 的 API 主机地址。
- */
-export function formatAzureOpenAIApiHost(host: string): string {
-  const normalizedHost = withoutTrailingSlash(host)
-    ?.replace(/\/v1$/, '')
-    .replace(/\/openai$/, '')
-  // NOTE: AISDK会添加上`v1`
-  return formatApiHost(normalizedHost + '/openai', false)
-}
-
-export function formatVertexApiHost(provider: VertexProvider): string {
-  const { apiHost } = provider
-  const { projectId: project, location } = store.getState().llm.settings.vertexai
-  const trimmedHost = withoutTrailingSlash(trim(apiHost))
-  if (!trimmedHost || trimmedHost.endsWith('aiplatform.googleapis.com')) {
-    const host =
-      location == 'global' ? 'https://aiplatform.googleapis.com' : `https://${location}-aiplatform.googleapis.com`
-    return `${formatApiHost(host)}/projects/${project}/locations/${location}`
-  }
-  return formatApiHost(trimmedHost)
-}
-
-// 目前对话界面只支持这些端点
-export const SUPPORTED_IMAGE_ENDPOINT_LIST = ['images/generations', 'images/edits', 'predict'] as const
-export const SUPPORTED_ENDPOINT_LIST = [
-  'chat/completions',
-  'responses',
-  'messages',
-  'generateContent',
-  'streamGenerateContent',
-  ...SUPPORTED_IMAGE_ENDPOINT_LIST
-] as const
-
-/**
- * Converts an API host URL into separate base URL and endpoint components.
- *
- * @param apiHost - The API host string to parse. Expected to be a trimmed URL that may end with '#' followed by an endpoint identifier.
- * @returns An object containing:
- *   - `baseURL`: The base URL without the endpoint suffix
- *   - `endpoint`: The matched endpoint identifier, or empty string if no match found
- *
- * @description
- * This function extracts endpoint information from a composite API host string.
- * If the host ends with '#', it attempts to match the preceding part against the supported endpoint list.
- * The '#' delimiter is removed before processing.
- *
- * @example
- * routeToEndpoint('https://api.example.com/openai/chat/completions#')
- * // Returns: { baseURL: 'https://api.example.com/v1', endpoint: 'chat/completions' }
- *
- * @example
- * routeToEndpoint('https://api.example.com/v1')
- * // Returns: { baseURL: 'https://api.example.com/v1', endpoint: '' }
- */
-export function routeToEndpoint(apiHost: string): { baseURL: string; endpoint: string } {
-  const trimmedHost = trim(apiHost)
-  // 前面已经确保apiHost合法
-  if (!trimmedHost.endsWith('#')) {
-    return { baseURL: trimmedHost, endpoint: '' }
-  }
-  // 去掉结尾的 #
-  const host = trimmedHost.slice(0, -1)
-  const endpointMatch = SUPPORTED_ENDPOINT_LIST.find((endpoint) => host.endsWith(endpoint))
-  if (!endpointMatch) {
-    const baseURL = withoutTrailingSlash(host)
-    return { baseURL, endpoint: '' }
-  }
-  const baseSegment = host.slice(0, host.length - endpointMatch.length)
-  const baseURL = withoutTrailingSlash(baseSegment).replace(/:$/, '') // 去掉结尾可能存在的冒号(gemini的特殊情况)
-  return { baseURL, endpoint: endpointMatch }
-}
-
-/**
- * 验证 API 主机地址是否合法。
- *
- * @param {string} apiHost - 需要验证的 API 主机地址。
- * @returns {boolean} 如果是合法的 URL 则返回 true，否则返回 false。
- */
-export function validateApiHost(apiHost: string): boolean {
-  // 允许apiHost为空
-  if (!apiHost || !trim(apiHost)) {
-    return true
-  }
-  try {
-    const url = new URL(trim(apiHost))
-    // 验证协议是否为 http 或 https
-    if (url.protocol !== 'http:' && url.protocol !== 'https:') {
-      return false
-    }
-    return true
-  } catch {
-    return false
-  }
-}
-
 /**
  * API key 脱敏函数。仅保留部分前后字符，中间用星号代替。
  *
diff --git a/src/renderer/src/utils/naming.ts b/src/renderer/src/utils/naming.ts
index bc24bc7db8..d258cee81a 100644
--- a/src/renderer/src/utils/naming.ts
+++ b/src/renderer/src/utils/naming.ts
@@ -2,6 +2,8 @@ import { getProviderLabel } from '@renderer/i18n/label'
 import type { Provider } from '@renderer/types'
 import { isSystemProvider } from '@renderer/types'
 
+export { getBaseModelName, getLowerBaseModelName } from '@shared/utils/naming'
+
 /**
  * 从模型 ID 中提取默认组名。
  * 规则如下：
@@ -50,38 +52,6 @@ export const getDefaultGroupName = (id: string, provider?: string): string => {
   return str
 }
 
-/**
- * 从模型 ID 中提取基础名称。
- * 例如：
- * - 'deepseek/deepseek-r1' => 'deepseek-r1'
- * - 'deepseek-ai/deepseek/deepseek-r1' => 'deepseek-r1'
- * @param {string} id 模型 ID
- * @param {string} [delimiter='/'] 分隔符，默认为 '/'
- * @returns {string} 基础名称
- */
-export const getBaseModelName = (id: string, delimiter: string = '/'): string => {
-  const parts = id.split(delimiter)
-  return parts[parts.length - 1]
-}
-
-/**
- * 从模型 ID 中提取基础名称并转换为小写。
- * 例如：
- * - 'deepseek/DeepSeek-R1' => 'deepseek-r1'
- * - 'deepseek-ai/deepseek/DeepSeek-R1' => 'deepseek-r1'
- * @param {string} id 模型 ID
- * @param {string} [delimiter='/'] 分隔符，默认为 '/'
- * @returns {string} 小写的基础名称
- */
-export const getLowerBaseModelName = (id: string, delimiter: string = '/'): string => {
-  const baseModelName = getBaseModelName(id, delimiter).toLowerCase()
-  // for openrouter
-  if (baseModelName.endsWith(':free')) {
-    return baseModelName.replace(':free', '')
-  }
-  return baseModelName
-}
-
 /**
  * 获取模型服务商名称，根据是否内置服务商来决定要不要翻译
  * @param provider 服务商
diff --git a/src/renderer/src/utils/provider.ts b/src/renderer/src/utils/provider.ts
index e8fc1b5cc7..2c79d36352 100644
--- a/src/renderer/src/utils/provider.ts
+++ b/src/renderer/src/utils/provider.ts
@@ -1,10 +1,20 @@
 import { CLAUDE_SUPPORTED_PROVIDERS } from '@renderer/pages/code'
-import type { AzureOpenAIProvider, ProviderType, VertexProvider } from '@renderer/types'
+import type { ProviderType } from '@renderer/types'
 import { isSystemProvider, type Provider, type SystemProviderId, SystemProviderIds } from '@renderer/types'
-
-export const isAzureResponsesEndpoint = (provider: AzureOpenAIProvider) => {
-  return provider.apiVersion === 'preview' || provider.apiVersion === 'v1'
-}
+export {
+  isAIGatewayProvider,
+  isAnthropicProvider,
+  isAwsBedrockProvider,
+  isAzureOpenAIProvider,
+  isAzureResponsesEndpoint,
+  isCherryAIProvider,
+  isGeminiProvider,
+  isNewApiProvider,
+  isOpenAICompatibleProvider,
+  isOpenAIProvider,
+  isPerplexityProvider,
+  isVertexProvider
+} from '@shared/provider'
 
 export const getClaudeSupportedProviders = (providers: Provider[]) => {
   return providers.filter(
@@ -119,55 +129,6 @@ export const isGeminiWebSearchProvider = (provider: Provider) => {
   return SUPPORT_GEMINI_NATIVE_WEB_SEARCH_PROVIDERS.some((id) => id === provider.id)
 }
 
-export const isNewApiProvider = (provider: Provider) => {
-  return ['new-api', 'cherryin'].includes(provider.id) || provider.type === 'new-api'
-}
-
-export function isCherryAIProvider(provider: Provider): boolean {
-  return provider.id === 'cherryai'
-}
-
-export function isPerplexityProvider(provider: Provider): boolean {
-  return provider.id === 'perplexity'
-}
-
-/**
- * 判断是否为 OpenAI 兼容的提供商
- * @param {Provider} provider 提供商对象
- * @returns {boolean} 是否为 OpenAI 兼容提供商
- */
-export function isOpenAICompatibleProvider(provider: Provider): boolean {
-  return ['openai', 'new-api', 'mistral'].includes(provider.type)
-}
-
-export function isAzureOpenAIProvider(provider: Provider): provider is AzureOpenAIProvider {
-  return provider.type === 'azure-openai'
-}
-
-export function isOpenAIProvider(provider: Provider): boolean {
-  return provider.type === 'openai-response'
-}
-
-export function isVertexProvider(provider: Provider): provider is VertexProvider {
-  return provider.type === 'vertexai'
-}
-
-export function isAwsBedrockProvider(provider: Provider): boolean {
-  return provider.type === 'aws-bedrock'
-}
-
-export function isAnthropicProvider(provider: Provider): boolean {
-  return provider.type === 'anthropic'
-}
-
-export function isGeminiProvider(provider: Provider): boolean {
-  return provider.type === 'gemini'
-}
-
-export function isAIGatewayProvider(provider: Provider): boolean {
-  return provider.type === 'ai-gateway'
-}
-
 const NOT_SUPPORT_API_VERSION_PROVIDERS = ['github', 'copilot', 'perplexity'] as const satisfies SystemProviderId[]
 
 export const isSupportAPIVersionProvider = (provider: Provider) => {

From 192357a32e150fa7952b4a103260a1e13572db31 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 27 Nov 2025 19:19:04 +0800
Subject: [PATCH 02/53] feat: Enhance thinking block management and tool
 conversion in unified messages

---
 .../shared/adapters/AiSdkToAnthropicSSE.ts    | 108 +++++++++++++-----
 .../apiServer/services/unified-messages.ts    |  89 +++++++++++++--
 .../agents/services/claudecode/transform.ts   |  30 ++++-
 3 files changed, 188 insertions(+), 39 deletions(-)

diff --git a/packages/shared/adapters/AiSdkToAnthropicSSE.ts b/packages/shared/adapters/AiSdkToAnthropicSSE.ts
index 38fab703ac..1674609236 100644
--- a/packages/shared/adapters/AiSdkToAnthropicSSE.ts
+++ b/packages/shared/adapters/AiSdkToAnthropicSSE.ts
@@ -59,7 +59,9 @@ interface AdapterState {
   currentBlockIndex: number
   blocks: Map<number, ContentBlockState>
   textBlockIndex: number | null
-  thinkingBlockIndex: number | null
+  // Track multiple thinking blocks by their reasoning ID
+  thinkingBlocks: Map<string, number> // reasoningId -> blockIndex
+  currentThinkingId: string | null // Currently active thinking block ID
   toolBlocks: Map<string, number> // toolCallId -> blockIndex
   stopReason: StopReason | null
   hasEmittedMessageStart: boolean
@@ -95,7 +97,8 @@ export class AiSdkToAnthropicSSE {
       currentBlockIndex: 0,
       blocks: new Map(),
       textBlockIndex: null,
-      thinkingBlockIndex: null,
+      thinkingBlocks: new Map(),
+      currentThinkingId: null,
       toolBlocks: new Map(),
       stopReason: null,
       hasEmittedMessageStart: false
@@ -133,7 +136,7 @@ export class AiSdkToAnthropicSSE {
    * Process a single AI SDK chunk and emit corresponding Anthropic events
    */
   private processChunk(chunk: TextStreamPart<ToolSet>): void {
-    logger.silly('AiSdkToAnthropicSSE - Processing chunk:', chunk)
+    logger.silly('AiSdkToAnthropicSSE - Processing chunk:', { chunk: JSON.stringify(chunk) })
     switch (chunk.type) {
       // === Text Events ===
       case 'text-start':
@@ -149,17 +152,23 @@ export class AiSdkToAnthropicSSE {
         break
 
       // === Reasoning/Thinking Events ===
-      case 'reasoning-start':
-        this.startThinkingBlock()
+      case 'reasoning-start': {
+        const reasoningId = (chunk as { id?: string }).id || `reasoning_${Date.now()}`
+        this.startThinkingBlock(reasoningId)
         break
+      }
 
-      case 'reasoning-delta':
-        this.emitThinkingDelta(chunk.text || '')
+      case 'reasoning-delta': {
+        const reasoningId = (chunk as { id?: string }).id
+        this.emitThinkingDelta(chunk.text || '', reasoningId)
         break
+      }
 
-      case 'reasoning-end':
-        this.stopThinkingBlock()
+      case 'reasoning-end': {
+        const reasoningId = (chunk as { id?: string }).id
+        this.stopThinkingBlock(reasoningId)
         break
+      }
 
       // === Tool Events ===
       case 'tool-call':
@@ -190,9 +199,7 @@ export class AiSdkToAnthropicSSE {
 
       // === Error Events ===
       case 'error':
-        // Anthropic doesn't have a standard error event in the stream
-        // Errors are typically sent as separate HTTP responses
-        // For now, we'll just log and continue
+        this.handleError(chunk.error)
         break
 
       // Ignore other event types
@@ -303,11 +310,13 @@ export class AiSdkToAnthropicSSE {
     this.state.textBlockIndex = null
   }
 
-  private startThinkingBlock(): void {
-    if (this.state.thinkingBlockIndex !== null) return
+  private startThinkingBlock(reasoningId: string): void {
+    // Check if this thinking block already exists
+    if (this.state.thinkingBlocks.has(reasoningId)) return
 
     const index = this.state.currentBlockIndex++
-    this.state.thinkingBlockIndex = index
+    this.state.thinkingBlocks.set(reasoningId, index)
+    this.state.currentThinkingId = reasoningId
     this.state.blocks.set(index, {
       type: 'thinking',
       index,
@@ -330,15 +339,25 @@ export class AiSdkToAnthropicSSE {
     this.onEvent(event)
   }
 
-  private emitThinkingDelta(text: string): void {
+  private emitThinkingDelta(text: string, reasoningId?: string): void {
     if (!text) return
 
-    // Auto-start thinking block if not started
-    if (this.state.thinkingBlockIndex === null) {
-      this.startThinkingBlock()
+    // Determine which thinking block to use
+    const targetId = reasoningId || this.state.currentThinkingId
+    if (!targetId) {
+      // Auto-start thinking block if not started
+      const newId = `reasoning_${Date.now()}`
+      this.startThinkingBlock(newId)
+      return this.emitThinkingDelta(text, newId)
+    }
+
+    const index = this.state.thinkingBlocks.get(targetId)
+    if (index === undefined) {
+      // If the block doesn't exist, create it
+      this.startThinkingBlock(targetId)
+      return this.emitThinkingDelta(text, targetId)
     }
 
-    const index = this.state.thinkingBlockIndex!
     const block = this.state.blocks.get(index)
     if (block) {
       block.content += text
@@ -358,10 +377,12 @@ export class AiSdkToAnthropicSSE {
     this.onEvent(event)
   }
 
-  private stopThinkingBlock(): void {
-    if (this.state.thinkingBlockIndex === null) return
+  private stopThinkingBlock(reasoningId?: string): void {
+    const targetId = reasoningId || this.state.currentThinkingId
+    if (!targetId) return
 
-    const index = this.state.thinkingBlockIndex
+    const index = this.state.thinkingBlocks.get(targetId)
+    if (index === undefined) return
 
     const event: RawContentBlockStopEvent = {
       type: 'content_block_stop',
@@ -369,7 +390,14 @@ export class AiSdkToAnthropicSSE {
     }
 
     this.onEvent(event)
-    this.state.thinkingBlockIndex = null
+    this.state.thinkingBlocks.delete(targetId)
+
+    // Update currentThinkingId if we just closed the current one
+    if (this.state.currentThinkingId === targetId) {
+      // Set to the most recent remaining thinking block, or null if none
+      const remaining = Array.from(this.state.thinkingBlocks.keys())
+      this.state.currentThinkingId = remaining.length > 0 ? remaining[remaining.length - 1] : null
+    }
   }
 
   private handleToolCall(chunk: { type: 'tool-call'; toolCallId: string; toolName: string; args: unknown }): void {
@@ -471,13 +499,41 @@ export class AiSdkToAnthropicSSE {
     }
   }
 
+  private handleError(error: unknown): void {
+    // Log the error for debugging
+    logger.warn('AiSdkToAnthropicSSE - Provider error received:', { error })
+
+    // Extract error message
+    let errorMessage = 'Unknown error from provider'
+    if (error && typeof error === 'object') {
+      const err = error as { message?: string; metadata?: { raw?: string } }
+      if (err.metadata?.raw) {
+        errorMessage = `Provider error: ${err.metadata.raw}`
+      } else if (err.message) {
+        errorMessage = err.message
+      }
+    } else if (typeof error === 'string') {
+      errorMessage = error
+    }
+
+    // Emit error as a text block so the user can see it
+    // First close any open thinking blocks to maintain proper event order
+    for (const reasoningId of Array.from(this.state.thinkingBlocks.keys())) {
+      this.stopThinkingBlock(reasoningId)
+    }
+
+    // Emit the error as text
+    this.emitTextDelta(`\n\n[Error: ${errorMessage}]\n`)
+  }
+
   private finalize(): void {
     // Close any open blocks
     if (this.state.textBlockIndex !== null) {
       this.stopTextBlock()
     }
-    if (this.state.thinkingBlockIndex !== null) {
-      this.stopThinkingBlock()
+    // Close all open thinking blocks
+    for (const reasoningId of this.state.thinkingBlocks.keys()) {
+      this.stopThinkingBlock(reasoningId)
     }
 
     // Emit message_delta with final stop reason and usage
diff --git a/src/main/apiServer/services/unified-messages.ts b/src/main/apiServer/services/unified-messages.ts
index d0acd70231..0f71cfcfae 100644
--- a/src/main/apiServer/services/unified-messages.ts
+++ b/src/main/apiServer/services/unified-messages.ts
@@ -1,6 +1,11 @@
 import type { LanguageModelV2ToolResultOutput } from '@ai-sdk/provider'
 import type { ReasoningPart, ToolCallPart, ToolResultPart } from '@ai-sdk/provider-utils'
-import type { ImageBlockParam, MessageCreateParams, TextBlockParam } from '@anthropic-ai/sdk/resources/messages'
+import type {
+  ImageBlockParam,
+  MessageCreateParams,
+  TextBlockParam,
+  Tool as AnthropicTool
+} from '@anthropic-ai/sdk/resources/messages'
 import { createProvider as createProviderCore } from '@cherrystudio/ai-core/provider'
 import { loggerService } from '@logger'
 import { reduxService } from '@main/services/ReduxService'
@@ -16,8 +21,8 @@ import {
 } from '@shared/provider'
 import { defaultAppHeaders } from '@shared/utils'
 import type { Provider } from '@types'
-import type { ImagePart, LanguageModel, ModelMessage, Provider as AiSdkProvider, TextPart } from 'ai'
-import { stepCountIs, streamText } from 'ai'
+import type { ImagePart, LanguageModel, ModelMessage, Provider as AiSdkProvider, TextPart, Tool } from 'ai'
+import { jsonSchema, stepCountIs, streamText, tool } from 'ai'
 import { net } from 'electron'
 import type { Response } from 'express'
 
@@ -190,6 +195,39 @@ IANA media type.
   }
 }
 
+/**
+ * Convert Anthropic tools format to AI SDK tools format
+ */
+function convertAnthropicToolsToAiSdk(tools: MessageCreateParams['tools']): Record<string, Tool> | undefined {
+  if (!tools || tools.length === 0) {
+    return undefined
+  }
+
+  const aiSdkTools: Record<string, Tool> = {}
+
+  for (const anthropicTool of tools) {
+    // Handle different tool types
+    if (anthropicTool.type === 'bash_20250124') {
+      // Skip computer use and bash tools - these are Anthropic-specific
+      continue
+    }
+
+    // Regular tool (type === 'custom' or no type)
+    const toolDef = anthropicTool as AnthropicTool
+    const parameters = toolDef.input_schema as Parameters<typeof jsonSchema>[0]
+
+    aiSdkTools[toolDef.name] = tool({
+      description: toolDef.description || '',
+      inputSchema: jsonSchema(parameters),
+      execute: async (input: Record<string, unknown>) => {
+        return input
+      }
+    })
+  }
+
+  return Object.keys(aiSdkTools).length > 0 ? aiSdkTools : undefined
+}
+
 /**
  * Convert Anthropic MessageCreateParams to AI SDK message format
  */
@@ -271,6 +309,13 @@ function convertAnthropicToAiMessages(params: MessageCreateParams): ModelMessage
         }
       }
 
+      if (toolResultParts.length > 0) {
+        messages.push({
+          role: 'tool',
+          content: [...toolResultParts]
+        })
+      }
+
       // Build the message based on role
       if (msg.role === 'user') {
         messages.push({
@@ -278,13 +323,11 @@ function convertAnthropicToAiMessages(params: MessageCreateParams): ModelMessage
           content: [...textParts, ...imageParts]
         })
       } else {
-        // Assistant messages can only have text
-        if (textParts.length > 0) {
-          messages.push({
-            role: 'assistant',
-            content: [...reasoningParts, ...textParts, ...toolCallParts, ...toolResultParts]
-          })
-        }
+        // Assistant messages contain tool calls, not tool results
+        messages.push({
+          role: 'assistant',
+          content: [...reasoningParts, ...textParts, ...toolCallParts]
+        })
       }
     }
   }
@@ -315,10 +358,29 @@ export async function streamUnifiedMessages(config: UnifiedStreamConfig): Promis
 
     const coreMessages = convertAnthropicToAiMessages(params)
 
+    // Convert tools if present
+    const tools = convertAnthropicToolsToAiSdk(params.tools)
+
     logger.debug('Converted messages', {
       originalCount: params.messages.length,
       convertedCount: coreMessages.length,
-      hasSystem: !!params.system
+      hasSystem: !!params.system,
+      hasTools: !!tools,
+      toolCount: tools ? Object.keys(tools).length : 0,
+      toolNames: tools ? Object.keys(tools).slice(0, 10) : [],
+      paramsToolCount: params.tools?.length || 0
+    })
+
+    // Debug: Log message structure to understand tool_result handling
+    logger.silly('Message structure for debugging', {
+      messages: coreMessages.map((m) => ({
+        role: m.role,
+        contentTypes: Array.isArray(m.content)
+          ? m.content.map((c: { type: string }) => c.type)
+          : typeof m.content === 'string'
+            ? ['string']
+            : ['unknown']
+      }))
     })
 
     // Create the adapter
@@ -340,6 +402,7 @@ export async function streamUnifiedMessages(config: UnifiedStreamConfig): Promis
       stopSequences: params.stop_sequences,
       stopWhen: stepCountIs(100),
       headers: defaultAppHeaders(),
+      tools,
       providerOptions: {}
     })
 
@@ -404,8 +467,9 @@ export async function generateUnifiedMessage(
     // Create language model (async - uses @cherrystudio/ai-core)
     const model = await createLanguageModel(provider, modelId)
 
-    // Convert messages
+    // Convert messages and tools
     const coreMessages = convertAnthropicToAiMessages(params)
+    const tools = convertAnthropicToolsToAiSdk(params.tools)
 
     // Create adapter to collect the response
     let finalResponse: ReturnType<typeof AiSdkToAnthropicSSE.prototype.buildNonStreamingResponse> | null = null
@@ -425,6 +489,7 @@ export async function generateUnifiedMessage(
       topP: params.top_p,
       stopSequences: params.stop_sequences,
       headers: defaultAppHeaders(),
+      tools,
       stopWhen: stepCountIs(100)
     })
 
diff --git a/src/main/services/agents/services/claudecode/transform.ts b/src/main/services/agents/services/claudecode/transform.ts
index 00be683ba8..fa0c615648 100644
--- a/src/main/services/agents/services/claudecode/transform.ts
+++ b/src/main/services/agents/services/claudecode/transform.ts
@@ -193,6 +193,30 @@ function handleAssistantMessage(
         }
         break
       }
+      case 'thinking':
+      case 'redacted_thinking': {
+        const thinkingText = block.type === 'thinking' ? block.thinking : block.data
+        if (thinkingText) {
+          const id = generateMessageId()
+          chunks.push({
+            type: 'reasoning-start',
+            id,
+            providerMetadata
+          })
+          chunks.push({
+            type: 'reasoning-delta',
+            id,
+            text: thinkingText,
+            providerMetadata
+          })
+          chunks.push({
+            type: 'reasoning-end',
+            id,
+            providerMetadata
+          })
+        }
+        break
+      }
       case 'tool_use':
         handleAssistantToolUse(block as ToolUseContent, providerMetadata, state, chunks)
         break
@@ -445,7 +469,11 @@ function handleStreamEvent(
     case 'content_block_stop': {
       const block = state.closeBlock(event.index)
       if (!block) {
-        logger.warn('Received content_block_stop for unknown index', { index: event.index })
+        // Some providers (e.g., Gemini) send content via assistant message before stream events,
+        // so the block may not exist in state. This is expected behavior, not an error.
+        logger.debug('Received content_block_stop for unknown index (may be from non-streaming content)', {
+          index: event.index
+        })
         break
       }
 

From ccfb9423e0df019984259814ad509e23ed40d697 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 27 Nov 2025 19:31:59 +0800
Subject: [PATCH 03/53] chore: format

---
 packages/shared/api/index.ts              |  8 ++++++--
 packages/shared/provider/config/helper.ts | 10 +++++-----
 packages/shared/provider/resolve.ts       |  3 +--
 3 files changed, 12 insertions(+), 9 deletions(-)

diff --git a/packages/shared/api/index.ts b/packages/shared/api/index.ts
index 0cf652b427..5ee19611d8 100644
--- a/packages/shared/api/index.ts
+++ b/packages/shared/api/index.ts
@@ -53,12 +53,16 @@ export function formatAzureOpenAIApiHost(host: string): string {
   return formatApiHost(normalizedHost + '/openai', false)
 }
 
-export function formatVertexApiHost(provider: MinimalProvider, project: string, location: string): string {
+export function formatVertexApiHost(
+  provider: MinimalProvider,
+  project: string = 'test-project',
+  location: string = 'us-central1'
+): string {
   const { apiHost } = provider
   const trimmedHost = withoutTrailingSlash(trim(apiHost))
   if (!trimmedHost || trimmedHost.endsWith('aiplatform.googleapis.com')) {
     const host =
-      location == 'global' ? 'https://aiplatform.googleapis.com' : `https://${location}-aiplatform.googleapis.com`
+      location === 'global' ? 'https://aiplatform.googleapis.com' : `https://${location}-aiplatform.googleapis.com`
     return `${formatApiHost(host)}/projects/${project}/locations/${location}`
   }
   return formatApiHost(trimmedHost)
diff --git a/packages/shared/provider/config/helper.ts b/packages/shared/provider/config/helper.ts
index 4e821a6c8f..95f53f885a 100644
--- a/packages/shared/provider/config/helper.ts
+++ b/packages/shared/provider/config/helper.ts
@@ -18,11 +18,11 @@ export const endpointIs =
  * @param provider 原始provider对象
  * @returns 解析出的provider对象
  */
-export function provider2Provider<
-  M extends MinimalModel,
-  R extends MinimalProvider,
-  P extends R = R
->(ruleSet: RuleSet<M, R>, model: M, provider: P): P {
+export function provider2Provider<M extends MinimalModel, R extends MinimalProvider, P extends R = R>(
+  ruleSet: RuleSet<M, R>,
+  model: M,
+  provider: P
+): P {
   for (const rule of ruleSet.rules) {
     if (rule.match(model)) {
       return rule.provider(provider) as P
diff --git a/packages/shared/provider/resolve.ts b/packages/shared/provider/resolve.ts
index 9055a36c6e..385da6a586 100644
--- a/packages/shared/provider/resolve.ts
+++ b/packages/shared/provider/resolve.ts
@@ -25,8 +25,7 @@ export function resolveActualProvider<M extends MinimalModel, P extends MinimalP
     resolvedProvider = newApiResolverCreator(model, resolvedProvider)
   }
 
-  const isSystemProvider =
-    options.isSystemProvider?.(resolvedProvider) ?? defaultIsSystemProvider(resolvedProvider)
+  const isSystemProvider = options.isSystemProvider?.(resolvedProvider) ?? defaultIsSystemProvider(resolvedProvider)
 
   if (isSystemProvider && resolvedProvider.id === 'aihubmix') {
     resolvedProvider = aihubmixProviderCreator(model, resolvedProvider)

From f225fbe3e3128b042560a35fb568843e746f062c Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 27 Nov 2025 20:43:47 +0800
Subject: [PATCH 04/53] feat: Implement direct processing for Anthropic SDK and
 refactor message handling

---
 packages/shared/anthropic/index.ts            |  28 ++++-
 src/main/apiServer/routes/messages.ts         | 100 ++++++++++++++++--
 src/main/apiServer/services/messages.ts       |  24 ++++-
 .../apiServer/services/unified-messages.ts    |   5 +-
 4 files changed, 141 insertions(+), 16 deletions(-)

diff --git a/packages/shared/anthropic/index.ts b/packages/shared/anthropic/index.ts
index bff143d118..2444ad6113 100644
--- a/packages/shared/anthropic/index.ts
+++ b/packages/shared/anthropic/index.ts
@@ -16,6 +16,20 @@ import type { ModelMessage } from 'ai'
 
 const logger = loggerService.withContext('anthropic-sdk')
 
+/**
+ * Context for Anthropic SDK client creation.
+ * This allows the shared module to be used in different environments
+ * by providing environment-specific implementations.
+ */
+export interface AnthropicSdkContext {
+  /**
+   * Custom fetch function to use for HTTP requests.
+   * In Electron main process, this should be `net.fetch`.
+   * In other environments, can use the default fetch or a custom implementation.
+   */
+  fetch?: typeof globalThis.fetch
+}
+
 const defaultClaudeCodeSystemPrompt = `You are Claude Code, Anthropic's official CLI for Claude.`
 
 const defaultClaudeCodeSystem: Array<TextBlockParam> = [
@@ -58,8 +72,11 @@ const defaultClaudeCodeSystem: Array<TextBlockParam> = [
 export function getSdkClient(
   provider: Provider,
   oauthToken?: string | null,
-  extraHeaders?: Record<string, string | string[]>
+  extraHeaders?: Record<string, string | string[]>,
+  context?: AnthropicSdkContext
 ): Anthropic {
+  const customFetch = context?.fetch
+
   if (provider.authType === 'oauth') {
     if (!oauthToken) {
       throw new Error('OAuth token is not available')
@@ -85,7 +102,8 @@ export function getSdkClient(
         'x-stainless-runtime': 'node',
         'x-stainless-runtime-version': 'v22.18.0',
         ...extraHeaders
-      }
+      },
+      fetch: customFetch
     })
   }
   let baseURL =
@@ -110,7 +128,8 @@ export function getSdkClient(
         'APP-Code': 'MLTG2087',
         ...provider.extra_headers,
         ...extraHeaders
-      }
+      },
+      fetch: customFetch
     })
   }
 
@@ -122,7 +141,8 @@ export function getSdkClient(
     defaultHeaders: {
       'anthropic-beta': 'output-128k-2025-02-19',
       ...provider.extra_headers
-    }
+    },
+    fetch: customFetch
   })
 }
 
diff --git a/src/main/apiServer/routes/messages.ts b/src/main/apiServer/routes/messages.ts
index 1ce42c46ea..f2590cf1d5 100644
--- a/src/main/apiServer/routes/messages.ts
+++ b/src/main/apiServer/routes/messages.ts
@@ -8,6 +8,17 @@ import { messagesService } from '../services/messages'
 import { generateUnifiedMessage, streamUnifiedMessages } from '../services/unified-messages'
 import { getProviderById, validateModelId } from '../utils'
 
+/**
+ * Check if provider should use direct Anthropic SDK
+ *
+ * A provider is considered "Anthropic-compatible" if:
+ * 1. It's a native Anthropic provider (type === 'anthropic'), OR
+ * 2. It has anthropicApiHost configured (aggregated providers routing to Anthropic-compatible endpoints)
+ */
+function shouldUseDirectAnthropic(provider: Provider): boolean {
+  return provider.type === 'anthropic' || !!(provider.anthropicApiHost && provider.anthropicApiHost.trim())
+}
+
 const logger = loggerService.withContext('ApiServerMessagesRoutes')
 
 const router = express.Router()
@@ -41,12 +52,70 @@ interface HandleMessageProcessingOptions {
 }
 
 /**
- * Handle message processing using unified AI SDK
- * All providers (including Anthropic) are handled through AI SDK:
- * - Anthropic providers use @ai-sdk/anthropic which outputs native Anthropic SSE
- * - Other providers use their respective AI SDK adapters, with output converted to Anthropic SSE
+ * Handle message processing using direct Anthropic SDK
+ * Used for providers with anthropicApiHost or native Anthropic providers
+ * This bypasses AI SDK conversion and uses native Anthropic protocol
  */
-async function handleMessageProcessing({
+async function handleDirectAnthropicProcessing({
+  res,
+  provider,
+  request,
+  modelId,
+  extraHeaders
+}: HandleMessageProcessingOptions & { extraHeaders?: Record<string, string | string[]> }): Promise<void> {
+  const actualModelId = modelId || request.model
+
+  logger.info('Processing message via direct Anthropic SDK', {
+    providerId: provider.id,
+    providerType: provider.type,
+    modelId: actualModelId,
+    stream: !!request.stream,
+    anthropicApiHost: provider.anthropicApiHost
+  })
+
+  try {
+    // Validate request
+    const validation = messagesService.validateRequest(request)
+    if (!validation.isValid) {
+      res.status(400).json({
+        type: 'error',
+        error: {
+          type: 'invalid_request_error',
+          message: validation.errors.join('; ')
+        }
+      })
+      return
+    }
+
+    // Process message using messagesService (native Anthropic SDK)
+    const { client, anthropicRequest } = await messagesService.processMessage({
+      provider,
+      request,
+      extraHeaders,
+      modelId: actualModelId
+    })
+
+    if (request.stream) {
+      // Use native Anthropic streaming
+      await messagesService.handleStreaming(client, anthropicRequest, { response: res }, provider)
+    } else {
+      // Use native Anthropic non-streaming
+      const response = await client.messages.create(anthropicRequest)
+      res.json(response)
+    }
+  } catch (error: any) {
+    logger.error('Direct Anthropic processing error', { error })
+    const { statusCode, errorResponse } = messagesService.transformError(error)
+    res.status(statusCode).json(errorResponse)
+  }
+}
+
+/**
+ * Handle message processing using unified AI SDK
+ * Used for non-Anthropic providers that need format conversion
+ * - Uses AI SDK adapters with output converted to Anthropic SSE format
+ */
+async function handleUnifiedProcessing({
   res,
   provider,
   request,
@@ -93,12 +162,31 @@ async function handleMessageProcessing({
       res.json(response)
     }
   } catch (error: any) {
-    logger.error('Message processing error', { error })
+    logger.error('Unified processing error', { error })
     const { statusCode, errorResponse } = messagesService.transformError(error)
     res.status(statusCode).json(errorResponse)
   }
 }
 
+/**
+ * Handle message processing - routes to appropriate handler based on provider
+ *
+ * Routing logic:
+ * - Providers with anthropicApiHost OR type 'anthropic': Direct Anthropic SDK (no conversion)
+ * - Other providers: Unified AI SDK with Anthropic SSE conversion
+ */
+async function handleMessageProcessing({
+  res,
+  provider,
+  request,
+  modelId
+}: HandleMessageProcessingOptions): Promise<void> {
+  if (shouldUseDirectAnthropic(provider)) {
+    return handleDirectAnthropicProcessing({ res, provider, request, modelId })
+  }
+  return handleUnifiedProcessing({ res, provider, request, modelId })
+}
+
 /**
  * @swagger
  * /v1/messages:
diff --git a/src/main/apiServer/services/messages.ts b/src/main/apiServer/services/messages.ts
index 8b46deaa8f..e3fbd069a7 100644
--- a/src/main/apiServer/services/messages.ts
+++ b/src/main/apiServer/services/messages.ts
@@ -4,6 +4,7 @@ import { loggerService } from '@logger'
 import anthropicService from '@main/services/AnthropicService'
 import { buildClaudeCodeSystemMessage, getSdkClient } from '@shared/anthropic'
 import type { Provider } from '@types'
+import { net } from 'electron'
 import type { Response } from 'express'
 
 const logger = loggerService.withContext('MessagesService')
@@ -98,11 +99,30 @@ export class MessagesService {
 
   async getClient(provider: Provider, extraHeaders?: Record<string, string | string[]>): Promise<Anthropic> {
     // Create Anthropic client for the provider
+    // Wrap net.fetch to handle compatibility issues:
+    // 1. net.fetch expects string URLs, not Request objects
+    // 2. net.fetch doesn't support 'agent' option from Node.js http module
+    const electronFetch: typeof globalThis.fetch = async (input: URL | RequestInfo, init?: RequestInit) => {
+      const url = typeof input === 'string' ? input : input instanceof URL ? input.toString() : input.url
+      // Remove unsupported options for Electron's net.fetch
+      if (init) {
+        const initWithAgent = init as RequestInit & { agent?: unknown }
+        delete initWithAgent.agent
+        const headers = new Headers(initWithAgent.headers)
+        if (headers.has('content-length')) {
+          headers.delete('content-length')
+        }
+        initWithAgent.headers = headers
+        return net.fetch(url, initWithAgent)
+      }
+      return net.fetch(url)
+    }
+    const context = { fetch: electronFetch }
     if (provider.authType === 'oauth') {
       const oauthToken = await anthropicService.getValidAccessToken()
-      return getSdkClient(provider, oauthToken, extraHeaders)
+      return getSdkClient(provider, oauthToken, extraHeaders, context)
     }
-    return getSdkClient(provider, null, extraHeaders)
+    return getSdkClient(provider, null, extraHeaders, context)
   }
 
   prepareHeaders(headers: Record<string, string | string[] | undefined>): Record<string, string | string[]> {
diff --git a/src/main/apiServer/services/unified-messages.ts b/src/main/apiServer/services/unified-messages.ts
index 0f71cfcfae..5aadfbf534 100644
--- a/src/main/apiServer/services/unified-messages.ts
+++ b/src/main/apiServer/services/unified-messages.ts
@@ -42,10 +42,6 @@ export interface UnifiedStreamConfig {
   onComplete?: () => void
 }
 
-// ============================================================================
-// Provider Factory
-// ============================================================================
-
 /**
  * Main process format context for formatProviderApiHost
  * Unlike renderer, main process doesn't have direct access to store getters, so use reduxService cache
@@ -338,6 +334,7 @@ function convertAnthropicToAiMessages(params: MessageCreateParams): ModelMessage
 /**
  * Stream a message request using AI SDK and convert to Anthropic SSE format
  */
+// TODO: 使用ai-core executor集成中间件和transformstream进来
 export async function streamUnifiedMessages(config: UnifiedStreamConfig): Promise<void> {
   const { response, provider, modelId, params, onError, onComplete } = config
 

From 36ed062b847279c2e2eda844e78b925e8250cdc2 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 27 Nov 2025 20:55:36 +0800
Subject: [PATCH 05/53] fix: test

---
 packages/shared/config/providers.ts           |  5 ---
 src/main/apiServer/routes/messages.ts         | 39 ++++++++++++++-----
 src/main/apiServer/utils/index.ts             | 29 ++++++++++++++
 .../provider/__tests__/providerConfig.test.ts | 30 ++++++++++++--
 src/renderer/src/utils/__tests__/api.test.ts  | 13 +------
 5 files changed, 86 insertions(+), 30 deletions(-)

diff --git a/packages/shared/config/providers.ts b/packages/shared/config/providers.ts
index f7744150e2..e03661bf0e 100644
--- a/packages/shared/config/providers.ts
+++ b/packages/shared/config/providers.ts
@@ -41,8 +41,3 @@ const SILICON_ANTHROPIC_COMPATIBLE_MODEL_SET = new Set(SILICON_ANTHROPIC_COMPATI
 export function isSiliconAnthropicCompatibleModel(modelId: string): boolean {
   return SILICON_ANTHROPIC_COMPATIBLE_MODEL_SET.has(modelId)
 }
-
-/**
- * Silicon provider's Anthropic API host URL.
- */
-export const SILICON_ANTHROPIC_API_HOST = 'https://api.siliconflow.cn'
diff --git a/src/main/apiServer/routes/messages.ts b/src/main/apiServer/routes/messages.ts
index f2590cf1d5..f0eaac8e4e 100644
--- a/src/main/apiServer/routes/messages.ts
+++ b/src/main/apiServer/routes/messages.ts
@@ -6,17 +6,34 @@ import express from 'express'
 
 import { messagesService } from '../services/messages'
 import { generateUnifiedMessage, streamUnifiedMessages } from '../services/unified-messages'
-import { getProviderById, validateModelId } from '../utils'
+import { getProviderById, isModelAnthropicCompatible, validateModelId } from '../utils'
 
 /**
- * Check if provider should use direct Anthropic SDK
+ * Check if a specific model on a provider should use direct Anthropic SDK
  *
- * A provider is considered "Anthropic-compatible" if:
+ * A provider+model combination is considered "Anthropic-compatible" if:
  * 1. It's a native Anthropic provider (type === 'anthropic'), OR
- * 2. It has anthropicApiHost configured (aggregated providers routing to Anthropic-compatible endpoints)
+ * 2. It has anthropicApiHost configured AND the specific model supports Anthropic API
+ *    (for aggregated providers like Silicon, only certain models support Anthropic endpoint)
+ *
+ * @param provider - The provider to check
+ * @param modelId - The model ID to check (without provider prefix)
+ * @returns true if should use direct Anthropic SDK, false for unified SDK
  */
-function shouldUseDirectAnthropic(provider: Provider): boolean {
-  return provider.type === 'anthropic' || !!(provider.anthropicApiHost && provider.anthropicApiHost.trim())
+function shouldUseDirectAnthropic(provider: Provider, modelId: string): boolean {
+  // Native Anthropic provider - always use direct SDK
+  if (provider.type === 'anthropic') {
+    return true
+  }
+
+  // No anthropicApiHost configured - use unified SDK
+  if (!provider.anthropicApiHost?.trim()) {
+    return false
+  }
+
+  // Has anthropicApiHost - check model-level compatibility
+  // For aggregated providers, only specific models support Anthropic API
+  return isModelAnthropicCompatible(provider, modelId)
 }
 
 const logger = loggerService.withContext('ApiServerMessagesRoutes')
@@ -169,11 +186,12 @@ async function handleUnifiedProcessing({
 }
 
 /**
- * Handle message processing - routes to appropriate handler based on provider
+ * Handle message processing - routes to appropriate handler based on provider and model
  *
  * Routing logic:
- * - Providers with anthropicApiHost OR type 'anthropic': Direct Anthropic SDK (no conversion)
- * - Other providers: Unified AI SDK with Anthropic SSE conversion
+ * - Native Anthropic providers (type === 'anthropic'): Direct Anthropic SDK
+ * - Providers with anthropicApiHost AND model supports Anthropic API: Direct Anthropic SDK
+ * - Other providers/models: Unified AI SDK with Anthropic SSE conversion
  */
 async function handleMessageProcessing({
   res,
@@ -181,7 +199,8 @@ async function handleMessageProcessing({
   request,
   modelId
 }: HandleMessageProcessingOptions): Promise<void> {
-  if (shouldUseDirectAnthropic(provider)) {
+  const actualModelId = modelId || request.model
+  if (shouldUseDirectAnthropic(provider, actualModelId)) {
     return handleDirectAnthropicProcessing({ res, provider, request, modelId })
   }
   return handleUnifiedProcessing({ res, provider, request, modelId })
diff --git a/src/main/apiServer/utils/index.ts b/src/main/apiServer/utils/index.ts
index e25b49e750..471e734c18 100644
--- a/src/main/apiServer/utils/index.ts
+++ b/src/main/apiServer/utils/index.ts
@@ -295,3 +295,32 @@ export const getProviderAnthropicModelChecker = (providerId: string): ((m: Model
       return () => true
   }
 }
+
+/**
+ * Check if a specific model is compatible with Anthropic API for a given provider.
+ *
+ * This is used for fine-grained routing decisions at the model level.
+ * For aggregated providers (like Silicon), only certain models support the Anthropic API endpoint.
+ *
+ * @param provider - The provider to check
+ * @param modelId - The model ID to check (without provider prefix)
+ * @returns true if the model supports Anthropic API endpoint
+ */
+export function isModelAnthropicCompatible(provider: Provider, modelId: string): boolean {
+  const checker = getProviderAnthropicModelChecker(provider.id)
+
+  const model = provider.models?.find((m) => m.id === modelId)
+
+  if (model) {
+    return checker(model)
+  }
+
+  const minimalModel: Model = {
+    id: modelId,
+    name: modelId,
+    provider: provider.id,
+    group: ''
+  }
+
+  return checker(minimalModel)
+}
diff --git a/src/renderer/src/aiCore/provider/__tests__/providerConfig.test.ts b/src/renderer/src/aiCore/provider/__tests__/providerConfig.test.ts
index 430ff52869..22ef654da8 100644
--- a/src/renderer/src/aiCore/provider/__tests__/providerConfig.test.ts
+++ b/src/renderer/src/aiCore/provider/__tests__/providerConfig.test.ts
@@ -24,7 +24,17 @@ vi.mock('@renderer/services/AssistantService', () => ({
 
 vi.mock('@renderer/store', () => ({
   default: {
-    getState: () => ({ copilot: { defaultHeaders: {} } })
+    getState: () => ({
+      copilot: { defaultHeaders: {} },
+      llm: {
+        settings: {
+          vertexai: {
+            projectId: 'test-project',
+            location: 'us-central1'
+          }
+        }
+      }
+    })
   }
 }))
 
@@ -33,7 +43,7 @@ vi.mock('@renderer/utils/api', () => ({
     if (isSupportedAPIVersion === false) {
       return host // Return host as-is when isSupportedAPIVersion is false
     }
-    return `${host}/v1` // Default behavior when isSupportedAPIVersion is true
+    return host ? `${host}/v1` : '' // Default behavior when isSupportedAPIVersion is true
   }),
   routeToEndpoint: vi.fn((host) => ({
     baseURL: host,
@@ -41,6 +51,20 @@ vi.mock('@renderer/utils/api', () => ({
   }))
 }))
 
+// Also mock @shared/api since formatProviderApiHost uses it directly
+vi.mock('@shared/api', async (importOriginal) => {
+  const actual = (await importOriginal()) as any
+  return {
+    ...actual,
+    formatApiHost: vi.fn((host, isSupportedAPIVersion = true) => {
+      if (isSupportedAPIVersion === false) {
+        return host || '' // Return host as-is when isSupportedAPIVersion is false
+      }
+      return host ? `${host}/v1` : '' // Default behavior when isSupportedAPIVersion is true
+    })
+  }
+})
+
 vi.mock('@renderer/utils/provider', async (importOriginal) => {
   const actual = (await importOriginal()) as any
   return {
@@ -73,8 +97,8 @@ vi.mock('@renderer/services/AssistantService', () => ({
 
 import { getProviderByModel } from '@renderer/services/AssistantService'
 import type { Model, Provider } from '@renderer/types'
-import { formatApiHost } from '@renderer/utils/api'
 import { isCherryAIProvider, isPerplexityProvider } from '@renderer/utils/provider'
+import { formatApiHost } from '@shared/api'
 
 import { COPILOT_DEFAULT_HEADERS, COPILOT_EDITOR_VERSION, isCopilotResponsesModel } from '../constants'
 import { getActualProvider, providerToAiSdkConfig } from '../providerConfig'
diff --git a/src/renderer/src/utils/__tests__/api.test.ts b/src/renderer/src/utils/__tests__/api.test.ts
index e854445fc5..f56fb53d00 100644
--- a/src/renderer/src/utils/__tests__/api.test.ts
+++ b/src/renderer/src/utils/__tests__/api.test.ts
@@ -300,18 +300,7 @@ describe('api', () => {
     })
 
     it('uses global endpoint when location equals global', () => {
-      getStateMock.mockReturnValueOnce({
-        llm: {
-          settings: {
-            vertexai: {
-              projectId: 'global-project',
-              location: 'global'
-            }
-          }
-        }
-      })
-
-      expect(formatVertexApiHost(createVertexProvider(''))).toBe(
+      expect(formatVertexApiHost(createVertexProvider(''), 'global-project', 'global')).toBe(
         'https://aiplatform.googleapis.com/v1/projects/global-project/locations/global'
       )
     })

From 2a1adfe3224d23874fbd6875c9d998cae54a6bd3 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 27 Nov 2025 21:00:52 +0800
Subject: [PATCH 06/53] feat: add ppio

---
 packages/shared/config/providers.ts           | 34 +++++++++++++++++++
 src/main/apiServer/utils/index.ts             |  4 ++-
 src/renderer/src/pages/code/CodeToolsPage.tsx |  6 ++--
 .../ProviderSettings/ProviderSetting.tsx      |  3 +-
 src/renderer/src/store/index.ts               |  2 +-
 src/renderer/src/store/migrate.ts             | 14 ++++++++
 6 files changed, 58 insertions(+), 5 deletions(-)

diff --git a/packages/shared/config/providers.ts b/packages/shared/config/providers.ts
index e03661bf0e..6490c61cc8 100644
--- a/packages/shared/config/providers.ts
+++ b/packages/shared/config/providers.ts
@@ -41,3 +41,37 @@ const SILICON_ANTHROPIC_COMPATIBLE_MODEL_SET = new Set(SILICON_ANTHROPIC_COMPATI
 export function isSiliconAnthropicCompatibleModel(modelId: string): boolean {
   return SILICON_ANTHROPIC_COMPATIBLE_MODEL_SET.has(modelId)
 }
+
+/**
+ * PPIO provider models that support Anthropic API endpoint.
+ * These models can be used with Claude Code via the Anthropic-compatible API.
+ *
+ * @see https://ppio.com/docs/model/llm-anthropic-compatibility
+ */
+export const PPIO_ANTHROPIC_COMPATIBLE_MODELS: readonly string[] = [
+  'moonshotai/kimi-k2-thinking',
+  'minimax/minimax-m2',
+  'deepseek/deepseek-v3.2-exp',
+  'deepseek/deepseek-v3.1-terminus',
+  'zai-org/glm-4.6',
+  'moonshotai/kimi-k2-0905',
+  'deepseek/deepseek-v3.1',
+  'moonshotai/kimi-k2-instruct',
+  'qwen/qwen3-next-80b-a3b-instruct',
+  'qwen/qwen3-next-80b-a3b-thinking'
+]
+
+/**
+ * Creates a Set for efficient lookup of PPIO Anthropic-compatible model IDs.
+ */
+const PPIO_ANTHROPIC_COMPATIBLE_MODEL_SET = new Set(PPIO_ANTHROPIC_COMPATIBLE_MODELS)
+
+/**
+ * Checks if a model ID is compatible with Anthropic API on PPIO provider.
+ *
+ * @param modelId - The model ID to check
+ * @returns true if the model supports Anthropic API endpoint
+ */
+export function isPpioAnthropicCompatibleModel(modelId: string): boolean {
+  return PPIO_ANTHROPIC_COMPATIBLE_MODEL_SET.has(modelId)
+}
diff --git a/src/main/apiServer/utils/index.ts b/src/main/apiServer/utils/index.ts
index 471e734c18..fde1ff3475 100644
--- a/src/main/apiServer/utils/index.ts
+++ b/src/main/apiServer/utils/index.ts
@@ -1,7 +1,7 @@
 import { CacheService } from '@main/services/CacheService'
 import { loggerService } from '@main/services/LoggerService'
 import { reduxService } from '@main/services/ReduxService'
-import { isSiliconAnthropicCompatibleModel } from '@shared/config/providers'
+import { isPpioAnthropicCompatibleModel, isSiliconAnthropicCompatibleModel } from '@shared/config/providers'
 import type { ApiModel, Model, Provider } from '@types'
 
 const logger = loggerService.withContext('ApiServerUtils')
@@ -290,6 +290,8 @@ export const getProviderAnthropicModelChecker = (providerId: string): ((m: Model
       return (m: Model) => m.id.includes('claude')
     case 'silicon':
       return (m: Model) => isSiliconAnthropicCompatibleModel(m.id)
+    case 'ppio':
+      return (m: Model) => isPpioAnthropicCompatibleModel(m.id)
     default:
       // allow all models when checker not configured
       return () => true
diff --git a/src/renderer/src/pages/code/CodeToolsPage.tsx b/src/renderer/src/pages/code/CodeToolsPage.tsx
index fcb2dbf482..a4314dfef9 100644
--- a/src/renderer/src/pages/code/CodeToolsPage.tsx
+++ b/src/renderer/src/pages/code/CodeToolsPage.tsx
@@ -17,7 +17,7 @@ import type { EndpointType, Model } from '@renderer/types'
 import { getClaudeSupportedProviders } from '@renderer/utils/provider'
 import type { TerminalConfig } from '@shared/config/constant'
 import { codeTools, terminalApps } from '@shared/config/constant'
-import { isSiliconAnthropicCompatibleModel } from '@shared/config/providers'
+import { isPpioAnthropicCompatibleModel, isSiliconAnthropicCompatibleModel } from '@shared/config/providers'
 import { Alert, Avatar, Button, Checkbox, Input, Popover, Select, Space, Tooltip } from 'antd'
 import { ArrowUpRight, Download, FolderOpen, HelpCircle, Terminal, X } from 'lucide-react'
 import type { FC } from 'react'
@@ -82,10 +82,12 @@ const CodeToolsPage: FC = () => {
         if (m.supported_endpoint_types) {
           return m.supported_endpoint_types.includes('anthropic')
         }
-        // Special handling for silicon provider: only specific models support Anthropic API
         if (m.provider === 'silicon') {
           return isSiliconAnthropicCompatibleModel(m.id)
         }
+        if (m.provider === 'ppio') {
+          return isPpioAnthropicCompatibleModel(m.id)
+        }
         return m.id.includes('claude') || CLAUDE_OFFICIAL_SUPPORTED_PROVIDERS.includes(m.provider)
       }
 
diff --git a/src/renderer/src/pages/settings/ProviderSettings/ProviderSetting.tsx b/src/renderer/src/pages/settings/ProviderSettings/ProviderSetting.tsx
index f341ac9229..b85690c3fb 100644
--- a/src/renderer/src/pages/settings/ProviderSettings/ProviderSetting.tsx
+++ b/src/renderer/src/pages/settings/ProviderSettings/ProviderSetting.tsx
@@ -85,7 +85,8 @@ const ANTHROPIC_COMPATIBLE_PROVIDER_IDS = [
   SystemProviderIds.minimax,
   SystemProviderIds.silicon,
   SystemProviderIds.qiniu,
-  SystemProviderIds.dmxapi
+  SystemProviderIds.dmxapi,
+  SystemProviderIds.ppio
 ] as const
 type AnthropicCompatibleProviderId = (typeof ANTHROPIC_COMPATIBLE_PROVIDER_IDS)[number]
 
diff --git a/src/renderer/src/store/index.ts b/src/renderer/src/store/index.ts
index 5c562885bb..94b51474b9 100644
--- a/src/renderer/src/store/index.ts
+++ b/src/renderer/src/store/index.ts
@@ -67,7 +67,7 @@ const persistedReducer = persistReducer(
   {
     key: 'cherry-studio',
     storage,
-    version: 179,
+    version: 180,
     blacklist: ['runtime', 'messages', 'messageBlocks', 'tabs', 'toolPermissions'],
     migrate
   },
diff --git a/src/renderer/src/store/migrate.ts b/src/renderer/src/store/migrate.ts
index 4b2e4cef89..1049da5964 100644
--- a/src/renderer/src/store/migrate.ts
+++ b/src/renderer/src/store/migrate.ts
@@ -2906,6 +2906,20 @@ const migrateConfig = {
       logger.error('migrate 179 error', error as Error)
       return state
     }
+  },
+  '180': (state: RootState) => {
+    try {
+      state.llm.providers.forEach((provider) => {
+        if (provider.id === SystemProviderIds.ppio) {
+          provider.anthropicApiHost = 'https://api.ppinfra.com/anthropic'
+        }
+      })
+      logger.info('migrate 180 success')
+      return state
+    } catch (error) {
+      logger.error('migrate 180 error', error as Error)
+      return state
+    }
   }
 }
 

From 4c4102da20b14bd75615f75bcd8690ee66b1a580 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 27 Nov 2025 21:10:26 +0800
Subject: [PATCH 07/53] feat: update agentModelFilter to exclude generate image
 models

---
 src/renderer/src/config/models/utils.ts | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/renderer/src/config/models/utils.ts b/src/renderer/src/config/models/utils.ts
index 1d5c9a6443..8a52d6e4ff 100644
--- a/src/renderer/src/config/models/utils.ts
+++ b/src/renderer/src/config/models/utils.ts
@@ -150,7 +150,7 @@ export const isGeminiModel = (model: Model) => {
 export const ZHIPU_RESULT_TOKENS = ['<|begin_of_box|>', '<|end_of_box|>'] as const
 
 export const agentModelFilter = (model: Model): boolean => {
-  return !isEmbeddingModel(model) && !isRerankModel(model) && !isTextToImageModel(model)
+  return !isEmbeddingModel(model) && !isRerankModel(model) && !isTextToImageModel(model) && !isGenerateImageModel(model)
 }
 
 export const isMaxTemperatureOneModel = (model: Model): boolean => {

From f02c0fe9629b5a3b623e50ff26214405f68696aa Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 27 Nov 2025 21:19:01 +0800
Subject: [PATCH 08/53] fix: typecheck

---
 tsconfig.node.json | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/tsconfig.node.json b/tsconfig.node.json
index 83c3f2b461..4e60782e11 100644
--- a/tsconfig.node.json
+++ b/tsconfig.node.json
@@ -26,7 +26,11 @@
       "@types": ["./src/renderer/src/types/index.ts"],
       "@shared/*": ["./packages/shared/*"],
       "@mcp-trace/*": ["./packages/mcp-trace/*"],
-      "@modelcontextprotocol/sdk/*": ["./node_modules/@modelcontextprotocol/sdk/dist/esm/*"]
+      "@modelcontextprotocol/sdk/*": ["./node_modules/@modelcontextprotocol/sdk/dist/esm/*"],
+      "@cherrystudio/ai-core/provider": ["./packages/aiCore/src/core/providers/index.ts"],
+      "@cherrystudio/ai-core/built-in/plugins": ["./packages/aiCore/src/core/plugins/built-in/index.ts"],
+      "@cherrystudio/ai-core/*": ["./packages/aiCore/src/*"],
+      "@cherrystudio/ai-core": ["./packages/aiCore/src/index.ts"]
     },
     "experimentalDecorators": true,
     "emitDecoratorMetadata": true,

From dad9cc95ad038d518b520705035cd9336cd715d7 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 27 Nov 2025 21:23:28 +0800
Subject: [PATCH 09/53] fix: typecheck

---
 tsconfig.node.json | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/tsconfig.node.json b/tsconfig.node.json
index 4e60782e11..9871e604f2 100644
--- a/tsconfig.node.json
+++ b/tsconfig.node.json
@@ -30,7 +30,8 @@
       "@cherrystudio/ai-core/provider": ["./packages/aiCore/src/core/providers/index.ts"],
       "@cherrystudio/ai-core/built-in/plugins": ["./packages/aiCore/src/core/plugins/built-in/index.ts"],
       "@cherrystudio/ai-core/*": ["./packages/aiCore/src/*"],
-      "@cherrystudio/ai-core": ["./packages/aiCore/src/index.ts"]
+      "@cherrystudio/ai-core": ["./packages/aiCore/src/index.ts"],
+      "@cherrystudio/ai-sdk-provider": ["./packages/ai-sdk-provider/src/index.ts"]
     },
     "experimentalDecorators": true,
     "emitDecoratorMetadata": true,

From 15c0a3881c4896acee0a672284acbf5593c5aba0 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 27 Nov 2025 21:28:24 +0800
Subject: [PATCH 10/53] fix: test

---
 src/renderer/src/config/models/__tests__/utils.test.ts | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/src/renderer/src/config/models/__tests__/utils.test.ts b/src/renderer/src/config/models/__tests__/utils.test.ts
index f3f4d402af..97dbf755d1 100644
--- a/src/renderer/src/config/models/__tests__/utils.test.ts
+++ b/src/renderer/src/config/models/__tests__/utils.test.ts
@@ -120,7 +120,7 @@ describe('model utils', () => {
     rerankMock.mockReturnValue(false)
     visionMock.mockReturnValue(true)
     textToImageMock.mockReturnValue(false)
-    generateImageMock.mockReturnValue(true)
+    generateImageMock.mockReturnValue(false)
     reasoningMock.mockReturnValue(false)
     openAIWebSearchOnlyMock.mockReturnValue(false)
   })
@@ -274,6 +274,7 @@ describe('model utils', () => {
     visionMock.mockReturnValueOnce(true).mockReturnValueOnce(false)
     expect(isVisionModels(models)).toBe(false)
 
+    generateImageMock.mockReturnValue(true)
     expect(isGenerateImageModels(models)).toBe(true)
     generateImageMock.mockReturnValueOnce(true).mockReturnValueOnce(false)
     expect(isGenerateImageModels(models)).toBe(false)
@@ -292,6 +293,10 @@ describe('model utils', () => {
     rerankMock.mockReturnValue(false)
     textToImageMock.mockReturnValueOnce(true)
     expect(agentModelFilter(createModel({ id: 'gpt-image-1' }))).toBe(false)
+
+    textToImageMock.mockReturnValue(false)
+    generateImageMock.mockReturnValueOnce(true)
+    expect(agentModelFilter(createModel({ id: 'dall-e-3' }))).toBe(false)
   })
 
   it('identifies models with maximum temperature of 1.0', () => {

From 0f6ec3e0614c59e3d411463c637e8ea92b312de0 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 27 Nov 2025 22:02:50 +0800
Subject: [PATCH 11/53] feat: add new aliases for ai-core provider and core

---
 electron.vite.config.ts | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/electron.vite.config.ts b/electron.vite.config.ts
index 172d48ca9a..761ecfbf15 100644
--- a/electron.vite.config.ts
+++ b/electron.vite.config.ts
@@ -25,7 +25,9 @@ export default defineConfig({
         '@shared': resolve('packages/shared'),
         '@logger': resolve('src/main/services/LoggerService'),
         '@mcp-trace/trace-core': resolve('packages/mcp-trace/trace-core'),
-        '@mcp-trace/trace-node': resolve('packages/mcp-trace/trace-node')
+        '@mcp-trace/trace-node': resolve('packages/mcp-trace/trace-node'),
+        '@cherrystudio/ai-core/provider': resolve('packages/aiCore/src/core/providers'),
+        '@cherrystudio/ai-core': resolve('packages/aiCore/src')
       }
     },
     build: {

From f163c4d3ee6b336e30b1516511cdc745c44fec05 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 27 Nov 2025 22:28:44 +0800
Subject: [PATCH 12/53] fix: resolve PR review issues for Proxy API Server
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Fix tool result content bug: return `values` array instead of empty array
- Fix empty message bug: skip pushing user/assistant messages when content is empty
- Expand provider support: remove type restrictions to support all AI SDK providers
- Add missing alias for @cherrystudio/ai-sdk-provider in main process config

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude <noreply@anthropic.com>
---
 electron.vite.config.ts                       |  3 ++-
 .../apiServer/services/unified-messages.ts    | 25 ++++++++++++-------
 src/main/apiServer/utils/index.ts             | 19 +++++---------
 3 files changed, 24 insertions(+), 23 deletions(-)

diff --git a/electron.vite.config.ts b/electron.vite.config.ts
index 761ecfbf15..da471c9fc9 100644
--- a/electron.vite.config.ts
+++ b/electron.vite.config.ts
@@ -27,7 +27,8 @@ export default defineConfig({
         '@mcp-trace/trace-core': resolve('packages/mcp-trace/trace-core'),
         '@mcp-trace/trace-node': resolve('packages/mcp-trace/trace-node'),
         '@cherrystudio/ai-core/provider': resolve('packages/aiCore/src/core/providers'),
-        '@cherrystudio/ai-core': resolve('packages/aiCore/src')
+        '@cherrystudio/ai-core': resolve('packages/aiCore/src'),
+        '@cherrystudio/ai-sdk-provider': resolve('packages/ai-sdk-provider/src')
       }
     },
     build: {
diff --git a/src/main/apiServer/services/unified-messages.ts b/src/main/apiServer/services/unified-messages.ts
index 5aadfbf534..ddb6d59b37 100644
--- a/src/main/apiServer/services/unified-messages.ts
+++ b/src/main/apiServer/services/unified-messages.ts
@@ -186,7 +186,7 @@ IANA media type.
     }
     return {
       type: 'content',
-      value: []
+      value: values
     }
   }
 }
@@ -313,17 +313,24 @@ function convertAnthropicToAiMessages(params: MessageCreateParams): ModelMessage
       }
 
       // Build the message based on role
+      // Only push user/assistant message if there's actual content (avoid empty messages)
       if (msg.role === 'user') {
-        messages.push({
-          role: 'user',
-          content: [...textParts, ...imageParts]
-        })
+        const userContent = [...textParts, ...imageParts]
+        if (userContent.length > 0) {
+          messages.push({
+            role: 'user',
+            content: userContent
+          })
+        }
       } else {
         // Assistant messages contain tool calls, not tool results
-        messages.push({
-          role: 'assistant',
-          content: [...reasoningParts, ...textParts, ...toolCallParts]
-        })
+        const assistantContent = [...reasoningParts, ...textParts, ...toolCallParts]
+        if (assistantContent.length > 0) {
+          messages.push({
+            role: 'assistant',
+            content: assistantContent
+          })
+        }
       }
     }
   }
diff --git a/src/main/apiServer/utils/index.ts b/src/main/apiServer/utils/index.ts
index fde1ff3475..17d3f9f088 100644
--- a/src/main/apiServer/utils/index.ts
+++ b/src/main/apiServer/utils/index.ts
@@ -28,10 +28,9 @@ export async function getAvailableProviders(): Promise<Provider[]> {
       return []
     }
 
-    // Support OpenAI and Anthropic type providers for API server
-    const supportedProviders = providers.filter(
-      (p: Provider) => p.enabled && (p.type === 'openai' || p.type === 'anthropic')
-    )
+    // Support all provider types that AI SDK can handle
+    // The unified-messages service uses AI SDK which supports many providers
+    const supportedProviders = providers.filter((p: Provider) => p.enabled)
 
     // Cache the filtered results
     CacheService.set(PROVIDERS_CACHE_KEY, supportedProviders, PROVIDERS_CACHE_TTL)
@@ -160,7 +159,7 @@ export async function validateModelId(model: string): Promise<{
         valid: false,
         error: {
           type: 'provider_not_found',
-          message: `Provider '${providerId}' not found, not enabled, or not supported. Only OpenAI providers are currently supported.`,
+          message: `Provider '${providerId}' not found or not enabled.`,
           code: 'provider_not_found'
         }
       }
@@ -262,14 +261,8 @@ export function validateProvider(provider: Provider): boolean {
       return false
     }
 
-    // Support OpenAI and Anthropic type providers
-    if (provider.type !== 'openai' && provider.type !== 'anthropic') {
-      logger.debug('Provider type not supported', {
-        providerId: provider.id,
-        providerType: provider.type
-      })
-      return false
-    }
+    // AI SDK supports many provider types, no longer need to filter by type
+    // The unified-messages service handles all supported types
 
     return true
   } catch (error: any) {

From 77c1b77113f4280454fd22869bd98f6516864f30 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 27 Nov 2025 22:41:18 +0800
Subject: [PATCH 13/53] refactor: extract shared token counting logic in
 messages routes
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Extract duplicated token estimation code from both count_tokens endpoints
into a shared `estimateTokenCount` function to improve maintainability.

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude <noreply@anthropic.com>
---
 src/main/apiServer/routes/messages.ts | 111 +++++++++++---------------
 1 file changed, 47 insertions(+), 64 deletions(-)

diff --git a/src/main/apiServer/routes/messages.ts b/src/main/apiServer/routes/messages.ts
index f0eaac8e4e..907b498273 100644
--- a/src/main/apiServer/routes/messages.ts
+++ b/src/main/apiServer/routes/messages.ts
@@ -41,6 +41,51 @@ const logger = loggerService.withContext('ApiServerMessagesRoutes')
 const router = express.Router()
 const providerRouter = express.Router({ mergeParams: true })
 
+/**
+ * Estimate token count from messages
+ * Simple approximation: ~4 characters per token for English text
+ */
+interface CountTokensInput {
+  messages: Array<{ role: string; content: string | Array<{ type: string; text?: string }> }>
+  system?: string | Array<{ type: string; text?: string }>
+}
+
+function estimateTokenCount(input: CountTokensInput): number {
+  const { messages, system } = input
+  let totalChars = 0
+
+  // Count system message tokens
+  if (system) {
+    if (typeof system === 'string') {
+      totalChars += system.length
+    } else if (Array.isArray(system)) {
+      for (const block of system) {
+        if (block.type === 'text' && block.text) {
+          totalChars += block.text.length
+        }
+      }
+    }
+  }
+
+  // Count message tokens
+  for (const msg of messages) {
+    if (typeof msg.content === 'string') {
+      totalChars += msg.content.length
+    } else if (Array.isArray(msg.content)) {
+      for (const block of msg.content) {
+        if (block.type === 'text' && block.text) {
+          totalChars += block.text.length
+        }
+      }
+    }
+    // Add overhead for role
+    totalChars += 10
+  }
+
+  // Estimate tokens (~4 chars per token, with some overhead)
+  return Math.ceil(totalChars / 4) + messages.length * 3
+}
+
 // Helper function for basic request validation
 async function validateRequestBody(req: Request): Promise<{ valid: boolean; error?: any }> {
   const request: MessageCreateParams = req.body
@@ -589,45 +634,11 @@ router.post('/count_tokens', async (req: Request, res: Response) => {
       })
     }
 
-    // Simple token estimation based on character count
-    // This is a rough approximation: ~4 characters per token for English text
-    let totalChars = 0
-
-    // Count system message tokens
-    if (system) {
-      if (typeof system === 'string') {
-        totalChars += system.length
-      } else if (Array.isArray(system)) {
-        for (const block of system) {
-          if (block.type === 'text' && block.text) {
-            totalChars += block.text.length
-          }
-        }
-      }
-    }
-
-    // Count message tokens
-    for (const msg of messages) {
-      if (typeof msg.content === 'string') {
-        totalChars += msg.content.length
-      } else if (Array.isArray(msg.content)) {
-        for (const block of msg.content) {
-          if (block.type === 'text' && block.text) {
-            totalChars += block.text.length
-          }
-        }
-      }
-      // Add overhead for role
-      totalChars += 10
-    }
-
-    // Estimate tokens (~4 chars per token, with some overhead)
-    const estimatedTokens = Math.ceil(totalChars / 4) + messages.length * 3
+    const estimatedTokens = estimateTokenCount({ messages, system })
 
     logger.debug('Token count estimated', {
       model,
       messageCount: messages.length,
-      totalChars,
       estimatedTokens
     })
 
@@ -663,35 +674,7 @@ providerRouter.post('/count_tokens', async (req: Request, res: Response) => {
       })
     }
 
-    // Simple token estimation
-    let totalChars = 0
-
-    if (system) {
-      if (typeof system === 'string') {
-        totalChars += system.length
-      } else if (Array.isArray(system)) {
-        for (const block of system) {
-          if (block.type === 'text' && block.text) {
-            totalChars += block.text.length
-          }
-        }
-      }
-    }
-
-    for (const msg of messages) {
-      if (typeof msg.content === 'string') {
-        totalChars += msg.content.length
-      } else if (Array.isArray(msg.content)) {
-        for (const block of msg.content) {
-          if (block.type === 'text' && block.text) {
-            totalChars += block.text.length
-          }
-        }
-      }
-      totalChars += 10
-    }
-
-    const estimatedTokens = Math.ceil(totalChars / 4) + messages.length * 3
+    const estimatedTokens = estimateTokenCount({ messages, system })
 
     logger.debug('Token count estimated (provider route)', {
       providerId: req.params.provider,

From ce2500159041bc31ac9dee8e5d27faf4a80d578e Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Fri, 28 Nov 2025 01:27:20 +0800
Subject: [PATCH 14/53] feat: add shared AI SDK middlewares and refactor
 middleware handling

---
 packages/shared/middleware/index.ts           |  15 +
 packages/shared/middleware/middlewares.ts     | 205 ++++++++
 .../apiServer/services/unified-messages.ts    | 461 +++++++-----------
 .../middleware/AiSdkMiddlewareBuilder.ts      |   3 +-
 .../openrouterReasoningMiddleware.ts          |  50 --
 .../skipGeminiThoughtSignatureMiddleware.ts   |  36 --
 tsconfig.node.json                            |   4 +-
 7 files changed, 401 insertions(+), 373 deletions(-)
 create mode 100644 packages/shared/middleware/index.ts
 create mode 100644 packages/shared/middleware/middlewares.ts
 delete mode 100644 src/renderer/src/aiCore/middleware/openrouterReasoningMiddleware.ts
 delete mode 100644 src/renderer/src/aiCore/middleware/skipGeminiThoughtSignatureMiddleware.ts

diff --git a/packages/shared/middleware/index.ts b/packages/shared/middleware/index.ts
new file mode 100644
index 0000000000..a4db5ad2dd
--- /dev/null
+++ b/packages/shared/middleware/index.ts
@@ -0,0 +1,15 @@
+/**
+ * Shared AI SDK Middlewares
+ *
+ * Environment-agnostic middlewares that can be used in both
+ * renderer process and main process (API server).
+ */
+
+export {
+  buildSharedMiddlewares,
+  getReasoningTagName,
+  isGemini3ModelId,
+  openrouterReasoningMiddleware,
+  type SharedMiddlewareConfig,
+  skipGeminiThoughtSignatureMiddleware
+} from './middlewares'
diff --git a/packages/shared/middleware/middlewares.ts b/packages/shared/middleware/middlewares.ts
new file mode 100644
index 0000000000..d9725101c2
--- /dev/null
+++ b/packages/shared/middleware/middlewares.ts
@@ -0,0 +1,205 @@
+/**
+ * Shared AI SDK Middlewares
+ *
+ * These middlewares are environment-agnostic and can be used in both
+ * renderer process and main process (API server).
+ */
+import type { LanguageModelV2Middleware, LanguageModelV2StreamPart } from '@ai-sdk/provider'
+import { extractReasoningMiddleware } from 'ai'
+
+/**
+ * Configuration for building shared middlewares
+ */
+export interface SharedMiddlewareConfig {
+  /**
+   * Whether to enable reasoning extraction
+   */
+  enableReasoning?: boolean
+
+  /**
+   * Tag name for reasoning extraction
+   * Defaults based on model ID
+   */
+  reasoningTagName?: string
+
+  /**
+   * Model ID - used to determine default reasoning tag and model detection
+   */
+  modelId?: string
+
+  /**
+   * Provider ID (Cherry Studio provider ID)
+   * Used for provider-specific middlewares like OpenRouter
+   */
+  providerId?: string
+
+  /**
+   * AI SDK Provider ID
+   * Used for Gemini thought signature middleware
+   * e.g., 'google', 'google-vertex'
+   */
+  aiSdkProviderId?: string
+}
+
+/**
+ * Check if model ID represents a Gemini 3 (2.5) model
+ * that requires thought signature handling
+ *
+ * @param modelId - The model ID string (not Model object)
+ */
+export function isGemini3ModelId(modelId?: string): boolean {
+  if (!modelId) return false
+  const lowerModelId = modelId.toLowerCase()
+  return lowerModelId.includes('gemini-2.5') || lowerModelId.includes('gemini-exp') || lowerModelId.includes('gemini-3')
+}
+
+/**
+ * Get the default reasoning tag name based on model ID
+ *
+ * Different models use different tags for reasoning content:
+ * - Most models: 'think'
+ * - GPT-OSS models: 'reasoning'
+ * - Gemini models: 'thought'
+ * - Seed models: 'seed:think'
+ */
+export function getReasoningTagName(modelId?: string): string {
+  if (!modelId) return 'think'
+  const lowerModelId = modelId.toLowerCase()
+  if (lowerModelId.includes('gpt-oss')) return 'reasoning'
+  if (lowerModelId.includes('gemini')) return 'thought'
+  if (lowerModelId.includes('seed-oss-36b')) return 'seed:think'
+  return 'think'
+}
+
+/**
+ * Skip Gemini Thought Signature Middleware
+ *
+ * Due to the complexity of multi-model client requests (which can switch
+ * to other models mid-process), this middleware skips all Gemini 3
+ * thinking signatures validation.
+ *
+ * @param aiSdkId - AI SDK Provider ID (e.g., 'google', 'google-vertex')
+ * @returns LanguageModelV2Middleware
+ */
+export function skipGeminiThoughtSignatureMiddleware(aiSdkId: string): LanguageModelV2Middleware {
+  const MAGIC_STRING = 'skip_thought_signature_validator'
+  return {
+    middlewareVersion: 'v2',
+
+    transformParams: async ({ params }) => {
+      const transformedParams = { ...params }
+      // Process messages in prompt
+      if (transformedParams.prompt && Array.isArray(transformedParams.prompt)) {
+        transformedParams.prompt = transformedParams.prompt.map((message) => {
+          if (typeof message.content !== 'string') {
+            for (const part of message.content) {
+              const googleOptions = part?.providerOptions?.[aiSdkId]
+              if (googleOptions?.thoughtSignature) {
+                googleOptions.thoughtSignature = MAGIC_STRING
+              }
+            }
+          }
+          return message
+        })
+      }
+
+      return transformedParams
+    }
+  }
+}
+
+/**
+ * OpenRouter Reasoning Middleware
+ *
+ * Filters out [REDACTED] blocks from OpenRouter reasoning responses.
+ * OpenRouter may include [REDACTED] markers in reasoning content that
+ * should be removed for cleaner output.
+ *
+ * @see https://openrouter.ai/docs/docs/best-practices/reasoning-tokens
+ * @returns LanguageModelV2Middleware
+ */
+export function openrouterReasoningMiddleware(): LanguageModelV2Middleware {
+  const REDACTED_BLOCK = '[REDACTED]'
+  return {
+    middlewareVersion: 'v2',
+    wrapGenerate: async ({ doGenerate }) => {
+      const { content, ...rest } = await doGenerate()
+      const modifiedContent = content.map((part) => {
+        if (part.type === 'reasoning' && part.text.includes(REDACTED_BLOCK)) {
+          return {
+            ...part,
+            text: part.text.replace(REDACTED_BLOCK, '')
+          }
+        }
+        return part
+      })
+      return { content: modifiedContent, ...rest }
+    },
+    wrapStream: async ({ doStream }) => {
+      const { stream, ...rest } = await doStream()
+      return {
+        stream: stream.pipeThrough(
+          new TransformStream<LanguageModelV2StreamPart, LanguageModelV2StreamPart>({
+            transform(
+              chunk: LanguageModelV2StreamPart,
+              controller: TransformStreamDefaultController<LanguageModelV2StreamPart>
+            ) {
+              if (chunk.type === 'reasoning-delta' && chunk.delta.includes(REDACTED_BLOCK)) {
+                controller.enqueue({
+                  ...chunk,
+                  delta: chunk.delta.replace(REDACTED_BLOCK, '')
+                })
+              } else {
+                controller.enqueue(chunk)
+              }
+            }
+          })
+        ),
+        ...rest
+      }
+    }
+  }
+}
+
+/**
+ * Build shared middlewares based on configuration
+ *
+ * This function builds a set of middlewares that are commonly needed
+ * across different environments (renderer, API server).
+ *
+ * @param config - Configuration for middleware building
+ * @returns Array of AI SDK middlewares
+ *
+ * @example
+ * ```typescript
+ * import { buildSharedMiddlewares } from '@shared/middleware'
+ *
+ * const middlewares = buildSharedMiddlewares({
+ *   enableReasoning: true,
+ *   modelId: 'gemini-2.5-pro',
+ *   providerId: 'openrouter',
+ *   aiSdkProviderId: 'google'
+ * })
+ * ```
+ */
+export function buildSharedMiddlewares(config: SharedMiddlewareConfig): LanguageModelV2Middleware[] {
+  const middlewares: LanguageModelV2Middleware[] = []
+
+  // 1. Reasoning extraction middleware
+  if (config.enableReasoning) {
+    const tagName = config.reasoningTagName || getReasoningTagName(config.modelId)
+    middlewares.push(extractReasoningMiddleware({ tagName }))
+  }
+
+  // 2. OpenRouter-specific: filter [REDACTED] blocks
+  if (config.providerId === 'openrouter' && config.enableReasoning) {
+    middlewares.push(openrouterReasoningMiddleware())
+  }
+
+  // 3. Gemini 3 (2.5) specific: skip thought signature validation
+  if (isGemini3ModelId(config.modelId) && config.aiSdkProviderId) {
+    middlewares.push(skipGeminiThoughtSignatureMiddleware(config.aiSdkProviderId))
+  }
+
+  return middlewares
+}
diff --git a/src/main/apiServer/services/unified-messages.ts b/src/main/apiServer/services/unified-messages.ts
index ddb6d59b37..be8b05aeac 100644
--- a/src/main/apiServer/services/unified-messages.ts
+++ b/src/main/apiServer/services/unified-messages.ts
@@ -1,4 +1,4 @@
-import type { LanguageModelV2ToolResultOutput } from '@ai-sdk/provider'
+import type { LanguageModelV2Middleware, LanguageModelV2ToolResultOutput } from '@ai-sdk/provider'
 import type { ReasoningPart, ToolCallPart, ToolResultPart } from '@ai-sdk/provider-utils'
 import type {
   ImageBlockParam,
@@ -6,7 +6,7 @@ import type {
   TextBlockParam,
   Tool as AnthropicTool
 } from '@anthropic-ai/sdk/resources/messages'
-import { createProvider as createProviderCore } from '@cherrystudio/ai-core/provider'
+import { type AiPlugin, createExecutor } from '@cherrystudio/ai-core'
 import { loggerService } from '@logger'
 import { reduxService } from '@main/services/ReduxService'
 import { AiSdkToAnthropicSSE, formatSSEDone, formatSSEEvent } from '@shared/adapters'
@@ -21,8 +21,8 @@ import {
 } from '@shared/provider'
 import { defaultAppHeaders } from '@shared/utils'
 import type { Provider } from '@types'
-import type { ImagePart, LanguageModel, ModelMessage, Provider as AiSdkProvider, TextPart, Tool } from 'ai'
-import { jsonSchema, stepCountIs, streamText, tool } from 'ai'
+import type { ImagePart, ModelMessage, TextPart, Tool } from 'ai'
+import { jsonSchema, simulateStreamingMiddleware, stepCountIs, tool } from 'ai'
 import { net } from 'electron'
 import type { Response } from 'express'
 
@@ -33,6 +33,9 @@ initializeSharedProviders({
   error: (message, error) => logger.error(message, error)
 })
 
+/**
+ * Configuration for unified message streaming
+ */
 export interface UnifiedStreamConfig {
   response: Response
   provider: Provider
@@ -40,12 +43,31 @@ export interface UnifiedStreamConfig {
   params: MessageCreateParams
   onError?: (error: unknown) => void
   onComplete?: () => void
+  /**
+   * Optional AI SDK middlewares to apply
+   */
+  middlewares?: LanguageModelV2Middleware[]
+  /**
+   * Optional AI Core plugins to use with the executor
+   */
+  plugins?: AiPlugin[]
 }
 
 /**
- * Main process format context for formatProviderApiHost
- * Unlike renderer, main process doesn't have direct access to store getters, so use reduxService cache
+ * Configuration for non-streaming message generation
  */
+export interface GenerateUnifiedMessageConfig {
+  provider: Provider
+  modelId: string
+  params: MessageCreateParams
+  middlewares?: LanguageModelV2Middleware[]
+  plugins?: AiPlugin[]
+}
+
+// ============================================================================
+// Internal Utilities
+// ============================================================================
+
 function getMainProcessFormatContext(): ProviderFormatContext {
   const vertexSettings = reduxService.selectSync<{ projectId: string; location: string }>('state.llm.settings.vertexai')
   return {
@@ -56,12 +78,7 @@ function getMainProcessFormatContext(): ProviderFormatContext {
   }
 }
 
-/**
- * Main process context for providerToAiSdkConfig
- * Main process doesn't have access to browser APIs like window.keyv
- */
 const mainProcessSdkContext: AiSdkConfigContext = {
-  // Simple key rotation - just return first key (no persistent rotation in main process)
   getRotatedApiKey: (provider) => {
     const keys = provider.apiKey.split(',').map((k) => k.trim())
     return keys[0] || provider.apiKey
@@ -69,199 +86,82 @@ const mainProcessSdkContext: AiSdkConfigContext = {
   fetch: net.fetch as typeof globalThis.fetch
 }
 
-/**
- * Get actual provider configuration for a model
- *
- * For aggregated providers (new-api, aihubmix, vertexai, azure-openai),
- * this resolves the actual provider type based on the model's characteristics.
- */
 function getActualProvider(provider: Provider, modelId: string): Provider {
-  // Find the model in provider's models list
   const model = provider.models?.find((m) => m.id === modelId)
-  if (!model) {
-    // If model not found, return provider as-is
-    return provider
-  }
-
-  // Resolve actual provider based on model
+  if (!model) return provider
   return resolveActualProvider(provider, model)
 }
 
-/**
- * Convert Cherry Studio Provider to AI SDK config
- * Uses shared implementation with main process context
- */
 function providerToAiSdkConfig(provider: Provider, modelId: string): AiSdkConfig {
-  // First resolve actual provider for aggregated providers
   const actualProvider = getActualProvider(provider, modelId)
-
-  // Format the provider's apiHost for AI SDK
   const formattedProvider = formatProviderApiHost(actualProvider, getMainProcessFormatContext())
-
-  // Use shared implementation
   return sharedProviderToAiSdkConfig(formattedProvider, modelId, mainProcessSdkContext)
 }
 
-/**
- * Create an AI SDK provider from Cherry Studio provider configuration
- */
-async function createAiSdkProvider(config: AiSdkConfig): Promise<AiSdkProvider | null> {
-  try {
-    const provider = await createProviderCore(config.providerId, config.options)
-    logger.debug('AI SDK provider created', {
-      providerId: config.providerId,
-      hasOptions: !!config.options
-    })
-    return provider
-  } catch (error) {
-    logger.error('Failed to create AI SDK provider', error as Error, {
-      providerId: config.providerId
-    })
-    throw error
-  }
-}
-
-/**
- * Create an AI SDK language model from a Cherry Studio provider configuration
- * Uses shared provider utilities for consistent behavior with renderer
- */
-async function createLanguageModel(provider: Provider, modelId: string): Promise<LanguageModel> {
-  logger.debug('Creating language model', {
-    providerId: provider.id,
-    providerType: provider.type,
-    modelId,
-    apiHost: provider.apiHost
-  })
-
-  // Convert provider config to AI SDK config
-  const config = providerToAiSdkConfig(provider, modelId)
-
-  // Create the AI SDK provider
-  const aiSdkProvider = await createAiSdkProvider(config)
-  if (!aiSdkProvider) {
-    throw new Error(`Failed to create AI SDK provider for ${provider.id}`)
-  }
-
-  // Get the language model
-  return aiSdkProvider.languageModel(modelId)
-}
-
 function convertAnthropicToolResultToAiSdk(
   content: string | Array<TextBlockParam | ImageBlockParam>
 ): LanguageModelV2ToolResultOutput {
   if (typeof content === 'string') {
-    return {
-      type: 'text',
-      value: content
-    }
-  } else {
-    const values: Array<
-      | { type: 'text'; text: string }
-      | {
-          type: 'media'
-          /**
-Base-64 encoded media data.
-*/
-          data: string
-          /**
-IANA media type.
-@see https://www.iana.org/assignments/media-types/media-types.xhtml
-*/
-          mediaType: string
-        }
-    > = []
-    for (const block of content) {
-      if (block.type === 'text') {
-        values.push({
-          type: 'text',
-          text: block.text
-        })
-      } else if (block.type === 'image') {
-        values.push({
-          type: 'media',
-          data: block.source.type === 'base64' ? block.source.data : block.source.url,
-          mediaType: block.source.type === 'base64' ? block.source.media_type : 'image/png'
-        })
-      }
-    }
-    return {
-      type: 'content',
-      value: values
+    return { type: 'text', value: content }
+  }
+  const values: Array<{ type: 'text'; text: string } | { type: 'media'; data: string; mediaType: string }> = []
+  for (const block of content) {
+    if (block.type === 'text') {
+      values.push({ type: 'text', text: block.text })
+    } else if (block.type === 'image') {
+      values.push({
+        type: 'media',
+        data: block.source.type === 'base64' ? block.source.data : block.source.url,
+        mediaType: block.source.type === 'base64' ? block.source.media_type : 'image/png'
+      })
     }
   }
+  return { type: 'content', value: values }
 }
 
-/**
- * Convert Anthropic tools format to AI SDK tools format
- */
 function convertAnthropicToolsToAiSdk(tools: MessageCreateParams['tools']): Record<string, Tool> | undefined {
-  if (!tools || tools.length === 0) {
-    return undefined
-  }
+  if (!tools || tools.length === 0) return undefined
 
   const aiSdkTools: Record<string, Tool> = {}
-
   for (const anthropicTool of tools) {
-    // Handle different tool types
-    if (anthropicTool.type === 'bash_20250124') {
-      // Skip computer use and bash tools - these are Anthropic-specific
-      continue
-    }
-
-    // Regular tool (type === 'custom' or no type)
+    if (anthropicTool.type === 'bash_20250124') continue
     const toolDef = anthropicTool as AnthropicTool
     const parameters = toolDef.input_schema as Parameters<typeof jsonSchema>[0]
-
     aiSdkTools[toolDef.name] = tool({
       description: toolDef.description || '',
       inputSchema: jsonSchema(parameters),
-      execute: async (input: Record<string, unknown>) => {
-        return input
-      }
+      execute: async (input: Record<string, unknown>) => input
     })
   }
-
   return Object.keys(aiSdkTools).length > 0 ? aiSdkTools : undefined
 }
 
-/**
- * Convert Anthropic MessageCreateParams to AI SDK message format
- */
 function convertAnthropicToAiMessages(params: MessageCreateParams): ModelMessage[] {
   const messages: ModelMessage[] = []
 
-  // Add system message if present
+  // System message
   if (params.system) {
     if (typeof params.system === 'string') {
-      messages.push({
-        role: 'system',
-        content: params.system
-      })
+      messages.push({ role: 'system', content: params.system })
     } else if (Array.isArray(params.system)) {
-      // Handle TextBlockParam array
       const systemText = params.system
         .filter((block) => block.type === 'text')
         .map((block) => block.text)
         .join('\n')
       if (systemText) {
-        messages.push({
-          role: 'system',
-          content: systemText
-        })
+        messages.push({ role: 'system', content: systemText })
       }
     }
   }
 
-  // Convert user/assistant messages
+  // User/assistant messages
   for (const msg of params.messages) {
     if (typeof msg.content === 'string') {
-      if (msg.role === 'user') {
-        messages.push({ role: 'user', content: msg.content })
-      } else {
-        messages.push({ role: 'assistant', content: msg.content })
-      }
+      messages.push({
+        role: msg.role === 'user' ? 'user' : 'assistant',
+        content: msg.content
+      })
     } else if (Array.isArray(msg.content)) {
-      // Handle content blocks
       const textParts: TextPart[] = []
       const imageParts: ImagePart[] = []
       const reasoningParts: ReasoningPart[] = []
@@ -278,15 +178,9 @@ function convertAnthropicToAiMessages(params: MessageCreateParams): ModelMessage
         } else if (block.type === 'image') {
           const source = block.source
           if (source.type === 'base64') {
-            imageParts.push({
-              type: 'image',
-              image: `data:${source.media_type};base64,${source.data}`
-            })
+            imageParts.push({ type: 'image', image: `data:${source.media_type};base64,${source.data}` })
           } else if (source.type === 'url') {
-            imageParts.push({
-              type: 'image',
-              image: source.url
-            })
+            imageParts.push({ type: 'image', image: source.url })
           }
         } else if (block.type === 'tool_use') {
           toolCallParts.push({
@@ -306,30 +200,18 @@ function convertAnthropicToAiMessages(params: MessageCreateParams): ModelMessage
       }
 
       if (toolResultParts.length > 0) {
-        messages.push({
-          role: 'tool',
-          content: [...toolResultParts]
-        })
+        messages.push({ role: 'tool', content: [...toolResultParts] })
       }
 
-      // Build the message based on role
-      // Only push user/assistant message if there's actual content (avoid empty messages)
       if (msg.role === 'user') {
         const userContent = [...textParts, ...imageParts]
         if (userContent.length > 0) {
-          messages.push({
-            role: 'user',
-            content: userContent
-          })
+          messages.push({ role: 'user', content: userContent })
         }
       } else {
-        // Assistant messages contain tool calls, not tool results
         const assistantContent = [...reasoningParts, ...textParts, ...toolCallParts]
         if (assistantContent.length > 0) {
-          messages.push({
-            role: 'assistant',
-            content: assistantContent
-          })
+          messages.push({ role: 'assistant', content: assistantContent })
         }
       }
     }
@@ -338,67 +220,54 @@ function convertAnthropicToAiMessages(params: MessageCreateParams): ModelMessage
   return messages
 }
 
-/**
- * Stream a message request using AI SDK and convert to Anthropic SSE format
- */
-// TODO: 使用ai-core executor集成中间件和transformstream进来
-export async function streamUnifiedMessages(config: UnifiedStreamConfig): Promise<void> {
-  const { response, provider, modelId, params, onError, onComplete } = config
+interface ExecuteStreamConfig {
+  provider: Provider
+  modelId: string
+  params: MessageCreateParams
+  middlewares?: LanguageModelV2Middleware[]
+  plugins?: AiPlugin[]
+  onEvent?: (event: Parameters<typeof formatSSEEvent>[0]) => void
+}
 
-  logger.info('Starting unified message stream', {
-    providerId: provider.id,
-    providerType: provider.type,
-    modelId,
-    stream: params.stream
+/**
+ * Core stream execution function - single source of truth for AI SDK calls
+ */
+async function executeStream(config: ExecuteStreamConfig): Promise<AiSdkToAnthropicSSE> {
+  const { provider, modelId, params, middlewares = [], plugins = [], onEvent } = config
+
+  // Convert provider config to AI SDK config
+  const sdkConfig = providerToAiSdkConfig(provider, modelId)
+
+  logger.debug('Created AI SDK config', {
+    providerId: sdkConfig.providerId,
+    hasOptions: !!sdkConfig.options
   })
 
-  try {
-    response.setHeader('Content-Type', 'text/event-stream')
-    response.setHeader('Cache-Control', 'no-cache')
-    response.setHeader('Connection', 'keep-alive')
-    response.setHeader('X-Accel-Buffering', 'no')
+  // Create executor with plugins
+  const executor = createExecutor(sdkConfig.providerId, sdkConfig.options, plugins)
 
-    const model = await createLanguageModel(provider, modelId)
+  // Convert messages and tools
+  const coreMessages = convertAnthropicToAiMessages(params)
+  const tools = convertAnthropicToolsToAiSdk(params.tools)
 
-    const coreMessages = convertAnthropicToAiMessages(params)
+  logger.debug('Converted messages', {
+    originalCount: params.messages.length,
+    convertedCount: coreMessages.length,
+    hasSystem: !!params.system,
+    hasTools: !!tools,
+    toolCount: tools ? Object.keys(tools).length : 0
+  })
 
-    // Convert tools if present
-    const tools = convertAnthropicToolsToAiSdk(params.tools)
+  // Create the adapter
+  const adapter = new AiSdkToAnthropicSSE({
+    model: `${provider.id}:${modelId}`,
+    onEvent: onEvent || (() => {})
+  })
 
-    logger.debug('Converted messages', {
-      originalCount: params.messages.length,
-      convertedCount: coreMessages.length,
-      hasSystem: !!params.system,
-      hasTools: !!tools,
-      toolCount: tools ? Object.keys(tools).length : 0,
-      toolNames: tools ? Object.keys(tools).slice(0, 10) : [],
-      paramsToolCount: params.tools?.length || 0
-    })
-
-    // Debug: Log message structure to understand tool_result handling
-    logger.silly('Message structure for debugging', {
-      messages: coreMessages.map((m) => ({
-        role: m.role,
-        contentTypes: Array.isArray(m.content)
-          ? m.content.map((c: { type: string }) => c.type)
-          : typeof m.content === 'string'
-            ? ['string']
-            : ['unknown']
-      }))
-    })
-
-    // Create the adapter
-    const adapter = new AiSdkToAnthropicSSE({
-      model: `${provider.id}:${modelId}`,
-      onEvent: (event) => {
-        const sseData = formatSSEEvent(event)
-        response.write(sseData)
-      }
-    })
-
-    // Start streaming
-    const result = streamText({
-      model,
+  // Execute stream
+  const result = await executor.streamText(
+    {
+      model: modelId,
       messages: coreMessages,
       maxOutputTokens: params.max_tokens,
       temperature: params.temperature,
@@ -408,38 +277,65 @@ export async function streamUnifiedMessages(config: UnifiedStreamConfig): Promis
       headers: defaultAppHeaders(),
       tools,
       providerOptions: {}
-    })
+    },
+    { middlewares }
+  )
 
-    // Process the stream through the adapter
-    await adapter.processStream(result.fullStream)
+  // Process the stream through the adapter
+  await adapter.processStream(result.fullStream)
+
+  return adapter
+}
+
+/**
+ * Stream a message request using AI SDK executor and convert to Anthropic SSE format
+ */
+export async function streamUnifiedMessages(config: UnifiedStreamConfig): Promise<void> {
+  const { response, provider, modelId, params, onError, onComplete, middlewares = [], plugins = [] } = config
+
+  logger.info('Starting unified message stream', {
+    providerId: provider.id,
+    providerType: provider.type,
+    modelId,
+    stream: params.stream,
+    middlewareCount: middlewares.length,
+    pluginCount: plugins.length
+  })
+
+  try {
+    response.setHeader('Content-Type', 'text/event-stream')
+    response.setHeader('Cache-Control', 'no-cache')
+    response.setHeader('Connection', 'keep-alive')
+    response.setHeader('X-Accel-Buffering', 'no')
+
+    await executeStream({
+      provider,
+      modelId,
+      params,
+      middlewares,
+      plugins,
+      onEvent: (event) => {
+        const sseData = formatSSEEvent(event)
+        response.write(sseData)
+      }
+    })
 
     // Send done marker
     response.write(formatSSEDone())
     response.end()
 
-    logger.info('Unified message stream completed', {
-      providerId: provider.id,
-      modelId
-    })
-
+    logger.info('Unified message stream completed', { providerId: provider.id, modelId })
     onComplete?.()
   } catch (error) {
-    logger.error('Error in unified message stream', error as Error, {
-      providerId: provider.id,
-      modelId
-    })
+    logger.error('Error in unified message stream', error as Error, { providerId: provider.id, modelId })
 
-    // Try to send error event if response is still writable
     if (!response.writableEnded) {
       try {
         const errorMessage = error instanceof Error ? error.message : 'Unknown error'
         response.write(
           `event: error\ndata: ${JSON.stringify({
             type: 'error',
-            error: {
-              type: 'api_error',
-              message: errorMessage
-            }
+            error: { type: 'api_error', message: errorMessage }
           })}\n\n`
         )
         response.end()
@@ -455,64 +351,61 @@ export async function streamUnifiedMessages(config: UnifiedStreamConfig): Promis
 
 /**
  * Generate a non-streaming message response
+ *
+ * Uses simulateStreamingMiddleware to reuse the same streaming logic,
+ * similar to renderer's ModernAiProvider pattern.
  */
 export async function generateUnifiedMessage(
-  provider: Provider,
-  modelId: string,
-  params: MessageCreateParams
+  providerOrConfig: Provider | GenerateUnifiedMessageConfig,
+  modelId?: string,
+  params?: MessageCreateParams
 ): Promise<ReturnType<typeof AiSdkToAnthropicSSE.prototype.buildNonStreamingResponse>> {
+  // Support both old signature and new config-based signature
+  let config: GenerateUnifiedMessageConfig
+  if ('provider' in providerOrConfig && 'modelId' in providerOrConfig && 'params' in providerOrConfig) {
+    config = providerOrConfig
+  } else {
+    config = {
+      provider: providerOrConfig as Provider,
+      modelId: modelId!,
+      params: params!
+    }
+  }
+
+  const { provider, middlewares = [], plugins = [] } = config
+
   logger.info('Starting unified message generation', {
     providerId: provider.id,
     providerType: provider.type,
-    modelId
+    modelId: config.modelId,
+    middlewareCount: middlewares.length,
+    pluginCount: plugins.length
   })
 
   try {
-    // Create language model (async - uses @cherrystudio/ai-core)
-    const model = await createLanguageModel(provider, modelId)
+    // Add simulateStreamingMiddleware to reuse streaming logic for non-streaming
+    const allMiddlewares = [simulateStreamingMiddleware(), ...middlewares]
 
-    // Convert messages and tools
-    const coreMessages = convertAnthropicToAiMessages(params)
-    const tools = convertAnthropicToolsToAiSdk(params.tools)
-
-    // Create adapter to collect the response
-    let finalResponse: ReturnType<typeof AiSdkToAnthropicSSE.prototype.buildNonStreamingResponse> | null = null
-    const adapter = new AiSdkToAnthropicSSE({
-      model: `${provider.id}:${modelId}`,
-      onEvent: () => {
-        // We don't need to emit events for non-streaming
-      }
+    const adapter = await executeStream({
+      provider,
+      modelId: config.modelId,
+      params: config.params,
+      middlewares: allMiddlewares,
+      plugins
     })
 
-    // Generate text
-    const result = streamText({
-      model,
-      messages: coreMessages,
-      maxOutputTokens: params.max_tokens,
-      temperature: params.temperature,
-      topP: params.top_p,
-      stopSequences: params.stop_sequences,
-      headers: defaultAppHeaders(),
-      tools,
-      stopWhen: stepCountIs(100)
-    })
-
-    // Process the stream to build the response
-    await adapter.processStream(result.fullStream)
-
-    // Get the final response
-    finalResponse = adapter.buildNonStreamingResponse()
+    const finalResponse = adapter.buildNonStreamingResponse()
 
     logger.info('Unified message generation completed', {
       providerId: provider.id,
-      modelId
+      modelId: config.modelId
     })
 
     return finalResponse
   } catch (error) {
     logger.error('Error in unified message generation', error as Error, {
       providerId: provider.id,
-      modelId
+      modelId: config.modelId
     })
     throw error
   }
diff --git a/src/renderer/src/aiCore/middleware/AiSdkMiddlewareBuilder.ts b/src/renderer/src/aiCore/middleware/AiSdkMiddlewareBuilder.ts
index b314ddd737..82e1c32465 100644
--- a/src/renderer/src/aiCore/middleware/AiSdkMiddlewareBuilder.ts
+++ b/src/renderer/src/aiCore/middleware/AiSdkMiddlewareBuilder.ts
@@ -5,6 +5,7 @@ import type { MCPTool } from '@renderer/types'
 import { type Assistant, type Message, type Model, type Provider, SystemProviderIds } from '@renderer/types'
 import type { Chunk } from '@renderer/types/chunk'
 import { isSupportEnableThinkingProvider } from '@renderer/utils/provider'
+import { openrouterReasoningMiddleware, skipGeminiThoughtSignatureMiddleware } from '@shared/middleware'
 import type { LanguageModelMiddleware } from 'ai'
 import { extractReasoningMiddleware, simulateStreamingMiddleware } from 'ai'
 import { isEmpty } from 'lodash'
@@ -13,9 +14,7 @@ import { getAiSdkProviderId } from '../provider/factory'
 import { isOpenRouterGeminiGenerateImageModel } from '../utils/image'
 import { noThinkMiddleware } from './noThinkMiddleware'
 import { openrouterGenerateImageMiddleware } from './openrouterGenerateImageMiddleware'
-import { openrouterReasoningMiddleware } from './openrouterReasoningMiddleware'
 import { qwenThinkingMiddleware } from './qwenThinkingMiddleware'
-import { skipGeminiThoughtSignatureMiddleware } from './skipGeminiThoughtSignatureMiddleware'
 import { toolChoiceMiddleware } from './toolChoiceMiddleware'
 
 const logger = loggerService.withContext('AiSdkMiddlewareBuilder')
diff --git a/src/renderer/src/aiCore/middleware/openrouterReasoningMiddleware.ts b/src/renderer/src/aiCore/middleware/openrouterReasoningMiddleware.ts
deleted file mode 100644
index 9ef3df61e9..0000000000
--- a/src/renderer/src/aiCore/middleware/openrouterReasoningMiddleware.ts
+++ /dev/null
@@ -1,50 +0,0 @@
-import type { LanguageModelV2StreamPart } from '@ai-sdk/provider'
-import type { LanguageModelMiddleware } from 'ai'
-
-/**
- * https://openrouter.ai/docs/docs/best-practices/reasoning-tokens#example-preserving-reasoning-blocks-with-openrouter-and-claude
- *
- * @returns LanguageModelMiddleware - a middleware filter redacted block
- */
-export function openrouterReasoningMiddleware(): LanguageModelMiddleware {
-  const REDACTED_BLOCK = '[REDACTED]'
-  return {
-    middlewareVersion: 'v2',
-    wrapGenerate: async ({ doGenerate }) => {
-      const { content, ...rest } = await doGenerate()
-      const modifiedContent = content.map((part) => {
-        if (part.type === 'reasoning' && part.text.includes(REDACTED_BLOCK)) {
-          return {
-            ...part,
-            text: part.text.replace(REDACTED_BLOCK, '')
-          }
-        }
-        return part
-      })
-      return { content: modifiedContent, ...rest }
-    },
-    wrapStream: async ({ doStream }) => {
-      const { stream, ...rest } = await doStream()
-      return {
-        stream: stream.pipeThrough(
-          new TransformStream<LanguageModelV2StreamPart, LanguageModelV2StreamPart>({
-            transform(
-              chunk: LanguageModelV2StreamPart,
-              controller: TransformStreamDefaultController<LanguageModelV2StreamPart>
-            ) {
-              if (chunk.type === 'reasoning-delta' && chunk.delta.includes(REDACTED_BLOCK)) {
-                controller.enqueue({
-                  ...chunk,
-                  delta: chunk.delta.replace(REDACTED_BLOCK, '')
-                })
-              } else {
-                controller.enqueue(chunk)
-              }
-            }
-          })
-        ),
-        ...rest
-      }
-    }
-  }
-}
diff --git a/src/renderer/src/aiCore/middleware/skipGeminiThoughtSignatureMiddleware.ts b/src/renderer/src/aiCore/middleware/skipGeminiThoughtSignatureMiddleware.ts
deleted file mode 100644
index da318ea60d..0000000000
--- a/src/renderer/src/aiCore/middleware/skipGeminiThoughtSignatureMiddleware.ts
+++ /dev/null
@@ -1,36 +0,0 @@
-import type { LanguageModelMiddleware } from 'ai'
-
-/**
- * skip Gemini Thought Signature Middleware
- * 由于多模型客户端请求的复杂性（可以中途切换其他模型），这里选择通过中间件方式添加跳过所有 Gemini3 思考签名
- * Due to the complexity of multi-model client requests (which can switch to other models mid-process),
- * it was decided to add a skip for all Gemini3 thinking signatures via middleware.
- * @param aiSdkId AI SDK Provider ID
- * @returns LanguageModelMiddleware
- */
-export function skipGeminiThoughtSignatureMiddleware(aiSdkId: string): LanguageModelMiddleware {
-  const MAGIC_STRING = 'skip_thought_signature_validator'
-  return {
-    middlewareVersion: 'v2',
-
-    transformParams: async ({ params }) => {
-      const transformedParams = { ...params }
-      // Process messages in prompt
-      if (transformedParams.prompt && Array.isArray(transformedParams.prompt)) {
-        transformedParams.prompt = transformedParams.prompt.map((message) => {
-          if (typeof message.content !== 'string') {
-            for (const part of message.content) {
-              const googleOptions = part?.providerOptions?.[aiSdkId]
-              if (googleOptions?.thoughtSignature) {
-                googleOptions.thoughtSignature = MAGIC_STRING
-              }
-            }
-          }
-          return message
-        })
-      }
-
-      return transformedParams
-    }
-  }
-}
diff --git a/tsconfig.node.json b/tsconfig.node.json
index 9871e604f2..4f9e797146 100644
--- a/tsconfig.node.json
+++ b/tsconfig.node.json
@@ -7,9 +7,11 @@
     "src/main/env.d.ts",
     "src/renderer/src/types/*",
     "packages/shared/**/*",
+    "packages/aiCore/src/**/*",
     "scripts",
     "packages/mcp-trace/**/*",
-    "src/renderer/src/services/traceApi.ts"
+    "src/renderer/src/services/traceApi.ts",
+    "packages/ai-sdk-provider/**/*"
   ],
   "compilerOptions": {
     "composite": true,

From 356e82842299df02701d55cc59f989c6f3ca095f Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Fri, 28 Nov 2025 04:12:18 +0800
Subject: [PATCH 15/53] feat: enhance AI SDK integration with middleware
 support and improve message handling

---
 .../shared/adapters/AiSdkToAnthropicSSE.ts    |  45 +++----
 packages/shared/middleware/middlewares.ts     |   2 +-
 src/main/apiServer/routes/messages.ts         |  23 +++-
 .../apiServer/services/unified-messages.ts    | 120 +++++++++++++-----
 4 files changed, 130 insertions(+), 60 deletions(-)

diff --git a/packages/shared/adapters/AiSdkToAnthropicSSE.ts b/packages/shared/adapters/AiSdkToAnthropicSSE.ts
index 1674609236..f1d6b0c022 100644
--- a/packages/shared/adapters/AiSdkToAnthropicSSE.ts
+++ b/packages/shared/adapters/AiSdkToAnthropicSSE.ts
@@ -36,7 +36,7 @@ import type {
   Usage
 } from '@anthropic-ai/sdk/resources/messages'
 import { loggerService } from '@logger'
-import type { TextStreamPart, ToolSet } from 'ai'
+import type { FinishReason, LanguageModelUsage, TextStreamPart, ToolSet } from 'ai'
 
 const logger = loggerService.withContext('AiSdkToAnthropicSSE')
 
@@ -56,6 +56,7 @@ interface AdapterState {
   model: string
   inputTokens: number
   outputTokens: number
+  cacheInputTokens: number
   currentBlockIndex: number
   blocks: Map<number, ContentBlockState>
   textBlockIndex: number | null
@@ -67,10 +68,6 @@ interface AdapterState {
   hasEmittedMessageStart: boolean
 }
 
-// ============================================================================
-// Adapter Class
-// ============================================================================
-
 export type SSEEventCallback = (event: RawMessageStreamEvent) => void
 
 export interface AiSdkToAnthropicSSEOptions {
@@ -94,6 +91,7 @@ export class AiSdkToAnthropicSSE {
       model: options.model,
       inputTokens: options.inputTokens || 0,
       outputTokens: 0,
+      cacheInputTokens: 0,
       currentBlockIndex: 0,
       blocks: new Map(),
       textBlockIndex: null,
@@ -153,19 +151,19 @@ export class AiSdkToAnthropicSSE {
 
       // === Reasoning/Thinking Events ===
       case 'reasoning-start': {
-        const reasoningId = (chunk as { id?: string }).id || `reasoning_${Date.now()}`
+        const reasoningId = chunk.id
         this.startThinkingBlock(reasoningId)
         break
       }
 
       case 'reasoning-delta': {
-        const reasoningId = (chunk as { id?: string }).id
+        const reasoningId = chunk.id
         this.emitThinkingDelta(chunk.text || '', reasoningId)
         break
       }
 
       case 'reasoning-end': {
-        const reasoningId = (chunk as { id?: string }).id
+        const reasoningId = chunk.id
         this.stopThinkingBlock(reasoningId)
         break
       }
@@ -176,14 +174,18 @@ export class AiSdkToAnthropicSSE {
           type: 'tool-call',
           toolCallId: chunk.toolCallId,
           toolName: chunk.toolName,
-          // AI SDK uses 'args' in some versions and 'input' in others
-          args: 'args' in chunk ? chunk.args : (chunk as any).input
+          args: chunk.input
         })
         break
 
       case 'tool-result':
-        // Tool results are handled separately in Anthropic API
-        // They come from user messages, not assistant stream
+        // this.handleToolResult({
+        //   type: 'tool-result',
+        //   toolCallId: chunk.toolCallId,
+        //   toolName: chunk.toolName,
+        //   args: chunk.input,
+        //   result: chunk.output
+        // })
         break
 
       // === Completion Events ===
@@ -465,34 +467,29 @@ export class AiSdkToAnthropicSSE {
     this.state.stopReason = 'tool_use'
   }
 
-  private handleFinish(chunk: {
-    type: 'finish'
-    finishReason?: string
-    totalUsage?: {
-      inputTokens?: number
-      outputTokens?: number
-    }
-  }): void {
+  private handleFinish(chunk: { type: 'finish'; finishReason?: FinishReason; totalUsage?: LanguageModelUsage }): void {
     // Update usage
     if (chunk.totalUsage) {
       this.state.inputTokens = chunk.totalUsage.inputTokens || 0
       this.state.outputTokens = chunk.totalUsage.outputTokens || 0
+      this.state.cacheInputTokens = chunk.totalUsage.cachedInputTokens || 0
     }
 
     // Determine finish reason
     if (!this.state.stopReason) {
       switch (chunk.finishReason) {
         case 'stop':
-        case 'end_turn':
           this.state.stopReason = 'end_turn'
           break
         case 'length':
-        case 'max_tokens':
           this.state.stopReason = 'max_tokens'
           break
         case 'tool-calls':
           this.state.stopReason = 'tool_use'
           break
+        case 'content-filter':
+          this.state.stopReason = 'refusal'
+          break
         default:
           this.state.stopReason = 'end_turn'
       }
@@ -539,8 +536,8 @@ export class AiSdkToAnthropicSSE {
     // Emit message_delta with final stop reason and usage
     const usage: MessageDeltaUsage = {
       output_tokens: this.state.outputTokens,
-      input_tokens: null,
-      cache_creation_input_tokens: null,
+      input_tokens: this.state.inputTokens,
+      cache_creation_input_tokens: this.state.cacheInputTokens,
       cache_read_input_tokens: null,
       server_tool_use: null
     }
diff --git a/packages/shared/middleware/middlewares.ts b/packages/shared/middleware/middlewares.ts
index d9725101c2..de857699f7 100644
--- a/packages/shared/middleware/middlewares.ts
+++ b/packages/shared/middleware/middlewares.ts
@@ -50,7 +50,7 @@ export interface SharedMiddlewareConfig {
 export function isGemini3ModelId(modelId?: string): boolean {
   if (!modelId) return false
   const lowerModelId = modelId.toLowerCase()
-  return lowerModelId.includes('gemini-2.5') || lowerModelId.includes('gemini-exp') || lowerModelId.includes('gemini-3')
+  return lowerModelId.includes('gemini-3')
 }
 
 /**
diff --git a/src/main/apiServer/routes/messages.ts b/src/main/apiServer/routes/messages.ts
index 907b498273..018e7d60ad 100644
--- a/src/main/apiServer/routes/messages.ts
+++ b/src/main/apiServer/routes/messages.ts
@@ -1,5 +1,7 @@
 import type { MessageCreateParams } from '@anthropic-ai/sdk/resources'
 import { loggerService } from '@logger'
+import { buildSharedMiddlewares, type SharedMiddlewareConfig } from '@shared/middleware'
+import { getAiSdkProviderId } from '@shared/provider'
 import type { Provider } from '@types'
 import type { Request, Response } from 'express'
 import express from 'express'
@@ -206,12 +208,26 @@ async function handleUnifiedProcessing({
       return
     }
 
+    const middlewareConfig: SharedMiddlewareConfig = {
+      modelId: actualModelId,
+      providerId: provider.id,
+      aiSdkProviderId: getAiSdkProviderId(provider)
+    }
+    const middlewares = buildSharedMiddlewares(middlewareConfig)
+
+    logger.debug('Built middlewares for unified processing', {
+      middlewareCount: middlewares.length,
+      modelId: actualModelId,
+      providerId: provider.id
+    })
+
     if (request.stream) {
       await streamUnifiedMessages({
         response: res,
         provider,
         modelId: actualModelId,
         params: request,
+        middlewares,
         onError: (error) => {
           logger.error('Stream error', error as Error)
         },
@@ -220,7 +236,12 @@ async function handleUnifiedProcessing({
         }
       })
     } else {
-      const response = await generateUnifiedMessage(provider, actualModelId, request)
+      const response = await generateUnifiedMessage({
+        provider,
+        modelId: actualModelId,
+        params: request,
+        middlewares
+      })
       res.json(response)
     }
   } catch (error: any) {
diff --git a/src/main/apiServer/services/unified-messages.ts b/src/main/apiServer/services/unified-messages.ts
index be8b05aeac..4370a429d0 100644
--- a/src/main/apiServer/services/unified-messages.ts
+++ b/src/main/apiServer/services/unified-messages.ts
@@ -1,5 +1,5 @@
 import type { LanguageModelV2Middleware, LanguageModelV2ToolResultOutput } from '@ai-sdk/provider'
-import type { ReasoningPart, ToolCallPart, ToolResultPart } from '@ai-sdk/provider-utils'
+import type { ProviderOptions, ReasoningPart, ToolCallPart, ToolResultPart } from '@ai-sdk/provider-utils'
 import type {
   ImageBlockParam,
   MessageCreateParams,
@@ -7,9 +7,11 @@ import type {
   Tool as AnthropicTool
 } from '@anthropic-ai/sdk/resources/messages'
 import { type AiPlugin, createExecutor } from '@cherrystudio/ai-core'
+import { createProvider as createProviderCore } from '@cherrystudio/ai-core/provider'
 import { loggerService } from '@logger'
 import { reduxService } from '@main/services/ReduxService'
 import { AiSdkToAnthropicSSE, formatSSEDone, formatSSEEvent } from '@shared/adapters'
+import { isGemini3ModelId } from '@shared/middleware'
 import {
   type AiSdkConfig,
   type AiSdkConfigContext,
@@ -21,13 +23,15 @@ import {
 } from '@shared/provider'
 import { defaultAppHeaders } from '@shared/utils'
 import type { Provider } from '@types'
-import type { ImagePart, ModelMessage, TextPart, Tool } from 'ai'
-import { jsonSchema, simulateStreamingMiddleware, stepCountIs, tool } from 'ai'
+import type { ImagePart, ModelMessage, Provider as AiSdkProvider, TextPart, Tool } from 'ai'
+import { jsonSchema, simulateStreamingMiddleware, stepCountIs, tool, wrapLanguageModel } from 'ai'
 import { net } from 'electron'
 import type { Response } from 'express'
 
 const logger = loggerService.withContext('UnifiedMessagesService')
 
+const MAGIC_STRING = 'skip_thought_signature_validator'
+
 initializeSharedProviders({
   warn: (message) => logger.warn(message),
   error: (message, error) => logger.error(message, error)
@@ -64,10 +68,6 @@ export interface GenerateUnifiedMessageConfig {
   plugins?: AiPlugin[]
 }
 
-// ============================================================================
-// Internal Utilities
-// ============================================================================
-
 function getMainProcessFormatContext(): ProviderFormatContext {
   const vertexSettings = reduxService.selectSync<{ projectId: string; location: string }>('state.llm.settings.vertexai')
   return {
@@ -154,6 +154,19 @@ function convertAnthropicToAiMessages(params: MessageCreateParams): ModelMessage
     }
   }
 
+  // Build a map of tool_use_id -> toolName from all messages first
+  // This is needed because tool_result references tool_use from previous assistant messages
+  const toolCallIdToName = new Map<string, string>()
+  for (const msg of params.messages) {
+    if (Array.isArray(msg.content)) {
+      for (const block of msg.content) {
+        if (block.type === 'tool_use') {
+          toolCallIdToName.set(block.id, block.name)
+        }
+      }
+    }
+  }
+
   // User/assistant messages
   for (const msg of params.messages) {
     if (typeof msg.content === 'string') {
@@ -190,10 +203,12 @@ function convertAnthropicToAiMessages(params: MessageCreateParams): ModelMessage
             input: block.input
           })
         } else if (block.type === 'tool_result') {
+          // Look up toolName from the pre-built map (covers cross-message references)
+          const toolName = toolCallIdToName.get(block.tool_use_id) || 'unknown'
           toolResultParts.push({
             type: 'tool-result',
             toolCallId: block.tool_use_id,
-            toolName: toolCallParts.find((t) => t.toolCallId === block.tool_use_id)?.toolName || 'unknown',
+            toolName,
             output: block.content ? convertAnthropicToolResultToAiSdk(block.content) : { type: 'text', value: '' }
           })
         }
@@ -211,7 +226,18 @@ function convertAnthropicToAiMessages(params: MessageCreateParams): ModelMessage
       } else {
         const assistantContent = [...reasoningParts, ...textParts, ...toolCallParts]
         if (assistantContent.length > 0) {
-          messages.push({ role: 'assistant', content: assistantContent })
+          let providerOptions: ProviderOptions | undefined = undefined
+          if (isGemini3ModelId(params.model)) {
+            providerOptions = {
+              google: {
+                thoughtSignature: MAGIC_STRING
+              },
+              openrouter: {
+                reasoning_details: []
+              }
+            }
+          }
+          messages.push({ role: 'assistant', content: assistantContent, providerOptions })
         }
       }
     }
@@ -229,6 +255,32 @@ interface ExecuteStreamConfig {
   onEvent?: (event: Parameters<typeof formatSSEEvent>[0]) => void
 }
 
+/**
+ * Create AI SDK provider instance from config
+ * Similar to renderer's createAiSdkProvider
+ */
+async function createAiSdkProvider(config: AiSdkConfig): Promise<AiSdkProvider> {
+  let providerId = config.providerId
+
+  // Handle special provider modes (same as renderer)
+  if (providerId === 'openai' && config.options?.mode === 'chat') {
+    providerId = 'openai-chat'
+  } else if (providerId === 'azure' && config.options?.mode === 'responses') {
+    providerId = 'azure-responses'
+  } else if (providerId === 'cherryin' && config.options?.mode === 'chat') {
+    providerId = 'cherryin-chat'
+  }
+
+  const provider = await createProviderCore(providerId, config.options)
+
+  logger.debug('AI SDK provider created', {
+    providerId,
+    hasOptions: !!config.options
+  })
+
+  return provider
+}
+
 /**
  * Core stream execution function - single source of truth for AI SDK calls
  */
@@ -240,9 +292,20 @@ async function executeStream(config: ExecuteStreamConfig): Promise<AiSdkToAnthro
 
   logger.debug('Created AI SDK config', {
     providerId: sdkConfig.providerId,
-    hasOptions: !!sdkConfig.options
+    hasOptions: !!sdkConfig.options,
+    message: params.messages
   })
 
+  // Create provider instance and get language model
+  const aiSdkProvider = await createAiSdkProvider(sdkConfig)
+  const baseModel = aiSdkProvider.languageModel(modelId)
+
+  // Apply middlewares if present
+  const model =
+    middlewares.length > 0 && typeof baseModel === 'object'
+      ? (wrapLanguageModel({ model: baseModel, middleware: middlewares }) as typeof baseModel)
+      : baseModel
+
   // Create executor with plugins
   const executor = createExecutor(sdkConfig.providerId, sdkConfig.options, plugins)
 
@@ -250,36 +313,25 @@ async function executeStream(config: ExecuteStreamConfig): Promise<AiSdkToAnthro
   const coreMessages = convertAnthropicToAiMessages(params)
   const tools = convertAnthropicToolsToAiSdk(params.tools)
 
-  logger.debug('Converted messages', {
-    originalCount: params.messages.length,
-    convertedCount: coreMessages.length,
-    hasSystem: !!params.system,
-    hasTools: !!tools,
-    toolCount: tools ? Object.keys(tools).length : 0
-  })
-
   // Create the adapter
   const adapter = new AiSdkToAnthropicSSE({
     model: `${provider.id}:${modelId}`,
     onEvent: onEvent || (() => {})
   })
 
-  // Execute stream
-  const result = await executor.streamText(
-    {
-      model: modelId,
-      messages: coreMessages,
-      maxOutputTokens: params.max_tokens,
-      temperature: params.temperature,
-      topP: params.top_p,
-      stopSequences: params.stop_sequences,
-      stopWhen: stepCountIs(100),
-      headers: defaultAppHeaders(),
-      tools,
-      providerOptions: {}
-    },
-    { middlewares }
-  )
+  // Execute stream - pass model object instead of string
+  const result = await executor.streamText({
+    model, // Now passing LanguageModel object, not string
+    messages: coreMessages,
+    maxOutputTokens: params.max_tokens,
+    temperature: params.temperature,
+    topP: params.top_p,
+    stopSequences: params.stop_sequences,
+    stopWhen: stepCountIs(100),
+    headers: defaultAppHeaders(),
+    tools,
+    providerOptions: {}
+  })
 
   // Process the stream through the adapter
   await adapter.processStream(result.fullStream)

From d367040fd4e5798e81768128b675bf7da5b45adc Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Fri, 28 Nov 2025 13:11:13 +0800
Subject: [PATCH 16/53] feat: implement reasoning cache for improved
 performance and error handling in AI SDK integration

---
 .../shared/adapters/AiSdkToAnthropicSSE.ts    |  44 ++-----
 src/main/apiServer/routes/messages.ts         |   1 -
 src/main/apiServer/services/cache.ts          | 116 ++++++++++++++++++
 src/main/apiServer/services/messages.ts       |  38 +++++-
 .../apiServer/services/unified-messages.ts    |  34 ++---
 .../claudecode/claude-stream-state.ts         |  11 ++
 .../agents/services/claudecode/index.ts       |  13 ++
 .../agents/services/claudecode/transform.ts   |  45 ++++---
 8 files changed, 225 insertions(+), 77 deletions(-)
 create mode 100644 src/main/apiServer/services/cache.ts

diff --git a/packages/shared/adapters/AiSdkToAnthropicSSE.ts b/packages/shared/adapters/AiSdkToAnthropicSSE.ts
index f1d6b0c022..9b23638f48 100644
--- a/packages/shared/adapters/AiSdkToAnthropicSSE.ts
+++ b/packages/shared/adapters/AiSdkToAnthropicSSE.ts
@@ -36,7 +36,8 @@ import type {
   Usage
 } from '@anthropic-ai/sdk/resources/messages'
 import { loggerService } from '@logger'
-import type { FinishReason, LanguageModelUsage, TextStreamPart, ToolSet } from 'ai'
+import { reasoningCache } from '@main/apiServer/services/cache'
+import { type FinishReason, type LanguageModelUsage, type TextStreamPart, type ToolSet } from 'ai'
 
 const logger = loggerService.withContext('AiSdkToAnthropicSSE')
 
@@ -125,6 +126,9 @@ export class AiSdkToAnthropicSSE {
 
       // Ensure all blocks are closed and emit final events
       this.finalize()
+    } catch (error) {
+      await reader.cancel()
+      throw error
     } finally {
       reader.releaseLock()
     }
@@ -188,8 +192,13 @@ export class AiSdkToAnthropicSSE {
         // })
         break
 
-      // === Completion Events ===
       case 'finish-step':
+        if (
+          chunk.providerMetadata?.openrouter?.reasoning_details &&
+          Array.isArray(chunk.providerMetadata.openrouter.reasoning_details)
+        ) {
+          reasoningCache.set('openrouter', chunk.providerMetadata?.openrouter?.reasoning_details)
+        }
         if (chunk.finishReason === 'tool-calls') {
           this.state.stopReason = 'tool_use'
         }
@@ -199,10 +208,8 @@ export class AiSdkToAnthropicSSE {
         this.handleFinish(chunk)
         break
 
-      // === Error Events ===
       case 'error':
-        this.handleError(chunk.error)
-        break
+        throw chunk.error
 
       // Ignore other event types
       default:
@@ -496,33 +503,6 @@ export class AiSdkToAnthropicSSE {
     }
   }
 
-  private handleError(error: unknown): void {
-    // Log the error for debugging
-    logger.warn('AiSdkToAnthropicSSE - Provider error received:', { error })
-
-    // Extract error message
-    let errorMessage = 'Unknown error from provider'
-    if (error && typeof error === 'object') {
-      const err = error as { message?: string; metadata?: { raw?: string } }
-      if (err.metadata?.raw) {
-        errorMessage = `Provider error: ${err.metadata.raw}`
-      } else if (err.message) {
-        errorMessage = err.message
-      }
-    } else if (typeof error === 'string') {
-      errorMessage = error
-    }
-
-    // Emit error as a text block so the user can see it
-    // First close any open thinking blocks to maintain proper event order
-    for (const reasoningId of Array.from(this.state.thinkingBlocks.keys())) {
-      this.stopThinkingBlock(reasoningId)
-    }
-
-    // Emit the error as text
-    this.emitTextDelta(`\n\n[Error: ${errorMessage}]\n`)
-  }
-
   private finalize(): void {
     // Close any open blocks
     if (this.state.textBlockIndex !== null) {
diff --git a/src/main/apiServer/routes/messages.ts b/src/main/apiServer/routes/messages.ts
index 018e7d60ad..1e18c86118 100644
--- a/src/main/apiServer/routes/messages.ts
+++ b/src/main/apiServer/routes/messages.ts
@@ -245,7 +245,6 @@ async function handleUnifiedProcessing({
       res.json(response)
     }
   } catch (error: any) {
-    logger.error('Unified processing error', { error })
     const { statusCode, errorResponse } = messagesService.transformError(error)
     res.status(statusCode).json(errorResponse)
   }
diff --git a/src/main/apiServer/services/cache.ts b/src/main/apiServer/services/cache.ts
new file mode 100644
index 0000000000..765ab1e1b9
--- /dev/null
+++ b/src/main/apiServer/services/cache.ts
@@ -0,0 +1,116 @@
+import { loggerService } from '@logger'
+
+const logger = loggerService.withContext('Cache')
+/**
+ * Cache entry with TTL support
+ */
+interface CacheEntry<T> {
+  details: T[]
+  timestamp: number
+}
+
+/**
+ * In-memory cache for reasoning details
+ * Key: signature
+ * Value: reasoning array with timestamp
+ */
+export class ReasoningCache<T> {
+  private cache = new Map<string, CacheEntry<T>>()
+  private readonly ttlMs: number
+  private cleanupInterval: ReturnType<typeof setInterval> | null = null
+
+  constructor(ttlMs: number = 30 * 60 * 1000) {
+    // Default 30 minutes TTL
+    this.ttlMs = ttlMs
+    this.startCleanup()
+  }
+
+  /**
+   * Store reasoning details by signature
+   */
+  set(signature: string, details: T[]): void {
+    if (!signature || !details.length) return
+
+    this.cache.set(signature, {
+      details,
+      timestamp: Date.now()
+    })
+
+    logger.debug('Cached reasoning details', {
+      signature: signature.substring(0, 20) + '...',
+      detailsCount: details.length
+    })
+  }
+
+  /**
+   * Retrieve reasoning details by signature
+   */
+  get(signature: string): T[] | undefined {
+    const entry = this.cache.get(signature)
+    if (!entry) return undefined
+
+    // Check TTL
+    if (Date.now() - entry.timestamp > this.ttlMs) {
+      this.cache.delete(signature)
+      return undefined
+    }
+
+    logger.debug('Retrieved reasoning details from cache', {
+      signature: signature.substring(0, 20) + '...',
+      detailsCount: entry.details.length
+    })
+
+    return entry.details
+  }
+
+  /**
+   * Clear expired entries
+   */
+  cleanup(): void {
+    const now = Date.now()
+    let cleaned = 0
+
+    for (const [key, entry] of this.cache) {
+      if (now - entry.timestamp > this.ttlMs) {
+        this.cache.delete(key)
+        cleaned++
+      }
+    }
+
+    if (cleaned > 0) {
+      logger.debug('Cleaned up expired reasoning cache entries', { cleaned, remaining: this.cache.size })
+    }
+  }
+
+  /**
+   * Start periodic cleanup
+   */
+  private startCleanup(): void {
+    // Cleanup every 5 minutes
+    this.cleanupInterval = setInterval(() => this.cleanup(), 5 * 60 * 1000)
+  }
+
+  /**
+   * Stop cleanup and clear cache
+   */
+  destroy(): void {
+    if (this.cleanupInterval) {
+      clearInterval(this.cleanupInterval)
+      this.cleanupInterval = null
+    }
+    this.cache.clear()
+  }
+
+  /**
+   * Get cache stats for debugging
+   */
+  stats(): { size: number; ttlMs: number } {
+    return {
+      size: this.cache.size,
+      ttlMs: this.ttlMs
+    }
+  }
+}
+
+// Singleton cache instance
+export const reasoningCache = new ReasoningCache()
diff --git a/src/main/apiServer/services/messages.ts b/src/main/apiServer/services/messages.ts
index e3fbd069a7..3277378266 100644
--- a/src/main/apiServer/services/messages.ts
+++ b/src/main/apiServer/services/messages.ts
@@ -4,6 +4,7 @@ import { loggerService } from '@logger'
 import anthropicService from '@main/services/AnthropicService'
 import { buildClaudeCodeSystemMessage, getSdkClient } from '@shared/anthropic'
 import type { Provider } from '@types'
+import { APICallError } from 'ai'
 import { net } from 'electron'
 import type { Response } from 'express'
 
@@ -253,9 +254,36 @@ export class MessagesService {
   }
 
   transformError(error: any): { statusCode: number; errorResponse: ErrorResponse } {
-    let statusCode = 500
-    let errorType = 'api_error'
-    let errorMessage = 'Internal server error'
+    let statusCode: number | undefined = undefined
+    let errorType: string | undefined = undefined
+    let errorMessage: string | undefined = undefined
+
+    const errorMap: Record<number, string> = {
+      400: 'invalid_request_error',
+      401: 'authentication_error',
+      403: 'forbidden_error',
+      404: 'not_found_error',
+      429: 'rate_limit_error',
+      500: 'internal_server_error'
+    }
+
+    if (APICallError.isInstance(error)) {
+      statusCode = error.statusCode
+      errorMessage = error.message
+      if (statusCode) {
+        return {
+          statusCode,
+          errorResponse: {
+            type: 'error',
+            error: {
+              type: errorMap[statusCode] || 'api_error',
+              message: errorMessage,
+              requestId: error.name
+            }
+          }
+        }
+      }
+    }
 
     const anthropicStatus = typeof error?.status === 'number' ? error.status : undefined
     const anthropicError = error?.error
@@ -297,11 +325,11 @@ export class MessagesService {
       typeof errorMessage === 'string' && errorMessage.length > 0 ? errorMessage : 'Internal server error'
 
     return {
-      statusCode,
+      statusCode: statusCode ?? 500,
       errorResponse: {
         type: 'error',
         error: {
-          type: errorType,
+          type: errorType || 'api_error',
           message: safeErrorMessage,
           requestId: error?.request_id
         }
diff --git a/src/main/apiServer/services/unified-messages.ts b/src/main/apiServer/services/unified-messages.ts
index 4370a429d0..5cd59377f6 100644
--- a/src/main/apiServer/services/unified-messages.ts
+++ b/src/main/apiServer/services/unified-messages.ts
@@ -23,11 +23,13 @@ import {
 } from '@shared/provider'
 import { defaultAppHeaders } from '@shared/utils'
 import type { Provider } from '@types'
-import type { ImagePart, ModelMessage, Provider as AiSdkProvider, TextPart, Tool } from 'ai'
+import type { ImagePart, JSONValue, ModelMessage, Provider as AiSdkProvider, TextPart, Tool } from 'ai'
 import { jsonSchema, simulateStreamingMiddleware, stepCountIs, tool, wrapLanguageModel } from 'ai'
 import { net } from 'electron'
 import type { Response } from 'express'
 
+import { reasoningCache } from './cache'
+
 const logger = loggerService.withContext('UnifiedMessagesService')
 
 const MAGIC_STRING = 'skip_thought_signature_validator'
@@ -154,8 +156,6 @@ function convertAnthropicToAiMessages(params: MessageCreateParams): ModelMessage
     }
   }
 
-  // Build a map of tool_use_id -> toolName from all messages first
-  // This is needed because tool_result references tool_use from previous assistant messages
   const toolCallIdToName = new Map<string, string>()
   for (const msg of params.messages) {
     if (Array.isArray(msg.content)) {
@@ -227,13 +227,16 @@ function convertAnthropicToAiMessages(params: MessageCreateParams): ModelMessage
         const assistantContent = [...reasoningParts, ...textParts, ...toolCallParts]
         if (assistantContent.length > 0) {
           let providerOptions: ProviderOptions | undefined = undefined
-          if (isGemini3ModelId(params.model)) {
+          if (reasoningCache.get('openrouter')) {
+            providerOptions = {
+              openrouter: {
+                reasoning_details: (reasoningCache.get('openrouter') as JSONValue[]) || []
+              }
+            }
+          } else if (isGemini3ModelId(params.model)) {
             providerOptions = {
               google: {
                 thoughtSignature: MAGIC_STRING
-              },
-              openrouter: {
-                reasoning_details: []
               }
             }
           }
@@ -367,6 +370,7 @@ export async function streamUnifiedMessages(config: UnifiedStreamConfig): Promis
       middlewares,
       plugins,
       onEvent: (event) => {
+        logger.silly('Streaming event', { eventType: event.type })
         const sseData = formatSSEEvent(event)
         response.write(sseData)
       }
@@ -380,22 +384,6 @@ export async function streamUnifiedMessages(config: UnifiedStreamConfig): Promis
     onComplete?.()
   } catch (error) {
     logger.error('Error in unified message stream', error as Error, { providerId: provider.id, modelId })
-
-    if (!response.writableEnded) {
-      try {
-        const errorMessage = error instanceof Error ? error.message : 'Unknown error'
-        response.write(
-          `event: error\ndata: ${JSON.stringify({
-            type: 'error',
-            error: { type: 'api_error', message: errorMessage }
-          })}\n\n`
-        )
-        response.end()
-      } catch {
-        // Response already ended
-      }
-    }
-
     onError?.(error)
     throw error
   }
diff --git a/src/main/services/agents/services/claudecode/claude-stream-state.ts b/src/main/services/agents/services/claudecode/claude-stream-state.ts
index 30b5790c82..5266fda995 100644
--- a/src/main/services/agents/services/claudecode/claude-stream-state.ts
+++ b/src/main/services/agents/services/claudecode/claude-stream-state.ts
@@ -87,6 +87,7 @@ export class ClaudeStreamState {
   private pendingUsage: PendingUsageState = {}
   private pendingToolCalls = new Map<string, PendingToolCall>()
   private stepActive = false
+  private _streamFinished = false
 
   constructor(options: ClaudeStreamStateOptions) {
     this.logger = loggerService.withContext('ClaudeStreamState')
@@ -289,6 +290,16 @@ export class ClaudeStreamState {
   getNamespacedToolCallId(rawToolCallId: string): string {
     return buildNamespacedToolCallId(this.agentSessionId, rawToolCallId)
   }
+
+  /** Marks the stream as finished (either completed or errored). */
+  markFinished(): void {
+    this._streamFinished = true
+  }
+
+  /** Returns true if the stream has already emitted a terminal event. */
+  isFinished(): boolean {
+    return this._streamFinished
+  }
 }
 
 export type { PendingToolCall }
diff --git a/src/main/services/agents/services/claudecode/index.ts b/src/main/services/agents/services/claudecode/index.ts
index 261ff7c07e..00a395c751 100644
--- a/src/main/services/agents/services/claudecode/index.ts
+++ b/src/main/services/agents/services/claudecode/index.ts
@@ -529,6 +529,19 @@ class ClaudeCodeService implements AgentServiceInterface {
         return
       }
 
+      // Skip emitting error if stream already finished (error was handled via result message)
+      if (streamState.isFinished()) {
+        logger.debug('SDK process exited after stream finished, skipping duplicate error event', {
+          duration,
+          error: errorObj instanceof Error ? { name: errorObj.name, message: errorObj.message } : String(errorObj)
+        })
+        // Still emit complete to signal stream end
+        stream.emit('data', {
+          type: 'complete'
+        })
+        return
+      }
+
       errorChunks.push(errorObj instanceof Error ? errorObj.message : String(errorObj))
       const errorMessage = errorChunks.join('\n\n')
       logger.error('SDK query failed', {
diff --git a/src/main/services/agents/services/claudecode/transform.ts b/src/main/services/agents/services/claudecode/transform.ts
index fa0c615648..094076e500 100644
--- a/src/main/services/agents/services/claudecode/transform.ts
+++ b/src/main/services/agents/services/claudecode/transform.ts
@@ -121,7 +121,7 @@ export function transformSDKMessageToStreamParts(sdkMessage: SDKMessage, state:
     case 'system':
       return handleSystemMessage(sdkMessage)
     case 'result':
-      return handleResultMessage(sdkMessage)
+      return handleResultMessage(sdkMessage, state)
     default:
       logger.warn('Unknown SDKMessage type', { type: (sdkMessage as any).type })
       return []
@@ -707,7 +707,13 @@ function handleSystemMessage(message: Extract<SDKMessage, { type: 'system' }>):
  * Successful runs yield a `finish` frame with aggregated usage metrics, while
  * failures are surfaced as `error` frames.
  */
-function handleResultMessage(message: Extract<SDKMessage, { type: 'result' }>): AgentStreamPart[] {
+function handleResultMessage(
+  message: Extract<SDKMessage, { type: 'result' }>,
+  state: ClaudeStreamState
+): AgentStreamPart[] {
+  // Mark stream as finished to prevent duplicate error events when SDK process exits
+  state.markFinished()
+
   const chunks: AgentStreamPart[] = []
 
   let usage: LanguageModelUsage | undefined
@@ -719,26 +725,33 @@ function handleResultMessage(message: Extract<SDKMessage, { type: 'result' }>):
     }
   }
 
-  if (message.subtype === 'success') {
-    chunks.push({
-      type: 'finish',
-      totalUsage: usage ?? emptyUsage,
-      finishReason: mapClaudeCodeFinishReason(message.subtype),
-      providerMetadata: {
-        ...sdkMessageToProviderMetadata(message),
-        usage: message.usage,
-        durationMs: message.duration_ms,
-        costUsd: message.total_cost_usd,
-        raw: message
-      }
-    } as AgentStreamPart)
-  } else {
+  chunks.push({
+    type: 'finish',
+    totalUsage: usage ?? emptyUsage,
+    finishReason: mapClaudeCodeFinishReason(message.subtype),
+    providerMetadata: {
+      ...sdkMessageToProviderMetadata(message),
+      usage: message.usage,
+      durationMs: message.duration_ms,
+      costUsd: message.total_cost_usd,
+      raw: message
+    }
+  } as AgentStreamPart)
+  if (message.subtype !== 'success') {
     chunks.push({
       type: 'error',
       error: {
         message: `${message.subtype}: Process failed after ${message.num_turns} turns`
       }
     } as AgentStreamPart)
+  } else {
+    if (message.is_error) {
+      const errorMatch = message.result.match(/\{.*\}/)
+      if (errorMatch) {
+        const errorDetail = JSON.parse(errorMatch[0])
+        chunks.push(errorDetail)
+      }
+    }
   }
   return chunks
 }

From 9d34098a5342b6f350f45695cf1a9363fad6f139 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Fri, 28 Nov 2025 13:36:29 +0800
Subject: [PATCH 17/53] feat: enhance provider configuration and error handling
 for AI SDK integration

---
 packages/shared/provider/constant.ts          | 26 +++++++
 packages/shared/provider/sdk-config.ts        | 12 +++-
 src/main/apiServer/services/messages.ts       | 37 +++++++++-
 .../apiServer/services/unified-messages.ts    | 70 ++++++++++++++++++-
 src/renderer/src/aiCore/provider/constants.ts | 26 +------
 5 files changed, 142 insertions(+), 29 deletions(-)
 create mode 100644 packages/shared/provider/constant.ts

diff --git a/packages/shared/provider/constant.ts b/packages/shared/provider/constant.ts
new file mode 100644
index 0000000000..fe47d6dcce
--- /dev/null
+++ b/packages/shared/provider/constant.ts
@@ -0,0 +1,26 @@
+import { getLowerBaseModelName } from '@shared/utils/naming'
+
+import type { MinimalModel } from './types'
+
+export const COPILOT_EDITOR_VERSION = 'vscode/1.104.1'
+export const COPILOT_PLUGIN_VERSION = 'copilot-chat/0.26.7'
+export const COPILOT_INTEGRATION_ID = 'vscode-chat'
+export const COPILOT_USER_AGENT = 'GitHubCopilotChat/0.26.7'
+
+export const COPILOT_DEFAULT_HEADERS = {
+  'Copilot-Integration-Id': COPILOT_INTEGRATION_ID,
+  'User-Agent': COPILOT_USER_AGENT,
+  'Editor-Version': COPILOT_EDITOR_VERSION,
+  'Editor-Plugin-Version': COPILOT_PLUGIN_VERSION,
+  'editor-version': COPILOT_EDITOR_VERSION,
+  'editor-plugin-version': COPILOT_PLUGIN_VERSION,
+  'copilot-vision-request': 'true'
+} as const
+
+// Models that require the OpenAI Responses endpoint when routed through GitHub Copilot (#10560)
+const COPILOT_RESPONSES_MODEL_IDS = ['gpt-5-codex']
+
+export function isCopilotResponsesModel<M extends MinimalModel>(model: M): boolean {
+  const normalizedId = getLowerBaseModelName(model.id)
+  return COPILOT_RESPONSES_MODEL_IDS.some((target) => normalizedId === target)
+}
diff --git a/packages/shared/provider/sdk-config.ts b/packages/shared/provider/sdk-config.ts
index a03b3b1417..e520cb6350 100644
--- a/packages/shared/provider/sdk-config.ts
+++ b/packages/shared/provider/sdk-config.ts
@@ -127,7 +127,7 @@ export function providerToAiSdkConfig(
   if (provider.id === SystemProviderIds.copilot) {
     const defaultHeaders = context.getCopilotDefaultHeaders?.() ?? {}
     const storedHeaders = context.getCopilotStoredHeaders?.() ?? {}
-    const options = ProviderConfigFactory.fromProvider('github-copilot-openai-compatible', baseConfig, {
+    const copilotExtraOptions: Record<string, unknown> = {
       headers: {
         ...defaultHeaders,
         ...storedHeaders,
@@ -135,7 +135,15 @@ export function providerToAiSdkConfig(
       },
       name: provider.id,
       includeUsage: true
-    })
+    }
+    if (context.fetch) {
+      copilotExtraOptions.fetch = context.fetch
+    }
+    const options = ProviderConfigFactory.fromProvider(
+      'github-copilot-openai-compatible',
+      baseConfig,
+      copilotExtraOptions
+    )
 
     return {
       providerId: 'github-copilot-openai-compatible',
diff --git a/src/main/apiServer/services/messages.ts b/src/main/apiServer/services/messages.ts
index 3277378266..e2c9ad24e2 100644
--- a/src/main/apiServer/services/messages.ts
+++ b/src/main/apiServer/services/messages.ts
@@ -4,7 +4,7 @@ import { loggerService } from '@logger'
 import anthropicService from '@main/services/AnthropicService'
 import { buildClaudeCodeSystemMessage, getSdkClient } from '@shared/anthropic'
 import type { Provider } from '@types'
-import { APICallError } from 'ai'
+import { APICallError, RetryError } from 'ai'
 import { net } from 'electron'
 import type { Response } from 'express'
 
@@ -267,6 +267,41 @@ export class MessagesService {
       500: 'internal_server_error'
     }
 
+    // Handle AI SDK RetryError - extract the last error for better error messages
+    if (RetryError.isInstance(error)) {
+      const lastError = error.lastError
+      // If the last error is an APICallError, extract its details
+      if (APICallError.isInstance(lastError)) {
+        statusCode = lastError.statusCode || 502
+        errorMessage = lastError.message
+        return {
+          statusCode,
+          errorResponse: {
+            type: 'error',
+            error: {
+              type: errorMap[statusCode] || 'api_error',
+              message: `${error.reason}: ${errorMessage}`,
+              requestId: lastError.name
+            }
+          }
+        }
+      }
+      // Fallback for other retry errors
+      errorMessage = error.message
+      statusCode = 502
+      return {
+        statusCode,
+        errorResponse: {
+          type: 'error',
+          error: {
+            type: 'api_error',
+            message: errorMessage,
+            requestId: error.name
+          }
+        }
+      }
+    }
+
     if (APICallError.isInstance(error)) {
       statusCode = error.statusCode
       errorMessage = error.message
diff --git a/src/main/apiServer/services/unified-messages.ts b/src/main/apiServer/services/unified-messages.ts
index 5cd59377f6..51751202dd 100644
--- a/src/main/apiServer/services/unified-messages.ts
+++ b/src/main/apiServer/services/unified-messages.ts
@@ -9,6 +9,8 @@ import type {
 import { type AiPlugin, createExecutor } from '@cherrystudio/ai-core'
 import { createProvider as createProviderCore } from '@cherrystudio/ai-core/provider'
 import { loggerService } from '@logger'
+import anthropicService from '@main/services/AnthropicService'
+import copilotService from '@main/services/CopilotService'
 import { reduxService } from '@main/services/ReduxService'
 import { AiSdkToAnthropicSSE, formatSSEDone, formatSSEEvent } from '@shared/adapters'
 import { isGemini3ModelId } from '@shared/middleware'
@@ -21,6 +23,7 @@ import {
   providerToAiSdkConfig as sharedProviderToAiSdkConfig,
   resolveActualProvider
 } from '@shared/provider'
+import { COPILOT_DEFAULT_HEADERS } from '@shared/provider/constant'
 import { defaultAppHeaders } from '@shared/utils'
 import type { Provider } from '@types'
 import type { ImagePart, JSONValue, ModelMessage, Provider as AiSdkProvider, TextPart, Tool } from 'ai'
@@ -284,6 +287,68 @@ async function createAiSdkProvider(config: AiSdkConfig): Promise<AiSdkProvider>
   return provider
 }
 
+/**
+ * Prepare special provider configuration for providers that need dynamic tokens
+ * Similar to renderer's prepareSpecialProviderConfig
+ */
+async function prepareSpecialProviderConfig(provider: Provider, config: AiSdkConfig): Promise<AiSdkConfig> {
+  switch (provider.id) {
+    case 'copilot': {
+      const storedHeaders =
+        ((await reduxService.select('state.copilot.defaultHeaders')) as Record<string, string> | null) ?? {}
+      const headers: Record<string, string> = {
+        ...COPILOT_DEFAULT_HEADERS,
+        ...storedHeaders
+      }
+
+      try {
+        const { token } = await copilotService.getToken(null as any, headers)
+        config.options.apiKey = token
+        const existingHeaders = (config.options.headers as Record<string, string> | undefined) ?? {}
+        config.options.headers = {
+          ...headers,
+          ...existingHeaders
+        }
+        logger.debug('Copilot token retrieved successfully')
+      } catch (error) {
+        logger.error('Failed to get Copilot token', error as Error)
+        throw new Error('Failed to get Copilot token. Please re-authorize Copilot.')
+      }
+      break
+    }
+    case 'anthropic': {
+      if (provider.authType === 'oauth') {
+        try {
+          const oauthToken = await anthropicService.getValidAccessToken()
+          if (!oauthToken) {
+            throw new Error('Anthropic OAuth token not available. Please re-authorize.')
+          }
+          config.options = {
+            ...config.options,
+            headers: {
+              ...(config.options.headers ? config.options.headers : {}),
+              'Content-Type': 'application/json',
+              'anthropic-version': '2023-06-01',
+              'anthropic-beta': 'oauth-2025-04-20',
+              Authorization: `Bearer ${oauthToken}`
+            },
+            baseURL: 'https://api.anthropic.com/v1',
+            apiKey: ''
+          }
+          logger.debug('Anthropic OAuth token retrieved successfully')
+        } catch (error) {
+          logger.error('Failed to get Anthropic OAuth token', error as Error)
+          throw new Error('Failed to get Anthropic OAuth token. Please re-authorize.')
+        }
+      }
+      break
+    }
+    // Note: cherryai requires request-level signing which is not easily supported here
+    // It would need custom fetch implementation similar to renderer
+  }
+  return config
+}
+
 /**
  * Core stream execution function - single source of truth for AI SDK calls
  */
@@ -291,7 +356,10 @@ async function executeStream(config: ExecuteStreamConfig): Promise<AiSdkToAnthro
   const { provider, modelId, params, middlewares = [], plugins = [], onEvent } = config
 
   // Convert provider config to AI SDK config
-  const sdkConfig = providerToAiSdkConfig(provider, modelId)
+  let sdkConfig = providerToAiSdkConfig(provider, modelId)
+
+  // Prepare special provider config (Copilot, Anthropic OAuth, etc.)
+  sdkConfig = await prepareSpecialProviderConfig(provider, sdkConfig)
 
   logger.debug('Created AI SDK config', {
     providerId: sdkConfig.providerId,
diff --git a/src/renderer/src/aiCore/provider/constants.ts b/src/renderer/src/aiCore/provider/constants.ts
index c7cd90bd93..67cde7894d 100644
--- a/src/renderer/src/aiCore/provider/constants.ts
+++ b/src/renderer/src/aiCore/provider/constants.ts
@@ -1,25 +1 @@
-import type { Model } from '@renderer/types'
-
-export const COPILOT_EDITOR_VERSION = 'vscode/1.104.1'
-export const COPILOT_PLUGIN_VERSION = 'copilot-chat/0.26.7'
-export const COPILOT_INTEGRATION_ID = 'vscode-chat'
-export const COPILOT_USER_AGENT = 'GitHubCopilotChat/0.26.7'
-
-export const COPILOT_DEFAULT_HEADERS = {
-  'Copilot-Integration-Id': COPILOT_INTEGRATION_ID,
-  'User-Agent': COPILOT_USER_AGENT,
-  'Editor-Version': COPILOT_EDITOR_VERSION,
-  'Editor-Plugin-Version': COPILOT_PLUGIN_VERSION,
-  'editor-version': COPILOT_EDITOR_VERSION,
-  'editor-plugin-version': COPILOT_PLUGIN_VERSION,
-  'copilot-vision-request': 'true'
-} as const
-
-// Models that require the OpenAI Responses endpoint when routed through GitHub Copilot (#10560)
-const COPILOT_RESPONSES_MODEL_IDS = ['gpt-5-codex']
-
-export function isCopilotResponsesModel(model: Model): boolean {
-  const normalizedId = model.id?.trim().toLowerCase()
-  const normalizedName = model.name?.trim().toLowerCase()
-  return COPILOT_RESPONSES_MODEL_IDS.some((target) => normalizedId === target || normalizedName === target)
-}
+export { COPILOT_DEFAULT_HEADERS, isCopilotResponsesModel } from '@shared/provider/constant'

From 534d27f37eff5c438534f2fb824e67843ee4da8e Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Fri, 28 Nov 2025 13:37:43 +0800
Subject: [PATCH 18/53] feat: add additional model IDs for OpenAI Responses
 endpoint in Copilot

---
 packages/shared/provider/constant.ts | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/packages/shared/provider/constant.ts b/packages/shared/provider/constant.ts
index fe47d6dcce..c449c9f635 100644
--- a/packages/shared/provider/constant.ts
+++ b/packages/shared/provider/constant.ts
@@ -18,7 +18,7 @@ export const COPILOT_DEFAULT_HEADERS = {
 } as const
 
 // Models that require the OpenAI Responses endpoint when routed through GitHub Copilot (#10560)
-const COPILOT_RESPONSES_MODEL_IDS = ['gpt-5-codex']
+const COPILOT_RESPONSES_MODEL_IDS = ['gpt-5-codex', 'gpt-5.1-codex', 'gpt-5.1-codex-mini']
 
 export function isCopilotResponsesModel<M extends MinimalModel>(model: M): boolean {
   const normalizedId = getLowerBaseModelName(model.id)

From 95c18d192a948297258d9e868140c44c3e157300 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Fri, 28 Nov 2025 13:42:33 +0800
Subject: [PATCH 19/53] feat: add reasoning cache support to
 AiSdkToAnthropicSSE and update unified-messages integration

---
 packages/shared/adapters/AiSdkToAnthropicSSE.ts | 17 +++++++++++++++--
 src/main/apiServer/services/unified-messages.ts |  3 ++-
 src/renderer/src/aiCore/provider/constants.ts   |  2 +-
 3 files changed, 18 insertions(+), 4 deletions(-)

diff --git a/packages/shared/adapters/AiSdkToAnthropicSSE.ts b/packages/shared/adapters/AiSdkToAnthropicSSE.ts
index 9b23638f48..08d45a09d7 100644
--- a/packages/shared/adapters/AiSdkToAnthropicSSE.ts
+++ b/packages/shared/adapters/AiSdkToAnthropicSSE.ts
@@ -36,7 +36,6 @@ import type {
   Usage
 } from '@anthropic-ai/sdk/resources/messages'
 import { loggerService } from '@logger'
-import { reasoningCache } from '@main/apiServer/services/cache'
 import { type FinishReason, type LanguageModelUsage, type TextStreamPart, type ToolSet } from 'ai'
 
 const logger = loggerService.withContext('AiSdkToAnthropicSSE')
@@ -71,11 +70,22 @@ interface AdapterState {
 
 export type SSEEventCallback = (event: RawMessageStreamEvent) => void
 
+/**
+ * Interface for a simple cache that stores reasoning details
+ */
+export interface ReasoningCacheInterface {
+  set(signature: string, details: unknown[]): void
+}
+
 export interface AiSdkToAnthropicSSEOptions {
   model: string
   messageId?: string
   inputTokens?: number
   onEvent: SSEEventCallback
+  /**
+   * Optional cache for storing reasoning details from providers like OpenRouter
+   */
+  reasoningCache?: ReasoningCacheInterface
 }
 
 /**
@@ -84,9 +94,11 @@ export interface AiSdkToAnthropicSSEOptions {
 export class AiSdkToAnthropicSSE {
   private state: AdapterState
   private onEvent: SSEEventCallback
+  private reasoningCache?: ReasoningCacheInterface
 
   constructor(options: AiSdkToAnthropicSSEOptions) {
     this.onEvent = options.onEvent
+    this.reasoningCache = options.reasoningCache
     this.state = {
       messageId: options.messageId || `msg_${Date.now()}_${Math.random().toString(36).substring(2, 11)}`,
       model: options.model,
@@ -194,10 +206,11 @@ export class AiSdkToAnthropicSSE {
 
       case 'finish-step':
         if (
+          this.reasoningCache &&
           chunk.providerMetadata?.openrouter?.reasoning_details &&
           Array.isArray(chunk.providerMetadata.openrouter.reasoning_details)
         ) {
-          reasoningCache.set('openrouter', chunk.providerMetadata?.openrouter?.reasoning_details)
+          this.reasoningCache.set('openrouter', chunk.providerMetadata.openrouter.reasoning_details)
         }
         if (chunk.finishReason === 'tool-calls') {
           this.state.stopReason = 'tool_use'
diff --git a/src/main/apiServer/services/unified-messages.ts b/src/main/apiServer/services/unified-messages.ts
index 51751202dd..298131460f 100644
--- a/src/main/apiServer/services/unified-messages.ts
+++ b/src/main/apiServer/services/unified-messages.ts
@@ -387,7 +387,8 @@ async function executeStream(config: ExecuteStreamConfig): Promise<AiSdkToAnthro
   // Create the adapter
   const adapter = new AiSdkToAnthropicSSE({
     model: `${provider.id}:${modelId}`,
-    onEvent: onEvent || (() => {})
+    onEvent: onEvent || (() => {}),
+    reasoningCache
   })
 
   // Execute stream - pass model object instead of string
diff --git a/src/renderer/src/aiCore/provider/constants.ts b/src/renderer/src/aiCore/provider/constants.ts
index 67cde7894d..57dad9fbc0 100644
--- a/src/renderer/src/aiCore/provider/constants.ts
+++ b/src/renderer/src/aiCore/provider/constants.ts
@@ -1 +1 @@
-export { COPILOT_DEFAULT_HEADERS, isCopilotResponsesModel } from '@shared/provider/constant'
+export { COPILOT_DEFAULT_HEADERS, COPILOT_EDITOR_VERSION, isCopilotResponsesModel } from '@shared/provider/constant'

From ed769ac4f7a96c4507e6d1002ef2e6a2e3c69517 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Fri, 28 Nov 2025 15:48:50 +0800
Subject: [PATCH 20/53] feat: add CherryAI signed fetch wrapper and enhance
 tool conversion to Zod schema

---
 packages/shared/provider/sdk-config.ts        |  15 +-
 .../apiServer/services/unified-messages.ts    | 144 ++++++++++++++++--
 2 files changed, 147 insertions(+), 12 deletions(-)

diff --git a/packages/shared/provider/sdk-config.ts b/packages/shared/provider/sdk-config.ts
index e520cb6350..91b3c8d54e 100644
--- a/packages/shared/provider/sdk-config.ts
+++ b/packages/shared/provider/sdk-config.ts
@@ -88,6 +88,12 @@ export interface AiSdkConfigContext {
    * Renderer process: use browser fetch (default)
    */
   fetch?: typeof globalThis.fetch
+
+  /**
+   * Get CherryAI signed fetch wrapper
+   * Returns a fetch function that adds signature headers to requests
+   */
+  getCherryAISignedFetch?: () => typeof globalThis.fetch
 }
 
 /**
@@ -220,8 +226,13 @@ export function providerToAiSdkConfig(
     }
   }
 
-  // Inject custom fetch if provided
-  if (context.fetch) {
+  // Handle cherryai signed fetch
+  if (provider.id === 'cherryai') {
+    const signedFetch = context.getCherryAISignedFetch?.()
+    if (signedFetch) {
+      extraOptions.fetch = signedFetch
+    }
+  } else if (context.fetch) {
     extraOptions.fetch = context.fetch
   }
 
diff --git a/src/main/apiServer/services/unified-messages.ts b/src/main/apiServer/services/unified-messages.ts
index 298131460f..063885d72c 100644
--- a/src/main/apiServer/services/unified-messages.ts
+++ b/src/main/apiServer/services/unified-messages.ts
@@ -9,6 +9,7 @@ import type {
 import { type AiPlugin, createExecutor } from '@cherrystudio/ai-core'
 import { createProvider as createProviderCore } from '@cherrystudio/ai-core/provider'
 import { loggerService } from '@logger'
+import { generateSignature as cherryaiGenerateSignature } from '@main/integration/cherryai'
 import anthropicService from '@main/services/AnthropicService'
 import copilotService from '@main/services/CopilotService'
 import { reduxService } from '@main/services/ReduxService'
@@ -26,10 +27,11 @@ import {
 import { COPILOT_DEFAULT_HEADERS } from '@shared/provider/constant'
 import { defaultAppHeaders } from '@shared/utils'
 import type { Provider } from '@types'
-import type { ImagePart, JSONValue, ModelMessage, Provider as AiSdkProvider, TextPart, Tool } from 'ai'
-import { jsonSchema, simulateStreamingMiddleware, stepCountIs, tool, wrapLanguageModel } from 'ai'
+import type { ImagePart, JSONValue, ModelMessage, Provider as AiSdkProvider, TextPart, Tool as AiSdkTool } from 'ai'
+import { simulateStreamingMiddleware, stepCountIs, tool, wrapLanguageModel, zodSchema } from 'ai'
 import { net } from 'electron'
 import type { Response } from 'express'
+import * as z from 'zod'
 
 import { reasoningCache } from './cache'
 
@@ -124,19 +126,119 @@ function convertAnthropicToolResultToAiSdk(
   return { type: 'content', value: values }
 }
 
-function convertAnthropicToolsToAiSdk(tools: MessageCreateParams['tools']): Record<string, Tool> | undefined {
+// Type alias for JSON Schema (compatible with recursive calls)
+type JsonSchemaLike = AnthropicTool.InputSchema | Record<string, unknown>
+
+/**
+ * Convert JSON Schema to Zod schema
+ * This avoids non-standard fields like input_examples that Anthropic doesn't support
+ */
+function jsonSchemaToZod(schema: JsonSchemaLike): z.ZodTypeAny {
+  const s = schema as Record<string, unknown>
+  const schemaType = s.type as string | string[] | undefined
+  const enumValues = s.enum as unknown[] | undefined
+  const description = s.description as string | undefined
+
+  // Handle enum first
+  if (enumValues && Array.isArray(enumValues) && enumValues.length > 0) {
+    if (enumValues.every((v) => typeof v === 'string')) {
+      const zodEnum = z.enum(enumValues as [string, ...string[]])
+      return description ? zodEnum.describe(description) : zodEnum
+    }
+    // For non-string enums, use union of literals
+    const literals = enumValues.map((v) => z.literal(v as string | number | boolean))
+    if (literals.length === 1) {
+      return description ? literals[0].describe(description) : literals[0]
+    }
+    const zodUnion = z.union(literals as unknown as [z.ZodTypeAny, z.ZodTypeAny, ...z.ZodTypeAny[]])
+    return description ? zodUnion.describe(description) : zodUnion
+  }
+
+  // Handle union types (type: ["string", "null"])
+  if (Array.isArray(schemaType)) {
+    const schemas = schemaType.map((t) => jsonSchemaToZod({ ...s, type: t, enum: undefined }))
+    if (schemas.length === 1) {
+      return schemas[0]
+    }
+    return z.union(schemas as [z.ZodTypeAny, z.ZodTypeAny, ...z.ZodTypeAny[]])
+  }
+
+  // Handle by type
+  switch (schemaType) {
+    case 'string': {
+      let zodString = z.string()
+      if (typeof s.minLength === 'number') zodString = zodString.min(s.minLength)
+      if (typeof s.maxLength === 'number') zodString = zodString.max(s.maxLength)
+      if (typeof s.pattern === 'string') zodString = zodString.regex(new RegExp(s.pattern))
+      return description ? zodString.describe(description) : zodString
+    }
+
+    case 'number':
+    case 'integer': {
+      let zodNumber = schemaType === 'integer' ? z.number().int() : z.number()
+      if (typeof s.minimum === 'number') zodNumber = zodNumber.min(s.minimum)
+      if (typeof s.maximum === 'number') zodNumber = zodNumber.max(s.maximum)
+      return description ? zodNumber.describe(description) : zodNumber
+    }
+
+    case 'boolean': {
+      const zodBoolean = z.boolean()
+      return description ? zodBoolean.describe(description) : zodBoolean
+    }
+
+    case 'null':
+      return z.null()
+
+    case 'array': {
+      const items = s.items as Record<string, unknown> | undefined
+      let zodArray = items ? z.array(jsonSchemaToZod(items)) : z.array(z.unknown())
+      if (typeof s.minItems === 'number') zodArray = zodArray.min(s.minItems)
+      if (typeof s.maxItems === 'number') zodArray = zodArray.max(s.maxItems)
+      return description ? zodArray.describe(description) : zodArray
+    }
+
+    case 'object': {
+      const properties = s.properties as Record<string, Record<string, unknown>> | undefined
+      const required = (s.required as string[]) || []
+
+      // Always use z.object() to ensure "properties" field is present in output schema
+      // OpenAI requires explicit properties field even for empty objects
+      const shape: Record<string, z.ZodTypeAny> = {}
+      if (properties) {
+        for (const [key, propSchema] of Object.entries(properties)) {
+          const zodProp = jsonSchemaToZod(propSchema)
+          shape[key] = required.includes(key) ? zodProp : zodProp.optional()
+        }
+      }
+
+      const zodObject = z.object(shape)
+      return description ? zodObject.describe(description) : zodObject
+    }
+
+    default:
+      // Unknown type, use z.unknown()
+      return z.unknown()
+  }
+}
+
+function convertAnthropicToolsToAiSdk(tools: MessageCreateParams['tools']): Record<string, AiSdkTool> | undefined {
   if (!tools || tools.length === 0) return undefined
 
-  const aiSdkTools: Record<string, Tool> = {}
+  const aiSdkTools: Record<string, AiSdkTool> = {}
   for (const anthropicTool of tools) {
     if (anthropicTool.type === 'bash_20250124') continue
     const toolDef = anthropicTool as AnthropicTool
-    const parameters = toolDef.input_schema as Parameters<typeof jsonSchema>[0]
-    aiSdkTools[toolDef.name] = tool({
+    const rawSchema = toolDef.input_schema
+    const schema = jsonSchemaToZod(rawSchema)
+
+    // Use tool() with inputSchema (AI SDK v5 API)
+    const aiTool = tool({
       description: toolDef.description || '',
-      inputSchema: jsonSchema(parameters),
-      execute: async (input: Record<string, unknown>) => input
+      inputSchema: zodSchema(schema)
     })
+
+    logger.debug('Converted Anthropic tool to AI SDK tool', aiTool)
+    aiSdkTools[toolDef.name] = aiTool
   }
   return Object.keys(aiSdkTools).length > 0 ? aiSdkTools : undefined
 }
@@ -343,8 +445,30 @@ async function prepareSpecialProviderConfig(provider: Provider, config: AiSdkCon
       }
       break
     }
-    // Note: cherryai requires request-level signing which is not easily supported here
-    // It would need custom fetch implementation similar to renderer
+    case 'cherryai': {
+      // Create a signed fetch wrapper for cherryai
+      const baseFetch = net.fetch as typeof globalThis.fetch
+      config.options.fetch = async (url: RequestInfo | URL, options?: RequestInit) => {
+        if (!options?.body) {
+          return baseFetch(url, options)
+        }
+        const signature = cherryaiGenerateSignature({
+          method: 'POST',
+          path: '/chat/completions',
+          query: '',
+          body: JSON.parse(options.body as string)
+        })
+        return baseFetch(url, {
+          ...options,
+          headers: {
+            ...(options.headers as Record<string, string>),
+            ...signature
+          }
+        })
+      }
+      logger.debug('CherryAI signed fetch configured')
+      break
+    }
   }
   return config
 }

From e8dccf51feab167102e9358e48d2067d2a722a22 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Fri, 28 Nov 2025 16:37:58 +0800
Subject: [PATCH 21/53] feat: enhance reasoning cache integration and update
 provider options in unified messages

---
 .../shared/adapters/AiSdkToAnthropicSSE.ts    | 26 +++++++++++--------
 src/main/apiServer/services/cache.ts          | 21 +++++----------
 .../apiServer/services/unified-messages.ts    | 15 ++++++++++-
 3 files changed, 35 insertions(+), 27 deletions(-)

diff --git a/packages/shared/adapters/AiSdkToAnthropicSSE.ts b/packages/shared/adapters/AiSdkToAnthropicSSE.ts
index 08d45a09d7..a9f1508a6a 100644
--- a/packages/shared/adapters/AiSdkToAnthropicSSE.ts
+++ b/packages/shared/adapters/AiSdkToAnthropicSSE.ts
@@ -36,6 +36,8 @@ import type {
   Usage
 } from '@anthropic-ai/sdk/resources/messages'
 import { loggerService } from '@logger'
+import { reasoningCache } from '@main/apiServer/services/cache'
+import type { JSONValue } from 'ai'
 import { type FinishReason, type LanguageModelUsage, type TextStreamPart, type ToolSet } from 'ai'
 
 const logger = loggerService.withContext('AiSdkToAnthropicSSE')
@@ -74,7 +76,7 @@ export type SSEEventCallback = (event: RawMessageStreamEvent) => void
  * Interface for a simple cache that stores reasoning details
  */
 export interface ReasoningCacheInterface {
-  set(signature: string, details: unknown[]): void
+  set(signature: string, details: JSONValue): void
 }
 
 export interface AiSdkToAnthropicSSEOptions {
@@ -82,9 +84,6 @@ export interface AiSdkToAnthropicSSEOptions {
   messageId?: string
   inputTokens?: number
   onEvent: SSEEventCallback
-  /**
-   * Optional cache for storing reasoning details from providers like OpenRouter
-   */
   reasoningCache?: ReasoningCacheInterface
 }
 
@@ -186,6 +185,17 @@ export class AiSdkToAnthropicSSE {
 
       // === Tool Events ===
       case 'tool-call':
+        if (this.reasoningCache && chunk.providerMetadata?.google?.thoughtSignature) {
+          this.reasoningCache.set('google', chunk.providerMetadata?.google?.thoughtSignature)
+        }
+        // FIXME: 按toolcall id绑定
+        if (
+          this.reasoningCache &&
+          chunk.providerMetadata?.openrouter?.reasoning_details &&
+          Array.isArray(chunk.providerMetadata.openrouter.reasoning_details)
+        ) {
+          this.reasoningCache.set('openrouter', chunk.providerMetadata.openrouter.reasoning_details)
+        }
         this.handleToolCall({
           type: 'tool-call',
           toolCallId: chunk.toolCallId,
@@ -205,13 +215,6 @@ export class AiSdkToAnthropicSSE {
         break
 
       case 'finish-step':
-        if (
-          this.reasoningCache &&
-          chunk.providerMetadata?.openrouter?.reasoning_details &&
-          Array.isArray(chunk.providerMetadata.openrouter.reasoning_details)
-        ) {
-          this.reasoningCache.set('openrouter', chunk.providerMetadata.openrouter.reasoning_details)
-        }
         if (chunk.finishReason === 'tool-calls') {
           this.state.stopReason = 'tool_use'
         }
@@ -552,6 +555,7 @@ export class AiSdkToAnthropicSSE {
     }
 
     this.onEvent(messageStopEvent)
+    reasoningCache.destroy()
   }
 
   /**
diff --git a/src/main/apiServer/services/cache.ts b/src/main/apiServer/services/cache.ts
index 765ab1e1b9..39dc5b1544 100644
--- a/src/main/apiServer/services/cache.ts
+++ b/src/main/apiServer/services/cache.ts
@@ -1,11 +1,12 @@
 import { loggerService } from '@logger'
+import type { JSONValue } from 'ai'
 
 const logger = loggerService.withContext('Cache')
 /**
  * Cache entry with TTL support
  */
 interface CacheEntry<T> {
-  details: T[]
+  details: T
   timestamp: number
 }
 
@@ -28,24 +29,19 @@ export class ReasoningCache<T> {
   /**
    * Store reasoning details by signature
    */
-  set(signature: string, details: T[]): void {
-    if (!signature || !details.length) return
+  set(signature: string, details: T): void {
+    if (!signature || !details) return
 
     this.cache.set(signature, {
       details,
       timestamp: Date.now()
     })
-
-    logger.debug('Cached reasoning details', {
-      signature: signature.substring(0, 20) + '...',
-      detailsCount: details.length
-    })
   }
 
   /**
    * Retrieve reasoning details by signature
    */
-  get(signature: string): T[] | undefined {
+  get(signature: string): T | undefined {
     const entry = this.cache.get(signature)
     if (!entry) return undefined
 
@@ -55,11 +51,6 @@ export class ReasoningCache<T> {
       return undefined
     }
 
-    logger.debug('Retrieved reasoning details from cache', {
-      signature: signature.substring(0, 20) + '...',
-      detailsCount: entry.details.length
-    })
-
     return entry.details
   }
 
@@ -113,4 +104,4 @@ export class ReasoningCache<T> {
 }
 
 // Singleton cache instance
-export const reasoningCache = new ReasoningCache()
+export const reasoningCache = new ReasoningCache<JSONValue>()
diff --git a/src/main/apiServer/services/unified-messages.ts b/src/main/apiServer/services/unified-messages.ts
index 063885d72c..af97941f2b 100644
--- a/src/main/apiServer/services/unified-messages.ts
+++ b/src/main/apiServer/services/unified-messages.ts
@@ -301,11 +301,24 @@ function convertAnthropicToAiMessages(params: MessageCreateParams): ModelMessage
             imageParts.push({ type: 'image', image: source.url })
           }
         } else if (block.type === 'tool_use') {
+          const options: ProviderOptions = {}
+          if (isGemini3ModelId(params.model)) {
+            if (reasoningCache.get('google')) {
+              options.google = {
+                thoughtSignature: MAGIC_STRING
+              }
+            } else if (reasoningCache.get('openrouter')) {
+              options.openrouter = {
+                reasoning_details: (reasoningCache.get('openrouter') as JSONValue[]) || []
+              }
+            }
+          }
           toolCallParts.push({
             type: 'tool-call',
             toolName: block.name,
             toolCallId: block.id,
-            input: block.input
+            input: block.input,
+            providerOptions: options
           })
         } else if (block.type === 'tool_result') {
           // Look up toolName from the pre-built map (covers cross-message references)

From e255a992cccd1edc0ec11fce81c7272528ed9b07 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Sat, 29 Nov 2025 17:39:31 +0800
Subject: [PATCH 22/53] fix: type check

---
 packages/shared/adapters/AiSdkToAnthropicSSE.ts | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/packages/shared/adapters/AiSdkToAnthropicSSE.ts b/packages/shared/adapters/AiSdkToAnthropicSSE.ts
index a9f1508a6a..c6e7555ea3 100644
--- a/packages/shared/adapters/AiSdkToAnthropicSSE.ts
+++ b/packages/shared/adapters/AiSdkToAnthropicSSE.ts
@@ -36,7 +36,6 @@ import type {
   Usage
 } from '@anthropic-ai/sdk/resources/messages'
 import { loggerService } from '@logger'
-import { reasoningCache } from '@main/apiServer/services/cache'
 import type { JSONValue } from 'ai'
 import { type FinishReason, type LanguageModelUsage, type TextStreamPart, type ToolSet } from 'ai'
 
@@ -77,6 +76,7 @@ export type SSEEventCallback = (event: RawMessageStreamEvent) => void
  */
 export interface ReasoningCacheInterface {
   set(signature: string, details: JSONValue): void
+  destroy?(): void
 }
 
 export interface AiSdkToAnthropicSSEOptions {
@@ -555,7 +555,7 @@ export class AiSdkToAnthropicSSE {
     }
 
     this.onEvent(messageStopEvent)
-    reasoningCache.destroy()
+    this.reasoningCache?.destroy?.()
   }
 
   /**

From 35cfc7c517ab9fa3de085bdb6a5f38282716919e Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Sat, 29 Nov 2025 19:12:56 +0800
Subject: [PATCH 23/53] feat: add sanitizeToolsForAnthropic function to clean
 tool definitions for Anthropic API

---
 packages/shared/anthropic/index.ts      | 30 ++++++++++++++++++++++++-
 src/main/apiServer/services/messages.ts |  5 +++--
 2 files changed, 32 insertions(+), 3 deletions(-)

diff --git a/packages/shared/anthropic/index.ts b/packages/shared/anthropic/index.ts
index 2444ad6113..e2113eb749 100644
--- a/packages/shared/anthropic/index.ts
+++ b/packages/shared/anthropic/index.ts
@@ -9,7 +9,7 @@
  */
 
 import Anthropic from '@anthropic-ai/sdk'
-import type { TextBlockParam } from '@anthropic-ai/sdk/resources'
+import type { MessageCreateParams, TextBlockParam, Tool as AnthropicTool } from '@anthropic-ai/sdk/resources'
 import { loggerService } from '@logger'
 import type { Provider } from '@types'
 import type { ModelMessage } from 'ai'
@@ -193,3 +193,31 @@ export function buildClaudeCodeSystemModelMessage(system?: string | Array<TextBl
     content: block.text
   }))
 }
+
+/**
+ * Sanitize tool definitions for Anthropic API.
+ *
+ * Removes non-standard fields like `input_examples` from tool definitions
+ * that Anthropic's API doesn't support. This prevents validation errors when
+ * tools with extended fields are passed to the Anthropic SDK.
+ *
+ * @param tools - Array of tool definitions from MessageCreateParams
+ * @returns Sanitized tools array with non-standard fields removed
+ *
+ * @example
+ * ```typescript
+ * const sanitizedTools = sanitizeToolsForAnthropic(request.tools)
+ * ```
+ */
+export function sanitizeToolsForAnthropic(tools?: MessageCreateParams['tools']): MessageCreateParams['tools'] {
+  if (!tools || tools.length === 0) return tools
+
+  return tools.map((tool) => {
+    if ('type' in tool && tool.type !== 'custom') return tool
+
+    // oxlint-disable-next-line no-unused-vars
+    const { input_examples, ...sanitizedTool } = tool as AnthropicTool & { input_examples?: unknown }
+
+    return sanitizedTool as typeof tool
+  })
+}
diff --git a/src/main/apiServer/services/messages.ts b/src/main/apiServer/services/messages.ts
index e2c9ad24e2..957c066520 100644
--- a/src/main/apiServer/services/messages.ts
+++ b/src/main/apiServer/services/messages.ts
@@ -2,7 +2,7 @@ import type Anthropic from '@anthropic-ai/sdk'
 import type { MessageCreateParams, MessageStreamEvent } from '@anthropic-ai/sdk/resources'
 import { loggerService } from '@logger'
 import anthropicService from '@main/services/AnthropicService'
-import { buildClaudeCodeSystemMessage, getSdkClient } from '@shared/anthropic'
+import { buildClaudeCodeSystemMessage, getSdkClient, sanitizeToolsForAnthropic } from '@shared/anthropic'
 import type { Provider } from '@types'
 import { APICallError, RetryError } from 'ai'
 import { net } from 'electron'
@@ -148,7 +148,8 @@ export class MessagesService {
   createAnthropicRequest(request: MessageCreateParams, provider: Provider, modelId?: string): MessageCreateParams {
     const anthropicRequest: MessageCreateParams = {
       ...request,
-      stream: !!request.stream
+      stream: !!request.stream,
+      tools: sanitizeToolsForAnthropic(request.tools)
     }
 
     // Override model if provided

From 3989229f611268a129d3c9e26cbb01b637a12abc Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Sun, 30 Nov 2025 07:10:10 +0800
Subject: [PATCH 24/53] feat: enhance API version handling and cache
 functionality

- Updated reasoning cache to use tool-specific keys for better organization.
- Added methods to list cache keys and entries.
- Improved API version regex patterns for more accurate matching.
- Refactored API host formatting to handle leading/trailing whitespace and slashes.
- Added functions to extract and remove trailing API version segments from URLs.
---
 .../shared/adapters/AiSdkToAnthropicSSE.ts    |  3 +-
 packages/shared/api/index.ts                  | 86 +++++++++++++++++--
 src/main/apiServer/services/cache.ts          | 12 +++
 .../apiServer/services/unified-messages.ts    | 18 +---
 4 files changed, 92 insertions(+), 27 deletions(-)

diff --git a/packages/shared/adapters/AiSdkToAnthropicSSE.ts b/packages/shared/adapters/AiSdkToAnthropicSSE.ts
index c6e7555ea3..c4f2355c0a 100644
--- a/packages/shared/adapters/AiSdkToAnthropicSSE.ts
+++ b/packages/shared/adapters/AiSdkToAnthropicSSE.ts
@@ -186,7 +186,7 @@ export class AiSdkToAnthropicSSE {
       // === Tool Events ===
       case 'tool-call':
         if (this.reasoningCache && chunk.providerMetadata?.google?.thoughtSignature) {
-          this.reasoningCache.set('google', chunk.providerMetadata?.google?.thoughtSignature)
+          this.reasoningCache.set(`google-${chunk.toolName}`, chunk.providerMetadata?.google?.thoughtSignature)
         }
         // FIXME: 按toolcall id绑定
         if (
@@ -555,7 +555,6 @@ export class AiSdkToAnthropicSSE {
     }
 
     this.onEvent(messageStopEvent)
-    this.reasoningCache?.destroy?.()
   }
 
   /**
diff --git a/packages/shared/api/index.ts b/packages/shared/api/index.ts
index 5ee19611d8..2e85c11c36 100644
--- a/packages/shared/api/index.ts
+++ b/packages/shared/api/index.ts
@@ -27,18 +27,35 @@ export function withoutTrailingSlash<T extends string>(url: T): T {
 }
 
 /**
- * Checks if the host path contains a version string (e.g., /v1, /v2beta).
+ * Matches a version segment in a path that starts with `/v<number>` and optionally
+ * continues with `alpha` or `beta`. The segment may be followed by `/` or the end
+ * of the string (useful for cases like `/v3alpha/resources`).
+ */
+const VERSION_REGEX_PATTERN = '\\/v\\d+(?:alpha|beta)?(?=\\/|$)'
+
+/**
+ * Matches an API version at the end of a URL (with optional trailing slash).
+ * Used to detect and extract versions only from the trailing position.
+ */
+const TRAILING_VERSION_REGEX = /\/v\d+(?:alpha|beta)?\/?$/i
+
+/**
+ * 判断 host 的 path 中是否包含形如版本的字符串（例如 /v1、/v2beta 等），
+ *
+ * @param host - 要检查的 host 或 path 字符串
+ * @returns 如果 path 中包含版本字符串则返回 true，否则 false
  */
 export function hasAPIVersion(host?: string): boolean {
   if (!host) return false
 
-  const versionRegex = /\/v\d+(?:alpha|beta)?(?=\/|$)/i
+  const regex = new RegExp(VERSION_REGEX_PATTERN, 'i')
 
   try {
     const url = new URL(host)
-    return versionRegex.test(url.pathname)
+    return regex.test(url.pathname)
   } catch {
-    return versionRegex.test(host)
+    // 若无法作为完整 URL 解析，则当作路径直接检测
+    return regex.test(host)
   }
 }
 
@@ -71,22 +88,26 @@ export function formatVertexApiHost(
 /**
  * Formats an API host URL by normalizing it and optionally appending an API version.
  *
- * @param host - The API host URL to format
- * @param isSupportedAPIVersion - Whether the API version is supported. Defaults to `true`.
+ * @param host - The API host URL to format. Leading/trailing whitespace will be trimmed and trailing slashes removed.
+ * @param supportApiVersion - Whether the API version is supported. Defaults to `true`.
  * @param apiVersion - The API version to append if needed. Defaults to `'v1'`.
  *
+ * @returns The formatted API host URL. If the host is empty after normalization, returns an empty string.
+ *          If the host ends with '#', API version is not supported, or the host already contains a version, returns the normalized host as-is.
+ *          Otherwise, returns the host with the API version appended.
+ *
  * @example
  * formatApiHost('https://api.example.com/') // Returns 'https://api.example.com/v1'
  * formatApiHost('https://api.example.com#') // Returns 'https://api.example.com#'
  * formatApiHost('https://api.example.com/v2', true, 'v1') // Returns 'https://api.example.com/v2'
  */
-export function formatApiHost(host?: string, isSupportedAPIVersion: boolean = true, apiVersion: string = 'v1'): string {
-  const normalizedHost = withoutTrailingSlash((host || '').trim())
+export function formatApiHost(host?: string, supportApiVersion: boolean = true, apiVersion: string = 'v1'): string {
+  const normalizedHost = withoutTrailingSlash(trim(host))
   if (!normalizedHost) {
     return ''
   }
 
-  if (normalizedHost.endsWith('#') || !isSupportedAPIVersion || hasAPIVersion(normalizedHost)) {
+  if (normalizedHost.endsWith('#') || !supportApiVersion || hasAPIVersion(normalizedHost)) {
     return normalizedHost
   }
   return `${normalizedHost}/${apiVersion}`
@@ -175,3 +196,50 @@ export function validateApiHost(apiHost: string): boolean {
     return false
   }
 }
+
+/**
+ * Extracts the trailing API version segment from a URL path.
+ *
+ * This function extracts API version patterns (e.g., `v1`, `v2beta`) from the end of a URL.
+ * Only versions at the end of the path are extracted, not versions in the middle.
+ * The returned version string does not include leading or trailing slashes.
+ *
+ * @param {string} url - The URL string to parse.
+ * @returns {string | undefined} The trailing API version found (e.g., 'v1', 'v2beta'), or undefined if none found.
+ *
+ * @example
+ * getTrailingApiVersion('https://api.example.com/v1') // 'v1'
+ * getTrailingApiVersion('https://api.example.com/v2beta/') // 'v2beta'
+ * getTrailingApiVersion('https://api.example.com/v1/chat') // undefined (version not at end)
+ * getTrailingApiVersion('https://gateway.ai.cloudflare.com/v1/xxx/v1beta') // 'v1beta'
+ * getTrailingApiVersion('https://api.example.com') // undefined
+ */
+export function getTrailingApiVersion(url: string): string | undefined {
+  const match = url.match(TRAILING_VERSION_REGEX)
+
+  if (match) {
+    // Extract version without leading slash and trailing slash
+    return match[0].replace(/^\//, '').replace(/\/$/, '')
+  }
+
+  return undefined
+}
+
+/**
+ * Removes the trailing API version segment from a URL path.
+ *
+ * This function removes API version patterns (e.g., `/v1`, `/v2beta`) from the end of a URL.
+ * Only versions at the end of the path are removed, not versions in the middle.
+ *
+ * @param {string} url - The URL string to process.
+ * @returns {string} The URL with the trailing API version removed, or the original URL if no trailing version found.
+ *
+ * @example
+ * withoutTrailingApiVersion('https://api.example.com/v1') // 'https://api.example.com'
+ * withoutTrailingApiVersion('https://api.example.com/v2beta/') // 'https://api.example.com'
+ * withoutTrailingApiVersion('https://api.example.com/v1/chat') // 'https://api.example.com/v1/chat' (no change)
+ * withoutTrailingApiVersion('https://api.example.com') // 'https://api.example.com'
+ */
+export function withoutTrailingApiVersion(url: string): string {
+  return url.replace(TRAILING_VERSION_REGEX, '')
+}
diff --git a/src/main/apiServer/services/cache.ts b/src/main/apiServer/services/cache.ts
index 39dc5b1544..9515778e16 100644
--- a/src/main/apiServer/services/cache.ts
+++ b/src/main/apiServer/services/cache.ts
@@ -54,6 +54,18 @@ export class ReasoningCache<T> {
     return entry.details
   }
 
+  listKeys(): string[] {
+    return Array.from(this.cache.keys())
+  }
+
+  listEntries(): Array<{ key: string; entry: CacheEntry<T> }> {
+    const entries: Array<{ key: string; entry: CacheEntry<T> }> = []
+    for (const [key, entry] of this.cache.entries()) {
+      entries.push({ key, entry })
+    }
+    return entries
+  }
+
   /**
    * Clear expired entries
    */
diff --git a/src/main/apiServer/services/unified-messages.ts b/src/main/apiServer/services/unified-messages.ts
index af97941f2b..815b1217f2 100644
--- a/src/main/apiServer/services/unified-messages.ts
+++ b/src/main/apiServer/services/unified-messages.ts
@@ -237,7 +237,6 @@ function convertAnthropicToolsToAiSdk(tools: MessageCreateParams['tools']): Reco
       inputSchema: zodSchema(schema)
     })
 
-    logger.debug('Converted Anthropic tool to AI SDK tool', aiTool)
     aiSdkTools[toolDef.name] = aiTool
   }
   return Object.keys(aiSdkTools).length > 0 ? aiSdkTools : undefined
@@ -302,8 +301,9 @@ function convertAnthropicToAiMessages(params: MessageCreateParams): ModelMessage
           }
         } else if (block.type === 'tool_use') {
           const options: ProviderOptions = {}
+
           if (isGemini3ModelId(params.model)) {
-            if (reasoningCache.get('google')) {
+            if (reasoningCache.get(`google-${block.name}`)) {
               options.google = {
                 thoughtSignature: MAGIC_STRING
               }
@@ -394,11 +394,6 @@ async function createAiSdkProvider(config: AiSdkConfig): Promise<AiSdkProvider>
 
   const provider = await createProviderCore(providerId, config.options)
 
-  logger.debug('AI SDK provider created', {
-    providerId,
-    hasOptions: !!config.options
-  })
-
   return provider
 }
 
@@ -424,7 +419,6 @@ async function prepareSpecialProviderConfig(provider: Provider, config: AiSdkCon
           ...headers,
           ...existingHeaders
         }
-        logger.debug('Copilot token retrieved successfully')
       } catch (error) {
         logger.error('Failed to get Copilot token', error as Error)
         throw new Error('Failed to get Copilot token. Please re-authorize Copilot.')
@@ -450,7 +444,6 @@ async function prepareSpecialProviderConfig(provider: Provider, config: AiSdkCon
             baseURL: 'https://api.anthropic.com/v1',
             apiKey: ''
           }
-          logger.debug('Anthropic OAuth token retrieved successfully')
         } catch (error) {
           logger.error('Failed to get Anthropic OAuth token', error as Error)
           throw new Error('Failed to get Anthropic OAuth token. Please re-authorize.')
@@ -479,7 +472,6 @@ async function prepareSpecialProviderConfig(provider: Provider, config: AiSdkCon
           }
         })
       }
-      logger.debug('CherryAI signed fetch configured')
       break
     }
   }
@@ -498,12 +490,6 @@ async function executeStream(config: ExecuteStreamConfig): Promise<AiSdkToAnthro
   // Prepare special provider config (Copilot, Anthropic OAuth, etc.)
   sdkConfig = await prepareSpecialProviderConfig(provider, sdkConfig)
 
-  logger.debug('Created AI SDK config', {
-    providerId: sdkConfig.providerId,
-    hasOptions: !!sdkConfig.options,
-    message: params.messages
-  })
-
   // Create provider instance and get language model
   const aiSdkProvider = await createAiSdkProvider(sdkConfig)
   const baseModel = aiSdkProvider.languageModel(modelId)

From 4c1466cd27c16dd76dddfb2a3a61c712a482ff55 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Sun, 30 Nov 2025 18:35:58 +0800
Subject: [PATCH 25/53] fix: update 'anthropic-beta' header and add
 authorization for longcat provider

---
 packages/shared/anthropic/index.ts | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/packages/shared/anthropic/index.ts b/packages/shared/anthropic/index.ts
index e2113eb749..78df7ff7af 100644
--- a/packages/shared/anthropic/index.ts
+++ b/packages/shared/anthropic/index.ts
@@ -11,7 +11,7 @@
 import Anthropic from '@anthropic-ai/sdk'
 import type { MessageCreateParams, TextBlockParam, Tool as AnthropicTool } from '@anthropic-ai/sdk/resources'
 import { loggerService } from '@logger'
-import type { Provider } from '@types'
+import { type Provider, SystemProviderIds } from '@types'
 import type { ModelMessage } from 'ai'
 
 const logger = loggerService.withContext('anthropic-sdk')
@@ -124,7 +124,7 @@ export function getSdkClient(
       baseURL,
       dangerouslyAllowBrowser: true,
       defaultHeaders: {
-        'anthropic-beta': 'output-128k-2025-02-19',
+        'anthropic-beta': 'interleaved-thinking-2025-05-14',
         'APP-Code': 'MLTG2087',
         ...provider.extra_headers,
         ...extraHeaders
@@ -139,7 +139,8 @@ export function getSdkClient(
     baseURL,
     dangerouslyAllowBrowser: true,
     defaultHeaders: {
-      'anthropic-beta': 'output-128k-2025-02-19',
+      'anthropic-beta': 'interleaved-thinking-2025-05-14',
+      Authorization: provider.id === SystemProviderIds.longcat ? `Bearer ${provider.apiKey}` : undefined,
       ...provider.extra_headers
     },
     fetch: customFetch

From 4a913fcef7fe2a559fb7c70a82e2dcf228c5961a Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Mon, 1 Dec 2025 00:36:55 +0800
Subject: [PATCH 26/53] Refactor: Remove old cache implementation and integrate
 new reasoning cache service

- Deleted the old ReasoningCache class and its instance.
- Introduced CacheService for managing reasoning caches.
- Updated unified-messages service to utilize new googleReasoningCache and openRouterReasoningCache.
- Added AiSdkToAnthropicSSE adapter to handle streaming events and integrate with new cache service.
- Reorganized shared adapters to include the new AiSdkToAnthropicSSE adapter.
- Created openrouter adapter with detailed reasoning schemas for better type safety and validation.
---
 .../adapters/AiSdkToAnthropicSSE.ts           |  28 ++---
 .../main/apiServer}/adapters/index.ts         |   0
 src/main/apiServer/adapters/openrouter.ts     |  95 ++++++++++++++
 src/main/apiServer/services/cache.ts          | 119 ------------------
 .../apiServer/services/unified-messages.ts    |  21 ++--
 src/main/services/CacheService.ts             |  31 +++++
 6 files changed, 150 insertions(+), 144 deletions(-)
 rename {packages/shared => src/main/apiServer}/adapters/AiSdkToAnthropicSSE.ts (95%)
 rename {packages/shared => src/main/apiServer}/adapters/index.ts (100%)
 create mode 100644 src/main/apiServer/adapters/openrouter.ts
 delete mode 100644 src/main/apiServer/services/cache.ts

diff --git a/packages/shared/adapters/AiSdkToAnthropicSSE.ts b/src/main/apiServer/adapters/AiSdkToAnthropicSSE.ts
similarity index 95%
rename from packages/shared/adapters/AiSdkToAnthropicSSE.ts
rename to src/main/apiServer/adapters/AiSdkToAnthropicSSE.ts
index c4f2355c0a..b5b52c4e03 100644
--- a/packages/shared/adapters/AiSdkToAnthropicSSE.ts
+++ b/src/main/apiServer/adapters/AiSdkToAnthropicSSE.ts
@@ -36,9 +36,10 @@ import type {
   Usage
 } from '@anthropic-ai/sdk/resources/messages'
 import { loggerService } from '@logger'
-import type { JSONValue } from 'ai'
 import { type FinishReason, type LanguageModelUsage, type TextStreamPart, type ToolSet } from 'ai'
 
+import { googleReasoningCache, openRouterReasoningCache } from '../../services/CacheService'
+
 const logger = loggerService.withContext('AiSdkToAnthropicSSE')
 
 interface ContentBlockState {
@@ -71,20 +72,11 @@ interface AdapterState {
 
 export type SSEEventCallback = (event: RawMessageStreamEvent) => void
 
-/**
- * Interface for a simple cache that stores reasoning details
- */
-export interface ReasoningCacheInterface {
-  set(signature: string, details: JSONValue): void
-  destroy?(): void
-}
-
 export interface AiSdkToAnthropicSSEOptions {
   model: string
   messageId?: string
   inputTokens?: number
   onEvent: SSEEventCallback
-  reasoningCache?: ReasoningCacheInterface
 }
 
 /**
@@ -93,11 +85,9 @@ export interface AiSdkToAnthropicSSEOptions {
 export class AiSdkToAnthropicSSE {
   private state: AdapterState
   private onEvent: SSEEventCallback
-  private reasoningCache?: ReasoningCacheInterface
 
   constructor(options: AiSdkToAnthropicSSEOptions) {
     this.onEvent = options.onEvent
-    this.reasoningCache = options.reasoningCache
     this.state = {
       messageId: options.messageId || `msg_${Date.now()}_${Math.random().toString(36).substring(2, 11)}`,
       model: options.model,
@@ -185,16 +175,22 @@ export class AiSdkToAnthropicSSE {
 
       // === Tool Events ===
       case 'tool-call':
-        if (this.reasoningCache && chunk.providerMetadata?.google?.thoughtSignature) {
-          this.reasoningCache.set(`google-${chunk.toolName}`, chunk.providerMetadata?.google?.thoughtSignature)
+        if (googleReasoningCache && chunk.providerMetadata?.google?.thoughtSignature) {
+          googleReasoningCache.set(
+            `google-${chunk.toolName}`,
+            chunk.providerMetadata?.google?.thoughtSignature as string
+          )
         }
         // FIXME: 按toolcall id绑定
         if (
-          this.reasoningCache &&
+          openRouterReasoningCache &&
           chunk.providerMetadata?.openrouter?.reasoning_details &&
           Array.isArray(chunk.providerMetadata.openrouter.reasoning_details)
         ) {
-          this.reasoningCache.set('openrouter', chunk.providerMetadata.openrouter.reasoning_details)
+          openRouterReasoningCache.set(
+            'openrouter',
+            JSON.parse(JSON.stringify(chunk.providerMetadata.openrouter.reasoning_details))
+          )
         }
         this.handleToolCall({
           type: 'tool-call',
diff --git a/packages/shared/adapters/index.ts b/src/main/apiServer/adapters/index.ts
similarity index 100%
rename from packages/shared/adapters/index.ts
rename to src/main/apiServer/adapters/index.ts
diff --git a/src/main/apiServer/adapters/openrouter.ts b/src/main/apiServer/adapters/openrouter.ts
new file mode 100644
index 0000000000..3b63191781
--- /dev/null
+++ b/src/main/apiServer/adapters/openrouter.ts
@@ -0,0 +1,95 @@
+import * as z from 'zod/v4'
+
+enum ReasoningFormat {
+  Unknown = 'unknown',
+  OpenAIResponsesV1 = 'openai-responses-v1',
+  XAIResponsesV1 = 'xai-responses-v1',
+  AnthropicClaudeV1 = 'anthropic-claude-v1',
+  GoogleGeminiV1 = 'google-gemini-v1'
+}
+
+// Anthropic Claude was the first reasoning that we're
+// passing back and forth
+export const DEFAULT_REASONING_FORMAT = ReasoningFormat.AnthropicClaudeV1
+
+function isDefinedOrNotNull<T>(value: T | null | undefined): value is T {
+  return value !== null && value !== undefined
+}
+
+export enum ReasoningDetailType {
+  Summary = 'reasoning.summary',
+  Encrypted = 'reasoning.encrypted',
+  Text = 'reasoning.text'
+}
+
+export const CommonReasoningDetailSchema = z
+  .object({
+    id: z.string().nullish(),
+    format: z.enum(ReasoningFormat).nullish(),
+    index: z.number().optional()
+  })
+  .loose()
+
+export const ReasoningDetailSummarySchema = z
+  .object({
+    type: z.literal(ReasoningDetailType.Summary),
+    summary: z.string()
+  })
+  .extend(CommonReasoningDetailSchema.shape)
+export type ReasoningDetailSummary = z.infer<typeof ReasoningDetailSummarySchema>
+
+export const ReasoningDetailEncryptedSchema = z
+  .object({
+    type: z.literal(ReasoningDetailType.Encrypted),
+    data: z.string()
+  })
+  .extend(CommonReasoningDetailSchema.shape)
+
+export type ReasoningDetailEncrypted = z.infer<typeof ReasoningDetailEncryptedSchema>
+
+export const ReasoningDetailTextSchema = z
+  .object({
+    type: z.literal(ReasoningDetailType.Text),
+    text: z.string().nullish(),
+    signature: z.string().nullish()
+  })
+  .extend(CommonReasoningDetailSchema.shape)
+
+export type ReasoningDetailText = z.infer<typeof ReasoningDetailTextSchema>
+
+export const ReasoningDetailUnionSchema = z.union([
+  ReasoningDetailSummarySchema,
+  ReasoningDetailEncryptedSchema,
+  ReasoningDetailTextSchema
+])
+
+export type ReasoningDetailUnion = z.infer<typeof ReasoningDetailUnionSchema>
+
+const ReasoningDetailsWithUnknownSchema = z.union([ReasoningDetailUnionSchema, z.unknown().transform(() => null)])
+
+export const ReasoningDetailArraySchema = z
+  .array(ReasoningDetailsWithUnknownSchema)
+  .transform((d) => d.filter((d): d is ReasoningDetailUnion => !!d))
+
+export const OutputUnionToReasoningDetailsSchema = z.union([
+  z
+    .object({
+      delta: z.object({
+        reasoning_details: z.array(ReasoningDetailsWithUnknownSchema)
+      })
+    })
+    .transform((data) => data.delta.reasoning_details.filter(isDefinedOrNotNull)),
+  z
+    .object({
+      message: z.object({
+        reasoning_details: z.array(ReasoningDetailsWithUnknownSchema)
+      })
+    })
+    .transform((data) => data.message.reasoning_details.filter(isDefinedOrNotNull)),
+  z
+    .object({
+      text: z.string(),
+      reasoning_details: z.array(ReasoningDetailsWithUnknownSchema)
+    })
+    .transform((data) => data.reasoning_details.filter(isDefinedOrNotNull))
+])
diff --git a/src/main/apiServer/services/cache.ts b/src/main/apiServer/services/cache.ts
deleted file mode 100644
index 9515778e16..0000000000
--- a/src/main/apiServer/services/cache.ts
+++ /dev/null
@@ -1,119 +0,0 @@
-import { loggerService } from '@logger'
-import type { JSONValue } from 'ai'
-
-const logger = loggerService.withContext('Cache')
-/**
- * Cache entry with TTL support
- */
-interface CacheEntry<T> {
-  details: T
-  timestamp: number
-}
-
-/**
- * In-memory cache for reasoning details
- * Key: signature
- * Value: reasoning array with timestamp
- */
-export class ReasoningCache<T> {
-  private cache = new Map<string, CacheEntry<T>>()
-  private readonly ttlMs: number
-  private cleanupInterval: ReturnType<typeof setInterval> | null = null
-
-  constructor(ttlMs: number = 30 * 60 * 1000) {
-    // Default 30 minutes TTL
-    this.ttlMs = ttlMs
-    this.startCleanup()
-  }
-
-  /**
-   * Store reasoning details by signature
-   */
-  set(signature: string, details: T): void {
-    if (!signature || !details) return
-
-    this.cache.set(signature, {
-      details,
-      timestamp: Date.now()
-    })
-  }
-
-  /**
-   * Retrieve reasoning details by signature
-   */
-  get(signature: string): T | undefined {
-    const entry = this.cache.get(signature)
-    if (!entry) return undefined
-
-    // Check TTL
-    if (Date.now() - entry.timestamp > this.ttlMs) {
-      this.cache.delete(signature)
-      return undefined
-    }
-
-    return entry.details
-  }
-
-  listKeys(): string[] {
-    return Array.from(this.cache.keys())
-  }
-
-  listEntries(): Array<{ key: string; entry: CacheEntry<T> }> {
-    const entries: Array<{ key: string; entry: CacheEntry<T> }> = []
-    for (const [key, entry] of this.cache.entries()) {
-      entries.push({ key, entry })
-    }
-    return entries
-  }
-
-  /**
-   * Clear expired entries
-   */
-  cleanup(): void {
-    const now = Date.now()
-    let cleaned = 0
-
-    for (const [key, entry] of this.cache) {
-      if (now - entry.timestamp > this.ttlMs) {
-        this.cache.delete(key)
-        cleaned++
-      }
-    }
-
-    if (cleaned > 0) {
-      logger.debug('Cleaned up expired reasoning cache entries', { cleaned, remaining: this.cache.size })
-    }
-  }
-
-  /**
-   * Start periodic cleanup
-   */
-  private startCleanup(): void {
-    // Cleanup every 5 minutes
-    this.cleanupInterval = setInterval(() => this.cleanup(), 5 * 60 * 1000)
-  }
-
-  /**
-   * Stop cleanup and clear cache
-   */
-  destroy(): void {
-    if (this.cleanupInterval) {
-      clearInterval(this.cleanupInterval)
-      this.cleanupInterval = null
-    }
-    this.cache.clear()
-  }
-
-  /**
-   * Get cache stats for debugging
-   */
-  stats(): { size: number; ttlMs: number } {
-    return {
-      size: this.cache.size,
-      ttlMs: this.ttlMs
-    }
-  }
-}
-
-// Singleton cache instance
-export const reasoningCache = new ReasoningCache<JSONValue>()
diff --git a/src/main/apiServer/services/unified-messages.ts b/src/main/apiServer/services/unified-messages.ts
index 815b1217f2..7c85e2d6cf 100644
--- a/src/main/apiServer/services/unified-messages.ts
+++ b/src/main/apiServer/services/unified-messages.ts
@@ -9,11 +9,11 @@ import type {
 import { type AiPlugin, createExecutor } from '@cherrystudio/ai-core'
 import { createProvider as createProviderCore } from '@cherrystudio/ai-core/provider'
 import { loggerService } from '@logger'
+import { AiSdkToAnthropicSSE, formatSSEDone, formatSSEEvent } from '@main/apiServer/adapters'
 import { generateSignature as cherryaiGenerateSignature } from '@main/integration/cherryai'
 import anthropicService from '@main/services/AnthropicService'
 import copilotService from '@main/services/CopilotService'
 import { reduxService } from '@main/services/ReduxService'
-import { AiSdkToAnthropicSSE, formatSSEDone, formatSSEEvent } from '@shared/adapters'
 import { isGemini3ModelId } from '@shared/middleware'
 import {
   type AiSdkConfig,
@@ -33,12 +33,16 @@ import { net } from 'electron'
 import type { Response } from 'express'
 import * as z from 'zod'
 
-import { reasoningCache } from './cache'
+import { googleReasoningCache, openRouterReasoningCache } from '../../services/CacheService'
 
 const logger = loggerService.withContext('UnifiedMessagesService')
 
 const MAGIC_STRING = 'skip_thought_signature_validator'
 
+function sanitizeJson(value: unknown): JSONValue {
+  return JSON.parse(JSON.stringify(value))
+}
+
 initializeSharedProviders({
   warn: (message) => logger.warn(message),
   error: (message, error) => logger.error(message, error)
@@ -303,13 +307,13 @@ function convertAnthropicToAiMessages(params: MessageCreateParams): ModelMessage
           const options: ProviderOptions = {}
 
           if (isGemini3ModelId(params.model)) {
-            if (reasoningCache.get(`google-${block.name}`)) {
+            if (googleReasoningCache.get(`google-${block.name}`)) {
               options.google = {
                 thoughtSignature: MAGIC_STRING
               }
-            } else if (reasoningCache.get('openrouter')) {
+            } else if (openRouterReasoningCache.get('openrouter')) {
               options.openrouter = {
-                reasoning_details: (reasoningCache.get('openrouter') as JSONValue[]) || []
+                reasoning_details: (sanitizeJson(openRouterReasoningCache.get('openrouter')) as JSONValue[]) || []
               }
             }
           }
@@ -345,10 +349,10 @@ function convertAnthropicToAiMessages(params: MessageCreateParams): ModelMessage
         const assistantContent = [...reasoningParts, ...textParts, ...toolCallParts]
         if (assistantContent.length > 0) {
           let providerOptions: ProviderOptions | undefined = undefined
-          if (reasoningCache.get('openrouter')) {
+          if (openRouterReasoningCache.get('openrouter')) {
             providerOptions = {
               openrouter: {
-                reasoning_details: (reasoningCache.get('openrouter') as JSONValue[]) || []
+                reasoning_details: (sanitizeJson(openRouterReasoningCache.get('openrouter')) as JSONValue[]) || []
               }
             }
           } else if (isGemini3ModelId(params.model)) {
@@ -510,8 +514,7 @@ async function executeStream(config: ExecuteStreamConfig): Promise<AiSdkToAnthro
   // Create the adapter
   const adapter = new AiSdkToAnthropicSSE({
     model: `${provider.id}:${modelId}`,
-    onEvent: onEvent || (() => {}),
-    reasoningCache
+    onEvent: onEvent || (() => {})
   })
 
   // Execute stream - pass model object instead of string
diff --git a/src/main/services/CacheService.ts b/src/main/services/CacheService.ts
index d2984a9984..b9de349b7b 100644
--- a/src/main/services/CacheService.ts
+++ b/src/main/services/CacheService.ts
@@ -4,6 +4,26 @@ interface CacheItem<T> {
   duration: number
 }
 
+// Import the reasoning detail type from openrouter adapter
+type ReasoningDetailUnion = {
+  id?: string | null
+  format?: 'unknown' | 'openai-responses-v1' | 'xai-responses-v1' | 'anthropic-claude-v1' | 'google-gemini-v1' | null
+  index?: number
+  type: 'reasoning.summary' | 'reasoning.encrypted' | 'reasoning.text'
+  summary?: string
+  data?: string
+  text?: string | null
+  signature?: string | null
+}
+
+/**
+ * Interface for reasoning cache
+ */
+export interface IReasoningCache<T> {
+  set(key: string, value: T): void
+  get(key: string): T | undefined
+}
+
 export class CacheService {
   private static cache: Map<string, CacheItem<any>> = new Map()
 
@@ -72,3 +92,14 @@ export class CacheService {
     return true
   }
 }
+
+// Singleton cache instances using CacheService
+export const googleReasoningCache: IReasoningCache<string> = {
+  set: (key, value) => CacheService.set(`google-reasoning:${key}`, value, 30 * 60 * 1000),
+  get: (key) => CacheService.get(`google-reasoning:${key}`) || undefined
+}
+
+export const openRouterReasoningCache: IReasoningCache<ReasoningDetailUnion[]> = {
+  set: (key, value) => CacheService.set(`openrouter-reasoning:${key}`, value, 30 * 60 * 1000),
+  get: (key) => CacheService.get(`openrouter-reasoning:${key}`) || undefined
+}

From 874d69291fa7df53a6e473f5b2d716be8821613d Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Mon, 1 Dec 2025 01:33:55 +0800
Subject: [PATCH 27/53] refactor:  import

---
 src/main/services/CacheService.ts | 14 ++------------
 1 file changed, 2 insertions(+), 12 deletions(-)

diff --git a/src/main/services/CacheService.ts b/src/main/services/CacheService.ts
index b9de349b7b..84c6935d3d 100644
--- a/src/main/services/CacheService.ts
+++ b/src/main/services/CacheService.ts
@@ -1,21 +1,11 @@
+import type { ReasoningDetailUnion } from '@main/apiServer/adapters/openrouter'
+
 interface CacheItem<T> {
   data: T
   timestamp: number
   duration: number
 }
 
-// Import the reasoning detail type from openrouter adapter
-type ReasoningDetailUnion = {
-  id?: string | null
-  format?: 'unknown' | 'openai-responses-v1' | 'xai-responses-v1' | 'anthropic-claude-v1' | 'google-gemini-v1' | null
-  index?: number
-  type: 'reasoning.summary' | 'reasoning.encrypted' | 'reasoning.text'
-  summary?: string
-  data?: string
-  text?: string | null
-  signature?: string | null
-}
-
 /**
  * Interface for reasoning cache
  */

From a23195296935dfcf1b28f46d3eee80512c184980 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Mon, 1 Dec 2025 01:59:41 +0800
Subject: [PATCH 28/53] feat: Add model exclusion logic for the Azure OpenAI
 provider and update the tool call model filter.

---
 src/renderer/src/config/models/tooluse.ts | 18 ++++++++++++++++++
 src/renderer/src/config/models/utils.ts   | 10 +++++++++-
 2 files changed, 27 insertions(+), 1 deletion(-)

diff --git a/src/renderer/src/config/models/tooluse.ts b/src/renderer/src/config/models/tooluse.ts
index 7f90df5f7b..db0a767346 100644
--- a/src/renderer/src/config/models/tooluse.ts
+++ b/src/renderer/src/config/models/tooluse.ts
@@ -1,6 +1,8 @@
+import { getProviderByModel } from '@renderer/services/AssistantService'
 import type { Model } from '@renderer/types'
 import { isSystemProviderId } from '@renderer/types'
 import { getLowerBaseModelName, isUserSelectedModelType } from '@renderer/utils'
+import { isAzureOpenAIProvider } from '@shared/provider'
 
 import { isEmbeddingModel, isRerankModel } from './embedding'
 import { isDeepSeekHybridInferenceModel } from './reasoning'
@@ -52,6 +54,13 @@ export const FUNCTION_CALLING_REGEX = new RegExp(
   'i'
 )
 
+const AZURE_FUNCTION_CALLING_EXCLUDED_MODELS = [
+  '(?:Meta-)?Llama-3(?:\\.\\d+)?-[\\w-]+',
+  'Phi-[34](?:\\.[\\w-]+)?(?:-[\\w-]+)?',
+  'DeepSeek-(?:R1|V3)',
+  'Codestral-2501'
+]
+
 export function isFunctionCallingModel(model?: Model): boolean {
   if (!model || isEmbeddingModel(model) || isRerankModel(model) || isTextToImageModel(model)) {
     return false
@@ -67,6 +76,15 @@ export function isFunctionCallingModel(model?: Model): boolean {
     return FUNCTION_CALLING_REGEX.test(modelId) || FUNCTION_CALLING_REGEX.test(model.name)
   }
 
+  const provider = getProviderByModel(model)
+
+  if (isAzureOpenAIProvider(provider)) {
+    const azureExcludedRegex = new RegExp(`\\b(?:${AZURE_FUNCTION_CALLING_EXCLUDED_MODELS.join('|')})\\b`, 'i')
+    if (azureExcludedRegex.test(modelId)) {
+      return false
+    }
+  }
+
   if (['deepseek', 'anthropic', 'kimi', 'moonshot'].includes(model.provider)) {
     return true
   }
diff --git a/src/renderer/src/config/models/utils.ts b/src/renderer/src/config/models/utils.ts
index bd45ed224f..129dc4abfd 100644
--- a/src/renderer/src/config/models/utils.ts
+++ b/src/renderer/src/config/models/utils.ts
@@ -13,6 +13,7 @@ import {
   isOpenAIReasoningModel
 } from './openai'
 import { isQwenMTModel } from './qwen'
+import { isFunctionCallingModel } from './tooluse'
 import { isGenerateImageModel, isTextToImageModel, isVisionModel } from './vision'
 export const NOT_SUPPORTED_REGEX = /(?:^tts|whisper|speech)/i
 export const GEMINI_FLASH_MODEL_REGEX = new RegExp('gemini.*-flash.*$', 'i')
@@ -181,8 +182,15 @@ export const isGeminiModel = (model: Model) => {
 // zhipu 视觉推理模型用这组 special token 标记推理结果
 export const ZHIPU_RESULT_TOKENS = ['<|begin_of_box|>', '<|end_of_box|>'] as const
 
+// TODO: 支持提示词模式的工具调用
 export const agentModelFilter = (model: Model): boolean => {
-  return !isEmbeddingModel(model) && !isRerankModel(model) && !isTextToImageModel(model) && !isGenerateImageModel(model)
+  return (
+    !isEmbeddingModel(model) &&
+    !isRerankModel(model) &&
+    !isTextToImageModel(model) &&
+    !isGenerateImageModel(model) &&
+    isFunctionCallingModel(model)
+  )
 }
 
 export const isMaxTemperatureOneModel = (model: Model): boolean => {

From fb9a8e7e2ce0bbfaef74e1364a047137fc9ab97c Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Mon, 1 Dec 2025 02:45:27 +0800
Subject: [PATCH 29/53] fix: params map

---
 .../apiServer/services/unified-messages.ts    | 68 ++++++++++++++++++-
 1 file changed, 67 insertions(+), 1 deletion(-)

diff --git a/src/main/apiServer/services/unified-messages.ts b/src/main/apiServer/services/unified-messages.ts
index 7c85e2d6cf..63bd461f5b 100644
--- a/src/main/apiServer/services/unified-messages.ts
+++ b/src/main/apiServer/services/unified-messages.ts
@@ -1,3 +1,6 @@
+import type { AnthropicProviderOptions } from '@ai-sdk/anthropic'
+import type { GoogleGenerativeAIProviderOptions } from '@ai-sdk/google'
+import type { OpenAIResponsesProviderOptions } from '@ai-sdk/openai'
 import type { LanguageModelV2Middleware, LanguageModelV2ToolResultOutput } from '@ai-sdk/provider'
 import type { ProviderOptions, ReasoningPart, ToolCallPart, ToolResultPart } from '@ai-sdk/provider-utils'
 import type {
@@ -20,6 +23,9 @@ import {
   type AiSdkConfigContext,
   formatProviderApiHost,
   initializeSharedProviders,
+  isAnthropicProvider,
+  isGeminiProvider,
+  isOpenAIProvider,
   type ProviderFormatContext,
   providerToAiSdkConfig as sharedProviderToAiSdkConfig,
   resolveActualProvider
@@ -482,6 +488,63 @@ async function prepareSpecialProviderConfig(provider: Provider, config: AiSdkCon
   return config
 }
 
+function mapAnthropicThinkToAISdkProviderOptions(
+  provider: Provider,
+  config: MessageCreateParams['thinking']
+): ProviderOptions | undefined {
+  if (!config) return undefined
+  if (isAnthropicProvider(provider)) {
+    return {
+      anthropic: {
+        ...mapToAnthropicProviderOptions(config)
+      }
+    }
+  }
+  if (isGeminiProvider(provider)) {
+    return {
+      google: {
+        ...mapToGeminiProviderOptions(config)
+      }
+    }
+  }
+  if (isOpenAIProvider(provider)) {
+    return {
+      openai: {
+        ...mapToOpenAIProviderOptions(config)
+      }
+    }
+  }
+  return undefined
+}
+
+function mapToAnthropicProviderOptions(config: NonNullable<MessageCreateParams['thinking']>): AnthropicProviderOptions {
+  return {
+    thinking: {
+      type: config.type,
+      budgetTokens: config.type === 'enabled' ? config.budget_tokens : undefined
+    }
+  }
+}
+
+function mapToGeminiProviderOptions(
+  config: NonNullable<MessageCreateParams['thinking']>
+): GoogleGenerativeAIProviderOptions {
+  return {
+    thinkingConfig: {
+      thinkingBudget: config.type === 'enabled' ? config.budget_tokens : -1,
+      includeThoughts: config.type === 'enabled'
+    }
+  }
+}
+
+function mapToOpenAIProviderOptions(
+  config: NonNullable<MessageCreateParams['thinking']>
+): OpenAIResponsesProviderOptions {
+  return {
+    reasoningEffort: config.type === 'enabled' ? 'high' : 'none'
+  }
+}
+
 /**
  * Core stream execution function - single source of truth for AI SDK calls
  */
@@ -521,14 +584,17 @@ async function executeStream(config: ExecuteStreamConfig): Promise<AiSdkToAnthro
   const result = await executor.streamText({
     model, // Now passing LanguageModel object, not string
     messages: coreMessages,
+    // FIXME: Claude Code传入的maxToken会超出有些模型限制，需做特殊处理，可能在v2好修复一点，现在维护的成本有点高
+    // 已知: 豆包
     maxOutputTokens: params.max_tokens,
     temperature: params.temperature,
     topP: params.top_p,
+    topK: params.top_k,
     stopSequences: params.stop_sequences,
     stopWhen: stepCountIs(100),
     headers: defaultAppHeaders(),
     tools,
-    providerOptions: {}
+    providerOptions: mapAnthropicThinkToAISdkProviderOptions(provider, params.thinking)
   })
 
   // Process the stream through the adapter

From 8c9d79a7d4ec4e6ba37432737503d58fde520fbf Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Mon, 1 Dec 2025 13:45:52 +0800
Subject: [PATCH 30/53] gitignore

---
 .gitignore | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/.gitignore b/.gitignore
index a8107fa93e..9322c8717e 100644
--- a/.gitignore
+++ b/.gitignore
@@ -73,3 +73,5 @@ test-results
 YOUR_MEMORY_FILE_PATH
 
 .sessions/
+.next/
+*.tsbuildinfo

From 4d77202afdf017f02650aba3c30543e986e68e66 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Mon, 1 Dec 2025 13:50:01 +0800
Subject: [PATCH 31/53] filter: copilot

---
 src/renderer/src/config/models/__tests__/utils.test.ts | 8 ++++++++
 src/renderer/src/config/models/utils.ts                | 7 +++++++
 2 files changed, 15 insertions(+)

diff --git a/src/renderer/src/config/models/__tests__/utils.test.ts b/src/renderer/src/config/models/__tests__/utils.test.ts
index b27ed930cd..618a9e9dfe 100644
--- a/src/renderer/src/config/models/__tests__/utils.test.ts
+++ b/src/renderer/src/config/models/__tests__/utils.test.ts
@@ -15,6 +15,7 @@ import {
   isSupportVerbosityModel
 } from '../openai'
 import { isQwenMTModel } from '../qwen'
+import { isFunctionCallingModel } from '../tooluse'
 import {
   agentModelFilter,
   getModelSupportedVerbosity,
@@ -112,6 +113,7 @@ const textToImageMock = vi.mocked(isTextToImageModel)
 const generateImageMock = vi.mocked(isGenerateImageModel)
 const reasoningMock = vi.mocked(isOpenAIReasoningModel)
 const openAIWebSearchOnlyMock = vi.mocked(isOpenAIWebSearchChatCompletionOnlyModel)
+const isFunctionCallingModelMock = vi.mocked(isFunctionCallingModel)
 
 describe('model utils', () => {
   beforeEach(() => {
@@ -457,6 +459,12 @@ describe('model utils', () => {
         expect(agentModelFilter(createModel({ id: 'rerank' }))).toBe(false)
       })
 
+      it('filters out non-function-call models', () => {
+        rerankMock.mockReturnValue(false)
+        isFunctionCallingModelMock.mockReturnValueOnce(false)
+        expect(agentModelFilter(createModel({ id: 'DeepSeek R1' }))).toBe(false)
+      })
+
       it('filters out text-to-image models', () => {
         rerankMock.mockReturnValue(false)
         textToImageMock.mockReturnValueOnce(true)
diff --git a/src/renderer/src/config/models/utils.ts b/src/renderer/src/config/models/utils.ts
index 129dc4abfd..9a7d5fedfb 100644
--- a/src/renderer/src/config/models/utils.ts
+++ b/src/renderer/src/config/models/utils.ts
@@ -1,5 +1,6 @@
 import type OpenAI from '@cherrystudio/openai'
 import { isEmbeddingModel, isRerankModel } from '@renderer/config/models/embedding'
+import { getProviderByModel } from '@renderer/services/AssistantService'
 import { type Model, SystemProviderIds } from '@renderer/types'
 import type { OpenAIVerbosity, ValidOpenAIVerbosity } from '@renderer/types/aiCoreTypes'
 import { getLowerBaseModelName } from '@renderer/utils'
@@ -184,6 +185,12 @@ export const ZHIPU_RESULT_TOKENS = ['<|begin_of_box|>', '<|end_of_box|>'] as con
 
 // TODO: 支持提示词模式的工具调用
 export const agentModelFilter = (model: Model): boolean => {
+  const provider = getProviderByModel(model)
+
+  // 需要适配，且容易超出限额
+  if (provider.id === SystemProviderIds.copilot) {
+    return false
+  }
   return (
     !isEmbeddingModel(model) &&
     !isRerankModel(model) &&

From fd0be32ab44e4c170be09cde65104b0c2573a6fa Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Wed, 3 Dec 2025 11:58:46 +0800
Subject: [PATCH 32/53] fix: openrouter

---
 .../apiServer/adapters/AiSdkToAnthropicSSE.ts |  3 +-
 .../apiServer/services/unified-messages.ts    | 36 ++++++++++++++-----
 2 files changed, 29 insertions(+), 10 deletions(-)

diff --git a/src/main/apiServer/adapters/AiSdkToAnthropicSSE.ts b/src/main/apiServer/adapters/AiSdkToAnthropicSSE.ts
index b5b52c4e03..f24d8304a7 100644
--- a/src/main/apiServer/adapters/AiSdkToAnthropicSSE.ts
+++ b/src/main/apiServer/adapters/AiSdkToAnthropicSSE.ts
@@ -181,14 +181,13 @@ export class AiSdkToAnthropicSSE {
             chunk.providerMetadata?.google?.thoughtSignature as string
           )
         }
-        // FIXME: 按toolcall id绑定
         if (
           openRouterReasoningCache &&
           chunk.providerMetadata?.openrouter?.reasoning_details &&
           Array.isArray(chunk.providerMetadata.openrouter.reasoning_details)
         ) {
           openRouterReasoningCache.set(
-            'openrouter',
+            `openrouter-${chunk.toolCallId}`,
             JSON.parse(JSON.stringify(chunk.providerMetadata.openrouter.reasoning_details))
           )
         }
diff --git a/src/main/apiServer/services/unified-messages.ts b/src/main/apiServer/services/unified-messages.ts
index 63bd461f5b..c418f8c434 100644
--- a/src/main/apiServer/services/unified-messages.ts
+++ b/src/main/apiServer/services/unified-messages.ts
@@ -17,6 +17,7 @@ import { generateSignature as cherryaiGenerateSignature } from '@main/integratio
 import anthropicService from '@main/services/AnthropicService'
 import copilotService from '@main/services/CopilotService'
 import { reduxService } from '@main/services/ReduxService'
+import type { OpenRouterProviderOptions } from '@openrouter/ai-sdk-provider'
 import { isGemini3ModelId } from '@shared/middleware'
 import {
   type AiSdkConfig,
@@ -28,7 +29,8 @@ import {
   isOpenAIProvider,
   type ProviderFormatContext,
   providerToAiSdkConfig as sharedProviderToAiSdkConfig,
-  resolveActualProvider
+  resolveActualProvider,
+  SystemProviderIds
 } from '@shared/provider'
 import { COPILOT_DEFAULT_HEADERS } from '@shared/provider/constant'
 import { defaultAppHeaders } from '@shared/utils'
@@ -311,18 +313,19 @@ function convertAnthropicToAiMessages(params: MessageCreateParams): ModelMessage
           }
         } else if (block.type === 'tool_use') {
           const options: ProviderOptions = {}
-
+          logger.debug('Processing tool call block', { block, msgRole: msg.role, model: params.model })
           if (isGemini3ModelId(params.model)) {
             if (googleReasoningCache.get(`google-${block.name}`)) {
               options.google = {
                 thoughtSignature: MAGIC_STRING
               }
-            } else if (openRouterReasoningCache.get('openrouter')) {
-              options.openrouter = {
-                reasoning_details: (sanitizeJson(openRouterReasoningCache.get('openrouter')) as JSONValue[]) || []
-              }
             }
           }
+          if (openRouterReasoningCache.get(`openrouter-${block.id}`)) {
+              options.openrouter = {
+                reasoning_details: (sanitizeJson(openRouterReasoningCache.get(`openrouter-${block.id}`)) as JSONValue[]) || []
+              }
+          }
           toolCallParts.push({
             type: 'tool-call',
             toolName: block.name,
@@ -514,6 +517,13 @@ function mapAnthropicThinkToAISdkProviderOptions(
       }
     }
   }
+  if (provider.id === SystemProviderIds.openrouter) {
+    return {
+      openrouter: {
+        ...mapToOpenRouterProviderOptions(config)
+      }
+    }
+  }
   return undefined
 }
 
@@ -545,6 +555,17 @@ function mapToOpenAIProviderOptions(
   }
 }
 
+function mapToOpenRouterProviderOptions(
+  config: NonNullable<MessageCreateParams['thinking']>
+): OpenRouterProviderOptions {
+  return {
+    reasoning: {
+      enabled: config.type === 'enabled',
+      effort: 'high'
+    }
+  }
+}
+
 /**
  * Core stream execution function - single source of truth for AI SDK calls
  */
@@ -580,9 +601,8 @@ async function executeStream(config: ExecuteStreamConfig): Promise<AiSdkToAnthro
     onEvent: onEvent || (() => {})
   })
 
-  // Execute stream - pass model object instead of string
   const result = await executor.streamText({
-    model, // Now passing LanguageModel object, not string
+    model,
     messages: coreMessages,
     // FIXME: Claude Code传入的maxToken会超出有些模型限制，需做特殊处理，可能在v2好修复一点，现在维护的成本有点高
     // 已知: 豆包

From 08a537bfe4bfafcf1b7060557698f6c8001d191b Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Wed, 3 Dec 2025 12:15:53 +0800
Subject: [PATCH 33/53] fix: test

---
 .../apiServer/services/unified-messages.ts    |  7 +++--
 .../config/models/__tests__/tooluse.test.ts   | 23 +++++++++++++++
 .../src/config/models/__tests__/utils.test.ts | 28 +++++++++++++++++++
 src/renderer/src/utils/api.ts                 |  1 +
 4 files changed, 56 insertions(+), 3 deletions(-)

diff --git a/src/main/apiServer/services/unified-messages.ts b/src/main/apiServer/services/unified-messages.ts
index c418f8c434..cfcdb48393 100644
--- a/src/main/apiServer/services/unified-messages.ts
+++ b/src/main/apiServer/services/unified-messages.ts
@@ -322,9 +322,10 @@ function convertAnthropicToAiMessages(params: MessageCreateParams): ModelMessage
             }
           }
           if (openRouterReasoningCache.get(`openrouter-${block.id}`)) {
-              options.openrouter = {
-                reasoning_details: (sanitizeJson(openRouterReasoningCache.get(`openrouter-${block.id}`)) as JSONValue[]) || []
-              }
+            options.openrouter = {
+              reasoning_details:
+                (sanitizeJson(openRouterReasoningCache.get(`openrouter-${block.id}`)) as JSONValue[]) || []
+            }
           }
           toolCallParts.push({
             type: 'tool-call',
diff --git a/src/renderer/src/config/models/__tests__/tooluse.test.ts b/src/renderer/src/config/models/__tests__/tooluse.test.ts
index e147e87f2f..24653f9a2c 100644
--- a/src/renderer/src/config/models/__tests__/tooluse.test.ts
+++ b/src/renderer/src/config/models/__tests__/tooluse.test.ts
@@ -6,6 +6,29 @@ import { isDeepSeekHybridInferenceModel } from '../reasoning'
 import { isFunctionCallingModel } from '../tooluse'
 import { isPureGenerateImageModel, isTextToImageModel } from '../vision'
 
+vi.mock('@renderer/i18n', () => ({
+  __esModule: true,
+  default: {
+    t: vi.fn((key: string) => key)
+  }
+}))
+
+vi.mock('@renderer/services/AssistantService', () => ({
+  getProviderByModel: vi.fn().mockReturnValue({
+    id: 'openai',
+    type: 'openai',
+    name: 'OpenAI',
+    models: []
+  }),
+  getAssistantSettings: vi.fn(),
+  getDefaultAssistant: vi.fn().mockReturnValue({
+    id: 'default',
+    name: 'Default Assistant',
+    prompt: '',
+    settings: {}
+  })
+}))
+
 vi.mock('@renderer/hooks/useStore', () => ({
   getStoreProviders: vi.fn(() => [])
 }))
diff --git a/src/renderer/src/config/models/__tests__/utils.test.ts b/src/renderer/src/config/models/__tests__/utils.test.ts
index 618a9e9dfe..a9387cc3f7 100644
--- a/src/renderer/src/config/models/__tests__/utils.test.ts
+++ b/src/renderer/src/config/models/__tests__/utils.test.ts
@@ -68,6 +68,29 @@ vi.mock('@renderer/store/settings', () => {
   )
 })
 
+vi.mock('@renderer/i18n', () => ({
+  __esModule: true,
+  default: {
+    t: vi.fn((key: string) => key)
+  }
+}))
+
+vi.mock('@renderer/services/AssistantService', () => ({
+  getProviderByModel: vi.fn().mockReturnValue({
+    id: 'openai',
+    type: 'openai',
+    name: 'OpenAI',
+    models: []
+  }),
+  getAssistantSettings: vi.fn(),
+  getDefaultAssistant: vi.fn().mockReturnValue({
+    id: 'default',
+    name: 'Default Assistant',
+    prompt: '',
+    settings: {}
+  })
+}))
+
 vi.mock('@renderer/hooks/useSettings', () => ({
   useSettings: vi.fn(() => ({})),
   useNavbarPosition: vi.fn(() => ({ navbarPosition: 'left' })),
@@ -98,6 +121,10 @@ vi.mock('../websearch', () => ({
   isOpenAIWebSearchChatCompletionOnlyModel: vi.fn()
 }))
 
+vi.mock('../tooluse', () => ({
+  isFunctionCallingModel: vi.fn()
+}))
+
 const createModel = (overrides: Partial<Model> = {}): Model => ({
   id: 'gpt-4o',
   name: 'gpt-4o',
@@ -125,6 +152,7 @@ describe('model utils', () => {
     generateImageMock.mockReturnValue(false)
     reasoningMock.mockReturnValue(false)
     openAIWebSearchOnlyMock.mockReturnValue(false)
+    isFunctionCallingModelMock.mockReturnValue(true)
   })
 
   describe('OpenAI model detection', () => {
diff --git a/src/renderer/src/utils/api.ts b/src/renderer/src/utils/api.ts
index 0bdb4cc999..3c9b8b0465 100644
--- a/src/renderer/src/utils/api.ts
+++ b/src/renderer/src/utils/api.ts
@@ -10,6 +10,7 @@ export {
   SUPPORTED_IMAGE_ENDPOINT_LIST,
   validateApiHost,
   withoutTrailingApiVersion,
+  withoutTrailingSharp,
   withoutTrailingSlash
 } from '@shared/api'
 

From 0fc901108e2e86d10c8a95edfe7eecc9eb33b0ad Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 4 Dec 2025 22:54:50 +0800
Subject: [PATCH 34/53] fix: type check

---
 src/renderer/src/utils/api.ts | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/renderer/src/utils/api.ts b/src/renderer/src/utils/api.ts
index 3c9b8b0465..665b49c7c4 100644
--- a/src/renderer/src/utils/api.ts
+++ b/src/renderer/src/utils/api.ts
@@ -1,6 +1,7 @@
 export {
   formatApiHost,
   formatAzureOpenAIApiHost,
+  formatOllamaApiHost,
   formatVertexApiHost,
   getAiSdkBaseUrl,
   getTrailingApiVersion,

From 39d1c71819aa124ca2dda201a37d16028a240aac Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Fri, 5 Dec 2025 13:59:00 +0800
Subject: [PATCH 35/53] fix: type check

---
 src/main/apiServer/services/unified-messages.ts | 4 ----
 1 file changed, 4 deletions(-)

diff --git a/src/main/apiServer/services/unified-messages.ts b/src/main/apiServer/services/unified-messages.ts
index cfcdb48393..27037f1a84 100644
--- a/src/main/apiServer/services/unified-messages.ts
+++ b/src/main/apiServer/services/unified-messages.ts
@@ -98,10 +98,6 @@ function getMainProcessFormatContext(): ProviderFormatContext {
 }
 
 const mainProcessSdkContext: AiSdkConfigContext = {
-  getRotatedApiKey: (provider) => {
-    const keys = provider.apiKey.split(',').map((k) => k.trim())
-    return keys[0] || provider.apiKey
-  },
   fetch: net.fetch as typeof globalThis.fetch
 }
 

From c0c7d1b0dff72c0772733e6cd58e54d782e0c321 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 11 Dec 2025 12:43:30 +0800
Subject: [PATCH 36/53] fix: test

---
 src/renderer/src/utils/api.ts | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/renderer/src/utils/api.ts b/src/renderer/src/utils/api.ts
index 665b49c7c4..f6e0c63c58 100644
--- a/src/renderer/src/utils/api.ts
+++ b/src/renderer/src/utils/api.ts
@@ -6,6 +6,7 @@ export {
   getAiSdkBaseUrl,
   getTrailingApiVersion,
   hasAPIVersion,
+  isWithTrailingSharp,
   routeToEndpoint,
   SUPPORTED_ENDPOINT_LIST,
   SUPPORTED_IMAGE_ENDPOINT_LIST,

From 03dbc52477e65acd98e992ca0c1202bde4600c91 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 11 Dec 2025 12:54:20 +0800
Subject: [PATCH 37/53] fix: test

---
 .../provider/__tests__/providerConfig.test.ts | 136 +++++-------------
 1 file changed, 36 insertions(+), 100 deletions(-)

diff --git a/src/renderer/src/aiCore/provider/__tests__/providerConfig.test.ts b/src/renderer/src/aiCore/provider/__tests__/providerConfig.test.ts
index 5d508f95fa..bbeedd69c9 100644
--- a/src/renderer/src/aiCore/provider/__tests__/providerConfig.test.ts
+++ b/src/renderer/src/aiCore/provider/__tests__/providerConfig.test.ts
@@ -110,6 +110,31 @@ const createWindowKeyv = () => {
   }
 }
 
+/**
+ * 创建默认的 mock state，包含所有必需的字段
+ */
+const createDefaultMockState = (overrides?: {
+  includeUsage?: boolean | undefined
+  copilotHeaders?: Record<string, string>
+}) => ({
+  copilot: { defaultHeaders: overrides?.copilotHeaders ?? {} },
+  settings: {
+    openAI: {
+      streamOptions: {
+        includeUsage: overrides?.includeUsage
+      }
+    }
+  },
+  llm: {
+    settings: {
+      vertexai: {
+        projectId: '',
+        location: ''
+      }
+    }
+  }
+})
+
 const createCopilotProvider = (): Provider => ({
   id: 'copilot',
   type: 'openai',
@@ -153,16 +178,7 @@ describe('Copilot responses routing', () => {
       ...(globalThis as any).window,
       keyv: createWindowKeyv()
     }
-    mockGetState.mockReturnValue({
-      copilot: { defaultHeaders: {} },
-      settings: {
-        openAI: {
-          streamOptions: {
-            includeUsage: undefined
-          }
-        }
-      }
-    })
+    mockGetState.mockReturnValue(createDefaultMockState())
   })
 
   it('detects official GPT-5 Codex identifiers case-insensitively', () => {
@@ -198,16 +214,7 @@ describe('CherryAI provider configuration', () => {
       ...(globalThis as any).window,
       keyv: createWindowKeyv()
     }
-    mockGetState.mockReturnValue({
-      copilot: { defaultHeaders: {} },
-      settings: {
-        openAI: {
-          streamOptions: {
-            includeUsage: undefined
-          }
-        }
-      }
-    })
+    mockGetState.mockReturnValue(createDefaultMockState())
     vi.clearAllMocks()
   })
 
@@ -279,16 +286,7 @@ describe('Perplexity provider configuration', () => {
       ...(globalThis as any).window,
       keyv: createWindowKeyv()
     }
-    mockGetState.mockReturnValue({
-      copilot: { defaultHeaders: {} },
-      settings: {
-        openAI: {
-          streamOptions: {
-            includeUsage: undefined
-          }
-        }
-      }
-    })
+    mockGetState.mockReturnValue(createDefaultMockState())
     vi.clearAllMocks()
   })
 
@@ -363,6 +361,7 @@ describe('Stream options includeUsage configuration', () => {
       ...(globalThis as any).window,
       keyv: createWindowKeyv()
     }
+    mockGetState.mockReturnValue(createDefaultMockState())
     vi.clearAllMocks()
   })
 
@@ -377,16 +376,7 @@ describe('Stream options includeUsage configuration', () => {
   })
 
   it('uses includeUsage from settings when undefined', () => {
-    mockGetState.mockReturnValue({
-      copilot: { defaultHeaders: {} },
-      settings: {
-        openAI: {
-          streamOptions: {
-            includeUsage: undefined
-          }
-        }
-      }
-    })
+    mockGetState.mockReturnValue(createDefaultMockState({ includeUsage: undefined }))
 
     const provider = createOpenAIProvider()
     const config = providerToAiSdkConfig(provider, createModel('gpt-4', 'GPT-4', 'openai'))
@@ -395,16 +385,7 @@ describe('Stream options includeUsage configuration', () => {
   })
 
   it('uses includeUsage from settings when set to true', () => {
-    mockGetState.mockReturnValue({
-      copilot: { defaultHeaders: {} },
-      settings: {
-        openAI: {
-          streamOptions: {
-            includeUsage: true
-          }
-        }
-      }
-    })
+    mockGetState.mockReturnValue(createDefaultMockState({ includeUsage: true }))
 
     const provider = createOpenAIProvider()
     const config = providerToAiSdkConfig(provider, createModel('gpt-4', 'GPT-4', 'openai'))
@@ -413,16 +394,7 @@ describe('Stream options includeUsage configuration', () => {
   })
 
   it('uses includeUsage from settings when set to false', () => {
-    mockGetState.mockReturnValue({
-      copilot: { defaultHeaders: {} },
-      settings: {
-        openAI: {
-          streamOptions: {
-            includeUsage: false
-          }
-        }
-      }
-    })
+    mockGetState.mockReturnValue(createDefaultMockState({ includeUsage: false }))
 
     const provider = createOpenAIProvider()
     const config = providerToAiSdkConfig(provider, createModel('gpt-4', 'GPT-4', 'openai'))
@@ -431,16 +403,7 @@ describe('Stream options includeUsage configuration', () => {
   })
 
   it('respects includeUsage setting for non-supporting providers', () => {
-    mockGetState.mockReturnValue({
-      copilot: { defaultHeaders: {} },
-      settings: {
-        openAI: {
-          streamOptions: {
-            includeUsage: true
-          }
-        }
-      }
-    })
+    mockGetState.mockReturnValue(createDefaultMockState({ includeUsage: true }))
 
     const testProvider: Provider = {
       id: 'test',
@@ -462,16 +425,7 @@ describe('Stream options includeUsage configuration', () => {
   })
 
   it('uses includeUsage from settings for Copilot provider when set to false', () => {
-    mockGetState.mockReturnValue({
-      copilot: { defaultHeaders: {} },
-      settings: {
-        openAI: {
-          streamOptions: {
-            includeUsage: false
-          }
-        }
-      }
-    })
+    mockGetState.mockReturnValue(createDefaultMockState({ includeUsage: false }))
 
     const provider = createCopilotProvider()
     const config = providerToAiSdkConfig(provider, createModel('gpt-4', 'GPT-4', 'copilot'))
@@ -481,16 +435,7 @@ describe('Stream options includeUsage configuration', () => {
   })
 
   it('uses includeUsage from settings for Copilot provider when set to true', () => {
-    mockGetState.mockReturnValue({
-      copilot: { defaultHeaders: {} },
-      settings: {
-        openAI: {
-          streamOptions: {
-            includeUsage: true
-          }
-        }
-      }
-    })
+    mockGetState.mockReturnValue(createDefaultMockState({ includeUsage: true }))
 
     const provider = createCopilotProvider()
     const config = providerToAiSdkConfig(provider, createModel('gpt-4', 'GPT-4', 'copilot'))
@@ -500,16 +445,7 @@ describe('Stream options includeUsage configuration', () => {
   })
 
   it('uses includeUsage from settings for Copilot provider when undefined', () => {
-    mockGetState.mockReturnValue({
-      copilot: { defaultHeaders: {} },
-      settings: {
-        openAI: {
-          streamOptions: {
-            includeUsage: undefined
-          }
-        }
-      }
-    })
+    mockGetState.mockReturnValue(createDefaultMockState({ includeUsage: undefined }))
 
     const provider = createCopilotProvider()
     const config = providerToAiSdkConfig(provider, createModel('gpt-4', 'GPT-4', 'copilot'))

From dd2faa2b6a29b6c6314478745b4e00fc05608b77 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Wed, 17 Dec 2025 18:17:26 +0800
Subject: [PATCH 38/53] chore: format

---
 src/main/services/agents/services/claudecode/index.ts | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/main/services/agents/services/claudecode/index.ts b/src/main/services/agents/services/claudecode/index.ts
index 0c36a6f61e..689c177ff5 100644
--- a/src/main/services/agents/services/claudecode/index.ts
+++ b/src/main/services/agents/services/claudecode/index.ts
@@ -107,7 +107,6 @@ class ClaudeCodeService implements AgentServiceInterface {
 
     const customGitBashPath = validateGitBashPath(configManager.get(ConfigKeys.GitBashPath) as string | undefined)
 
-
     // Route through local API Server which handles format conversion via unified adapter
     // This enables Claude Code Agent to work with any provider (OpenAI, Gemini, etc.)
     // The API Server converts AI SDK responses to Anthropic SSE format transparently

From 905e29007118e61139fae3e8b80aa73e4ad6cec9 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Wed, 17 Dec 2025 18:21:42 +0800
Subject: [PATCH 39/53] chore: lint

---
 packages/shared/provider/sdk-config.ts | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/packages/shared/provider/sdk-config.ts b/packages/shared/provider/sdk-config.ts
index 006de36ba4..b87a31ed25 100644
--- a/packages/shared/provider/sdk-config.ts
+++ b/packages/shared/provider/sdk-config.ts
@@ -6,6 +6,7 @@
  */
 
 import { formatPrivateKey, hasProviderConfig, ProviderConfigFactory } from '@cherrystudio/ai-core/provider'
+import { defaultAppHeaders } from '@shared/utils'
 import { isEmpty } from 'lodash'
 
 import { routeToEndpoint } from '../api'
@@ -13,7 +14,6 @@ import { isOllamaProvider } from './detection'
 import { getAiSdkProviderId } from './mapping'
 import type { MinimalProvider } from './types'
 import { SystemProviderIds } from './types'
-import { defaultAppHeaders } from '@shared/utils'
 
 /**
  * AI SDK configuration result

From b33e5959556ff634fe64f3b99c97c4d8dd6cc8de Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 18 Dec 2025 14:10:42 +0800
Subject: [PATCH 40/53] Merge remote-tracking branch 'origin/main' into
 feat/proxy-api-server

---
 build/nsis-installer.nsh                      |  65 +-
 electron-builder.yml                          |  60 +-
 package.json                                  |   2 +-
 packages/shared/IpcChannel.ts                 |   1 +
 packages/shared/config/constant.ts            |   8 +
 packages/shared/provider/types.ts             |   6 +-
 src/main/ipc.ts                               |  25 +-
 src/main/mcpServers/factory.ts                |   2 +-
 src/main/mcpServers/filesystem.ts             | 652 ------------------
 src/main/mcpServers/filesystem/index.ts       |   2 +
 src/main/mcpServers/filesystem/server.ts      | 118 ++++
 .../mcpServers/filesystem/tools/delete.ts     |  93 +++
 src/main/mcpServers/filesystem/tools/edit.ts  | 130 ++++
 src/main/mcpServers/filesystem/tools/glob.ts  | 149 ++++
 src/main/mcpServers/filesystem/tools/grep.ts  | 266 +++++++
 src/main/mcpServers/filesystem/tools/index.ts |   8 +
 src/main/mcpServers/filesystem/tools/ls.ts    | 150 ++++
 src/main/mcpServers/filesystem/tools/read.ts  | 101 +++
 src/main/mcpServers/filesystem/tools/write.ts |  83 +++
 src/main/mcpServers/filesystem/types.ts       | 627 +++++++++++++++++
 src/main/services/ConfigManager.ts            |   3 +-
 src/main/services/MCPService.ts               |  20 +
 .../agents/services/claudecode/index.ts       |   7 +-
 src/main/utils/__tests__/process.test.ts      | 294 +++++++-
 src/main/utils/process.ts                     |  78 ++-
 src/preload/index.ts                          |   3 +-
 .../legacy/clients/openai/OpenAIApiClient.ts  |   6 +-
 .../middleware/AiSdkMiddlewareBuilder.ts      |  11 -
 .../plugins/searchOrchestrationPlugin.ts      |  46 +-
 .../__tests__/model-parameters.test.ts        |   2 +-
 .../aiCore/utils/__tests__/reasoning.test.ts  | 107 ++-
 src/renderer/src/aiCore/utils/reasoning.ts    |  54 +-
 .../src/assets/images/models/mimo.svg         |  17 +
 .../src/assets/images/providers/mimo.svg      |  17 +
 src/renderer/src/components/Icons/SVGIcon.tsx |  12 +
 .../components/Popups/agent/AgentModal.tsx    | 177 +++--
 .../config/models/__tests__/reasoning.test.ts | 122 +++-
 src/renderer/src/config/models/default.ts     |  16 +-
 src/renderer/src/config/models/logo.ts        |   4 +-
 src/renderer/src/config/models/reasoning.ts   |  95 ++-
 src/renderer/src/config/models/tooluse.ts     |   5 +-
 src/renderer/src/config/models/vision.ts      |   2 +-
 src/renderer/src/config/providers.ts          |  26 +-
 src/renderer/src/i18n/label.ts                |  22 +-
 src/renderer/src/i18n/locales/en-us.json      |  19 +-
 src/renderer/src/i18n/locales/zh-cn.json      |  19 +-
 src/renderer/src/i18n/locales/zh-tw.json      |  19 +-
 src/renderer/src/i18n/translate/de-de.json    |  19 +-
 src/renderer/src/i18n/translate/el-gr.json    |  19 +-
 src/renderer/src/i18n/translate/es-es.json    |  19 +-
 src/renderer/src/i18n/translate/fr-fr.json    |  19 +-
 src/renderer/src/i18n/translate/ja-jp.json    |  19 +-
 src/renderer/src/i18n/translate/pt-pt.json    |  19 +-
 src/renderer/src/i18n/translate/ru-ru.json    |  19 +-
 .../tools/components/ThinkingButton.tsx       |  44 +-
 .../MCPSettings/BuiltinMCPServerList.tsx      |  11 +-
 .../ProviderSettings/ProviderSetting.tsx      |   1 +
 src/renderer/src/services/ApiService.ts       |  57 ++
 src/renderer/src/services/AssistantService.ts |   5 +-
 src/renderer/src/services/KnowledgeService.ts | 132 ++++
 .../src/services/OrchestrateService.ts        |  91 ---
 .../src/services/StreamProcessingService.ts   |   4 +
 .../callbacks/citationCallbacks.ts            |   7 +-
 src/renderer/src/store/index.ts               |   2 +-
 src/renderer/src/store/mcp.ts                 |  10 +
 src/renderer/src/store/migrate.ts             |  15 +
 src/renderer/src/store/thunk/messageThunk.ts  |   6 +-
 src/renderer/src/types/index.ts               |  19 +-
 yarn.lock                                     |  20 +-
 69 files changed, 3189 insertions(+), 1119 deletions(-)
 delete mode 100644 src/main/mcpServers/filesystem.ts
 create mode 100644 src/main/mcpServers/filesystem/index.ts
 create mode 100644 src/main/mcpServers/filesystem/server.ts
 create mode 100644 src/main/mcpServers/filesystem/tools/delete.ts
 create mode 100644 src/main/mcpServers/filesystem/tools/edit.ts
 create mode 100644 src/main/mcpServers/filesystem/tools/glob.ts
 create mode 100644 src/main/mcpServers/filesystem/tools/grep.ts
 create mode 100644 src/main/mcpServers/filesystem/tools/index.ts
 create mode 100644 src/main/mcpServers/filesystem/tools/ls.ts
 create mode 100644 src/main/mcpServers/filesystem/tools/read.ts
 create mode 100644 src/main/mcpServers/filesystem/tools/write.ts
 create mode 100644 src/main/mcpServers/filesystem/types.ts
 create mode 100644 src/renderer/src/assets/images/models/mimo.svg
 create mode 100644 src/renderer/src/assets/images/providers/mimo.svg
 delete mode 100644 src/renderer/src/services/OrchestrateService.ts

diff --git a/build/nsis-installer.nsh b/build/nsis-installer.nsh
index 769ccaaa19..e644e18f3d 100644
--- a/build/nsis-installer.nsh
+++ b/build/nsis-installer.nsh
@@ -12,8 +12,13 @@
 
 ; https://github.com/electron-userland/electron-builder/issues/1122
 !ifndef BUILD_UNINSTALLER
+  ; Check VC++ Redistributable based on architecture stored in $1
   Function checkVCRedist
-    ReadRegDWORD $0 HKLM "SOFTWARE\Microsoft\VisualStudio\14.0\VC\Runtimes\x64" "Installed"
+    ${If} $1 == "arm64"
+      ReadRegDWORD $0 HKLM "SOFTWARE\Microsoft\VisualStudio\14.0\VC\Runtimes\ARM64" "Installed"
+    ${Else}
+      ReadRegDWORD $0 HKLM "SOFTWARE\Microsoft\VisualStudio\14.0\VC\Runtimes\x64" "Installed"
+    ${EndIf}
   FunctionEnd
 
   Function checkArchitectureCompatibility
@@ -97,29 +102,47 @@
 
   Call checkVCRedist
   ${If} $0 != "1"
-    MessageBox MB_YESNO "\
-      NOTE: ${PRODUCT_NAME} requires $\r$\n\
-      'Microsoft Visual C++ Redistributable'$\r$\n\
-      to function properly.$\r$\n$\r$\n\
-      Download and install now?" /SD IDYES IDYES InstallVCRedist IDNO DontInstall
-    InstallVCRedist:
-      inetc::get /CAPTION " " /BANNER "Downloading Microsoft Visual C++ Redistributable..." "https://aka.ms/vs/17/release/vc_redist.x64.exe" "$TEMP\vc_redist.x64.exe"
-      ExecWait "$TEMP\vc_redist.x64.exe /install /norestart"
-      ;IfErrors InstallError ContinueInstall ; vc_redist exit code is unreliable :(
-      Call checkVCRedist
-      ${If} $0 == "1"
-        Goto ContinueInstall
-      ${EndIf}
+    ; VC++ is required - install automatically since declining would abort anyway
+    ; Select download URL based on system architecture (stored in $1)
+    ${If} $1 == "arm64"
+      StrCpy $2 "https://aka.ms/vs/17/release/vc_redist.arm64.exe"
+      StrCpy $3 "$TEMP\vc_redist.arm64.exe"
+    ${Else}
+      StrCpy $2 "https://aka.ms/vs/17/release/vc_redist.x64.exe"
+      StrCpy $3 "$TEMP\vc_redist.x64.exe"
+    ${EndIf}
 
-    ;InstallError:
-      MessageBox MB_ICONSTOP "\
-        There was an unexpected error installing$\r$\n\
-        Microsoft Visual C++ Redistributable.$\r$\n\
-        The installation of ${PRODUCT_NAME} cannot continue."
-    DontInstall:
+    inetc::get /CAPTION " " /BANNER "Downloading Microsoft Visual C++ Redistributable..." \
+      $2 $3 /END
+    Pop $0  ; Get download status from inetc::get
+    ${If} $0 != "OK"
+      MessageBox MB_ICONSTOP|MB_YESNO "\
+        Failed to download Microsoft Visual C++ Redistributable.$\r$\n$\r$\n\
+        Error: $0$\r$\n$\r$\n\
+        Would you like to open the download page in your browser?$\r$\n\
+        $2" IDYES openDownloadUrl IDNO skipDownloadUrl
+      openDownloadUrl:
+        ExecShell "open" $2
+      skipDownloadUrl:
       Abort
+    ${EndIf}
+
+    ExecWait "$3 /install /quiet /norestart"
+    ; Note: vc_redist exit code is unreliable, verify via registry check instead
+
+    Call checkVCRedist
+    ${If} $0 != "1"
+      MessageBox MB_ICONSTOP|MB_YESNO "\
+        Microsoft Visual C++ Redistributable installation failed.$\r$\n$\r$\n\
+        Would you like to open the download page in your browser?$\r$\n\
+        $2$\r$\n$\r$\n\
+        The installation of ${PRODUCT_NAME} cannot continue." IDYES openInstallUrl IDNO skipInstallUrl
+      openInstallUrl:
+        ExecShell "open" $2
+      skipInstallUrl:
+      Abort
+    ${EndIf}
   ${EndIf}
-  ContinueInstall:
     Pop $4
     Pop $3
     Pop $2
diff --git a/electron-builder.yml b/electron-builder.yml
index db1184be87..e3ab493666 100644
--- a/electron-builder.yml
+++ b/electron-builder.yml
@@ -134,54 +134,38 @@ artifactBuildCompleted: scripts/artifact-build-completed.js
 releaseInfo:
   releaseNotes: |
     <!--LANG:en-->
-    Cherry Studio 1.7.4 - New Browser MCP & Model Updates
+    Cherry Studio 1.7.5 - Filesystem MCP Overhaul & Topic Management
 
-    This release adds a powerful browser automation MCP server, new web search provider, and model support updates.
+    This release features a completely rewritten filesystem MCP server, new batch topic management, and improved assistant management.
 
     ✨ New Features
-    - [MCP] Add @cherry/browser CDP MCP server with session management for browser automation
-    - [Web Search] Add ExaMCP free web search provider (no API key required)
-    - [Model] Support GPT 5.2 series models
-    - [Model] Add capabilities support for Doubao Seed Code models (tool calling, reasoning, vision)
-
-    🔧 Improvements
-    - [Translate] Add reasoning effort option to translate service
-    - [i18n] Improve zh-TW Traditional Chinese locale
-    - [Settings] Update MCP Settings layout and styling
+    - [MCP] Rewrite filesystem MCP server with improved tool set (glob, ls, grep, read, write, edit, delete)
+    - [Topics] Add topic manage mode for batch delete and move operations with search functionality
+    - [Assistants] Merge import/subscribe popups and add export to assistant management
+    - [Knowledge] Use prompt injection for forced knowledge base search (faster response times)
+    - [Settings] Add tool use mode setting (prompt/function) to default assistant settings
 
     🐛 Bug Fixes
-    - [Chat] Fix line numbers being wrongly copied from code blocks
-    - [Translate] Fix default to first supported reasoning effort when translating
-    - [Chat] Fix preserve thinking block in assistant messages
-    - [Web Search] Fix max search result limit
-    - [Embedding] Fix embedding dimensions retrieval for ModernAiProvider
-    - [Chat] Fix token calculation in prompt tool use plugin
-    - [Model] Fix Ollama provider options for Qwen model support
-    - [UI] Fix Chat component marginRight calculation for improved layout
+    - [Model] Correct typo in Gemini 3 Pro Image Preview model name
+    - [Installer] Auto-install VC++ Redistributable without user prompt
+    - [Notes] Fix notes directory validation and default path reset for cross-platform restore
+    - [OAuth] Bind OAuth callback server to localhost (127.0.0.1) for security
 
     <!--LANG:zh-CN-->
-    Cherry Studio 1.7.4 - 新增浏览器 MCP 与模型更新
+    Cherry Studio 1.7.5 - 文件系统 MCP 重构与话题管理
 
-    本次更新新增强大的浏览器自动化 MCP 服务器、新的网页搜索提供商以及模型支持更新。
+    本次更新完全重写了文件系统 MCP 服务器，新增批量话题管理功能，并改进了助手管理。
 
     ✨ 新功能
-    - [MCP] 新增 @cherry/browser CDP MCP 服务器，支持会话管理的浏览器自动化
-    - [网页搜索] 新增 ExaMCP 免费网页搜索提供商（无需 API 密钥）
-    - [模型] 支持 GPT 5.2 系列模型
-    - [模型] 为豆包 Seed Code 模型添加能力支持（工具调用、推理、视觉）
-
-    🔧 功能改进
-    - [翻译] 为翻译服务添加推理强度选项
-    - [国际化] 改进繁体中文（zh-TW）本地化
-    - [设置] 优化 MCP 设置布局和样式
+    - [MCP] 重写文件系统 MCP 服务器，提供改进的工具集（glob、ls、grep、read、write、edit、delete）
+    - [话题] 新增话题管理模式，支持批量删除和移动操作，带搜索功能
+    - [助手] 合并导入/订阅弹窗，并在助手管理中添加导出功能
+    - [知识库] 使用提示词注入进行强制知识库搜索（响应更快）
+    - [设置] 在默认助手设置中添加工具使用模式设置（prompt/function）
 
     🐛 问题修复
-    - [聊天] 修复代码块中行号被错误复制的问题
-    - [翻译] 修复翻译时默认使用第一个支持的推理强度
-    - [聊天] 修复助手消息中思考块的保留问题
-    - [网页搜索] 修复最大搜索结果数限制
-    - [嵌入] 修复 ModernAiProvider 嵌入维度获取问题
-    - [聊天] 修复提示词工具使用插件的 token 计算问题
-    - [模型] 修复 Ollama 提供商对 Qwen 模型的支持选项
-    - [界面] 修复聊天组件右边距计算以改善布局
+    - [模型] 修正 Gemini 3 Pro Image Preview 模型名称的拼写错误
+    - [安装程序] 自动安装 VC++ 运行库，无需用户确认
+    - [笔记] 修复跨平台恢复场景下的笔记目录验证和默认路径重置逻辑
+    - [OAuth] 将 OAuth 回调服务器绑定到 localhost (127.0.0.1) 以提高安全性
     <!--LANG:END-->
diff --git a/package.json b/package.json
index 3fd6d1741f..b894030b58 100644
--- a/package.json
+++ b/package.json
@@ -1,6 +1,6 @@
 {
   "name": "CherryStudio",
-  "version": "1.7.4",
+  "version": "1.7.5",
   "private": true,
   "description": "A powerful AI assistant for producer.",
   "main": "./out/main/index.js",
diff --git a/packages/shared/IpcChannel.ts b/packages/shared/IpcChannel.ts
index 0ebe48266d..aec1d57b43 100644
--- a/packages/shared/IpcChannel.ts
+++ b/packages/shared/IpcChannel.ts
@@ -244,6 +244,7 @@ export enum IpcChannel {
   System_GetCpuName = 'system:getCpuName',
   System_CheckGitBash = 'system:checkGitBash',
   System_GetGitBashPath = 'system:getGitBashPath',
+  System_GetGitBashPathInfo = 'system:getGitBashPathInfo',
   System_SetGitBashPath = 'system:setGitBashPath',
 
   // DevTools
diff --git a/packages/shared/config/constant.ts b/packages/shared/config/constant.ts
index 1e02ce7706..af0191f4fa 100644
--- a/packages/shared/config/constant.ts
+++ b/packages/shared/config/constant.ts
@@ -488,3 +488,11 @@ export const MACOS_TERMINALS_WITH_COMMANDS: TerminalConfigWithCommand[] = [
 
 // resources/scripts should be maintained manually
 export const HOME_CHERRY_DIR = '.cherrystudio'
+
+// Git Bash path configuration types
+export type GitBashPathSource = 'manual' | 'auto'
+
+export interface GitBashPathInfo {
+  path: string | null
+  source: GitBashPathSource | null
+}
diff --git a/packages/shared/provider/types.ts b/packages/shared/provider/types.ts
index 763ed210c4..3dd56376db 100644
--- a/packages/shared/provider/types.ts
+++ b/packages/shared/provider/types.ts
@@ -100,7 +100,8 @@ export const SystemProviderIdSchema = z.enum([
   'huggingface',
   'sophnet',
   'gateway',
-  'cerebras'
+  'cerebras',
+  'mimo'
 ])
 
 export type SystemProviderId = z.infer<typeof SystemProviderIdSchema>
@@ -169,7 +170,8 @@ export const SystemProviderIds = {
   longcat: 'longcat',
   huggingface: 'huggingface',
   gateway: 'gateway',
-  cerebras: 'cerebras'
+  cerebras: 'cerebras',
+  mimo: 'mimo'
 } as const satisfies Record<SystemProviderId, SystemProviderId>
 
 export type SystemProviderIdTypeMap = typeof SystemProviderIds
diff --git a/src/main/ipc.ts b/src/main/ipc.ts
index d7e82ff875..4cb3402414 100644
--- a/src/main/ipc.ts
+++ b/src/main/ipc.ts
@@ -6,7 +6,14 @@ import { loggerService } from '@logger'
 import { isLinux, isMac, isPortable, isWin } from '@main/constant'
 import { generateSignature } from '@main/integration/cherryai'
 import anthropicService from '@main/services/AnthropicService'
-import { findGitBash, getBinaryPath, isBinaryExists, runInstallScript, validateGitBashPath } from '@main/utils/process'
+import {
+  autoDiscoverGitBash,
+  getBinaryPath,
+  getGitBashPathInfo,
+  isBinaryExists,
+  runInstallScript,
+  validateGitBashPath
+} from '@main/utils/process'
 import { handleZoomFactor } from '@main/utils/zoom'
 import type { SpanEntity, TokenUsage } from '@mcp-trace/trace-core'
 import type { UpgradeChannel } from '@shared/config/constant'
@@ -499,9 +506,8 @@ export function registerIpc(mainWindow: BrowserWindow, app: Electron.App) {
     }
 
     try {
-      const customPath = configManager.get(ConfigKeys.GitBashPath) as string | undefined
-      const bashPath = findGitBash(customPath)
-
+      // Use autoDiscoverGitBash to handle auto-discovery and persistence
+      const bashPath = autoDiscoverGitBash()
       if (bashPath) {
         logger.info('Git Bash is available', { path: bashPath })
         return true
@@ -524,13 +530,22 @@ export function registerIpc(mainWindow: BrowserWindow, app: Electron.App) {
     return customPath ?? null
   })
 
+  // Returns { path, source } where source is 'manual' | 'auto' | null
+  ipcMain.handle(IpcChannel.System_GetGitBashPathInfo, () => {
+    return getGitBashPathInfo()
+  })
+
   ipcMain.handle(IpcChannel.System_SetGitBashPath, (_, newPath: string | null) => {
     if (!isWin) {
       return false
     }
 
     if (!newPath) {
+      // Clear manual setting and re-run auto-discovery
       configManager.set(ConfigKeys.GitBashPath, null)
+      configManager.set(ConfigKeys.GitBashPathSource, null)
+      // Re-run auto-discovery to restore auto-discovered path if available
+      autoDiscoverGitBash()
       return true
     }
 
@@ -539,7 +554,9 @@ export function registerIpc(mainWindow: BrowserWindow, app: Electron.App) {
       return false
     }
 
+    // Set path with 'manual' source
     configManager.set(ConfigKeys.GitBashPath, validated)
+    configManager.set(ConfigKeys.GitBashPathSource, 'manual')
     return true
   })
 
diff --git a/src/main/mcpServers/factory.ts b/src/main/mcpServers/factory.ts
index ce736f6843..909901c1c8 100644
--- a/src/main/mcpServers/factory.ts
+++ b/src/main/mcpServers/factory.ts
@@ -36,7 +36,7 @@ export function createInMemoryMCPServer(
       return new FetchServer().server
     }
     case BuiltinMCPServerNames.filesystem: {
-      return new FileSystemServer(args).server
+      return new FileSystemServer(envs.WORKSPACE_ROOT).server
     }
     case BuiltinMCPServerNames.difyKnowledge: {
       const difyKey = envs.DIFY_KEY
diff --git a/src/main/mcpServers/filesystem.ts b/src/main/mcpServers/filesystem.ts
deleted file mode 100644
index ba10783881..0000000000
--- a/src/main/mcpServers/filesystem.ts
+++ /dev/null
@@ -1,652 +0,0 @@
-// port https://github.com/modelcontextprotocol/servers/blob/main/src/filesystem/index.ts
-
-import { loggerService } from '@logger'
-import { Server } from '@modelcontextprotocol/sdk/server/index.js'
-import { CallToolRequestSchema, ListToolsRequestSchema } from '@modelcontextprotocol/sdk/types.js'
-import { createTwoFilesPatch } from 'diff'
-import fs from 'fs/promises'
-import { minimatch } from 'minimatch'
-import os from 'os'
-import path from 'path'
-import * as z from 'zod'
-
-const logger = loggerService.withContext('MCP:FileSystemServer')
-
-// Normalize all paths consistently
-function normalizePath(p: string): string {
-  return path.normalize(p)
-}
-
-function expandHome(filepath: string): string {
-  if (filepath.startsWith('~/') || filepath === '~') {
-    return path.join(os.homedir(), filepath.slice(1))
-  }
-  return filepath
-}
-
-// Security utilities
-async function validatePath(allowedDirectories: string[], requestedPath: string): Promise<string> {
-  const expandedPath = expandHome(requestedPath)
-  const absolute = path.isAbsolute(expandedPath)
-    ? path.resolve(expandedPath)
-    : path.resolve(process.cwd(), expandedPath)
-
-  const normalizedRequested = normalizePath(absolute)
-
-  // Check if path is within allowed directories
-  const isAllowed = allowedDirectories.some((dir) => normalizedRequested.startsWith(dir))
-  if (!isAllowed) {
-    throw new Error(
-      `Access denied - path outside allowed directories: ${absolute} not in ${allowedDirectories.join(', ')}`
-    )
-  }
-
-  // Handle symlinks by checking their real path
-  try {
-    const realPath = await fs.realpath(absolute)
-    const normalizedReal = normalizePath(realPath)
-    const isRealPathAllowed = allowedDirectories.some((dir) => normalizedReal.startsWith(dir))
-    if (!isRealPathAllowed) {
-      throw new Error('Access denied - symlink target outside allowed directories')
-    }
-    return realPath
-  } catch (error) {
-    // For new files that don't exist yet, verify parent directory
-    const parentDir = path.dirname(absolute)
-    try {
-      const realParentPath = await fs.realpath(parentDir)
-      const normalizedParent = normalizePath(realParentPath)
-      const isParentAllowed = allowedDirectories.some((dir) => normalizedParent.startsWith(dir))
-      if (!isParentAllowed) {
-        throw new Error('Access denied - parent directory outside allowed directories')
-      }
-      return absolute
-    } catch {
-      throw new Error(`Parent directory does not exist: ${parentDir}`)
-    }
-  }
-}
-
-// Schema definitions
-const ReadFileArgsSchema = z.object({
-  path: z.string()
-})
-
-const ReadMultipleFilesArgsSchema = z.object({
-  paths: z.array(z.string())
-})
-
-const WriteFileArgsSchema = z.object({
-  path: z.string(),
-  content: z.string()
-})
-
-const EditOperation = z.object({
-  oldText: z.string().describe('Text to search for - must match exactly'),
-  newText: z.string().describe('Text to replace with')
-})
-
-const EditFileArgsSchema = z.object({
-  path: z.string(),
-  edits: z.array(EditOperation),
-  dryRun: z.boolean().default(false).describe('Preview changes using git-style diff format')
-})
-
-const CreateDirectoryArgsSchema = z.object({
-  path: z.string()
-})
-
-const ListDirectoryArgsSchema = z.object({
-  path: z.string()
-})
-
-const DirectoryTreeArgsSchema = z.object({
-  path: z.string()
-})
-
-const MoveFileArgsSchema = z.object({
-  source: z.string(),
-  destination: z.string()
-})
-
-const SearchFilesArgsSchema = z.object({
-  path: z.string(),
-  pattern: z.string(),
-  excludePatterns: z.array(z.string()).optional().default([])
-})
-
-const GetFileInfoArgsSchema = z.object({
-  path: z.string()
-})
-
-interface FileInfo {
-  size: number
-  created: Date
-  modified: Date
-  accessed: Date
-  isDirectory: boolean
-  isFile: boolean
-  permissions: string
-}
-
-// Tool implementations
-async function getFileStats(filePath: string): Promise<FileInfo> {
-  const stats = await fs.stat(filePath)
-  return {
-    size: stats.size,
-    created: stats.birthtime,
-    modified: stats.mtime,
-    accessed: stats.atime,
-    isDirectory: stats.isDirectory(),
-    isFile: stats.isFile(),
-    permissions: stats.mode.toString(8).slice(-3)
-  }
-}
-
-async function searchFiles(
-  allowedDirectories: string[],
-  rootPath: string,
-  pattern: string,
-  excludePatterns: string[] = []
-): Promise<string[]> {
-  const results: string[] = []
-
-  async function search(currentPath: string) {
-    const entries = await fs.readdir(currentPath, { withFileTypes: true })
-
-    for (const entry of entries) {
-      const fullPath = path.join(currentPath, entry.name)
-
-      try {
-        // Validate each path before processing
-        await validatePath(allowedDirectories, fullPath)
-
-        // Check if path matches any exclude pattern
-        const relativePath = path.relative(rootPath, fullPath)
-        const shouldExclude = excludePatterns.some((pattern) => {
-          const globPattern = pattern.includes('*') ? pattern : `**/${pattern}/**`
-          return minimatch(relativePath, globPattern, { dot: true })
-        })
-
-        if (shouldExclude) {
-          continue
-        }
-
-        if (entry.name.toLowerCase().includes(pattern.toLowerCase())) {
-          results.push(fullPath)
-        }
-
-        if (entry.isDirectory()) {
-          await search(fullPath)
-        }
-      } catch (error) {
-        // Skip invalid paths during search
-      }
-    }
-  }
-
-  await search(rootPath)
-  return results
-}
-
-// file editing and diffing utilities
-function normalizeLineEndings(text: string): string {
-  return text.replace(/\r\n/g, '\n')
-}
-
-function createUnifiedDiff(originalContent: string, newContent: string, filepath: string = 'file'): string {
-  // Ensure consistent line endings for diff
-  const normalizedOriginal = normalizeLineEndings(originalContent)
-  const normalizedNew = normalizeLineEndings(newContent)
-
-  return createTwoFilesPatch(filepath, filepath, normalizedOriginal, normalizedNew, 'original', 'modified')
-}
-
-async function applyFileEdits(
-  filePath: string,
-  edits: Array<{ oldText: string; newText: string }>,
-  dryRun = false
-): Promise<string> {
-  // Read file content and normalize line endings
-  const content = normalizeLineEndings(await fs.readFile(filePath, 'utf-8'))
-
-  // Apply edits sequentially
-  let modifiedContent = content
-  for (const edit of edits) {
-    const normalizedOld = normalizeLineEndings(edit.oldText)
-    const normalizedNew = normalizeLineEndings(edit.newText)
-
-    // If exact match exists, use it
-    if (modifiedContent.includes(normalizedOld)) {
-      modifiedContent = modifiedContent.replace(normalizedOld, normalizedNew)
-      continue
-    }
-
-    // Otherwise, try line-by-line matching with flexibility for whitespace
-    const oldLines = normalizedOld.split('\n')
-    const contentLines = modifiedContent.split('\n')
-    let matchFound = false
-
-    for (let i = 0; i <= contentLines.length - oldLines.length; i++) {
-      const potentialMatch = contentLines.slice(i, i + oldLines.length)
-
-      // Compare lines with normalized whitespace
-      const isMatch = oldLines.every((oldLine, j) => {
-        const contentLine = potentialMatch[j]
-        return oldLine.trim() === contentLine.trim()
-      })
-
-      if (isMatch) {
-        // Preserve original indentation of first line
-        const originalIndent = contentLines[i].match(/^\s*/)?.[0] || ''
-        const newLines = normalizedNew.split('\n').map((line, j) => {
-          if (j === 0) return originalIndent + line.trimStart()
-          // For subsequent lines, try to preserve relative indentation
-          const oldIndent = oldLines[j]?.match(/^\s*/)?.[0] || ''
-          const newIndent = line.match(/^\s*/)?.[0] || ''
-          if (oldIndent && newIndent) {
-            const relativeIndent = newIndent.length - oldIndent.length
-            return originalIndent + ' '.repeat(Math.max(0, relativeIndent)) + line.trimStart()
-          }
-          return line
-        })
-
-        contentLines.splice(i, oldLines.length, ...newLines)
-        modifiedContent = contentLines.join('\n')
-        matchFound = true
-        break
-      }
-    }
-
-    if (!matchFound) {
-      throw new Error(`Could not find exact match for edit:\n${edit.oldText}`)
-    }
-  }
-
-  // Create unified diff
-  const diff = createUnifiedDiff(content, modifiedContent, filePath)
-
-  // Format diff with appropriate number of backticks
-  let numBackticks = 3
-  while (diff.includes('`'.repeat(numBackticks))) {
-    numBackticks++
-  }
-  const formattedDiff = `${'`'.repeat(numBackticks)}diff\n${diff}${'`'.repeat(numBackticks)}\n\n`
-
-  if (!dryRun) {
-    await fs.writeFile(filePath, modifiedContent, 'utf-8')
-  }
-
-  return formattedDiff
-}
-
-class FileSystemServer {
-  public server: Server
-  private allowedDirectories: string[]
-  constructor(allowedDirs: string[]) {
-    if (!Array.isArray(allowedDirs) || allowedDirs.length === 0) {
-      throw new Error('No allowed directories provided, please specify at least one directory in args')
-    }
-
-    this.allowedDirectories = allowedDirs.map((dir) => normalizePath(path.resolve(expandHome(dir))))
-
-    // Validate that all directories exist and are accessible
-    this.validateDirs().catch((error) => {
-      logger.error('Error validating allowed directories:', error)
-      throw new Error(`Error validating allowed directories: ${error}`)
-    })
-
-    this.server = new Server(
-      {
-        name: 'secure-filesystem-server',
-        version: '0.2.0'
-      },
-      {
-        capabilities: {
-          tools: {}
-        }
-      }
-    )
-    this.initialize()
-  }
-
-  async validateDirs() {
-    // Validate that all directories exist and are accessible
-    await Promise.all(
-      this.allowedDirectories.map(async (dir) => {
-        try {
-          const stats = await fs.stat(expandHome(dir))
-          if (!stats.isDirectory()) {
-            logger.error(`Error: ${dir} is not a directory`)
-            throw new Error(`Error: ${dir} is not a directory`)
-          }
-        } catch (error: any) {
-          logger.error(`Error accessing directory ${dir}:`, error)
-          throw new Error(`Error accessing directory ${dir}:`, error)
-        }
-      })
-    )
-  }
-
-  initialize() {
-    // Tool handlers
-    this.server.setRequestHandler(ListToolsRequestSchema, async () => {
-      return {
-        tools: [
-          {
-            name: 'read_file',
-            description:
-              'Read the complete contents of a file from the file system. ' +
-              'Handles various text encodings and provides detailed error messages ' +
-              'if the file cannot be read. Use this tool when you need to examine ' +
-              'the contents of a single file. Only works within allowed directories.',
-            inputSchema: z.toJSONSchema(ReadFileArgsSchema)
-          },
-          {
-            name: 'read_multiple_files',
-            description:
-              'Read the contents of multiple files simultaneously. This is more ' +
-              'efficient than reading files one by one when you need to analyze ' +
-              "or compare multiple files. Each file's content is returned with its " +
-              "path as a reference. Failed reads for individual files won't stop " +
-              'the entire operation. Only works within allowed directories.',
-            inputSchema: z.toJSONSchema(ReadMultipleFilesArgsSchema)
-          },
-          {
-            name: 'write_file',
-            description:
-              'Create a new file or completely overwrite an existing file with new content. ' +
-              'Use with caution as it will overwrite existing files without warning. ' +
-              'Handles text content with proper encoding. Only works within allowed directories.',
-            inputSchema: z.toJSONSchema(WriteFileArgsSchema)
-          },
-          {
-            name: 'edit_file',
-            description:
-              'Make line-based edits to a text file. Each edit replaces exact line sequences ' +
-              'with new content. Returns a git-style diff showing the changes made. ' +
-              'Only works within allowed directories.',
-            inputSchema: z.toJSONSchema(EditFileArgsSchema)
-          },
-          {
-            name: 'create_directory',
-            description:
-              'Create a new directory or ensure a directory exists. Can create multiple ' +
-              'nested directories in one operation. If the directory already exists, ' +
-              'this operation will succeed silently. Perfect for setting up directory ' +
-              'structures for projects or ensuring required paths exist. Only works within allowed directories.',
-            inputSchema: z.toJSONSchema(CreateDirectoryArgsSchema)
-          },
-          {
-            name: 'list_directory',
-            description:
-              'Get a detailed listing of all files and directories in a specified path. ' +
-              'Results clearly distinguish between files and directories with [FILE] and [DIR] ' +
-              'prefixes. This tool is essential for understanding directory structure and ' +
-              'finding specific files within a directory. Only works within allowed directories.',
-            inputSchema: z.toJSONSchema(ListDirectoryArgsSchema)
-          },
-          {
-            name: 'directory_tree',
-            description:
-              'Get a recursive tree view of files and directories as a JSON structure. ' +
-              "Each entry includes 'name', 'type' (file/directory), and 'children' for directories. " +
-              'Files have no children array, while directories always have a children array (which may be empty). ' +
-              'The output is formatted with 2-space indentation for readability. Only works within allowed directories.',
-            inputSchema: z.toJSONSchema(DirectoryTreeArgsSchema)
-          },
-          {
-            name: 'move_file',
-            description:
-              'Move or rename files and directories. Can move files between directories ' +
-              'and rename them in a single operation. If the destination exists, the ' +
-              'operation will fail. Works across different directories and can be used ' +
-              'for simple renaming within the same directory. Both source and destination must be within allowed directories.',
-            inputSchema: z.toJSONSchema(MoveFileArgsSchema)
-          },
-          {
-            name: 'search_files',
-            description:
-              'Recursively search for files and directories matching a pattern. ' +
-              'Searches through all subdirectories from the starting path. The search ' +
-              'is case-insensitive and matches partial names. Returns full paths to all ' +
-              "matching items. Great for finding files when you don't know their exact location. " +
-              'Only searches within allowed directories.',
-            inputSchema: z.toJSONSchema(SearchFilesArgsSchema)
-          },
-          {
-            name: 'get_file_info',
-            description:
-              'Retrieve detailed metadata about a file or directory. Returns comprehensive ' +
-              'information including size, creation time, last modified time, permissions, ' +
-              'and type. This tool is perfect for understanding file characteristics ' +
-              'without reading the actual content. Only works within allowed directories.',
-            inputSchema: z.toJSONSchema(GetFileInfoArgsSchema)
-          },
-          {
-            name: 'list_allowed_directories',
-            description:
-              'Returns the list of directories that this server is allowed to access. ' +
-              'Use this to understand which directories are available before trying to access files.',
-            inputSchema: {
-              type: 'object',
-              properties: {},
-              required: []
-            }
-          }
-        ]
-      }
-    })
-
-    this.server.setRequestHandler(CallToolRequestSchema, async (request) => {
-      try {
-        const { name, arguments: args } = request.params
-
-        switch (name) {
-          case 'read_file': {
-            const parsed = ReadFileArgsSchema.safeParse(args)
-            if (!parsed.success) {
-              throw new Error(`Invalid arguments for read_file: ${parsed.error}`)
-            }
-            const validPath = await validatePath(this.allowedDirectories, parsed.data.path)
-            const content = await fs.readFile(validPath, 'utf-8')
-            return {
-              content: [{ type: 'text', text: content }]
-            }
-          }
-
-          case 'read_multiple_files': {
-            const parsed = ReadMultipleFilesArgsSchema.safeParse(args)
-            if (!parsed.success) {
-              throw new Error(`Invalid arguments for read_multiple_files: ${parsed.error}`)
-            }
-            const results = await Promise.all(
-              parsed.data.paths.map(async (filePath: string) => {
-                try {
-                  const validPath = await validatePath(this.allowedDirectories, filePath)
-                  const content = await fs.readFile(validPath, 'utf-8')
-                  return `${filePath}:\n${content}\n`
-                } catch (error) {
-                  const errorMessage = error instanceof Error ? error.message : String(error)
-                  return `${filePath}: Error - ${errorMessage}`
-                }
-              })
-            )
-            return {
-              content: [{ type: 'text', text: results.join('\n---\n') }]
-            }
-          }
-
-          case 'write_file': {
-            const parsed = WriteFileArgsSchema.safeParse(args)
-            if (!parsed.success) {
-              throw new Error(`Invalid arguments for write_file: ${parsed.error}`)
-            }
-            const validPath = await validatePath(this.allowedDirectories, parsed.data.path)
-            await fs.writeFile(validPath, parsed.data.content, 'utf-8')
-            return {
-              content: [{ type: 'text', text: `Successfully wrote to ${parsed.data.path}` }]
-            }
-          }
-
-          case 'edit_file': {
-            const parsed = EditFileArgsSchema.safeParse(args)
-            if (!parsed.success) {
-              throw new Error(`Invalid arguments for edit_file: ${parsed.error}`)
-            }
-            const validPath = await validatePath(this.allowedDirectories, parsed.data.path)
-            const result = await applyFileEdits(validPath, parsed.data.edits, parsed.data.dryRun)
-            return {
-              content: [{ type: 'text', text: result }]
-            }
-          }
-
-          case 'create_directory': {
-            const parsed = CreateDirectoryArgsSchema.safeParse(args)
-            if (!parsed.success) {
-              throw new Error(`Invalid arguments for create_directory: ${parsed.error}`)
-            }
-            const validPath = await validatePath(this.allowedDirectories, parsed.data.path)
-            await fs.mkdir(validPath, { recursive: true })
-            return {
-              content: [{ type: 'text', text: `Successfully created directory ${parsed.data.path}` }]
-            }
-          }
-
-          case 'list_directory': {
-            const parsed = ListDirectoryArgsSchema.safeParse(args)
-            if (!parsed.success) {
-              throw new Error(`Invalid arguments for list_directory: ${parsed.error}`)
-            }
-            const validPath = await validatePath(this.allowedDirectories, parsed.data.path)
-            const entries = await fs.readdir(validPath, { withFileTypes: true })
-            const formatted = entries
-              .map((entry) => `${entry.isDirectory() ? '[DIR]' : '[FILE]'} ${entry.name}`)
-              .join('\n')
-            return {
-              content: [{ type: 'text', text: formatted }]
-            }
-          }
-
-          case 'directory_tree': {
-            const parsed = DirectoryTreeArgsSchema.safeParse(args)
-            if (!parsed.success) {
-              throw new Error(`Invalid arguments for directory_tree: ${parsed.error}`)
-            }
-
-            interface TreeEntry {
-              name: string
-              type: 'file' | 'directory'
-              children?: TreeEntry[]
-            }
-
-            async function buildTree(allowedDirectories: string[], currentPath: string): Promise<TreeEntry[]> {
-              const validPath = await validatePath(allowedDirectories, currentPath)
-              const entries = await fs.readdir(validPath, { withFileTypes: true })
-              const result: TreeEntry[] = []
-
-              for (const entry of entries) {
-                const entryData: TreeEntry = {
-                  name: entry.name,
-                  type: entry.isDirectory() ? 'directory' : 'file'
-                }
-
-                if (entry.isDirectory()) {
-                  const subPath = path.join(currentPath, entry.name)
-                  entryData.children = await buildTree(allowedDirectories, subPath)
-                }
-
-                result.push(entryData)
-              }
-
-              return result
-            }
-
-            const treeData = await buildTree(this.allowedDirectories, parsed.data.path)
-            return {
-              content: [
-                {
-                  type: 'text',
-                  text: JSON.stringify(treeData, null, 2)
-                }
-              ]
-            }
-          }
-
-          case 'move_file': {
-            const parsed = MoveFileArgsSchema.safeParse(args)
-            if (!parsed.success) {
-              throw new Error(`Invalid arguments for move_file: ${parsed.error}`)
-            }
-            const validSourcePath = await validatePath(this.allowedDirectories, parsed.data.source)
-            const validDestPath = await validatePath(this.allowedDirectories, parsed.data.destination)
-            await fs.rename(validSourcePath, validDestPath)
-            return {
-              content: [
-                { type: 'text', text: `Successfully moved ${parsed.data.source} to ${parsed.data.destination}` }
-              ]
-            }
-          }
-
-          case 'search_files': {
-            const parsed = SearchFilesArgsSchema.safeParse(args)
-            if (!parsed.success) {
-              throw new Error(`Invalid arguments for search_files: ${parsed.error}`)
-            }
-            const validPath = await validatePath(this.allowedDirectories, parsed.data.path)
-            const results = await searchFiles(
-              this.allowedDirectories,
-              validPath,
-              parsed.data.pattern,
-              parsed.data.excludePatterns
-            )
-            return {
-              content: [{ type: 'text', text: results.length > 0 ? results.join('\n') : 'No matches found' }]
-            }
-          }
-
-          case 'get_file_info': {
-            const parsed = GetFileInfoArgsSchema.safeParse(args)
-            if (!parsed.success) {
-              throw new Error(`Invalid arguments for get_file_info: ${parsed.error}`)
-            }
-            const validPath = await validatePath(this.allowedDirectories, parsed.data.path)
-            const info = await getFileStats(validPath)
-            return {
-              content: [
-                {
-                  type: 'text',
-                  text: Object.entries(info)
-                    .map(([key, value]) => `${key}: ${value}`)
-                    .join('\n')
-                }
-              ]
-            }
-          }
-
-          case 'list_allowed_directories': {
-            return {
-              content: [
-                {
-                  type: 'text',
-                  text: `Allowed directories:\n${this.allowedDirectories.join('\n')}`
-                }
-              ]
-            }
-          }
-
-          default:
-            throw new Error(`Unknown tool: ${name}`)
-        }
-      } catch (error) {
-        const errorMessage = error instanceof Error ? error.message : String(error)
-        return {
-          content: [{ type: 'text', text: `Error: ${errorMessage}` }],
-          isError: true
-        }
-      }
-    })
-  }
-}
-
-export default FileSystemServer
diff --git a/src/main/mcpServers/filesystem/index.ts b/src/main/mcpServers/filesystem/index.ts
new file mode 100644
index 0000000000..cec4c31cdf
--- /dev/null
+++ b/src/main/mcpServers/filesystem/index.ts
@@ -0,0 +1,2 @@
+// Re-export FileSystemServer to maintain existing import pattern
+export { default, FileSystemServer } from './server'
diff --git a/src/main/mcpServers/filesystem/server.ts b/src/main/mcpServers/filesystem/server.ts
new file mode 100644
index 0000000000..164ba0c9c4
--- /dev/null
+++ b/src/main/mcpServers/filesystem/server.ts
@@ -0,0 +1,118 @@
+import { Server } from '@modelcontextprotocol/sdk/server/index.js'
+import { CallToolRequestSchema, ListToolsRequestSchema } from '@modelcontextprotocol/sdk/types.js'
+import { app } from 'electron'
+import fs from 'fs/promises'
+import path from 'path'
+
+import {
+  deleteToolDefinition,
+  editToolDefinition,
+  globToolDefinition,
+  grepToolDefinition,
+  handleDeleteTool,
+  handleEditTool,
+  handleGlobTool,
+  handleGrepTool,
+  handleLsTool,
+  handleReadTool,
+  handleWriteTool,
+  lsToolDefinition,
+  readToolDefinition,
+  writeToolDefinition
+} from './tools'
+import { logger } from './types'
+
+export class FileSystemServer {
+  public server: Server
+  private baseDir: string
+
+  constructor(baseDir?: string) {
+    if (baseDir && path.isAbsolute(baseDir)) {
+      this.baseDir = baseDir
+      logger.info(`Using provided baseDir for filesystem MCP: ${baseDir}`)
+    } else {
+      const userData = app.getPath('userData')
+      this.baseDir = path.join(userData, 'Data', 'Workspace')
+      logger.info(`Using default workspace for filesystem MCP baseDir: ${this.baseDir}`)
+    }
+
+    this.server = new Server(
+      {
+        name: 'filesystem-server',
+        version: '2.0.0'
+      },
+      {
+        capabilities: {
+          tools: {}
+        }
+      }
+    )
+
+    this.initialize()
+  }
+
+  async initialize() {
+    try {
+      await fs.mkdir(this.baseDir, { recursive: true })
+    } catch (error) {
+      logger.error('Failed to create filesystem MCP baseDir', { error, baseDir: this.baseDir })
+    }
+
+    // Register tool list handler
+    this.server.setRequestHandler(ListToolsRequestSchema, async () => {
+      return {
+        tools: [
+          globToolDefinition,
+          lsToolDefinition,
+          grepToolDefinition,
+          readToolDefinition,
+          editToolDefinition,
+          writeToolDefinition,
+          deleteToolDefinition
+        ]
+      }
+    })
+
+    // Register tool call handler
+    this.server.setRequestHandler(CallToolRequestSchema, async (request) => {
+      try {
+        const { name, arguments: args } = request.params
+
+        switch (name) {
+          case 'glob':
+            return await handleGlobTool(args, this.baseDir)
+
+          case 'ls':
+            return await handleLsTool(args, this.baseDir)
+
+          case 'grep':
+            return await handleGrepTool(args, this.baseDir)
+
+          case 'read':
+            return await handleReadTool(args, this.baseDir)
+
+          case 'edit':
+            return await handleEditTool(args, this.baseDir)
+
+          case 'write':
+            return await handleWriteTool(args, this.baseDir)
+
+          case 'delete':
+            return await handleDeleteTool(args, this.baseDir)
+
+          default:
+            throw new Error(`Unknown tool: ${name}`)
+        }
+      } catch (error) {
+        const errorMessage = error instanceof Error ? error.message : String(error)
+        logger.error(`Tool execution error for ${request.params.name}:`, { error })
+        return {
+          content: [{ type: 'text', text: `Error: ${errorMessage}` }],
+          isError: true
+        }
+      }
+    })
+  }
+}
+
+export default FileSystemServer
diff --git a/src/main/mcpServers/filesystem/tools/delete.ts b/src/main/mcpServers/filesystem/tools/delete.ts
new file mode 100644
index 0000000000..83becc4f17
--- /dev/null
+++ b/src/main/mcpServers/filesystem/tools/delete.ts
@@ -0,0 +1,93 @@
+import fs from 'fs/promises'
+import path from 'path'
+import * as z from 'zod'
+
+import { logger, validatePath } from '../types'
+
+// Schema definition
+export const DeleteToolSchema = z.object({
+  path: z.string().describe('The path to the file or directory to delete'),
+  recursive: z.boolean().optional().describe('For directories, whether to delete recursively (default: false)')
+})
+
+// Tool definition with detailed description
+export const deleteToolDefinition = {
+  name: 'delete',
+  description: `Deletes a file or directory from the filesystem.
+
+CAUTION: This operation cannot be undone!
+
+- For files: simply provide the path
+- For empty directories: provide the path
+- For non-empty directories: set recursive=true
+- The path must be an absolute path, not a relative path
+- Always verify the path before deleting to avoid data loss`,
+  inputSchema: z.toJSONSchema(DeleteToolSchema)
+}
+
+// Handler implementation
+export async function handleDeleteTool(args: unknown, baseDir: string) {
+  const parsed = DeleteToolSchema.safeParse(args)
+  if (!parsed.success) {
+    throw new Error(`Invalid arguments for delete: ${parsed.error}`)
+  }
+
+  const targetPath = parsed.data.path
+  const validPath = await validatePath(targetPath, baseDir)
+  const recursive = parsed.data.recursive || false
+
+  // Check if path exists and get stats
+  let stats
+  try {
+    stats = await fs.stat(validPath)
+  } catch (error: any) {
+    if (error.code === 'ENOENT') {
+      throw new Error(`Path not found: ${targetPath}`)
+    }
+    throw error
+  }
+
+  const isDirectory = stats.isDirectory()
+  const relativePath = path.relative(baseDir, validPath)
+
+  // Perform deletion
+  try {
+    if (isDirectory) {
+      if (recursive) {
+        // Delete directory recursively
+        await fs.rm(validPath, { recursive: true, force: true })
+      } else {
+        // Try to delete empty directory
+        await fs.rmdir(validPath)
+      }
+    } else {
+      // Delete file
+      await fs.unlink(validPath)
+    }
+  } catch (error: any) {
+    if (error.code === 'ENOTEMPTY') {
+      throw new Error(`Directory not empty: ${targetPath}. Use recursive=true to delete non-empty directories.`)
+    }
+    throw new Error(`Failed to delete: ${error.message}`)
+  }
+
+  // Log the operation
+  logger.info('Path deleted', {
+    path: validPath,
+    type: isDirectory ? 'directory' : 'file',
+    recursive: isDirectory ? recursive : undefined
+  })
+
+  // Format output
+  const itemType = isDirectory ? 'Directory' : 'File'
+  const recursiveNote = isDirectory && recursive ? ' (recursive)' : ''
+
+  return {
+    content: [
+      {
+        type: 'text',
+        text: `${itemType} deleted${recursiveNote}: ${relativePath}`
+      }
+    ]
+  }
+}
diff --git a/src/main/mcpServers/filesystem/tools/edit.ts b/src/main/mcpServers/filesystem/tools/edit.ts
new file mode 100644
index 0000000000..c1a0e637ce
--- /dev/null
+++ b/src/main/mcpServers/filesystem/tools/edit.ts
@@ -0,0 +1,130 @@
+import fs from 'fs/promises'
+import path from 'path'
+import * as z from 'zod'
+
+import { logger, replaceWithFuzzyMatch, validatePath } from '../types'
+
+// Schema definition
+export const EditToolSchema = z.object({
+  file_path: z.string().describe('The path to the file to modify'),
+  old_string: z.string().describe('The text to replace'),
+  new_string: z.string().describe('The text to replace it with'),
+  replace_all: z.boolean().optional().default(false).describe('Replace all occurrences of old_string (default false)')
+})
+
+// Tool definition with detailed description
+export const editToolDefinition = {
+  name: 'edit',
+  description: `Performs exact string replacements in files.
+
+- You must use the 'read' tool at least once before editing
+- The file_path must be an absolute path, not a relative path
+- Preserve exact indentation from read output (after the line number prefix)
+- Never include line number prefixes in old_string or new_string
+- ALWAYS prefer editing existing files over creating new ones
+- The edit will FAIL if old_string is not found in the file
+- The edit will FAIL if old_string appears multiple times (provide more context or use replace_all)
+- The edit will FAIL if old_string equals new_string
+- Use replace_all to rename variables or replace all occurrences`,
+  inputSchema: z.toJSONSchema(EditToolSchema)
+}
+
+// Handler implementation
+export async function handleEditTool(args: unknown, baseDir: string) {
+  const parsed = EditToolSchema.safeParse(args)
+  if (!parsed.success) {
+    throw new Error(`Invalid arguments for edit: ${parsed.error}`)
+  }
+
+  const { file_path: filePath, old_string: oldString, new_string: newString, replace_all: replaceAll } = parsed.data
+
+  // Validate path
+  const validPath = await validatePath(filePath, baseDir)
+
+  // Check if file exists
+  try {
+    const stats = await fs.stat(validPath)
+    if (!stats.isFile()) {
+      throw new Error(`Path is not a file: ${filePath}`)
+    }
+  } catch (error: any) {
+    if (error.code === 'ENOENT') {
+      // If old_string is empty, this is a create new file operation
+      if (oldString === '') {
+        // Create parent directory if needed
+        const parentDir = path.dirname(validPath)
+        await fs.mkdir(parentDir, { recursive: true })
+
+        // Write the new content
+        await fs.writeFile(validPath, newString, 'utf-8')
+
+        logger.info('File created', { path: validPath })
+
+        const relativePath = path.relative(baseDir, validPath)
+        return {
+          content: [
+            {
+              type: 'text',
+              text: `Created new file: ${relativePath}\nLines: ${newString.split('\n').length}`
+            }
+          ]
+        }
+      }
+      throw new Error(`File not found: ${filePath}`)
+    }
+    throw error
+  }
+
+  // Read current content
+  const content = await fs.readFile(validPath, 'utf-8')
+
+  // Handle special case: old_string is empty (create file with content)
+  if (oldString === '') {
+    await fs.writeFile(validPath, newString, 'utf-8')
+
+    logger.info('File overwritten', { path: validPath })
+
+    const relativePath = path.relative(baseDir, validPath)
+    return {
+      content: [
+        {
+          type: 'text',
+          text: `Overwrote file: ${relativePath}\nLines: ${newString.split('\n').length}`
+        }
+      ]
+    }
+  }
+
+  // Perform the replacement with fuzzy matching
+  const newContent = replaceWithFuzzyMatch(content, oldString, newString, replaceAll)
+
+  // Write the modified content
+  await fs.writeFile(validPath, newContent, 'utf-8')
+
+  logger.info('File edited', {
+    path: validPath,
+    replaceAll
+  })
+
+  // Generate a simple diff summary
+  const oldLines = content.split('\n').length
+  const newLines = newContent.split('\n').length
+  const lineDiff = newLines - oldLines
+
+  const relativePath = path.relative(baseDir, validPath)
+  let diffSummary = `Edited: ${relativePath}`
+  if (lineDiff > 0) {
+    diffSummary += `\n+${lineDiff} lines`
+  } else if (lineDiff < 0) {
+    diffSummary += `\n${lineDiff} lines`
+  }
+
+  return {
+    content: [
+      {
+        type: 'text',
+        text: diffSummary
+      }
+    ]
+  }
+}
diff --git a/src/main/mcpServers/filesystem/tools/glob.ts b/src/main/mcpServers/filesystem/tools/glob.ts
new file mode 100644
index 0000000000..d6a6b4a757
--- /dev/null
+++ b/src/main/mcpServers/filesystem/tools/glob.ts
@@ -0,0 +1,149 @@
+import fs from 'fs/promises'
+import path from 'path'
+import * as z from 'zod'
+
+import type { FileInfo } from '../types'
+import { logger, MAX_FILES_LIMIT, runRipgrep, validatePath } from '../types'
+
+// Schema definition
+export const GlobToolSchema = z.object({
+  pattern: z.string().describe('The glob pattern to match files against'),
+  path: z
+    .string()
+    .optional()
+    .describe('The directory to search in (must be absolute path). Defaults to the base directory')
+})
+
+// Tool definition with detailed description
+export const globToolDefinition = {
+  name: 'glob',
+  description: `Fast file pattern matching tool that works with any codebase size.
+
+- Supports glob patterns like "**/*.js" or "src/**/*.ts"
+- Returns matching absolute file paths sorted by modification time (newest first)
+- Use this when you need to find files by name patterns
+- Patterns without "/" (e.g., "*.txt") match files at ANY depth in the directory tree
+- Patterns with "/" (e.g., "src/*.ts") match relative to the search path
+- Pattern syntax: * (any chars), ** (any path), {a,b} (alternatives), ? (single char)
+- Results are limited to 100 files
+- The path parameter must be an absolute path if specified
+- If path is not specified, defaults to the base directory
+- IMPORTANT: Omit the path field for the default directory (don't use "undefined" or "null")`,
+  inputSchema: z.toJSONSchema(GlobToolSchema)
+}
+
+// Handler implementation
+export async function handleGlobTool(args: unknown, baseDir: string) {
+  const parsed = GlobToolSchema.safeParse(args)
+  if (!parsed.success) {
+    throw new Error(`Invalid arguments for glob: ${parsed.error}`)
+  }
+
+  const searchPath = parsed.data.path || baseDir
+  const validPath = await validatePath(searchPath, baseDir)
+
+  // Verify the search directory exists
+  try {
+    const stats = await fs.stat(validPath)
+    if (!stats.isDirectory()) {
+      throw new Error(`Path is not a directory: ${validPath}`)
+    }
+  } catch (error: unknown) {
+    if (error && typeof error === 'object' && 'code' in error && error.code === 'ENOENT') {
+      throw new Error(`Directory not found: ${validPath}`)
+    }
+    throw error
+  }
+
+  // Validate pattern
+  const pattern = parsed.data.pattern.trim()
+  if (!pattern) {
+    throw new Error('Pattern cannot be empty')
+  }
+
+  const files: FileInfo[] = []
+  let truncated = false
+
+  // Build ripgrep arguments for file listing using --glob=pattern format
+  const rgArgs: string[] = [
+    '--files',
+    '--follow',
+    '--hidden',
+    `--glob=${pattern}`,
+    '--glob=!.git/*',
+    '--glob=!node_modules/*',
+    '--glob=!dist/*',
+    '--glob=!build/*',
+    '--glob=!__pycache__/*',
+    validPath
+  ]
+
+  // Use ripgrep for file listing
+  logger.debug('Running ripgrep with args', { rgArgs })
+  const rgResult = await runRipgrep(rgArgs)
+  logger.debug('Ripgrep result', {
+    ok: rgResult.ok,
+    exitCode: rgResult.exitCode,
+    stdoutLength: rgResult.stdout.length,
+    stdoutPreview: rgResult.stdout.slice(0, 500)
+  })
+
+  // Process results if we have stdout content
+  // Exit code 2 can indicate partial errors (e.g., permission denied on some dirs) but still have valid results
+  if (rgResult.ok && rgResult.stdout.length > 0) {
+    const lines = rgResult.stdout.split('\n').filter(Boolean)
+    logger.debug('Parsed lines from ripgrep', { lineCount: lines.length, lines })
+
+    for (const line of lines) {
+      if (files.length >= MAX_FILES_LIMIT) {
+        truncated = true
+        break
+      }
+
+      const filePath = line.trim()
+      if (!filePath) continue
+
+      const absolutePath = path.isAbsolute(filePath) ? filePath : path.resolve(validPath, filePath)
+
+      try {
+        const stats = await fs.stat(absolutePath)
+        files.push({
+          path: absolutePath,
+          type: 'file', // ripgrep --files only returns files
+          size: stats.size,
+          modified: stats.mtime
+        })
+      } catch (error) {
+        logger.debug('Failed to stat file from ripgrep output, skipping', { file: absolutePath, error })
+      }
+    }
+  }
+
+  // Sort by modification time (newest first)
+  files.sort((a, b) => {
+    const aTime = a.modified ? a.modified.getTime() : 0
+    const bTime = b.modified ? b.modified.getTime() : 0
+    return bTime - aTime
+  })
+
+  // Format output - always use absolute paths
+  const output: string[] = []
+  if (files.length === 0) {
+    output.push(`No files found matching pattern "${parsed.data.pattern}" in ${validPath}`)
+  } else {
+    output.push(...files.map((f) => f.path))
+    if (truncated) {
+      output.push('')
+      output.push(`(Results truncated to ${MAX_FILES_LIMIT} files. Consider using a more specific pattern.)`)
+    }
+  }
+
+  return {
+    content: [
+      {
+        type: 'text',
+        text: output.join('\n')
+      }
+    ]
+  }
+}
diff --git a/src/main/mcpServers/filesystem/tools/grep.ts b/src/main/mcpServers/filesystem/tools/grep.ts
new file mode 100644
index 0000000000..d822db9d88
--- /dev/null
+++ b/src/main/mcpServers/filesystem/tools/grep.ts
@@ -0,0 +1,266 @@
+import fs from 'fs/promises'
+import path from 'path'
+import * as z from 'zod'
+
+import type { GrepMatch } from '../types'
+import { isBinaryFile, MAX_GREP_MATCHES, MAX_LINE_LENGTH, runRipgrep, validatePath } from '../types'
+
+// Schema definition
+export const GrepToolSchema = z.object({
+  pattern: z.string().describe('The regex pattern to search for in file contents'),
+  path: z
+    .string()
+    .optional()
+    .describe('The directory to search in (must be absolute path). Defaults to the base directory'),
+  include: z.string().optional().describe('File pattern to include in the search (e.g. "*.js", "*.{ts,tsx}")')
+})
+
+// Tool definition with detailed description
+export const grepToolDefinition = {
+  name: 'grep',
+  description: `Fast content search tool that works with any codebase size.
+
+- Searches file contents using regular expressions
+- Supports full regex syntax (e.g., "log.*Error", "function\\s+\\w+")
+- Filter files by pattern with include (e.g., "*.js", "*.{ts,tsx}")
+- Returns absolute file paths and line numbers with matching content
+- Results are limited to 100 matches
+- Binary files are automatically skipped
+- Common directories (node_modules, .git, dist) are excluded
+- The path parameter must be an absolute path if specified
+- If path is not specified, defaults to the base directory`,
+  inputSchema: z.toJSONSchema(GrepToolSchema)
+}
+
+// Handler implementation
+export async function handleGrepTool(args: unknown, baseDir: string) {
+  const parsed = GrepToolSchema.safeParse(args)
+  if (!parsed.success) {
+    throw new Error(`Invalid arguments for grep: ${parsed.error}`)
+  }
+
+  const data = parsed.data
+
+  if (!data.pattern) {
+    throw new Error('Pattern is required for grep')
+  }
+
+  const searchPath = data.path || baseDir
+  const validPath = await validatePath(searchPath, baseDir)
+
+  const matches: GrepMatch[] = []
+  let truncated = false
+  let regex: RegExp
+
+  // Build ripgrep arguments
+  const rgArgs: string[] = [
+    '--no-heading',
+    '--line-number',
+    '--color',
+    'never',
+    '--ignore-case',
+    '--glob',
+    '!.git/**',
+    '--glob',
+    '!node_modules/**',
+    '--glob',
+    '!dist/**',
+    '--glob',
+    '!build/**',
+    '--glob',
+    '!__pycache__/**'
+  ]
+
+  if (data.include) {
+    for (const pat of data.include
+      .split(',')
+      .map((p) => p.trim())
+      .filter(Boolean)) {
+      rgArgs.push('--glob', pat)
+    }
+  }
+
+  rgArgs.push(data.pattern)
+  rgArgs.push(validPath)
+
+  try {
+    regex = new RegExp(data.pattern, 'gi')
+  } catch (error) {
+    throw new Error(`Invalid regex pattern: ${data.pattern}`)
+  }
+
+  async function searchFile(filePath: string): Promise<void> {
+    if (matches.length >= MAX_GREP_MATCHES) {
+      truncated = true
+      return
+    }
+
+    try {
+      // Skip binary files
+      if (await isBinaryFile(filePath)) {
+        return
+      }
+
+      const content = await fs.readFile(filePath, 'utf-8')
+      const lines = content.split('\n')
+
+      lines.forEach((line, index) => {
+        if (matches.length >= MAX_GREP_MATCHES) {
+          truncated = true
+          return
+        }
+
+        if (regex.test(line)) {
+          // Truncate long lines
+          const truncatedLine = line.length > MAX_LINE_LENGTH ? line.substring(0, MAX_LINE_LENGTH) + '...' : line
+
+          matches.push({
+            file: filePath,
+            line: index + 1,
+            content: truncatedLine.trim()
+          })
+        }
+      })
+    } catch (error) {
+      // Skip files we can't read
+    }
+  }
+
+  async function searchDirectory(dir: string): Promise<void> {
+    if (matches.length >= MAX_GREP_MATCHES) {
+      truncated = true
+      return
+    }
+
+    try {
+      const entries = await fs.readdir(dir, { withFileTypes: true })
+
+      for (const entry of entries) {
+        if (matches.length >= MAX_GREP_MATCHES) {
+          truncated = true
+          break
+        }
+
+        const fullPath = path.join(dir, entry.name)
+
+        // Skip common ignore patterns
+        if (entry.name.startsWith('.') && entry.name !== '.env.example') {
+          continue
+        }
+        if (['node_modules', 'dist', 'build', '__pycache__', '.git'].includes(entry.name)) {
+          continue
+        }
+
+        if (entry.isFile()) {
+          // Check if file matches include pattern
+          if (data.include) {
+            const includePatterns = data.include.split(',').map((p) => p.trim())
+            const fileName = path.basename(fullPath)
+            const matchesInclude = includePatterns.some((pattern) => {
+              // Simple glob pattern matching
+              const regexPattern = pattern
+                .replace(/\*/g, '.*')
+                .replace(/\?/g, '.')
+                .replace(/\{([^}]+)\}/g, (_, group) => `(${group.split(',').join('|')})`)
+              return new RegExp(`^${regexPattern}$`).test(fileName)
+            })
+            if (!matchesInclude) {
+              continue
+            }
+          }
+
+          await searchFile(fullPath)
+        } else if (entry.isDirectory()) {
+          await searchDirectory(fullPath)
+        }
+      }
+    } catch (error) {
+      // Skip directories we can't read
+    }
+  }
+
+  // Perform the search
+  let usedRipgrep = false
+  try {
+    const rgResult = await runRipgrep(rgArgs)
+    if (rgResult.ok && rgResult.exitCode !== null && rgResult.exitCode !== 2) {
+      usedRipgrep = true
+      const lines = rgResult.stdout.split('\n').filter(Boolean)
+      for (const line of lines) {
+        if (matches.length >= MAX_GREP_MATCHES) {
+          truncated = true
+          break
+        }
+
+        const firstColon = line.indexOf(':')
+        const secondColon = line.indexOf(':', firstColon + 1)
+        if (firstColon === -1 || secondColon === -1) continue
+
+        const filePart = line.slice(0, firstColon)
+        const linePart = line.slice(firstColon + 1, secondColon)
+        const contentPart = line.slice(secondColon + 1)
+        const lineNum = Number.parseInt(linePart, 10)
+        if (!Number.isFinite(lineNum)) continue
+
+        const absoluteFilePath = path.isAbsolute(filePart) ? filePart : path.resolve(baseDir, filePart)
+        const truncatedLine =
+          contentPart.length > MAX_LINE_LENGTH ? contentPart.substring(0, MAX_LINE_LENGTH) + '...' : contentPart
+
+        matches.push({
+          file: absoluteFilePath,
+          line: lineNum,
+          content: truncatedLine.trim()
+        })
+      }
+    }
+  } catch {
+    usedRipgrep = false
+  }
+
+  if (!usedRipgrep) {
+    const stats = await fs.stat(validPath)
+    if (stats.isFile()) {
+      await searchFile(validPath)
+    } else {
+      await searchDirectory(validPath)
+    }
+  }
+
+  // Format output
+  const output: string[] = []
+
+  if (matches.length === 0) {
+    output.push('No matches found')
+  } else {
+    // Group matches by file
+    const fileGroups = new Map<string, GrepMatch[]>()
+    matches.forEach((match) => {
+      if (!fileGroups.has(match.file)) {
+        fileGroups.set(match.file, [])
+      }
+      fileGroups.get(match.file)!.push(match)
+    })
+
+    // Format grouped matches - always use absolute paths
+    fileGroups.forEach((fileMatches, filePath) => {
+      output.push(`\n${filePath}:`)
+      fileMatches.forEach((match) => {
+        output.push(`  ${match.line}: ${match.content}`)
+      })
+    })
+
+    if (truncated) {
+      output.push('')
+      output.push(`(Results truncated to ${MAX_GREP_MATCHES} matches. Consider using a more specific pattern or path.)`)
+    }
+  }
+
+  return {
+    content: [
+      {
+        type: 'text',
+        text: output.join('\n')
+      }
+    ]
+  }
+}
diff --git a/src/main/mcpServers/filesystem/tools/index.ts b/src/main/mcpServers/filesystem/tools/index.ts
new file mode 100644
index 0000000000..2e02d613c4
--- /dev/null
+++ b/src/main/mcpServers/filesystem/tools/index.ts
@@ -0,0 +1,8 @@
+// Export all tool definitions and handlers
+export { deleteToolDefinition, handleDeleteTool } from './delete'
+export { editToolDefinition, handleEditTool } from './edit'
+export { globToolDefinition, handleGlobTool } from './glob'
+export { grepToolDefinition, handleGrepTool } from './grep'
+export { handleLsTool, lsToolDefinition } from './ls'
+export { handleReadTool, readToolDefinition } from './read'
+export { handleWriteTool, writeToolDefinition } from './write'
diff --git a/src/main/mcpServers/filesystem/tools/ls.ts b/src/main/mcpServers/filesystem/tools/ls.ts
new file mode 100644
index 0000000000..22672c9fb9
--- /dev/null
+++ b/src/main/mcpServers/filesystem/tools/ls.ts
@@ -0,0 +1,150 @@
+import fs from 'fs/promises'
+import path from 'path'
+import * as z from 'zod'
+
+import { MAX_FILES_LIMIT, validatePath } from '../types'
+
+// Schema definition
+export const LsToolSchema = z.object({
+  path: z.string().optional().describe('The directory to list (must be absolute path). Defaults to the base directory'),
+  recursive: z.boolean().optional().describe('Whether to list directories recursively (default: false)')
+})
+
+// Tool definition with detailed description
+export const lsToolDefinition = {
+  name: 'ls',
+  description: `Lists files and directories in a specified path.
+
+- Returns a tree-like structure with icons (📁 directories, 📄 files)
+- Shows the absolute directory path in the header
+- Entries are sorted alphabetically with directories first
+- Can list recursively with recursive=true (up to 5 levels deep)
+- Common directories (node_modules, dist, .git) are excluded
+- Hidden files (starting with .) are excluded except .env.example
+- Results are limited to 100 entries
+- The path parameter must be an absolute path if specified
+- If path is not specified, defaults to the base directory`,
+  inputSchema: z.toJSONSchema(LsToolSchema)
+}
+
+// Handler implementation
+export async function handleLsTool(args: unknown, baseDir: string) {
+  const parsed = LsToolSchema.safeParse(args)
+  if (!parsed.success) {
+    throw new Error(`Invalid arguments for ls: ${parsed.error}`)
+  }
+
+  const targetPath = parsed.data.path || baseDir
+  const validPath = await validatePath(targetPath, baseDir)
+  const recursive = parsed.data.recursive || false
+
+  interface TreeNode {
+    name: string
+    type: 'file' | 'directory'
+    children?: TreeNode[]
+  }
+
+  let fileCount = 0
+  let truncated = false
+
+  async function buildTree(dirPath: string, depth: number = 0): Promise<TreeNode[]> {
+    if (fileCount >= MAX_FILES_LIMIT) {
+      truncated = true
+      return []
+    }
+
+    try {
+      const entries = await fs.readdir(dirPath, { withFileTypes: true })
+      const nodes: TreeNode[] = []
+
+      // Sort entries: directories first, then files, alphabetically
+      entries.sort((a, b) => {
+        if (a.isDirectory() && !b.isDirectory()) return -1
+        if (!a.isDirectory() && b.isDirectory()) return 1
+        return a.name.localeCompare(b.name)
+      })
+
+      for (const entry of entries) {
+        if (fileCount >= MAX_FILES_LIMIT) {
+          truncated = true
+          break
+        }
+
+        // Skip hidden files and common ignore patterns
+        if (entry.name.startsWith('.') && entry.name !== '.env.example') {
+          continue
+        }
+        if (['node_modules', 'dist', 'build', '__pycache__'].includes(entry.name)) {
+          continue
+        }
+
+        fileCount++
+        const node: TreeNode = {
+          name: entry.name,
+          type: entry.isDirectory() ? 'directory' : 'file'
+        }
+
+        if (entry.isDirectory() && recursive && depth < 5) {
+          // Limit depth to prevent infinite recursion
+          const childPath = path.join(dirPath, entry.name)
+          node.children = await buildTree(childPath, depth + 1)
+        }
+
+        nodes.push(node)
+      }
+
+      return nodes
+    } catch (error) {
+      return []
+    }
+  }
+
+  // Build the tree
+  const tree = await buildTree(validPath)
+
+  // Format as text output
+  function formatTree(nodes: TreeNode[], prefix: string = ''): string[] {
+    const lines: string[] = []
+
+    nodes.forEach((node, index) => {
+      const isLastNode = index === nodes.length - 1
+      const connector = isLastNode ? '└── ' : '├── '
+      const icon = node.type === 'directory' ? '📁 ' : '📄 '
+
+      lines.push(prefix + connector + icon + node.name)
+
+      if (node.children && node.children.length > 0) {
+        const childPrefix = prefix + (isLastNode ? '    ' : '│   ')
+        lines.push(...formatTree(node.children, childPrefix))
+      }
+    })
+
+    return lines
+  }
+
+  // Generate output
+  const output: string[] = []
+  output.push(`Directory: ${validPath}`)
+  output.push('')
+
+  if (tree.length === 0) {
+    output.push('(empty directory)')
+  } else {
+    const treeLines = formatTree(tree, '')
+    output.push(...treeLines)
+
+    if (truncated) {
+      output.push('')
+      output.push(`(Results truncated to ${MAX_FILES_LIMIT} files. Consider listing a more specific directory.)`)
+    }
+  }
+
+  return {
+    content: [
+      {
+        type: 'text',
+        text: output.join('\n')
+      }
+    ]
+  }
+}
diff --git a/src/main/mcpServers/filesystem/tools/read.ts b/src/main/mcpServers/filesystem/tools/read.ts
new file mode 100644
index 0000000000..460c88dda4
--- /dev/null
+++ b/src/main/mcpServers/filesystem/tools/read.ts
@@ -0,0 +1,101 @@
+import fs from 'fs/promises'
+import path from 'path'
+import * as z from 'zod'
+
+import { DEFAULT_READ_LIMIT, isBinaryFile, MAX_LINE_LENGTH, validatePath } from '../types'
+
+// Schema definition
+export const ReadToolSchema = z.object({
+  file_path: z.string().describe('The path to the file to read'),
+  offset: z.number().optional().describe('The line number to start reading from (1-based)'),
+  limit: z.number().optional().describe('The number of lines to read (defaults to 2000)')
+})
+
+// Tool definition with detailed description
+export const readToolDefinition = {
+  name: 'read',
+  description: `Reads a file from the local filesystem.
+
+- Assumes this tool can read all files on the machine
+- The file_path parameter must be an absolute path, not a relative path
+- By default, reads up to 2000 lines starting from the beginning
+- You can optionally specify a line offset and limit for long files
+- Any lines longer than 2000 characters will be truncated
+- Results are returned with line numbers starting at 1
+- Binary files are detected and rejected with an error
+- Empty files return a warning`,
+  inputSchema: z.toJSONSchema(ReadToolSchema)
+}
+
+// Handler implementation
+export async function handleReadTool(args: unknown, baseDir: string) {
+  const parsed = ReadToolSchema.safeParse(args)
+  if (!parsed.success) {
+    throw new Error(`Invalid arguments for read: ${parsed.error}`)
+  }
+
+  const filePath = parsed.data.file_path
+  const validPath = await validatePath(filePath, baseDir)
+
+  // Check if file exists
+  try {
+    const stats = await fs.stat(validPath)
+    if (!stats.isFile()) {
+      throw new Error(`Path is not a file: ${filePath}`)
+    }
+  } catch (error: any) {
+    if (error.code === 'ENOENT') {
+      throw new Error(`File not found: ${filePath}`)
+    }
+    throw error
+  }
+
+  // Check if file is binary
+  if (await isBinaryFile(validPath)) {
+    throw new Error(`Cannot read binary file: ${filePath}`)
+  }
+
+  // Read file content
+  const content = await fs.readFile(validPath, 'utf-8')
+  const lines = content.split('\n')
+
+  // Apply offset and limit
+  const offset = (parsed.data.offset || 1) - 1 // Convert to 0-based
+  const limit = parsed.data.limit || DEFAULT_READ_LIMIT
+
+  if (offset < 0 || offset >= lines.length) {
+    throw new Error(`Invalid offset: ${offset + 1}. File has ${lines.length} lines.`)
+  }
+
+  const selectedLines = lines.slice(offset, offset + limit)
+
+  // Format output with line numbers and truncate long lines
+  const output: string[] = []
+  const relativePath = path.relative(baseDir, validPath)
+
+  output.push(`File: ${relativePath}`)
+  if (offset > 0 || limit < lines.length) {
+    output.push(`Lines ${offset + 1} to ${Math.min(offset + limit, lines.length)} of ${lines.length}`)
+  }
+  output.push('')
+
+  selectedLines.forEach((line, index) => {
+    const lineNumber = offset + index + 1
+    const truncatedLine = line.length > MAX_LINE_LENGTH ? line.substring(0, MAX_LINE_LENGTH) + '...' : line
+    output.push(`${lineNumber.toString().padStart(6)}\t${truncatedLine}`)
+  })
+
+  if (offset + limit < lines.length) {
+    output.push('')
+    output.push(`(${lines.length - (offset + limit)} more lines not shown)`)
+  }
+
+  return {
+    content: [
+      {
+        type: 'text',
+        text: output.join('\n')
+      }
+    ]
+  }
+}
diff --git a/src/main/mcpServers/filesystem/tools/write.ts b/src/main/mcpServers/filesystem/tools/write.ts
new file mode 100644
index 0000000000..2898f2f874
--- /dev/null
+++ b/src/main/mcpServers/filesystem/tools/write.ts
@@ -0,0 +1,83 @@
+import fs from 'fs/promises'
+import path from 'path'
+import * as z from 'zod'
+
+import { logger, validatePath } from '../types'
+
+// Schema definition
+export const WriteToolSchema = z.object({
+  file_path: z.string().describe('The path to the file to write'),
+  content: z.string().describe('The content to write to the file')
+})
+
+// Tool definition with detailed description
+export const writeToolDefinition = {
+  name: 'write',
+  description: `Writes a file to the local filesystem.
+
+- This tool will overwrite the existing file if one exists at the path
+- You MUST use the read tool first to understand what you're overwriting
+- ALWAYS prefer using the 'edit' tool for existing files
+- NEVER proactively create documentation files unless explicitly requested
+- Parent directories will be created automatically if they don't exist
+- The file_path must be an absolute path, not a relative path`,
+  inputSchema: z.toJSONSchema(WriteToolSchema)
+}
+
+// Handler implementation
+export async function handleWriteTool(args: unknown, baseDir: string) {
+  const parsed = WriteToolSchema.safeParse(args)
+  if (!parsed.success) {
+    throw new Error(`Invalid arguments for write: ${parsed.error}`)
+  }
+
+  const filePath = parsed.data.file_path
+  const validPath = await validatePath(filePath, baseDir)
+
+  // Create parent directory if it doesn't exist
+  const parentDir = path.dirname(validPath)
+  try {
+    await fs.mkdir(parentDir, { recursive: true })
+  } catch (error: any) {
+    if (error.code !== 'EEXIST') {
+      throw new Error(`Failed to create parent directory: ${error.message}`)
+    }
+  }
+
+  // Check if file exists (for logging)
+  let isOverwrite = false
+  try {
+    await fs.stat(validPath)
+    isOverwrite = true
+  } catch {
+    // File doesn't exist, that's fine
+  }
+
+  // Write the file
+  try {
+    await fs.writeFile(validPath, parsed.data.content, 'utf-8')
+  } catch (error: any) {
+    throw new Error(`Failed to write file: ${error.message}`)
+  }
+
+  // Log the operation
+  logger.info('File written', {
+    path: validPath,
+    overwrite: isOverwrite,
+    size: parsed.data.content.length
+  })
+
+  // Format output
+  const relativePath = path.relative(baseDir, validPath)
+  const action = isOverwrite ? 'Updated' : 'Created'
+  const lines = parsed.data.content.split('\n').length
+
+  return {
+    content: [
+      {
+        type: 'text',
+        text: `${action} file: ${relativePath}\n` + `Size: ${parsed.data.content.length} bytes\n` + `Lines: ${lines}`
+      }
+    ]
+  }
+}
diff --git a/src/main/mcpServers/filesystem/types.ts b/src/main/mcpServers/filesystem/types.ts
new file mode 100644
index 0000000000..922fe0b23a
--- /dev/null
+++ b/src/main/mcpServers/filesystem/types.ts
@@ -0,0 +1,627 @@
+import { loggerService } from '@logger'
+import { isMac, isWin } from '@main/constant'
+import { spawn } from 'child_process'
+import fs from 'fs/promises'
+import os from 'os'
+import path from 'path'
+
+export const logger = loggerService.withContext('MCP:FileSystemServer')
+
+// Constants
+export const MAX_LINE_LENGTH = 2000
+export const DEFAULT_READ_LIMIT = 2000
+export const MAX_FILES_LIMIT = 100
+export const MAX_GREP_MATCHES = 100
+
+// Common types
+export interface FileInfo {
+  path: string
+  type: 'file' | 'directory'
+  size?: number
+  modified?: Date
+}
+
+export interface GrepMatch {
+  file: string
+  line: number
+  content: string
+}
+
+// Utility functions for path handling
+export function normalizePath(p: string): string {
+  return path.normalize(p)
+}
+
+export function expandHome(filepath: string): string {
+  if (filepath.startsWith('~/') || filepath === '~') {
+    return path.join(os.homedir(), filepath.slice(1))
+  }
+  return filepath
+}
+
+// Security validation
+export async function validatePath(requestedPath: string, baseDir?: string): Promise<string> {
+  const expandedPath = expandHome(requestedPath)
+  const root = baseDir ?? process.cwd()
+  const absolute = path.isAbsolute(expandedPath) ? path.resolve(expandedPath) : path.resolve(root, expandedPath)
+
+  // Handle symlinks by checking their real path
+  try {
+    const realPath = await fs.realpath(absolute)
+    return normalizePath(realPath)
+  } catch (error) {
+    // For new files that don't exist yet, verify parent directory
+    const parentDir = path.dirname(absolute)
+    try {
+      const realParentPath = await fs.realpath(parentDir)
+      normalizePath(realParentPath)
+      return normalizePath(absolute)
+    } catch {
+      return normalizePath(absolute)
+    }
+  }
+}
+
+// ============================================================================
+// Edit Tool Utilities - Fuzzy matching replacers from opencode
+// ============================================================================
+
+export type Replacer = (content: string, find: string) => Generator<string, void, unknown>
+
+// Similarity thresholds for block anchor fallback matching
+const SINGLE_CANDIDATE_SIMILARITY_THRESHOLD = 0.0
+const MULTIPLE_CANDIDATES_SIMILARITY_THRESHOLD = 0.3
+
+/**
+ * Levenshtein distance algorithm implementation
+ */
+function levenshtein(a: string, b: string): number {
+  if (a === '' || b === '') {
+    return Math.max(a.length, b.length)
+  }
+  const matrix = Array.from({ length: a.length + 1 }, (_, i) =>
+    Array.from({ length: b.length + 1 }, (_, j) => (i === 0 ? j : j === 0 ? i : 0))
+  )
+
+  for (let i = 1; i <= a.length; i++) {
+    for (let j = 1; j <= b.length; j++) {
+      const cost = a[i - 1] === b[j - 1] ? 0 : 1
+      matrix[i][j] = Math.min(matrix[i - 1][j] + 1, matrix[i][j - 1] + 1, matrix[i - 1][j - 1] + cost)
+    }
+  }
+  return matrix[a.length][b.length]
+}
+
+export const SimpleReplacer: Replacer = function* (_content, find) {
+  yield find
+}
+
+export const LineTrimmedReplacer: Replacer = function* (content, find) {
+  const originalLines = content.split('\n')
+  const searchLines = find.split('\n')
+
+  if (searchLines[searchLines.length - 1] === '') {
+    searchLines.pop()
+  }
+
+  for (let i = 0; i <= originalLines.length - searchLines.length; i++) {
+    let matches = true
+
+    for (let j = 0; j < searchLines.length; j++) {
+      const originalTrimmed = originalLines[i + j].trim()
+      const searchTrimmed = searchLines[j].trim()
+
+      if (originalTrimmed !== searchTrimmed) {
+        matches = false
+        break
+      }
+    }
+
+    if (matches) {
+      let matchStartIndex = 0
+      for (let k = 0; k < i; k++) {
+        matchStartIndex += originalLines[k].length + 1
+      }
+
+      let matchEndIndex = matchStartIndex
+      for (let k = 0; k < searchLines.length; k++) {
+        matchEndIndex += originalLines[i + k].length
+        if (k < searchLines.length - 1) {
+          matchEndIndex += 1
+        }
+      }
+
+      yield content.substring(matchStartIndex, matchEndIndex)
+    }
+  }
+}
+
+export const BlockAnchorReplacer: Replacer = function* (content, find) {
+  const originalLines = content.split('\n')
+  const searchLines = find.split('\n')
+
+  if (searchLines.length < 3) {
+    return
+  }
+
+  if (searchLines[searchLines.length - 1] === '') {
+    searchLines.pop()
+  }
+
+  const firstLineSearch = searchLines[0].trim()
+  const lastLineSearch = searchLines[searchLines.length - 1].trim()
+  const searchBlockSize = searchLines.length
+
+  const candidates: Array<{ startLine: number; endLine: number }> = []
+  for (let i = 0; i < originalLines.length; i++) {
+    if (originalLines[i].trim() !== firstLineSearch) {
+      continue
+    }
+
+    for (let j = i + 2; j < originalLines.length; j++) {
+      if (originalLines[j].trim() === lastLineSearch) {
+        candidates.push({ startLine: i, endLine: j })
+        break
+      }
+    }
+  }
+
+  if (candidates.length === 0) {
+    return
+  }
+
+  if (candidates.length === 1) {
+    const { startLine, endLine } = candidates[0]
+    const actualBlockSize = endLine - startLine + 1
+
+    let similarity = 0
+    const linesToCheck = Math.min(searchBlockSize - 2, actualBlockSize - 2)
+
+    if (linesToCheck > 0) {
+      for (let j = 1; j < searchBlockSize - 1 && j < actualBlockSize - 1; j++) {
+        const originalLine = originalLines[startLine + j].trim()
+        const searchLine = searchLines[j].trim()
+        const maxLen = Math.max(originalLine.length, searchLine.length)
+        if (maxLen === 0) {
+          continue
+        }
+        const distance = levenshtein(originalLine, searchLine)
+        similarity += (1 - distance / maxLen) / linesToCheck
+
+        if (similarity >= SINGLE_CANDIDATE_SIMILARITY_THRESHOLD) {
+          break
+        }
+      }
+    } else {
+      similarity = 1.0
+    }
+
+    if (similarity >= SINGLE_CANDIDATE_SIMILARITY_THRESHOLD) {
+      let matchStartIndex = 0
+      for (let k = 0; k < startLine; k++) {
+        matchStartIndex += originalLines[k].length + 1
+      }
+      let matchEndIndex = matchStartIndex
+      for (let k = startLine; k <= endLine; k++) {
+        matchEndIndex += originalLines[k].length
+        if (k < endLine) {
+          matchEndIndex += 1
+        }
+      }
+      yield content.substring(matchStartIndex, matchEndIndex)
+    }
+    return
+  }
+
+  let bestMatch: { startLine: number; endLine: number } | null = null
+  let maxSimilarity = -1
+
+  for (const candidate of candidates) {
+    const { startLine, endLine } = candidate
+    const actualBlockSize = endLine - startLine + 1
+
+    let similarity = 0
+    const linesToCheck = Math.min(searchBlockSize - 2, actualBlockSize - 2)
+
+    if (linesToCheck > 0) {
+      for (let j = 1; j < searchBlockSize - 1 && j < actualBlockSize - 1; j++) {
+        const originalLine = originalLines[startLine + j].trim()
+        const searchLine = searchLines[j].trim()
+        const maxLen = Math.max(originalLine.length, searchLine.length)
+        if (maxLen === 0) {
+          continue
+        }
+        const distance = levenshtein(originalLine, searchLine)
+        similarity += 1 - distance / maxLen
+      }
+      similarity /= linesToCheck
+    } else {
+      similarity = 1.0
+    }
+
+    if (similarity > maxSimilarity) {
+      maxSimilarity = similarity
+      bestMatch = candidate
+    }
+  }
+
+  if (maxSimilarity >= MULTIPLE_CANDIDATES_SIMILARITY_THRESHOLD && bestMatch) {
+    const { startLine, endLine } = bestMatch
+    let matchStartIndex = 0
+    for (let k = 0; k < startLine; k++) {
+      matchStartIndex += originalLines[k].length + 1
+    }
+    let matchEndIndex = matchStartIndex
+    for (let k = startLine; k <= endLine; k++) {
+      matchEndIndex += originalLines[k].length
+      if (k < endLine) {
+        matchEndIndex += 1
+      }
+    }
+    yield content.substring(matchStartIndex, matchEndIndex)
+  }
+}
+
+export const WhitespaceNormalizedReplacer: Replacer = function* (content, find) {
+  const normalizeWhitespace = (text: string) => text.replace(/\s+/g, ' ').trim()
+  const normalizedFind = normalizeWhitespace(find)
+
+  const lines = content.split('\n')
+  for (let i = 0; i < lines.length; i++) {
+    const line = lines[i]
+    if (normalizeWhitespace(line) === normalizedFind) {
+      yield line
+    } else {
+      const normalizedLine = normalizeWhitespace(line)
+      if (normalizedLine.includes(normalizedFind)) {
+        const words = find.trim().split(/\s+/)
+        if (words.length > 0) {
+          const pattern = words.map((word) => word.replace(/[.*+?^${}()|[\]\\]/g, '\\$&')).join('\\s+')
+          try {
+            const regex = new RegExp(pattern)
+            const match = line.match(regex)
+            if (match) {
+              yield match[0]
+            }
+          } catch {
+            // Invalid regex pattern, skip
+          }
+        }
+      }
+    }
+  }
+
+  const findLines = find.split('\n')
+  if (findLines.length > 1) {
+    for (let i = 0; i <= lines.length - findLines.length; i++) {
+      const block = lines.slice(i, i + findLines.length)
+      if (normalizeWhitespace(block.join('\n')) === normalizedFind) {
+        yield block.join('\n')
+      }
+    }
+  }
+}
+
+export const IndentationFlexibleReplacer: Replacer = function* (content, find) {
+  const removeIndentation = (text: string) => {
+    const lines = text.split('\n')
+    const nonEmptyLines = lines.filter((line) => line.trim().length > 0)
+    if (nonEmptyLines.length === 0) return text
+
+    const minIndent = Math.min(
+      ...nonEmptyLines.map((line) => {
+        const match = line.match(/^(\s*)/)
+        return match ? match[1].length : 0
+      })
+    )
+
+    return lines.map((line) => (line.trim().length === 0 ? line : line.slice(minIndent))).join('\n')
+  }
+
+  const normalizedFind = removeIndentation(find)
+  const contentLines = content.split('\n')
+  const findLines = find.split('\n')
+
+  for (let i = 0; i <= contentLines.length - findLines.length; i++) {
+    const block = contentLines.slice(i, i + findLines.length).join('\n')
+    if (removeIndentation(block) === normalizedFind) {
+      yield block
+    }
+  }
+}
+
+export const EscapeNormalizedReplacer: Replacer = function* (content, find) {
+  const unescapeString = (str: string): string => {
+    return str.replace(/\\(n|t|r|'|"|`|\\|\n|\$)/g, (match, capturedChar) => {
+      switch (capturedChar) {
+        case 'n':
+          return '\n'
+        case 't':
+          return '\t'
+        case 'r':
+          return '\r'
+        case "'":
+          return "'"
+        case '"':
+          return '"'
+        case '`':
+          return '`'
+        case '\\':
+          return '\\'
+        case '\n':
+          return '\n'
+        case '$':
+          return '$'
+        default:
+          return match
+      }
+    })
+  }
+
+  const unescapedFind = unescapeString(find)
+
+  if (content.includes(unescapedFind)) {
+    yield unescapedFind
+  }
+
+  const lines = content.split('\n')
+  const findLines = unescapedFind.split('\n')
+
+  for (let i = 0; i <= lines.length - findLines.length; i++) {
+    const block = lines.slice(i, i + findLines.length).join('\n')
+    const unescapedBlock = unescapeString(block)
+
+    if (unescapedBlock === unescapedFind) {
+      yield block
+    }
+  }
+}
+
+export const TrimmedBoundaryReplacer: Replacer = function* (content, find) {
+  const trimmedFind = find.trim()
+
+  if (trimmedFind === find) {
+    return
+  }
+
+  if (content.includes(trimmedFind)) {
+    yield trimmedFind
+  }
+
+  const lines = content.split('\n')
+  const findLines = find.split('\n')
+
+  for (let i = 0; i <= lines.length - findLines.length; i++) {
+    const block = lines.slice(i, i + findLines.length).join('\n')
+
+    if (block.trim() === trimmedFind) {
+      yield block
+    }
+  }
+}
+
+export const ContextAwareReplacer: Replacer = function* (content, find) {
+  const findLines = find.split('\n')
+  if (findLines.length < 3) {
+    return
+  }
+
+  if (findLines[findLines.length - 1] === '') {
+    findLines.pop()
+  }
+
+  const contentLines = content.split('\n')
+
+  const firstLine = findLines[0].trim()
+  const lastLine = findLines[findLines.length - 1].trim()
+
+  for (let i = 0; i < contentLines.length; i++) {
+    if (contentLines[i].trim() !== firstLine) continue
+
+    for (let j = i + 2; j < contentLines.length; j++) {
+      if (contentLines[j].trim() === lastLine) {
+        const blockLines = contentLines.slice(i, j + 1)
+        const block = blockLines.join('\n')
+
+        if (blockLines.length === findLines.length) {
+          let matchingLines = 0
+          let totalNonEmptyLines = 0
+
+          for (let k = 1; k < blockLines.length - 1; k++) {
+            const blockLine = blockLines[k].trim()
+            const findLine = findLines[k].trim()
+
+            if (blockLine.length > 0 || findLine.length > 0) {
+              totalNonEmptyLines++
+              if (blockLine === findLine) {
+                matchingLines++
+              }
+            }
+          }
+
+          if (totalNonEmptyLines === 0 || matchingLines / totalNonEmptyLines >= 0.5) {
+            yield block
+            break
+          }
+        }
+        break
+      }
+    }
+  }
+}
+
+export const MultiOccurrenceReplacer: Replacer = function* (content, find) {
+  let startIndex = 0
+
+  while (true) {
+    const index = content.indexOf(find, startIndex)
+    if (index === -1) break
+
+    yield find
+    startIndex = index + find.length
+  }
+}
+
+/**
+ * All replacers in order of specificity
+ */
+export const ALL_REPLACERS: Replacer[] = [
+  SimpleReplacer,
+  LineTrimmedReplacer,
+  BlockAnchorReplacer,
+  WhitespaceNormalizedReplacer,
+  IndentationFlexibleReplacer,
+  EscapeNormalizedReplacer,
+  TrimmedBoundaryReplacer,
+  ContextAwareReplacer,
+  MultiOccurrenceReplacer
+]
+
+/**
+ * Replace oldString with newString in content using fuzzy matching
+ */
+export function replaceWithFuzzyMatch(
+  content: string,
+  oldString: string,
+  newString: string,
+  replaceAll = false
+): string {
+  if (oldString === newString) {
+    throw new Error('old_string and new_string must be different')
+  }
+
+  let notFound = true
+
+  for (const replacer of ALL_REPLACERS) {
+    for (const search of replacer(content, oldString)) {
+      const index = content.indexOf(search)
+      if (index === -1) continue
+      notFound = false
+      if (replaceAll) {
+        return content.replaceAll(search, newString)
+      }
+      const lastIndex = content.lastIndexOf(search)
+      if (index !== lastIndex) continue
+      return content.substring(0, index) + newString + content.substring(index + search.length)
+    }
+  }
+
+  if (notFound) {
+    throw new Error('old_string not found in content')
+  }
+  throw new Error(
+    'Found multiple matches for old_string. Provide more surrounding lines in old_string to identify the correct match.'
+  )
+}
+
+// ============================================================================
+// Binary File Detection
+// ============================================================================
+
+// Check if a file is likely binary
+export async function isBinaryFile(filePath: string): Promise<boolean> {
+  try {
+    const buffer = Buffer.alloc(4096)
+    const fd = await fs.open(filePath, 'r')
+    const { bytesRead } = await fd.read(buffer, 0, buffer.length, 0)
+    await fd.close()
+
+    if (bytesRead === 0) return false
+
+    const view = buffer.subarray(0, bytesRead)
+
+    let zeroBytes = 0
+    let evenZeros = 0
+    let oddZeros = 0
+    let nonPrintable = 0
+
+    for (let i = 0; i < view.length; i++) {
+      const b = view[i]
+
+      if (b === 0) {
+        zeroBytes++
+        if (i % 2 === 0) evenZeros++
+        else oddZeros++
+        continue
+      }
+
+      // treat common whitespace as printable
+      if (b === 9 || b === 10 || b === 13) continue
+
+      // basic ASCII printable range
+      if (b >= 32 && b <= 126) continue
+
+      // bytes >= 128 are likely part of UTF-8 sequences; count as printable
+      if (b >= 128) continue
+
+      nonPrintable++
+    }
+
+    // If there are lots of null bytes, it's probably binary unless it looks like UTF-16 text.
+    if (zeroBytes > 0) {
+      const evenSlots = Math.ceil(view.length / 2)
+      const oddSlots = Math.floor(view.length / 2)
+      const evenZeroRatio = evenSlots > 0 ? evenZeros / evenSlots : 0
+      const oddZeroRatio = oddSlots > 0 ? oddZeros / oddSlots : 0
+
+      // UTF-16LE/BE tends to have zeros on every other byte.
+      if (evenZeroRatio > 0.7 || oddZeroRatio > 0.7) return false
+
+      if (zeroBytes / view.length > 0.05) return true
+    }
+
+    // Heuristic: too many non-printable bytes => binary.
+    return nonPrintable / view.length > 0.3
+  } catch {
+    return false
+  }
+}
+
+// ============================================================================
+// Ripgrep Utilities
+// ============================================================================
+
+export interface RipgrepResult {
+  ok: boolean
+  stdout: string
+  exitCode: number | null
+}
+
+export function getRipgrepAddonPath(): string {
+  const pkgJsonPath = require.resolve('@anthropic-ai/claude-agent-sdk/package.json')
+  const pkgRoot = path.dirname(pkgJsonPath)
+  const platform = isMac ? 'darwin' : isWin ? 'win32' : 'linux'
+  const arch = process.arch === 'arm64' ? 'arm64' : 'x64'
+  return path.join(pkgRoot, 'vendor', 'ripgrep', `${arch}-${platform}`, 'ripgrep.node')
+}
+
+export async function runRipgrep(args: string[]): Promise<RipgrepResult> {
+  const addonPath = getRipgrepAddonPath()
+  const childScript = `const { ripgrepMain } = require(process.env.RIPGREP_ADDON_PATH); process.exit(ripgrepMain(process.argv.slice(1)));`
+
+  return new Promise((resolve) => {
+    const child = spawn(process.execPath, ['--eval', childScript, 'rg', ...args], {
+      cwd: process.cwd(),
+      env: {
+        ...process.env,
+        ELECTRON_RUN_AS_NODE: '1',
+        RIPGREP_ADDON_PATH: addonPath
+      },
+      stdio: ['ignore', 'pipe', 'pipe']
+    })
+
+    let stdout = ''
+
+    child.stdout?.on('data', (chunk) => {
+      stdout += chunk.toString('utf-8')
+    })
+
+    child.on('error', () => {
+      resolve({ ok: false, stdout: '', exitCode: null })
+    })
+
+    child.on('close', (code) => {
+      resolve({ ok: true, stdout, exitCode: code })
+    })
+  })
+}
diff --git a/src/main/services/ConfigManager.ts b/src/main/services/ConfigManager.ts
index c693d4b05a..6f2bbd44a4 100644
--- a/src/main/services/ConfigManager.ts
+++ b/src/main/services/ConfigManager.ts
@@ -32,7 +32,8 @@ export enum ConfigKeys {
   Proxy = 'proxy',
   EnableDeveloperMode = 'enableDeveloperMode',
   ClientId = 'clientId',
-  GitBashPath = 'gitBashPath'
+  GitBashPath = 'gitBashPath',
+  GitBashPathSource = 'gitBashPathSource' // 'manual' | 'auto' | null
 }
 
 export class ConfigManager {
diff --git a/src/main/services/MCPService.ts b/src/main/services/MCPService.ts
index cc6bbaa366..ebdc2247fc 100644
--- a/src/main/services/MCPService.ts
+++ b/src/main/services/MCPService.ts
@@ -249,6 +249,26 @@ class McpService {
           StdioClientTransport | SSEClientTransport | InMemoryTransport | StreamableHTTPClientTransport
         > => {
           // Create appropriate transport based on configuration
+
+          // Special case for nowledgeMem - uses HTTP transport instead of in-memory
+          if (isBuiltinMCPServer(server) && server.name === BuiltinMCPServerNames.nowledgeMem) {
+            const nowledgeMemUrl = 'http://127.0.0.1:14242/mcp'
+            const options: StreamableHTTPClientTransportOptions = {
+              fetch: async (url, init) => {
+                return net.fetch(typeof url === 'string' ? url : url.toString(), init)
+              },
+              requestInit: {
+                headers: {
+                  ...defaultAppHeaders(),
+                  APP: 'Cherry Studio'
+                }
+              },
+              authProvider
+            }
+            getServerLogger(server).debug(`Using StreamableHTTPClientTransport for ${server.name}`)
+            return new StreamableHTTPClientTransport(new URL(nowledgeMemUrl), options)
+          }
+
           if (isBuiltinMCPServer(server) && server.name !== BuiltinMCPServerNames.mcpAutoInstall) {
             getServerLogger(server).debug(`Using in-memory transport`)
             const [clientTransport, serverTransport] = InMemoryTransport.createLinkedPair()
diff --git a/src/main/services/agents/services/claudecode/index.ts b/src/main/services/agents/services/claudecode/index.ts
index 689c177ff5..50dd5a6d3d 100644
--- a/src/main/services/agents/services/claudecode/index.ts
+++ b/src/main/services/agents/services/claudecode/index.ts
@@ -15,8 +15,8 @@ import { query } from '@anthropic-ai/claude-agent-sdk'
 import { loggerService } from '@logger'
 import { config as apiConfigService } from '@main/apiServer/config'
 import { validateModelId } from '@main/apiServer/utils'
-import { ConfigKeys, configManager } from '@main/services/ConfigManager'
-import { validateGitBashPath } from '@main/utils/process'
+import { isWin } from '@main/constant'
+import { autoDiscoverGitBash } from '@main/utils/process'
 import getLoginShellEnvironment from '@main/utils/shell-env'
 import { app } from 'electron'
 
@@ -105,7 +105,8 @@ class ClaudeCodeService implements AgentServiceInterface {
       Object.entries(loginShellEnv).filter(([key]) => !key.toLowerCase().endsWith('_proxy'))
     ) as Record<string, string>
 
-    const customGitBashPath = validateGitBashPath(configManager.get(ConfigKeys.GitBashPath) as string | undefined)
+    // Auto-discover Git Bash path on Windows (already logs internally)
+    const customGitBashPath = isWin ? autoDiscoverGitBash() : null
 
     // Route through local API Server which handles format conversion via unified adapter
     // This enables Claude Code Agent to work with any provider (OpenAI, Gemini, etc.)
diff --git a/src/main/utils/__tests__/process.test.ts b/src/main/utils/__tests__/process.test.ts
index 0485ec5fad..a1ac2fd9a5 100644
--- a/src/main/utils/__tests__/process.test.ts
+++ b/src/main/utils/__tests__/process.test.ts
@@ -1,9 +1,21 @@
+import { configManager } from '@main/services/ConfigManager'
 import { execFileSync } from 'child_process'
 import fs from 'fs'
 import path from 'path'
 import { beforeEach, describe, expect, it, vi } from 'vitest'
 
-import { findExecutable, findGitBash, validateGitBashPath } from '../process'
+import { autoDiscoverGitBash, findExecutable, findGitBash, validateGitBashPath } from '../process'
+
+// Mock configManager
+vi.mock('@main/services/ConfigManager', () => ({
+  ConfigKeys: {
+    GitBashPath: 'gitBashPath'
+  },
+  configManager: {
+    get: vi.fn(),
+    set: vi.fn()
+  }
+}))
 
 // Mock dependencies
 vi.mock('child_process')
@@ -695,4 +707,284 @@ describe.skipIf(process.platform !== 'win32')('process utilities', () => {
       })
     })
   })
+
+  describe('autoDiscoverGitBash', () => {
+    const originalEnvVar = process.env.CLAUDE_CODE_GIT_BASH_PATH
+
+    beforeEach(() => {
+      vi.mocked(configManager.get).mockReset()
+      vi.mocked(configManager.set).mockReset()
+      delete process.env.CLAUDE_CODE_GIT_BASH_PATH
+    })
+
+    afterEach(() => {
+      // Restore original environment variable
+      if (originalEnvVar !== undefined) {
+        process.env.CLAUDE_CODE_GIT_BASH_PATH = originalEnvVar
+      } else {
+        delete process.env.CLAUDE_CODE_GIT_BASH_PATH
+      }
+    })
+
+    /**
+     * Helper to mock fs.existsSync with a set of valid paths
+     */
+    const mockExistingPaths = (...validPaths: string[]) => {
+      vi.mocked(fs.existsSync).mockImplementation((p) => validPaths.includes(p as string))
+    }
+
+    describe('with no existing config path', () => {
+      it('should discover and persist Git Bash path when not configured', () => {
+        const bashPath = 'C:\\Program Files\\Git\\bin\\bash.exe'
+        const gitPath = 'C:\\Program Files\\Git\\cmd\\git.exe'
+
+        vi.mocked(configManager.get).mockReturnValue(undefined)
+        process.env.ProgramFiles = 'C:\\Program Files'
+        mockExistingPaths(gitPath, bashPath)
+
+        const result = autoDiscoverGitBash()
+
+        expect(result).toBe(bashPath)
+        expect(configManager.set).toHaveBeenCalledWith('gitBashPath', bashPath)
+      })
+
+      it('should return null and not persist when Git Bash is not found', () => {
+        vi.mocked(configManager.get).mockReturnValue(undefined)
+        vi.mocked(fs.existsSync).mockReturnValue(false)
+        vi.mocked(execFileSync).mockImplementation(() => {
+          throw new Error('Not found')
+        })
+
+        const result = autoDiscoverGitBash()
+
+        expect(result).toBeNull()
+        expect(configManager.set).not.toHaveBeenCalled()
+      })
+    })
+
+    describe('environment variable precedence', () => {
+      it('should use env var over valid config path', () => {
+        const envPath = 'C:\\EnvGit\\bin\\bash.exe'
+        const configPath = 'C:\\ConfigGit\\bin\\bash.exe'
+
+        process.env.CLAUDE_CODE_GIT_BASH_PATH = envPath
+        vi.mocked(configManager.get).mockReturnValue(configPath)
+        mockExistingPaths(envPath, configPath)
+
+        const result = autoDiscoverGitBash()
+
+        // Env var should take precedence
+        expect(result).toBe(envPath)
+        // Should not persist env var path (it's a runtime override)
+        expect(configManager.set).not.toHaveBeenCalled()
+      })
+
+      it('should fall back to config path when env var is invalid', () => {
+        const envPath = 'C:\\Invalid\\bash.exe'
+        const configPath = 'C:\\ConfigGit\\bin\\bash.exe'
+
+        process.env.CLAUDE_CODE_GIT_BASH_PATH = envPath
+        vi.mocked(configManager.get).mockReturnValue(configPath)
+        // Env path is invalid (doesn't exist), only config path exists
+        mockExistingPaths(configPath)
+
+        const result = autoDiscoverGitBash()
+
+        // Should fall back to config path
+        expect(result).toBe(configPath)
+        expect(configManager.set).not.toHaveBeenCalled()
+      })
+
+      it('should fall back to auto-discovery when both env var and config are invalid', () => {
+        const envPath = 'C:\\InvalidEnv\\bash.exe'
+        const configPath = 'C:\\InvalidConfig\\bash.exe'
+        const discoveredPath = 'C:\\Program Files\\Git\\bin\\bash.exe'
+        const gitPath = 'C:\\Program Files\\Git\\cmd\\git.exe'
+
+        process.env.CLAUDE_CODE_GIT_BASH_PATH = envPath
+        process.env.ProgramFiles = 'C:\\Program Files'
+        vi.mocked(configManager.get).mockReturnValue(configPath)
+        // Both env and config paths are invalid, only standard Git exists
+        mockExistingPaths(gitPath, discoveredPath)
+
+        const result = autoDiscoverGitBash()
+
+        expect(result).toBe(discoveredPath)
+        expect(configManager.set).toHaveBeenCalledWith('gitBashPath', discoveredPath)
+      })
+    })
+
+    describe('with valid existing config path', () => {
+      it('should validate and return existing path without re-discovering', () => {
+        const existingPath = 'C:\\CustomGit\\bin\\bash.exe'
+
+        vi.mocked(configManager.get).mockReturnValue(existingPath)
+        mockExistingPaths(existingPath)
+
+        const result = autoDiscoverGitBash()
+
+        expect(result).toBe(existingPath)
+        // Should not call findGitBash or persist again
+        expect(configManager.set).not.toHaveBeenCalled()
+        // Should not call execFileSync (which findGitBash would use for discovery)
+        expect(execFileSync).not.toHaveBeenCalled()
+      })
+
+      it('should not override existing valid config with auto-discovery', () => {
+        const existingPath = 'C:\\CustomGit\\bin\\bash.exe'
+        const discoveredPath = 'C:\\Program Files\\Git\\bin\\bash.exe'
+
+        vi.mocked(configManager.get).mockReturnValue(existingPath)
+        mockExistingPaths(existingPath, discoveredPath)
+
+        const result = autoDiscoverGitBash()
+
+        expect(result).toBe(existingPath)
+        expect(configManager.set).not.toHaveBeenCalled()
+      })
+    })
+
+    describe('with invalid existing config path', () => {
+      it('should attempt auto-discovery when existing path does not exist', () => {
+        const existingPath = 'C:\\NonExistent\\bin\\bash.exe'
+        const discoveredPath = 'C:\\Program Files\\Git\\bin\\bash.exe'
+        const gitPath = 'C:\\Program Files\\Git\\cmd\\git.exe'
+
+        vi.mocked(configManager.get).mockReturnValue(existingPath)
+        process.env.ProgramFiles = 'C:\\Program Files'
+        // Invalid path doesn't exist, but Git is installed at standard location
+        mockExistingPaths(gitPath, discoveredPath)
+
+        const result = autoDiscoverGitBash()
+
+        // Should discover and return the new path
+        expect(result).toBe(discoveredPath)
+        // Should persist the discovered path (overwrites invalid)
+        expect(configManager.set).toHaveBeenCalledWith('gitBashPath', discoveredPath)
+      })
+
+      it('should attempt auto-discovery when existing path is not bash.exe', () => {
+        const existingPath = 'C:\\CustomGit\\bin\\git.exe'
+        const discoveredPath = 'C:\\Program Files\\Git\\bin\\bash.exe'
+        const gitPath = 'C:\\Program Files\\Git\\cmd\\git.exe'
+
+        vi.mocked(configManager.get).mockReturnValue(existingPath)
+        process.env.ProgramFiles = 'C:\\Program Files'
+        // Invalid path exists but is not bash.exe (validation will fail)
+        // Git is installed at standard location
+        mockExistingPaths(existingPath, gitPath, discoveredPath)
+
+        const result = autoDiscoverGitBash()
+
+        // Should discover and return the new path
+        expect(result).toBe(discoveredPath)
+        // Should persist the discovered path (overwrites invalid)
+        expect(configManager.set).toHaveBeenCalledWith('gitBashPath', discoveredPath)
+      })
+
+      it('should return null when existing path is invalid and discovery fails', () => {
+        const existingPath = 'C:\\NonExistent\\bin\\bash.exe'
+
+        vi.mocked(configManager.get).mockReturnValue(existingPath)
+        vi.mocked(fs.existsSync).mockReturnValue(false)
+        vi.mocked(execFileSync).mockImplementation(() => {
+          throw new Error('Not found')
+        })
+
+        const result = autoDiscoverGitBash()
+
+        // Both validation and discovery failed
+        expect(result).toBeNull()
+        // Should not persist when discovery fails
+        expect(configManager.set).not.toHaveBeenCalled()
+      })
+    })
+
+    describe('config persistence verification', () => {
+      it('should persist discovered path with correct config key', () => {
+        const bashPath = 'C:\\Program Files\\Git\\bin\\bash.exe'
+        const gitPath = 'C:\\Program Files\\Git\\cmd\\git.exe'
+
+        vi.mocked(configManager.get).mockReturnValue(undefined)
+        process.env.ProgramFiles = 'C:\\Program Files'
+        mockExistingPaths(gitPath, bashPath)
+
+        autoDiscoverGitBash()
+
+        // Verify the exact call to configManager.set
+        expect(configManager.set).toHaveBeenCalledTimes(1)
+        expect(configManager.set).toHaveBeenCalledWith('gitBashPath', bashPath)
+      })
+
+      it('should persist on each discovery when config remains undefined', () => {
+        const bashPath = 'C:\\Program Files\\Git\\bin\\bash.exe'
+        const gitPath = 'C:\\Program Files\\Git\\cmd\\git.exe'
+
+        vi.mocked(configManager.get).mockReturnValue(undefined)
+        process.env.ProgramFiles = 'C:\\Program Files'
+        mockExistingPaths(gitPath, bashPath)
+
+        autoDiscoverGitBash()
+        autoDiscoverGitBash()
+
+        // Each call discovers and persists since config remains undefined (mocked)
+        expect(configManager.set).toHaveBeenCalledTimes(2)
+      })
+    })
+
+    describe('real-world scenarios', () => {
+      it('should discover and persist standard Git for Windows installation', () => {
+        const gitPath = 'C:\\Program Files\\Git\\cmd\\git.exe'
+        const bashPath = 'C:\\Program Files\\Git\\bin\\bash.exe'
+
+        vi.mocked(configManager.get).mockReturnValue(undefined)
+        process.env.ProgramFiles = 'C:\\Program Files'
+        mockExistingPaths(gitPath, bashPath)
+
+        const result = autoDiscoverGitBash()
+
+        expect(result).toBe(bashPath)
+        expect(configManager.set).toHaveBeenCalledWith('gitBashPath', bashPath)
+      })
+
+      it('should discover portable Git via where.exe and persist', () => {
+        const gitPath = 'D:\\PortableApps\\Git\\bin\\git.exe'
+        const bashPath = 'D:\\PortableApps\\Git\\bin\\bash.exe'
+
+        vi.mocked(configManager.get).mockReturnValue(undefined)
+
+        vi.mocked(fs.existsSync).mockImplementation((p) => {
+          const pathStr = p?.toString() || ''
+          // Common git paths don't exist
+          if (pathStr.includes('Program Files\\Git\\cmd\\git.exe')) return false
+          if (pathStr.includes('Program Files (x86)\\Git\\cmd\\git.exe')) return false
+          // Portable bash path exists
+          if (pathStr === bashPath) return true
+          return false
+        })
+
+        vi.mocked(execFileSync).mockReturnValue(gitPath)
+
+        const result = autoDiscoverGitBash()
+
+        expect(result).toBe(bashPath)
+        expect(configManager.set).toHaveBeenCalledWith('gitBashPath', bashPath)
+      })
+
+      it('should respect user-configured path over auto-discovery', () => {
+        const userConfiguredPath = 'D:\\MyGit\\bin\\bash.exe'
+        const systemPath = 'C:\\Program Files\\Git\\bin\\bash.exe'
+
+        vi.mocked(configManager.get).mockReturnValue(userConfiguredPath)
+        mockExistingPaths(userConfiguredPath, systemPath)
+
+        const result = autoDiscoverGitBash()
+
+        expect(result).toBe(userConfiguredPath)
+        expect(configManager.set).not.toHaveBeenCalled()
+        // Verify findGitBash was not called for discovery
+        expect(execFileSync).not.toHaveBeenCalled()
+      })
+    })
+  })
 })
diff --git a/src/main/utils/process.ts b/src/main/utils/process.ts
index 7175af7e75..ccc0f66535 100644
--- a/src/main/utils/process.ts
+++ b/src/main/utils/process.ts
@@ -1,4 +1,5 @@
 import { loggerService } from '@logger'
+import type { GitBashPathInfo, GitBashPathSource } from '@shared/config/constant'
 import { HOME_CHERRY_DIR } from '@shared/config/constant'
 import { execFileSync, spawn } from 'child_process'
 import fs from 'fs'
@@ -6,6 +7,7 @@ import os from 'os'
 import path from 'path'
 
 import { isWin } from '../constant'
+import { ConfigKeys, configManager } from '../services/ConfigManager'
 import { getResourcePath } from '.'
 
 const logger = loggerService.withContext('Utils:Process')
@@ -59,7 +61,7 @@ export async function getBinaryPath(name?: string): Promise<string> {
 
 export async function isBinaryExists(name: string): Promise<boolean> {
   const cmd = await getBinaryPath(name)
-  return await fs.existsSync(cmd)
+  return fs.existsSync(cmd)
 }
 
 /**
@@ -225,3 +227,77 @@ export function validateGitBashPath(customPath?: string | null): string | null {
   logger.debug('Validated custom Git Bash path', { path: resolved })
   return resolved
 }
+
+/**
+ * Auto-discover and persist Git Bash path if not already configured
+ * Only called when Git Bash is actually needed
+ *
+ * Precedence order:
+ * 1. CLAUDE_CODE_GIT_BASH_PATH environment variable (highest - runtime override)
+ * 2. Configured path from settings (manual or auto)
+ * 3. Auto-discovery via findGitBash (only if no valid config exists)
+ */
+export function autoDiscoverGitBash(): string | null {
+  if (!isWin) {
+    return null
+  }
+
+  // 1. Check environment variable override first (highest priority)
+  const envOverride = process.env.CLAUDE_CODE_GIT_BASH_PATH
+  if (envOverride) {
+    const validated = validateGitBashPath(envOverride)
+    if (validated) {
+      logger.debug('Using CLAUDE_CODE_GIT_BASH_PATH override', { path: validated })
+      return validated
+    }
+    logger.warn('CLAUDE_CODE_GIT_BASH_PATH provided but path is invalid', { path: envOverride })
+  }
+
+  // 2. Check if a path is already configured
+  const existingPath = configManager.get<string | undefined>(ConfigKeys.GitBashPath)
+  const existingSource = configManager.get<GitBashPathSource | undefined>(ConfigKeys.GitBashPathSource)
+
+  if (existingPath) {
+    const validated = validateGitBashPath(existingPath)
+    if (validated) {
+      return validated
+    }
+    // Existing path is invalid, try to auto-discover
+    logger.warn('Existing Git Bash path is invalid, attempting auto-discovery', {
+      path: existingPath,
+      source: existingSource
+    })
+  }
+
+  // 3. Try to find Git Bash via auto-discovery
+  const discoveredPath = findGitBash()
+  if (discoveredPath) {
+    // Persist the discovered path with 'auto' source
+    configManager.set(ConfigKeys.GitBashPath, discoveredPath)
+    configManager.set(ConfigKeys.GitBashPathSource, 'auto')
+    logger.info('Auto-discovered Git Bash path', { path: discoveredPath })
+  }
+
+  return discoveredPath
+}
+
+/**
+ * Get Git Bash path info including source
+ * If no path is configured, triggers auto-discovery first
+ */
+export function getGitBashPathInfo(): GitBashPathInfo {
+  if (!isWin) {
+    return { path: null, source: null }
+  }
+
+  let path = configManager.get<string | null>(ConfigKeys.GitBashPath) ?? null
+  let source = configManager.get<GitBashPathSource | null>(ConfigKeys.GitBashPathSource) ?? null
+
+  // If no path configured, trigger auto-discovery (handles upgrade from old versions)
+  if (!path) {
+    path = autoDiscoverGitBash()
+    source = path ? 'auto' : null
+  }
+
+  return { path, source }
+}
diff --git a/src/preload/index.ts b/src/preload/index.ts
index 117bec3b91..dc08e9a2df 100644
--- a/src/preload/index.ts
+++ b/src/preload/index.ts
@@ -2,7 +2,7 @@ import type { PermissionUpdate } from '@anthropic-ai/claude-agent-sdk'
 import { electronAPI } from '@electron-toolkit/preload'
 import type { SpanEntity, TokenUsage } from '@mcp-trace/trace-core'
 import type { SpanContext } from '@opentelemetry/api'
-import type { TerminalConfig, UpgradeChannel } from '@shared/config/constant'
+import type { GitBashPathInfo, TerminalConfig, UpgradeChannel } from '@shared/config/constant'
 import type { LogLevel, LogSourceWithContext } from '@shared/config/logger'
 import type { FileChangeEvent, WebviewKeyEvent } from '@shared/config/types'
 import type { MCPServerLogEntry } from '@shared/config/types'
@@ -126,6 +126,7 @@ const api = {
     getCpuName: () => ipcRenderer.invoke(IpcChannel.System_GetCpuName),
     checkGitBash: (): Promise<boolean> => ipcRenderer.invoke(IpcChannel.System_CheckGitBash),
     getGitBashPath: (): Promise<string | null> => ipcRenderer.invoke(IpcChannel.System_GetGitBashPath),
+    getGitBashPathInfo: (): Promise<GitBashPathInfo> => ipcRenderer.invoke(IpcChannel.System_GetGitBashPathInfo),
     setGitBashPath: (newPath: string | null): Promise<boolean> =>
       ipcRenderer.invoke(IpcChannel.System_SetGitBashPath, newPath)
   },
diff --git a/src/renderer/src/aiCore/legacy/clients/openai/OpenAIApiClient.ts b/src/renderer/src/aiCore/legacy/clients/openai/OpenAIApiClient.ts
index d839da8964..73a5bed4fe 100644
--- a/src/renderer/src/aiCore/legacy/clients/openai/OpenAIApiClient.ts
+++ b/src/renderer/src/aiCore/legacy/clients/openai/OpenAIApiClient.ts
@@ -142,6 +142,10 @@ export class OpenAIAPIClient extends OpenAIBaseClient<
       return { thinking: { type: reasoningEffort ? 'enabled' : 'disabled' } }
     }
 
+    if (reasoningEffort === 'default') {
+      return {}
+    }
+
     if (!reasoningEffort) {
       // DeepSeek hybrid inference models, v3.1 and maybe more in the future
       // 不同的 provider 有不同的思考控制方式，在这里统一解决
@@ -303,7 +307,7 @@ export class OpenAIAPIClient extends OpenAIBaseClient<
     // Grok models/Perplexity models/OpenAI models
     if (isSupportedReasoningEffortModel(model)) {
       // 检查模型是否支持所选选项
-      const supportedOptions = getModelSupportedReasoningEffortOptions(model)
+      const supportedOptions = getModelSupportedReasoningEffortOptions(model)?.filter((option) => option !== 'default')
       if (supportedOptions?.includes(reasoningEffort)) {
         return {
           reasoning_effort: reasoningEffort
diff --git a/src/renderer/src/aiCore/middleware/AiSdkMiddlewareBuilder.ts b/src/renderer/src/aiCore/middleware/AiSdkMiddlewareBuilder.ts
index 6f1ec709b8..ae83df4f3f 100644
--- a/src/renderer/src/aiCore/middleware/AiSdkMiddlewareBuilder.ts
+++ b/src/renderer/src/aiCore/middleware/AiSdkMiddlewareBuilder.ts
@@ -8,14 +8,12 @@ import { isOllamaProvider, isSupportEnableThinkingProvider } from '@renderer/uti
 import { openrouterReasoningMiddleware, skipGeminiThoughtSignatureMiddleware } from '@shared/middleware'
 import type { LanguageModelMiddleware } from 'ai'
 import { extractReasoningMiddleware, simulateStreamingMiddleware } from 'ai'
-import { isEmpty } from 'lodash'
 
 import { getAiSdkProviderId } from '../provider/factory'
 import { isOpenRouterGeminiGenerateImageModel } from '../utils/image'
 import { noThinkMiddleware } from './noThinkMiddleware'
 import { openrouterGenerateImageMiddleware } from './openrouterGenerateImageMiddleware'
 import { qwenThinkingMiddleware } from './qwenThinkingMiddleware'
-import { toolChoiceMiddleware } from './toolChoiceMiddleware'
 
 const logger = loggerService.withContext('AiSdkMiddlewareBuilder')
 
@@ -135,15 +133,6 @@ export class AiSdkMiddlewareBuilder {
 export function buildAiSdkMiddlewares(config: AiSdkMiddlewareConfig): LanguageModelMiddleware[] {
   const builder = new AiSdkMiddlewareBuilder()
 
-  // 0. 知识库强制调用中间件（必须在最前面，确保第一轮强制调用知识库）
-  if (!isEmpty(config.assistant?.knowledge_bases?.map((base) => base.id)) && config.knowledgeRecognition !== 'on') {
-    builder.add({
-      name: 'force-knowledge-first',
-      middleware: toolChoiceMiddleware('builtin_knowledge_search')
-    })
-    logger.debug('Added toolChoice middleware to force knowledge base search on first round')
-  }
-
   // 1. 根据provider添加特定中间件
   if (config.provider) {
     addProviderSpecificMiddlewares(builder, config)
diff --git a/src/renderer/src/aiCore/plugins/searchOrchestrationPlugin.ts b/src/renderer/src/aiCore/plugins/searchOrchestrationPlugin.ts
index 6be577f194..5b095a4461 100644
--- a/src/renderer/src/aiCore/plugins/searchOrchestrationPlugin.ts
+++ b/src/renderer/src/aiCore/plugins/searchOrchestrationPlugin.ts
@@ -31,7 +31,7 @@ import { webSearchToolWithPreExtractedKeywords } from '../tools/WebSearchTool'
 
 const logger = loggerService.withContext('SearchOrchestrationPlugin')
 
-const getMessageContent = (message: ModelMessage) => {
+export const getMessageContent = (message: ModelMessage) => {
   if (typeof message.content === 'string') return message.content
   return message.content.reduce((acc, part) => {
     if (part.type === 'text') {
@@ -266,14 +266,14 @@ export const searchOrchestrationPlugin = (assistant: Assistant, topicId: string)
         // 判断是否需要各种搜索
         const knowledgeBaseIds = assistant.knowledge_bases?.map((base) => base.id)
         const hasKnowledgeBase = !isEmpty(knowledgeBaseIds)
-        const knowledgeRecognition = assistant.knowledgeRecognition || 'on'
+        const knowledgeRecognition = assistant.knowledgeRecognition || 'off'
         const globalMemoryEnabled = selectGlobalMemoryEnabled(store.getState())
         const shouldWebSearch = !!assistant.webSearchProviderId
         const shouldKnowledgeSearch = hasKnowledgeBase && knowledgeRecognition === 'on'
         const shouldMemorySearch = globalMemoryEnabled && assistant.enableMemory
 
         // 执行意图分析
-        if (shouldWebSearch || hasKnowledgeBase) {
+        if (shouldWebSearch || shouldKnowledgeSearch) {
           const analysisResult = await analyzeSearchIntent(lastUserMessage, assistant, {
             shouldWebSearch,
             shouldKnowledgeSearch,
@@ -330,41 +330,25 @@ export const searchOrchestrationPlugin = (assistant: Assistant, topicId: string)
         // 📚 知识库搜索工具配置
         const knowledgeBaseIds = assistant.knowledge_bases?.map((base) => base.id)
         const hasKnowledgeBase = !isEmpty(knowledgeBaseIds)
-        const knowledgeRecognition = assistant.knowledgeRecognition || 'on'
+        const knowledgeRecognition = assistant.knowledgeRecognition || 'off'
+        const shouldKnowledgeSearch = hasKnowledgeBase && knowledgeRecognition === 'on'
 
-        if (hasKnowledgeBase) {
-          if (knowledgeRecognition === 'off') {
-            // off 模式：直接添加知识库搜索工具，使用用户消息作为搜索关键词
+        if (shouldKnowledgeSearch) {
+          // on 模式：根据意图识别结果决定是否添加工具
+          const needsKnowledgeSearch =
+            analysisResult?.knowledge &&
+            analysisResult.knowledge.question &&
+            analysisResult.knowledge.question[0] !== 'not_needed'
+
+          if (needsKnowledgeSearch && analysisResult.knowledge) {
+            // logger.info('📚 Adding knowledge search tool (intent-based)')
             const userMessage = userMessages[context.requestId]
-            const fallbackKeywords = {
-              question: [getMessageContent(userMessage) || 'search'],
-              rewrite: getMessageContent(userMessage) || 'search'
-            }
-            // logger.info('📚 Adding knowledge search tool (force mode)')
             params.tools['builtin_knowledge_search'] = knowledgeSearchTool(
               assistant,
-              fallbackKeywords,
+              analysisResult.knowledge,
               getMessageContent(userMessage),
               topicId
             )
-            // params.toolChoice = { type: 'tool', toolName: 'builtin_knowledge_search' }
-          } else {
-            // on 模式：根据意图识别结果决定是否添加工具
-            const needsKnowledgeSearch =
-              analysisResult?.knowledge &&
-              analysisResult.knowledge.question &&
-              analysisResult.knowledge.question[0] !== 'not_needed'
-
-            if (needsKnowledgeSearch && analysisResult.knowledge) {
-              // logger.info('📚 Adding knowledge search tool (intent-based)')
-              const userMessage = userMessages[context.requestId]
-              params.tools['builtin_knowledge_search'] = knowledgeSearchTool(
-                assistant,
-                analysisResult.knowledge,
-                getMessageContent(userMessage),
-                topicId
-              )
-            }
           }
         }
 
diff --git a/src/renderer/src/aiCore/prepareParams/__tests__/model-parameters.test.ts b/src/renderer/src/aiCore/prepareParams/__tests__/model-parameters.test.ts
index 70b4ac84b7..a4f345e3e5 100644
--- a/src/renderer/src/aiCore/prepareParams/__tests__/model-parameters.test.ts
+++ b/src/renderer/src/aiCore/prepareParams/__tests__/model-parameters.test.ts
@@ -18,7 +18,7 @@ vi.mock('@renderer/services/AssistantService', () => ({
     toolUseMode: assistant.settings?.toolUseMode ?? 'prompt',
     defaultModel: assistant.defaultModel,
     customParameters: assistant.settings?.customParameters ?? [],
-    reasoning_effort: assistant.settings?.reasoning_effort,
+    reasoning_effort: assistant.settings?.reasoning_effort ?? 'default',
     reasoning_effort_cache: assistant.settings?.reasoning_effort_cache,
     qwenThinkMode: assistant.settings?.qwenThinkMode
   })
diff --git a/src/renderer/src/aiCore/utils/__tests__/reasoning.test.ts b/src/renderer/src/aiCore/utils/__tests__/reasoning.test.ts
index fec4d197e3..df7d69d0c2 100644
--- a/src/renderer/src/aiCore/utils/__tests__/reasoning.test.ts
+++ b/src/renderer/src/aiCore/utils/__tests__/reasoning.test.ts
@@ -11,6 +11,7 @@ import { beforeEach, describe, expect, it, vi } from 'vitest'
 
 import {
   getAnthropicReasoningParams,
+  getAnthropicThinkingBudget,
   getBedrockReasoningParams,
   getCustomParameters,
   getGeminiReasoningParams,
@@ -89,7 +90,8 @@ vi.mock('@renderer/config/models', async (importOriginal) => {
     isQwenAlwaysThinkModel: vi.fn(() => false),
     isSupportedThinkingTokenHunyuanModel: vi.fn(() => false),
     isSupportedThinkingTokenModel: vi.fn(() => false),
-    isGPT51SeriesModel: vi.fn(() => false)
+    isGPT51SeriesModel: vi.fn(() => false),
+    findTokenLimit: vi.fn(actual.findTokenLimit)
   }
 })
 
@@ -596,7 +598,7 @@ describe('reasoning utils', () => {
       expect(result).toEqual({})
     })
 
-    it('should return disabled thinking when no reasoning effort', async () => {
+    it('should return disabled thinking when reasoning effort is none', async () => {
       const { isReasoningModel, isSupportedThinkingTokenClaudeModel } = await import('@renderer/config/models')
 
       vi.mocked(isReasoningModel).mockReturnValue(true)
@@ -611,7 +613,9 @@ describe('reasoning utils', () => {
       const assistant: Assistant = {
         id: 'test',
         name: 'Test',
-        settings: {}
+        settings: {
+          reasoning_effort: 'none'
+        }
       } as Assistant
 
       const result = getAnthropicReasoningParams(assistant, model)
@@ -647,7 +651,7 @@ describe('reasoning utils', () => {
       expect(result).toEqual({
         thinking: {
           type: 'enabled',
-          budgetTokens: 2048
+          budgetTokens: 4096
         }
       })
     })
@@ -675,7 +679,7 @@ describe('reasoning utils', () => {
       expect(result).toEqual({})
     })
 
-    it('should disable thinking for Flash models without reasoning effort', async () => {
+    it('should disable thinking for Flash models when reasoning effort is none', async () => {
       const { isReasoningModel, isSupportedThinkingTokenGeminiModel } = await import('@renderer/config/models')
 
       vi.mocked(isReasoningModel).mockReturnValue(true)
@@ -690,7 +694,9 @@ describe('reasoning utils', () => {
       const assistant: Assistant = {
         id: 'test',
         name: 'Test',
-        settings: {}
+        settings: {
+          reasoning_effort: 'none'
+        }
       } as Assistant
 
       const result = getGeminiReasoningParams(assistant, model)
@@ -725,7 +731,7 @@ describe('reasoning utils', () => {
       const result = getGeminiReasoningParams(assistant, model)
       expect(result).toEqual({
         thinkingConfig: {
-          thinkingBudget: 16448,
+          thinkingBudget: expect.any(Number),
           includeThoughts: true
         }
       })
@@ -889,7 +895,7 @@ describe('reasoning utils', () => {
       expect(result).toEqual({
         reasoningConfig: {
           type: 'enabled',
-          budgetTokens: 2048
+          budgetTokens: 4096
         }
       })
     })
@@ -990,4 +996,89 @@ describe('reasoning utils', () => {
       })
     })
   })
+
+  describe('getAnthropicThinkingBudget', () => {
+    it('should return undefined when reasoningEffort is undefined', async () => {
+      const result = getAnthropicThinkingBudget(4096, undefined, 'claude-3-7-sonnet')
+      expect(result).toBeUndefined()
+    })
+
+    it('should return undefined when reasoningEffort is none', async () => {
+      const result = getAnthropicThinkingBudget(4096, 'none', 'claude-3-7-sonnet')
+      expect(result).toBeUndefined()
+    })
+
+    it('should return undefined when tokenLimit is not found', async () => {
+      const { findTokenLimit } = await import('@renderer/config/models')
+      vi.mocked(findTokenLimit).mockReturnValue(undefined)
+
+      const result = getAnthropicThinkingBudget(4096, 'medium', 'unknown-model')
+      expect(result).toBeUndefined()
+    })
+
+    it('should calculate budget correctly when maxTokens is provided', async () => {
+      const { findTokenLimit } = await import('@renderer/config/models')
+      vi.mocked(findTokenLimit).mockReturnValue({ min: 1024, max: 32768 })
+
+      const result = getAnthropicThinkingBudget(4096, 'medium', 'claude-3-7-sonnet')
+      // EFFORT_RATIO['medium'] = 0.5
+      // budget = Math.floor((32768 - 1024) * 0.5 + 1024)
+      // = Math.floor(31744 * 0.5 + 1024) = Math.floor(15872 + 1024) = 16896
+      // budgetTokens = Math.min(16896, 4096) = 4096
+      // result = Math.max(1024, 4096) = 4096
+      expect(result).toBe(4096)
+    })
+
+    it('should use tokenLimit.max when maxTokens is undefined', async () => {
+      const { findTokenLimit } = await import('@renderer/config/models')
+      vi.mocked(findTokenLimit).mockReturnValue({ min: 1024, max: 32768 })
+
+      const result = getAnthropicThinkingBudget(undefined, 'medium', 'claude-3-7-sonnet')
+      // When maxTokens is undefined, budget is not constrained by maxTokens
+      // EFFORT_RATIO['medium'] = 0.5
+      // budget = Math.floor((32768 - 1024) * 0.5 + 1024)
+      // = Math.floor(31744 * 0.5 + 1024) = Math.floor(15872 + 1024) = 16896
+      // result = Math.max(1024, 16896) = 16896
+      expect(result).toBe(16896)
+    })
+
+    it('should enforce minimum budget of 1024', async () => {
+      const { findTokenLimit } = await import('@renderer/config/models')
+      vi.mocked(findTokenLimit).mockReturnValue({ min: 100, max: 1000 })
+
+      const result = getAnthropicThinkingBudget(500, 'low', 'claude-3-7-sonnet')
+      // EFFORT_RATIO['low'] = 0.05
+      // budget = Math.floor((1000 - 100) * 0.05 + 100)
+      // = Math.floor(900 * 0.05 + 100) = Math.floor(45 + 100) = 145
+      // budgetTokens = Math.min(145, 500) = 145
+      // result = Math.max(1024, 145) = 1024
+      expect(result).toBe(1024)
+    })
+
+    it('should respect effort ratio for high reasoning effort', async () => {
+      const { findTokenLimit } = await import('@renderer/config/models')
+      vi.mocked(findTokenLimit).mockReturnValue({ min: 1024, max: 32768 })
+
+      const result = getAnthropicThinkingBudget(8192, 'high', 'claude-3-7-sonnet')
+      // EFFORT_RATIO['high'] = 0.8
+      // budget = Math.floor((32768 - 1024) * 0.8 + 1024)
+      // = Math.floor(31744 * 0.8 + 1024) = Math.floor(25395.2 + 1024) = 26419
+      // budgetTokens = Math.min(26419, 8192) = 8192
+      // result = Math.max(1024, 8192) = 8192
+      expect(result).toBe(8192)
+    })
+
+    it('should use full token limit when maxTokens is undefined and reasoning effort is high', async () => {
+      const { findTokenLimit } = await import('@renderer/config/models')
+      vi.mocked(findTokenLimit).mockReturnValue({ min: 1024, max: 32768 })
+
+      const result = getAnthropicThinkingBudget(undefined, 'high', 'claude-3-7-sonnet')
+      // When maxTokens is undefined, budget is not constrained by maxTokens
+      // EFFORT_RATIO['high'] = 0.8
+      // budget = Math.floor((32768 - 1024) * 0.8 + 1024)
+      // = Math.floor(31744 * 0.8 + 1024) = Math.floor(25395.2 + 1024) = 26419
+      // result = Math.max(1024, 26419) = 26419
+      expect(result).toBe(26419)
+    })
+  })
 })
diff --git a/src/renderer/src/aiCore/utils/reasoning.ts b/src/renderer/src/aiCore/utils/reasoning.ts
index f182405714..a2364d97e1 100644
--- a/src/renderer/src/aiCore/utils/reasoning.ts
+++ b/src/renderer/src/aiCore/utils/reasoning.ts
@@ -10,6 +10,7 @@ import {
   GEMINI_FLASH_MODEL_REGEX,
   getModelSupportedReasoningEffortOptions,
   isDeepSeekHybridInferenceModel,
+  isDoubaoSeed18Model,
   isDoubaoSeedAfter251015,
   isDoubaoThinkingAutoModel,
   isGemini3ThinkingTokenModel,
@@ -28,6 +29,7 @@ import {
   isSupportedThinkingTokenDoubaoModel,
   isSupportedThinkingTokenGeminiModel,
   isSupportedThinkingTokenHunyuanModel,
+  isSupportedThinkingTokenMiMoModel,
   isSupportedThinkingTokenModel,
   isSupportedThinkingTokenQwenModel,
   isSupportedThinkingTokenZhipuModel
@@ -64,7 +66,7 @@ export function getReasoningEffort(assistant: Assistant, model: Model): Reasonin
   // reasoningEffort is not set, no extra reasoning setting
   // Generally, for every model which supports reasoning control, the reasoning effort won't be undefined.
   // It's for some reasoning models that don't support reasoning control, such as deepseek reasoner.
-  if (!reasoningEffort) {
+  if (!reasoningEffort || reasoningEffort === 'default') {
     return {}
   }
 
@@ -329,7 +331,7 @@ export function getReasoningEffort(assistant: Assistant, model: Model): Reasonin
   // Grok models/Perplexity models/OpenAI models, use reasoning_effort
   if (isSupportedReasoningEffortModel(model)) {
     // 检查模型是否支持所选选项
-    const supportedOptions = getModelSupportedReasoningEffortOptions(model)
+    const supportedOptions = getModelSupportedReasoningEffortOptions(model)?.filter((option) => option !== 'default')
     if (supportedOptions?.includes(reasoningEffort)) {
       return {
         reasoningEffort
@@ -389,7 +391,7 @@ export function getReasoningEffort(assistant: Assistant, model: Model): Reasonin
 
   // Use thinking, doubao, zhipu, etc.
   if (isSupportedThinkingTokenDoubaoModel(model)) {
-    if (isDoubaoSeedAfter251015(model)) {
+    if (isDoubaoSeedAfter251015(model) || isDoubaoSeed18Model(model)) {
       return { reasoningEffort }
     }
     if (reasoningEffort === 'high') {
@@ -408,6 +410,12 @@ export function getReasoningEffort(assistant: Assistant, model: Model): Reasonin
     return { thinking: { type: 'enabled' } }
   }
 
+  if (isSupportedThinkingTokenMiMoModel(model)) {
+    return {
+      thinking: { type: 'enabled' }
+    }
+  }
+
   // Default case: no special thinking settings
   return {}
 }
@@ -427,7 +435,7 @@ export function getOpenAIReasoningParams(
 
   let reasoningEffort = assistant?.settings?.reasoning_effort
 
-  if (!reasoningEffort) {
+  if (!reasoningEffort || reasoningEffort === 'default') {
     return {}
   }
 
@@ -479,16 +487,14 @@ export function getAnthropicThinkingBudget(
     return undefined
   }
 
-  const budgetTokens = Math.max(
-    1024,
-    Math.floor(
-      Math.min(
-        (tokenLimit.max - tokenLimit.min) * effortRatio + tokenLimit.min,
-        (maxTokens || DEFAULT_MAX_TOKENS) * effortRatio
-      )
-    )
-  )
-  return budgetTokens
+  const budget = Math.floor((tokenLimit.max - tokenLimit.min) * effortRatio + tokenLimit.min)
+
+  let budgetTokens = budget
+  if (maxTokens !== undefined) {
+    budgetTokens = Math.min(budget, maxTokens)
+  }
+
+  return Math.max(1024, budgetTokens)
 }
 
 /**
@@ -505,7 +511,11 @@ export function getAnthropicReasoningParams(
 
   const reasoningEffort = assistant?.settings?.reasoning_effort
 
-  if (reasoningEffort === undefined || reasoningEffort === 'none') {
+  if (!reasoningEffort || reasoningEffort === 'default') {
+    return {}
+  }
+
+  if (reasoningEffort === 'none') {
     return {
       thinking: {
         type: 'disabled'
@@ -560,6 +570,10 @@ export function getGeminiReasoningParams(
 
   const reasoningEffort = assistant?.settings?.reasoning_effort
 
+  if (!reasoningEffort || reasoningEffort === 'default') {
+    return {}
+  }
+
   // Gemini 推理参数
   if (isSupportedThinkingTokenGeminiModel(model)) {
     if (reasoningEffort === undefined || reasoningEffort === 'none') {
@@ -620,10 +634,6 @@ export function getXAIReasoningParams(assistant: Assistant, model: Model): Pick<
 
   const { reasoning_effort: reasoningEffort } = getAssistantSettings(assistant)
 
-  if (!reasoningEffort || reasoningEffort === 'none') {
-    return {}
-  }
-
   switch (reasoningEffort) {
     case 'auto':
     case 'minimal':
@@ -634,6 +644,10 @@ export function getXAIReasoningParams(assistant: Assistant, model: Model): Pick<
       return { reasoningEffort }
     case 'xhigh':
       return { reasoningEffort: 'high' }
+    case 'default':
+    case 'none':
+    default:
+      return {}
   }
 }
 
@@ -650,7 +664,7 @@ export function getBedrockReasoningParams(
 
   const reasoningEffort = assistant?.settings?.reasoning_effort
 
-  if (reasoningEffort === undefined) {
+  if (reasoningEffort === undefined || reasoningEffort === 'default') {
     return {}
   }
 
diff --git a/src/renderer/src/assets/images/models/mimo.svg b/src/renderer/src/assets/images/models/mimo.svg
new file mode 100644
index 0000000000..82370fece3
--- /dev/null
+++ b/src/renderer/src/assets/images/models/mimo.svg
@@ -0,0 +1,17 @@
+<svg width="100" height="100" viewBox="0 0 100 100" fill="none" xmlns="http://www.w3.org/2000/svg">
+  <g transform="translate(10, 42) scale(1.35)">
+    <!-- m -->
+    <path d="M1.2683 15.9987C0.9317 15.998 0.6091 15.8638 0.3713 15.6256C0.1335 15.3873 0 15.0644 0 14.7278V7.165C0.0148 6.83757 0.1554 6.52848 0.3924 6.30203C0.6293 6.07559 0.9445 5.94922 1.2722 5.94922C1.6 5.94922 1.9152 6.07559 2.1521 6.30203C2.3891 6.52848 2.5296 6.83757 2.5445 7.165V14.7278C2.5442 14.895 2.5109 15.0606 2.4466 15.215C2.3822 15.3693 2.2881 15.5095 2.1696 15.6276C2.0511 15.7456 1.9105 15.8391 1.7559 15.9028C1.6012 15.9665 1.4356 15.9991 1.2683 15.9987Z" fill="currentColor"/>
+    <path d="M14.8841 15.9993C14.5468 15.9993 14.2232 15.8655 13.9845 15.6272C13.7457 15.389 13.6112 15.0657 13.6105 14.7284V4.67881L8.9888 9.45281C8.7538 9.69657 8.4315 9.83697 8.0929 9.84312C7.7544 9.84928 7.4272 9.72069 7.1835 9.48563C6.9397 9.25058 6.7993 8.92832 6.7931 8.58976C6.7901 8.42211 6.8201 8.25551 6.8814 8.09947C6.9428 7.94342 7.0342 7.80098 7.1506 7.68028L13.9703 0.661082C14.1463 0.478921 14.3728 0.35354 14.6207 0.301033C14.8685 0.248526 15.1264 0.271291 15.3612 0.366403C15.5961 0.461516 15.7971 0.624637 15.9385 0.834827C16.08 1.04502 16.1554 1.29268 16.1551 1.54603V14.7284C16.1551 15.0655 16.0212 15.3887 15.7828 15.6271C15.5444 15.8654 15.2212 15.9993 14.8841 15.9993Z" fill="currentColor"/>
+    <path d="M8.0748 9.82621C7.9058 9.82749 7.7383 9.79518 7.5818 9.73117C7.4254 9.66716 7.2833 9.57272 7.1636 9.45332L0.3571 2.4315C0.1224 2.18948 -0.0065 1.86414 -0.0014 1.52705C0.0038 1.18996 0.1427 0.868726 0.3847 0.634023C0.6267 0.399319 0.9521 0.270369 1.2892 0.27554C1.6262 0.280711 1.9475 0.419579 2.1822 0.661595L8.9887 7.66767C9.1623 7.84735 9.2792 8.07413 9.3249 8.31977C9.3706 8.56541 9.343 8.81906 9.2456 9.04914C9.1482 9.27922 8.9852 9.47557 8.7771 9.61374C8.5689 9.75191 8.3247 9.8258 8.0748 9.82621Z" fill="currentColor"/>
+    <!-- i -->
+    <path d="M20.3539 15.9997C20.0169 15.9997 19.6936 15.8658 19.4552 15.6274C19.2169 15.3891 19.083 15.0658 19.083 14.7287V1.54636C19.083 1.20928 19.2169 0.886001 19.4552 0.647648C19.6936 0.409296 20.0169 0.275391 20.3539 0.275391C20.691 0.275391 21.0143 0.409296 21.2526 0.647648C21.491 0.886001 21.6249 1.20928 21.6249 1.54636V14.7287C21.6249 14.8956 21.592 15.0609 21.5282 15.2151C21.4643 15.3693 21.3707 15.5094 21.2526 15.6274C21.1346 15.7454 20.9945 15.839 20.8403 15.9029C20.6861 15.9668 20.5208 15.9997 20.3539 15.9997Z" fill="currentColor"/>
+    <!-- m -->
+    <path d="M25.8263 15.9992C25.4893 15.9992 25.166 15.8653 24.9276 15.627C24.6893 15.3886 24.5554 15.0654 24.5554 14.7283V7.1655C24.5554 6.82842 24.6893 6.50514 24.9276 6.26679C25.166 6.02844 25.4893 5.89453 25.8263 5.89453C26.1634 5.89453 26.4867 6.02844 26.7251 6.26679C26.9634 6.50514 27.0973 6.82842 27.0973 7.1655V14.7283C27.0973 15.0654 26.9634 15.3886 26.7251 15.627C26.4867 15.8653 26.1634 15.9992 25.8263 15.9992Z" fill="currentColor"/>
+    <path d="M39.4394 16.0004C39.1023 16.0004 38.779 15.8664 38.5406 15.6281C38.3023 15.3897 38.1684 15.0665 38.1684 14.7294V4.67982L33.5467 9.45382C33.3117 9.69584 32.9901 9.83457 32.6523 9.83949C32.3156 9.84442 31.9894 9.71513 31.7474 9.48008C31.5054 9.24503 31.3674 8.92346 31.3623 8.58613C31.3573 8.24879 31.4863 7.92331 31.7214 7.6813L38.5284 0.662093C38.7044 0.483575 38.9304 0.361405 39.1767 0.311007C39.4233 0.260609 39.6787 0.284243 39.9114 0.378925C40.1437 0.473608 40.3427 0.635093 40.4837 0.842994C40.6247 1.05089 40.7007 1.29589 40.7027 1.54704V14.7294C40.7017 15.0649 40.5687 15.3866 40.3327 15.6246C40.0957 15.8625 39.7747 15.9976 39.4394 16.0004Z" fill="currentColor"/>
+    <path d="M32.6324 9.82618C32.4634 9.82746 32.2964 9.79516 32.1394 9.73115C31.9834 9.66713 31.8414 9.57269 31.7214 9.45329L24.9151 2.43147C24.7921 2.31326 24.6942 2.1715 24.6271 2.01463C24.5601 1.85777 24.5253 1.68901 24.5249 1.51842C24.5244 1.34783 24.5583 1.1789 24.6246 1.02169C24.6908 0.864476 24.788 0.722207 24.9104 0.603357C25.0327 0.484507 25.1778 0.391509 25.3369 0.329905C25.4959 0.268302 25.6658 0.239353 25.8363 0.244785C26.0068 0.250217 26.1745 0.289918 26.3293 0.361522C26.4841 0.433126 26.623 0.535168 26.7375 0.661566L33.5467 7.66764C33.7204 7.84732 33.8374 8.0741 33.8824 8.31974C33.9284 8.56538 33.9014 8.81903 33.8034 9.04911C33.7064 9.27919 33.5434 9.47554 33.3354 9.61371C33.1267 9.75189 32.8824 9.82577 32.6324 9.82618Z" fill="currentColor"/>
+    <!-- o -->
+    <path d="M50.9434 15.9814C49.5534 15.9865 48.1864 15.6287 46.9774 14.9433C45.7674 14.2579 44.7584 13.2687 44.0484 12.0735C43.3384 10.8783 42.9534 9.5185 42.9304 8.12863C42.9074 6.73875 43.2474 5.36692 43.9164 4.1488C44.0844 3.86356 44.3564 3.65487 44.6754 3.56707C44.9944 3.47927 45.3344 3.51928 45.6244 3.67859C45.9144 3.8379 46.1314 4.10397 46.2274 4.42026C46.3244 4.73656 46.2944 5.07816 46.1434 5.3725C45.5764 6.40664 45.3594 7.59693 45.5264 8.76468C45.6924 9.93243 46.2334 11.0147 47.0674 11.8489C47.9014 12.6831 48.9834 13.2244 50.1514 13.3914C51.3184 13.5584 52.5094 13.3421 53.5434 12.7751C53.8384 12.6125 54.1864 12.5738 54.5104 12.6676C54.8344 12.7614 55.1074 12.98 55.2704 13.2753C55.4324 13.5706 55.4714 13.9184 55.3774 14.2422C55.2834 14.566 55.0654 14.8393 54.7694 15.0019C53.5974 15.6455 52.2814 15.9824 50.9434 15.9814Z" fill="currentColor"/>
+    <path d="M56.8104 12.5052C56.5944 12.5044 56.3834 12.4484 56.1954 12.3424C55.9014 12.1795 55.6824 11.9066 55.5894 11.5833C55.4954 11.26 55.5324 10.9126 55.6944 10.6171C56.2614 9.58297 56.4784 8.39268 56.3114 7.22493C56.1454 6.05718 55.6044 4.97496 54.7704 4.14073C53.9364 3.30649 52.8544 2.76525 51.6864 2.59825C50.5194 2.43125 49.3284 2.64749 48.2944 3.21452C48.1474 3.30059 47.9854 3.3564 47.8164 3.37863C47.6484 3.40087 47.4774 3.38908 47.3134 3.34397C47.1494 3.29886 46.9964 3.22134 46.8624 3.116C46.7294 3.01066 46.6184 2.87964 46.5364 2.73069C46.4544 2.58174 46.4034 2.41788 46.3864 2.24882C46.3684 2.07975 46.3854 1.90891 46.4354 1.7464C46.4854 1.58389 46.5674 1.43301 46.6764 1.3027C46.7854 1.17238 46.9194 1.06527 47.0704 0.987704C48.5874 0.155491 50.3324 -0.162266 52.0454 0.0821474C53.7574 0.326561 55.3454 1.11995 56.5684 2.34319C57.7914 3.56642 58.5844 5.15347 58.8294 6.86604C59.0734 8.5786 58.7554 10.3242 57.9234 11.8408C57.8144 12.0411 57.6534 12.2084 57.4574 12.3253C57.2624 12.4422 57.0384 12.5043 56.8104 12.5052Z" fill="currentColor"/>
+  </g>
+</svg>
diff --git a/src/renderer/src/assets/images/providers/mimo.svg b/src/renderer/src/assets/images/providers/mimo.svg
new file mode 100644
index 0000000000..82370fece3
--- /dev/null
+++ b/src/renderer/src/assets/images/providers/mimo.svg
@@ -0,0 +1,17 @@
+<svg width="100" height="100" viewBox="0 0 100 100" fill="none" xmlns="http://www.w3.org/2000/svg">
+  <g transform="translate(10, 42) scale(1.35)">
+    <!-- m -->
+    <path d="M1.2683 15.9987C0.9317 15.998 0.6091 15.8638 0.3713 15.6256C0.1335 15.3873 0 15.0644 0 14.7278V7.165C0.0148 6.83757 0.1554 6.52848 0.3924 6.30203C0.6293 6.07559 0.9445 5.94922 1.2722 5.94922C1.6 5.94922 1.9152 6.07559 2.1521 6.30203C2.3891 6.52848 2.5296 6.83757 2.5445 7.165V14.7278C2.5442 14.895 2.5109 15.0606 2.4466 15.215C2.3822 15.3693 2.2881 15.5095 2.1696 15.6276C2.0511 15.7456 1.9105 15.8391 1.7559 15.9028C1.6012 15.9665 1.4356 15.9991 1.2683 15.9987Z" fill="currentColor"/>
+    <path d="M14.8841 15.9993C14.5468 15.9993 14.2232 15.8655 13.9845 15.6272C13.7457 15.389 13.6112 15.0657 13.6105 14.7284V4.67881L8.9888 9.45281C8.7538 9.69657 8.4315 9.83697 8.0929 9.84312C7.7544 9.84928 7.4272 9.72069 7.1835 9.48563C6.9397 9.25058 6.7993 8.92832 6.7931 8.58976C6.7901 8.42211 6.8201 8.25551 6.8814 8.09947C6.9428 7.94342 7.0342 7.80098 7.1506 7.68028L13.9703 0.661082C14.1463 0.478921 14.3728 0.35354 14.6207 0.301033C14.8685 0.248526 15.1264 0.271291 15.3612 0.366403C15.5961 0.461516 15.7971 0.624637 15.9385 0.834827C16.08 1.04502 16.1554 1.29268 16.1551 1.54603V14.7284C16.1551 15.0655 16.0212 15.3887 15.7828 15.6271C15.5444 15.8654 15.2212 15.9993 14.8841 15.9993Z" fill="currentColor"/>
+    <path d="M8.0748 9.82621C7.9058 9.82749 7.7383 9.79518 7.5818 9.73117C7.4254 9.66716 7.2833 9.57272 7.1636 9.45332L0.3571 2.4315C0.1224 2.18948 -0.0065 1.86414 -0.0014 1.52705C0.0038 1.18996 0.1427 0.868726 0.3847 0.634023C0.6267 0.399319 0.9521 0.270369 1.2892 0.27554C1.6262 0.280711 1.9475 0.419579 2.1822 0.661595L8.9887 7.66767C9.1623 7.84735 9.2792 8.07413 9.3249 8.31977C9.3706 8.56541 9.343 8.81906 9.2456 9.04914C9.1482 9.27922 8.9852 9.47557 8.7771 9.61374C8.5689 9.75191 8.3247 9.8258 8.0748 9.82621Z" fill="currentColor"/>
+    <!-- i -->
+    <path d="M20.3539 15.9997C20.0169 15.9997 19.6936 15.8658 19.4552 15.6274C19.2169 15.3891 19.083 15.0658 19.083 14.7287V1.54636C19.083 1.20928 19.2169 0.886001 19.4552 0.647648C19.6936 0.409296 20.0169 0.275391 20.3539 0.275391C20.691 0.275391 21.0143 0.409296 21.2526 0.647648C21.491 0.886001 21.6249 1.20928 21.6249 1.54636V14.7287C21.6249 14.8956 21.592 15.0609 21.5282 15.2151C21.4643 15.3693 21.3707 15.5094 21.2526 15.6274C21.1346 15.7454 20.9945 15.839 20.8403 15.9029C20.6861 15.9668 20.5208 15.9997 20.3539 15.9997Z" fill="currentColor"/>
+    <!-- m -->
+    <path d="M25.8263 15.9992C25.4893 15.9992 25.166 15.8653 24.9276 15.627C24.6893 15.3886 24.5554 15.0654 24.5554 14.7283V7.1655C24.5554 6.82842 24.6893 6.50514 24.9276 6.26679C25.166 6.02844 25.4893 5.89453 25.8263 5.89453C26.1634 5.89453 26.4867 6.02844 26.7251 6.26679C26.9634 6.50514 27.0973 6.82842 27.0973 7.1655V14.7283C27.0973 15.0654 26.9634 15.3886 26.7251 15.627C26.4867 15.8653 26.1634 15.9992 25.8263 15.9992Z" fill="currentColor"/>
+    <path d="M39.4394 16.0004C39.1023 16.0004 38.779 15.8664 38.5406 15.6281C38.3023 15.3897 38.1684 15.0665 38.1684 14.7294V4.67982L33.5467 9.45382C33.3117 9.69584 32.9901 9.83457 32.6523 9.83949C32.3156 9.84442 31.9894 9.71513 31.7474 9.48008C31.5054 9.24503 31.3674 8.92346 31.3623 8.58613C31.3573 8.24879 31.4863 7.92331 31.7214 7.6813L38.5284 0.662093C38.7044 0.483575 38.9304 0.361405 39.1767 0.311007C39.4233 0.260609 39.6787 0.284243 39.9114 0.378925C40.1437 0.473608 40.3427 0.635093 40.4837 0.842994C40.6247 1.05089 40.7007 1.29589 40.7027 1.54704V14.7294C40.7017 15.0649 40.5687 15.3866 40.3327 15.6246C40.0957 15.8625 39.7747 15.9976 39.4394 16.0004Z" fill="currentColor"/>
+    <path d="M32.6324 9.82618C32.4634 9.82746 32.2964 9.79516 32.1394 9.73115C31.9834 9.66713 31.8414 9.57269 31.7214 9.45329L24.9151 2.43147C24.7921 2.31326 24.6942 2.1715 24.6271 2.01463C24.5601 1.85777 24.5253 1.68901 24.5249 1.51842C24.5244 1.34783 24.5583 1.1789 24.6246 1.02169C24.6908 0.864476 24.788 0.722207 24.9104 0.603357C25.0327 0.484507 25.1778 0.391509 25.3369 0.329905C25.4959 0.268302 25.6658 0.239353 25.8363 0.244785C26.0068 0.250217 26.1745 0.289918 26.3293 0.361522C26.4841 0.433126 26.623 0.535168 26.7375 0.661566L33.5467 7.66764C33.7204 7.84732 33.8374 8.0741 33.8824 8.31974C33.9284 8.56538 33.9014 8.81903 33.8034 9.04911C33.7064 9.27919 33.5434 9.47554 33.3354 9.61371C33.1267 9.75189 32.8824 9.82577 32.6324 9.82618Z" fill="currentColor"/>
+    <!-- o -->
+    <path d="M50.9434 15.9814C49.5534 15.9865 48.1864 15.6287 46.9774 14.9433C45.7674 14.2579 44.7584 13.2687 44.0484 12.0735C43.3384 10.8783 42.9534 9.5185 42.9304 8.12863C42.9074 6.73875 43.2474 5.36692 43.9164 4.1488C44.0844 3.86356 44.3564 3.65487 44.6754 3.56707C44.9944 3.47927 45.3344 3.51928 45.6244 3.67859C45.9144 3.8379 46.1314 4.10397 46.2274 4.42026C46.3244 4.73656 46.2944 5.07816 46.1434 5.3725C45.5764 6.40664 45.3594 7.59693 45.5264 8.76468C45.6924 9.93243 46.2334 11.0147 47.0674 11.8489C47.9014 12.6831 48.9834 13.2244 50.1514 13.3914C51.3184 13.5584 52.5094 13.3421 53.5434 12.7751C53.8384 12.6125 54.1864 12.5738 54.5104 12.6676C54.8344 12.7614 55.1074 12.98 55.2704 13.2753C55.4324 13.5706 55.4714 13.9184 55.3774 14.2422C55.2834 14.566 55.0654 14.8393 54.7694 15.0019C53.5974 15.6455 52.2814 15.9824 50.9434 15.9814Z" fill="currentColor"/>
+    <path d="M56.8104 12.5052C56.5944 12.5044 56.3834 12.4484 56.1954 12.3424C55.9014 12.1795 55.6824 11.9066 55.5894 11.5833C55.4954 11.26 55.5324 10.9126 55.6944 10.6171C56.2614 9.58297 56.4784 8.39268 56.3114 7.22493C56.1454 6.05718 55.6044 4.97496 54.7704 4.14073C53.9364 3.30649 52.8544 2.76525 51.6864 2.59825C50.5194 2.43125 49.3284 2.64749 48.2944 3.21452C48.1474 3.30059 47.9854 3.3564 47.8164 3.37863C47.6484 3.40087 47.4774 3.38908 47.3134 3.34397C47.1494 3.29886 46.9964 3.22134 46.8624 3.116C46.7294 3.01066 46.6184 2.87964 46.5364 2.73069C46.4544 2.58174 46.4034 2.41788 46.3864 2.24882C46.3684 2.07975 46.3854 1.90891 46.4354 1.7464C46.4854 1.58389 46.5674 1.43301 46.6764 1.3027C46.7854 1.17238 46.9194 1.06527 47.0704 0.987704C48.5874 0.155491 50.3324 -0.162266 52.0454 0.0821474C53.7574 0.326561 55.3454 1.11995 56.5684 2.34319C57.7914 3.56642 58.5844 5.15347 58.8294 6.86604C59.0734 8.5786 58.7554 10.3242 57.9234 11.8408C57.8144 12.0411 57.6534 12.2084 57.4574 12.3253C57.2624 12.4422 57.0384 12.5043 56.8104 12.5052Z" fill="currentColor"/>
+  </g>
+</svg>
diff --git a/src/renderer/src/components/Icons/SVGIcon.tsx b/src/renderer/src/components/Icons/SVGIcon.tsx
index ad503f0e38..82be6b340e 100644
--- a/src/renderer/src/components/Icons/SVGIcon.tsx
+++ b/src/renderer/src/components/Icons/SVGIcon.tsx
@@ -113,6 +113,18 @@ export function MdiLightbulbOn(props: SVGProps<SVGSVGElement>) {
   )
 }
 
+export function MdiLightbulbQuestion(props: SVGProps<SVGSVGElement>) {
+  // {/* Icon from Material Design Icons by Pictogrammers - https://github.com/Templarian/MaterialDesign/blob/master/LICENSE */}
+  return (
+    <svg xmlns="http://www.w3.org/2000/svg" width="1em" height="1em" viewBox="0 0 24 24" {...props}>
+      <path
+        fill="currentColor"
+        d="M8 2C11.9 2 15 5.1 15 9C15 11.4 13.8 13.5 12 14.7V17C12 17.6 11.6 18 11 18H5C4.4 18 4 17.6 4 17V14.7C2.2 13.5 1 11.4 1 9C1 5.1 4.1 2 8 2M5 21V20H11V21C11 21.6 10.6 22 10 22H6C5.4 22 5 21.6 5 21M8 4C5.2 4 3 6.2 3 9C3 11.1 4.2 12.8 6 13.6V16H10V13.6C11.8 12.8 13 11.1 13 9C13 6.2 10.8 4 8 4M20.5 14.5V16H19V14.5H20.5M18.5 9.5H17V9C17 7.3 18.3 6 20 6S23 7.3 23 9C23 10 22.5 10.9 21.7 11.4L21.4 11.6C20.8 12 20.5 12.6 20.5 13.3V13.5H19V13.3C19 12.1 19.6 11 20.6 10.4L20.9 10.2C21.3 9.9 21.5 9.5 21.5 9C21.5 8.2 20.8 7.5 20 7.5S18.5 8.2 18.5 9V9.5Z"
+      />
+    </svg>
+  )
+}
+
 export function BingLogo(props: SVGProps<SVGSVGElement>) {
   return (
     <svg
diff --git a/src/renderer/src/components/Popups/agent/AgentModal.tsx b/src/renderer/src/components/Popups/agent/AgentModal.tsx
index 8a8b4fe61b..25e4b81f18 100644
--- a/src/renderer/src/components/Popups/agent/AgentModal.tsx
+++ b/src/renderer/src/components/Popups/agent/AgentModal.tsx
@@ -3,6 +3,7 @@ import { ErrorBoundary } from '@renderer/components/ErrorBoundary'
 import { HelpTooltip } from '@renderer/components/TooltipIcons'
 import { TopView } from '@renderer/components/TopView'
 import { permissionModeCards } from '@renderer/config/agent'
+import { isWin } from '@renderer/config/constant'
 import { useAgents } from '@renderer/hooks/agents/useAgents'
 import { useUpdateAgent } from '@renderer/hooks/agents/useUpdateAgent'
 import SelectAgentBaseModelButton from '@renderer/pages/home/components/SelectAgentBaseModelButton'
@@ -16,7 +17,8 @@ import type {
   UpdateAgentForm
 } from '@renderer/types'
 import { AgentConfigurationSchema, isAgentType } from '@renderer/types'
-import { Alert, Button, Input, Modal, Select } from 'antd'
+import type { GitBashPathInfo } from '@shared/config/constant'
+import { Button, Input, Modal, Select } from 'antd'
 import { AlertTriangleIcon } from 'lucide-react'
 import type { ChangeEvent, FormEvent } from 'react'
 import { useCallback, useEffect, useMemo, useRef, useState } from 'react'
@@ -59,8 +61,7 @@ const PopupContainer: React.FC<Props> = ({ agent, afterSubmit, resolve }) => {
   const isEditing = (agent?: AgentWithTools) => agent !== undefined
 
   const [form, setForm] = useState<BaseAgentForm>(() => buildAgentForm(agent))
-  const [hasGitBash, setHasGitBash] = useState<boolean>(true)
-  const [customGitBashPath, setCustomGitBashPath] = useState<string>('')
+  const [gitBashPathInfo, setGitBashPathInfo] = useState<GitBashPathInfo>({ path: null, source: null })
 
   useEffect(() => {
     if (open) {
@@ -68,29 +69,15 @@ const PopupContainer: React.FC<Props> = ({ agent, afterSubmit, resolve }) => {
     }
   }, [agent, open])
 
-  const checkGitBash = useCallback(
-    async (showToast = false) => {
-      try {
-        const [gitBashInstalled, savedPath] = await Promise.all([
-          window.api.system.checkGitBash(),
-          window.api.system.getGitBashPath().catch(() => null)
-        ])
-        setCustomGitBashPath(savedPath ?? '')
-        setHasGitBash(gitBashInstalled)
-        if (showToast) {
-          if (gitBashInstalled) {
-            window.toast.success(t('agent.gitBash.success', 'Git Bash detected successfully!'))
-          } else {
-            window.toast.error(t('agent.gitBash.notFound', 'Git Bash not found. Please install it first.'))
-          }
-        }
-      } catch (error) {
-        logger.error('Failed to check Git Bash:', error as Error)
-        setHasGitBash(true) // Default to true on error to avoid false warnings
-      }
-    },
-    [t]
-  )
+  const checkGitBash = useCallback(async () => {
+    if (!isWin) return
+    try {
+      const pathInfo = await window.api.system.getGitBashPathInfo()
+      setGitBashPathInfo(pathInfo)
+    } catch (error) {
+      logger.error('Failed to check Git Bash:', error as Error)
+    }
+  }, [])
 
   useEffect(() => {
     checkGitBash()
@@ -119,24 +106,22 @@ const PopupContainer: React.FC<Props> = ({ agent, afterSubmit, resolve }) => {
         return
       }
 
-      setCustomGitBashPath(pickedPath)
-      await checkGitBash(true)
+      await checkGitBash()
     } catch (error) {
       logger.error('Failed to pick Git Bash path', error as Error)
       window.toast.error(t('agent.gitBash.pick.failed', 'Failed to set Git Bash path'))
     }
   }, [checkGitBash, t])
 
-  const handleClearGitBash = useCallback(async () => {
+  const handleResetGitBash = useCallback(async () => {
     try {
+      // Clear manual setting and re-run auto-discovery
       await window.api.system.setGitBashPath(null)
-      setCustomGitBashPath('')
-      await checkGitBash(true)
+      await checkGitBash()
     } catch (error) {
-      logger.error('Failed to clear Git Bash path', error as Error)
-      window.toast.error(t('agent.gitBash.pick.failed', 'Failed to set Git Bash path'))
+      logger.error('Failed to reset Git Bash path', error as Error)
     }
-  }, [checkGitBash, t])
+  }, [checkGitBash])
 
   const onPermissionModeChange = useCallback((value: PermissionMode) => {
     setForm((prev) => {
@@ -268,6 +253,12 @@ const PopupContainer: React.FC<Props> = ({ agent, afterSubmit, resolve }) => {
         return
       }
 
+      if (isWin && !gitBashPathInfo.path) {
+        window.toast.error(t('agent.gitBash.error.required', 'Git Bash path is required on Windows'))
+        loadingRef.current = false
+        return
+      }
+
       if (isEditing(agent)) {
         if (!agent) {
           loadingRef.current = false
@@ -327,7 +318,8 @@ const PopupContainer: React.FC<Props> = ({ agent, afterSubmit, resolve }) => {
       t,
       updateAgent,
       afterSubmit,
-      addAgent
+      addAgent,
+      gitBashPathInfo.path
     ]
   )
 
@@ -346,66 +338,6 @@ const PopupContainer: React.FC<Props> = ({ agent, afterSubmit, resolve }) => {
         footer={null}>
         <StyledForm onSubmit={onSubmit}>
           <FormContent>
-            {!hasGitBash && (
-              <Alert
-                message={t('agent.gitBash.error.title', 'Git Bash Required')}
-                description={
-                  <div>
-                    <div style={{ marginBottom: 8 }}>
-                      {t(
-                        'agent.gitBash.error.description',
-                        'Git Bash is required to run agents on Windows. The agent cannot function without it. Please install Git for Windows from'
-                      )}{' '}
-                      <a
-                        href="https://git-scm.com/download/win"
-                        onClick={(e) => {
-                          e.preventDefault()
-                          window.api.openWebsite('https://git-scm.com/download/win')
-                        }}
-                        style={{ textDecoration: 'underline' }}>
-                        git-scm.com
-                      </a>
-                    </div>
-                    <Button size="small" onClick={() => checkGitBash(true)}>
-                      {t('agent.gitBash.error.recheck', 'Recheck Git Bash Installation')}
-                    </Button>
-                    <Button size="small" style={{ marginLeft: 8 }} onClick={handlePickGitBash}>
-                      {t('agent.gitBash.pick.button', 'Select Git Bash Path')}
-                    </Button>
-                  </div>
-                }
-                type="error"
-                showIcon
-                style={{ marginBottom: 16 }}
-              />
-            )}
-
-            {hasGitBash && customGitBashPath && (
-              <Alert
-                message={t('agent.gitBash.found.title', 'Git Bash configured')}
-                description={
-                  <div style={{ display: 'flex', flexDirection: 'column', gap: 8 }}>
-                    <div>
-                      {t('agent.gitBash.customPath', {
-                        defaultValue: 'Using custom path: {{path}}',
-                        path: customGitBashPath
-                      })}
-                    </div>
-                    <div style={{ display: 'flex', gap: 8 }}>
-                      <Button size="small" onClick={handlePickGitBash}>
-                        {t('agent.gitBash.pick.button', 'Select Git Bash Path')}
-                      </Button>
-                      <Button size="small" onClick={handleClearGitBash}>
-                        {t('agent.gitBash.clear.button', 'Clear custom path')}
-                      </Button>
-                    </div>
-                  </div>
-                }
-                type="success"
-                showIcon
-                style={{ marginBottom: 16 }}
-              />
-            )}
             <FormRow>
               <FormItem style={{ flex: 1 }}>
                 <Label>
@@ -439,6 +371,40 @@ const PopupContainer: React.FC<Props> = ({ agent, afterSubmit, resolve }) => {
               />
             </FormItem>
 
+            {isWin && (
+              <FormItem>
+                <div className="flex items-center gap-2">
+                  <Label>
+                    Git Bash <RequiredMark>*</RequiredMark>
+                  </Label>
+                  <HelpTooltip
+                    title={t(
+                      'agent.gitBash.tooltip',
+                      'Git Bash is required to run agents on Windows. Install from git-scm.com if not available.'
+                    )}
+                  />
+                </div>
+                <GitBashInputWrapper>
+                  <Input
+                    value={gitBashPathInfo.path ?? ''}
+                    readOnly
+                    placeholder={t('agent.gitBash.placeholder', 'Select bash.exe path')}
+                  />
+                  <Button size="small" onClick={handlePickGitBash}>
+                    {t('common.select', 'Select')}
+                  </Button>
+                  {gitBashPathInfo.source === 'manual' && (
+                    <Button size="small" onClick={handleResetGitBash}>
+                      {t('common.reset', 'Reset')}
+                    </Button>
+                  )}
+                </GitBashInputWrapper>
+                {gitBashPathInfo.path && gitBashPathInfo.source === 'auto' && (
+                  <SourceHint>{t('agent.gitBash.autoDiscoveredHint', 'Auto-discovered')}</SourceHint>
+                )}
+              </FormItem>
+            )}
+
             <FormItem>
               <Label>
                 {t('agent.settings.tooling.permissionMode.title', 'Permission mode')} <RequiredMark>*</RequiredMark>
@@ -511,7 +477,11 @@ const PopupContainer: React.FC<Props> = ({ agent, afterSubmit, resolve }) => {
 
           <FormFooter>
             <Button onClick={onCancel}>{t('common.close')}</Button>
-            <Button type="primary" htmlType="submit" loading={loadingRef.current} disabled={!hasGitBash}>
+            <Button
+              type="primary"
+              htmlType="submit"
+              loading={loadingRef.current}
+              disabled={isWin && !gitBashPathInfo.path}>
               {isEditing(agent) ? t('common.confirm') : t('common.add')}
             </Button>
           </FormFooter>
@@ -582,6 +552,21 @@ const FormItem = styled.div`
   gap: 8px;
 `
 
+const GitBashInputWrapper = styled.div`
+  display: flex;
+  gap: 8px;
+  align-items: center;
+
+  input {
+    flex: 1;
+  }
+`
+
+const SourceHint = styled.span`
+  font-size: 12px;
+  color: var(--color-text-3);
+`
+
 const Label = styled.label`
   font-size: 14px;
   color: var(--color-text-1);
diff --git a/src/renderer/src/config/models/__tests__/reasoning.test.ts b/src/renderer/src/config/models/__tests__/reasoning.test.ts
index 5a60676b64..ba7af37f17 100644
--- a/src/renderer/src/config/models/__tests__/reasoning.test.ts
+++ b/src/renderer/src/config/models/__tests__/reasoning.test.ts
@@ -631,7 +631,7 @@ describe('Reasoning option configuration', () => {
 
   it('restricts GPT-5 Pro reasoning to high effort only', () => {
     expect(MODEL_SUPPORTED_REASONING_EFFORT.gpt5pro).toEqual(['high'])
-    expect(MODEL_SUPPORTED_OPTIONS.gpt5pro).toEqual(['high'])
+    expect(MODEL_SUPPORTED_OPTIONS.gpt5pro).toEqual(['default', 'high'])
   })
 })
 
@@ -733,6 +733,11 @@ describe('getThinkModelType - Comprehensive Coverage', () => {
       expect(getThinkModelType(createModel({ id: 'doubao-seed-1-6-lite-251015' }))).toBe('doubao_after_251015')
     })
 
+    it('should return doubao_after_251015 for Doubao-Seed-1.8 models', () => {
+      expect(getThinkModelType(createModel({ id: 'doubao-seed-1-8-251215' }))).toBe('doubao_after_251015')
+      expect(getThinkModelType(createModel({ id: 'doubao-seed-1.8' }))).toBe('doubao_after_251015')
+    })
+
     it('should return doubao_no_auto for other Doubao thinking models', () => {
       expect(getThinkModelType(createModel({ id: 'doubao-1.5-thinking-vision-pro' }))).toBe('doubao_no_auto')
     })
@@ -863,6 +868,7 @@ describe('getThinkModelType - Comprehensive Coverage', () => {
       // auto > after_251015 > no_auto
       expect(getThinkModelType(createModel({ id: 'doubao-seed-1.6' }))).toBe('doubao')
       expect(getThinkModelType(createModel({ id: 'doubao-seed-1-6-251015' }))).toBe('doubao_after_251015')
+      expect(getThinkModelType(createModel({ id: 'doubao-seed-1-8-251215' }))).toBe('doubao_after_251015')
       expect(getThinkModelType(createModel({ id: 'doubao-1.5-thinking-vision-pro' }))).toBe('doubao_no_auto')
     })
 
@@ -1672,10 +1678,26 @@ describe('getModelSupportedReasoningEffortOptions', () => {
 
   describe('OpenAI models', () => {
     it('should return correct options for o-series models', () => {
-      expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'o3' }))).toEqual(['low', 'medium', 'high'])
-      expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'o3-mini' }))).toEqual(['low', 'medium', 'high'])
-      expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'o4' }))).toEqual(['low', 'medium', 'high'])
+      expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'o3' }))).toEqual([
+        'default',
+        'low',
+        'medium',
+        'high'
+      ])
+      expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'o3-mini' }))).toEqual([
+        'default',
+        'low',
+        'medium',
+        'high'
+      ])
+      expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'o4' }))).toEqual([
+        'default',
+        'low',
+        'medium',
+        'high'
+      ])
       expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'gpt-oss-reasoning' }))).toEqual([
+        'default',
         'low',
         'medium',
         'high'
@@ -1685,17 +1707,22 @@ describe('getModelSupportedReasoningEffortOptions', () => {
     it('should return correct options for deep research models', () => {
       // Note: Deep research models need to be actual OpenAI reasoning models to be detected
       // 'sonar-deep-research' from Perplexity is the primary deep research model
-      expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'sonar-deep-research' }))).toEqual(['medium'])
+      expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'sonar-deep-research' }))).toEqual([
+        'default',
+        'medium'
+      ])
     })
 
     it('should return correct options for GPT-5 models', () => {
       expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'gpt-5' }))).toEqual([
+        'default',
         'minimal',
         'low',
         'medium',
         'high'
       ])
       expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'gpt-5-preview' }))).toEqual([
+        'default',
         'minimal',
         'low',
         'medium',
@@ -1704,17 +1731,22 @@ describe('getModelSupportedReasoningEffortOptions', () => {
     })
 
     it('should return correct options for GPT-5 Pro models', () => {
-      expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'gpt-5-pro' }))).toEqual(['high'])
-      expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'gpt-5-pro-preview' }))).toEqual(['high'])
+      expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'gpt-5-pro' }))).toEqual(['default', 'high'])
+      expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'gpt-5-pro-preview' }))).toEqual([
+        'default',
+        'high'
+      ])
     })
 
     it('should return correct options for GPT-5 Codex models', () => {
       expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'gpt-5-codex' }))).toEqual([
+        'default',
         'low',
         'medium',
         'high'
       ])
       expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'gpt-5-codex-mini' }))).toEqual([
+        'default',
         'low',
         'medium',
         'high'
@@ -1723,18 +1755,21 @@ describe('getModelSupportedReasoningEffortOptions', () => {
 
     it('should return correct options for GPT-5.1 models', () => {
       expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'gpt-5.1' }))).toEqual([
+        'default',
         'none',
         'low',
         'medium',
         'high'
       ])
       expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'gpt-5.1-preview' }))).toEqual([
+        'default',
         'none',
         'low',
         'medium',
         'high'
       ])
       expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'gpt-5.1-mini' }))).toEqual([
+        'default',
         'none',
         'low',
         'medium',
@@ -1744,11 +1779,13 @@ describe('getModelSupportedReasoningEffortOptions', () => {
 
     it('should return correct options for GPT-5.1 Codex models', () => {
       expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'gpt-5.1-codex' }))).toEqual([
+        'default',
         'none',
         'medium',
         'high'
       ])
       expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'gpt-5.1-codex-mini' }))).toEqual([
+        'default',
         'none',
         'medium',
         'high'
@@ -1758,19 +1795,24 @@ describe('getModelSupportedReasoningEffortOptions', () => {
 
   describe('Grok models', () => {
     it('should return correct options for Grok 3 mini', () => {
-      expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'grok-3-mini' }))).toEqual(['low', 'high'])
+      expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'grok-3-mini' }))).toEqual([
+        'default',
+        'low',
+        'high'
+      ])
     })
 
     it('should return correct options for Grok 4 Fast', () => {
       expect(
         getModelSupportedReasoningEffortOptions(createModel({ id: 'grok-4-fast', provider: 'openrouter' }))
-      ).toEqual(['none', 'auto'])
+      ).toEqual(['default', 'none', 'auto'])
     })
   })
 
   describe('Gemini models', () => {
     it('should return correct options for Gemini Flash models', () => {
       expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'gemini-2.5-flash-latest' }))).toEqual([
+        'default',
         'none',
         'low',
         'medium',
@@ -1778,6 +1820,7 @@ describe('getModelSupportedReasoningEffortOptions', () => {
         'auto'
       ])
       expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'gemini-flash-latest' }))).toEqual([
+        'default',
         'none',
         'low',
         'medium',
@@ -1788,12 +1831,14 @@ describe('getModelSupportedReasoningEffortOptions', () => {
 
     it('should return correct options for Gemini Pro models', () => {
       expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'gemini-2.5-pro-latest' }))).toEqual([
+        'default',
         'low',
         'medium',
         'high',
         'auto'
       ])
       expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'gemini-pro-latest' }))).toEqual([
+        'default',
         'low',
         'medium',
         'high',
@@ -1803,11 +1848,13 @@ describe('getModelSupportedReasoningEffortOptions', () => {
 
     it('should return correct options for Gemini 3 models', () => {
       expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'gemini-3-flash' }))).toEqual([
+        'default',
         'low',
         'medium',
         'high'
       ])
       expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'gemini-3-pro-preview' }))).toEqual([
+        'default',
         'low',
         'medium',
         'high'
@@ -1818,24 +1865,28 @@ describe('getModelSupportedReasoningEffortOptions', () => {
   describe('Qwen models', () => {
     it('should return correct options for controllable Qwen models', () => {
       expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'qwen-plus' }))).toEqual([
+        'default',
         'none',
         'low',
         'medium',
         'high'
       ])
       expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'qwen-turbo' }))).toEqual([
+        'default',
         'none',
         'low',
         'medium',
         'high'
       ])
       expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'qwen-flash' }))).toEqual([
+        'default',
         'none',
         'low',
         'medium',
         'high'
       ])
       expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'qwen3-8b' }))).toEqual([
+        'default',
         'none',
         'low',
         'medium',
@@ -1853,11 +1904,13 @@ describe('getModelSupportedReasoningEffortOptions', () => {
   describe('Doubao models', () => {
     it('should return correct options for auto-thinking Doubao models', () => {
       expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'doubao-seed-1.6' }))).toEqual([
+        'default',
         'none',
         'auto',
         'high'
       ])
       expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'doubao-1-5-thinking-pro-m' }))).toEqual([
+        'default',
         'none',
         'auto',
         'high'
@@ -1866,12 +1919,14 @@ describe('getModelSupportedReasoningEffortOptions', () => {
 
     it('should return correct options for Doubao models after 251015', () => {
       expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'doubao-seed-1-6-251015' }))).toEqual([
+        'default',
         'minimal',
         'low',
         'medium',
         'high'
       ])
       expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'doubao-seed-1-6-lite-251015' }))).toEqual([
+        'default',
         'minimal',
         'low',
         'medium',
@@ -1881,6 +1936,7 @@ describe('getModelSupportedReasoningEffortOptions', () => {
 
     it('should return correct options for other Doubao thinking models', () => {
       expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'doubao-1.5-thinking-vision-pro' }))).toEqual([
+        'default',
         'none',
         'high'
       ])
@@ -1889,28 +1945,43 @@ describe('getModelSupportedReasoningEffortOptions', () => {
 
   describe('Other providers', () => {
     it('should return correct options for Hunyuan models', () => {
-      expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'hunyuan-a13b' }))).toEqual(['none', 'auto'])
+      expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'hunyuan-a13b' }))).toEqual([
+        'default',
+        'none',
+        'auto'
+      ])
     })
 
     it('should return correct options for Zhipu models', () => {
-      expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'glm-4.5' }))).toEqual(['none', 'auto'])
-      expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'glm-4.6' }))).toEqual(['none', 'auto'])
+      expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'glm-4.5' }))).toEqual([
+        'default',
+        'none',
+        'auto'
+      ])
+      expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'glm-4.6' }))).toEqual([
+        'default',
+        'none',
+        'auto'
+      ])
     })
 
     it('should return correct options for Perplexity models', () => {
-      expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'sonar-deep-research' }))).toEqual(['medium'])
+      expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'sonar-deep-research' }))).toEqual([
+        'default',
+        'medium'
+      ])
     })
 
     it('should return correct options for DeepSeek hybrid models', () => {
       expect(
         getModelSupportedReasoningEffortOptions(createModel({ id: 'deepseek-v3.1', provider: 'deepseek' }))
-      ).toEqual(['none', 'auto'])
+      ).toEqual(['default', 'none', 'auto'])
       expect(
         getModelSupportedReasoningEffortOptions(createModel({ id: 'deepseek-v3.2', provider: 'openrouter' }))
-      ).toEqual(['none', 'auto'])
+      ).toEqual(['default', 'none', 'auto'])
       expect(
         getModelSupportedReasoningEffortOptions(createModel({ id: 'deepseek-chat', provider: 'deepseek' }))
-      ).toEqual(['none', 'auto'])
+      ).toEqual(['default', 'none', 'auto'])
     })
   })
 
@@ -1925,7 +1996,7 @@ describe('getModelSupportedReasoningEffortOptions', () => {
             provider: 'openrouter'
           })
         )
-      ).toEqual(['none', 'auto'])
+      ).toEqual(['default', 'none', 'auto'])
 
       expect(
         getModelSupportedReasoningEffortOptions(
@@ -1934,7 +2005,7 @@ describe('getModelSupportedReasoningEffortOptions', () => {
             name: 'gpt-5.1'
           })
         )
-      ).toEqual(['none', 'low', 'medium', 'high'])
+      ).toEqual(['default', 'none', 'low', 'medium', 'high'])
 
       // Qwen models work well for name-based fallback
       expect(
@@ -1944,7 +2015,7 @@ describe('getModelSupportedReasoningEffortOptions', () => {
             name: 'qwen-plus'
           })
         )
-      ).toEqual(['none', 'low', 'medium', 'high'])
+      ).toEqual(['default', 'none', 'low', 'medium', 'high'])
     })
 
     it('should use id result when id matches', () => {
@@ -1955,7 +2026,7 @@ describe('getModelSupportedReasoningEffortOptions', () => {
             name: 'Different Name'
           })
         )
-      ).toEqual(['none', 'low', 'medium', 'high'])
+      ).toEqual(['default', 'none', 'low', 'medium', 'high'])
 
       expect(
         getModelSupportedReasoningEffortOptions(
@@ -1964,20 +2035,27 @@ describe('getModelSupportedReasoningEffortOptions', () => {
             name: 'Some other name'
           })
         )
-      ).toEqual(['low', 'medium', 'high'])
+      ).toEqual(['default', 'low', 'medium', 'high'])
     })
   })
 
   describe('Case sensitivity', () => {
     it('should handle case insensitive model IDs', () => {
       expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'GPT-5.1' }))).toEqual([
+        'default',
         'none',
         'low',
         'medium',
         'high'
       ])
-      expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'O3-MINI' }))).toEqual(['low', 'medium', 'high'])
+      expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'O3-MINI' }))).toEqual([
+        'default',
+        'low',
+        'medium',
+        'high'
+      ])
       expect(getModelSupportedReasoningEffortOptions(createModel({ id: 'Gemini-2.5-Flash-Latest' }))).toEqual([
+        'default',
         'none',
         'low',
         'medium',
diff --git a/src/renderer/src/config/models/default.ts b/src/renderer/src/config/models/default.ts
index 45fa7f79c4..37854c5749 100644
--- a/src/renderer/src/config/models/default.ts
+++ b/src/renderer/src/config/models/default.ts
@@ -362,7 +362,7 @@ export const SYSTEM_MODELS: Record<SystemProviderId | 'defaultModel', Model[]> =
     {
       id: 'gemini-3-pro-image-preview',
       provider: 'gemini',
-      name: 'Gemini 3 Pro Image Privew',
+      name: 'Gemini 3 Pro Image Preview',
       group: 'Gemini 3'
     },
     {
@@ -746,6 +746,12 @@ export const SYSTEM_MODELS: Record<SystemProviderId | 'defaultModel', Model[]> =
     }
   ],
   doubao: [
+    {
+      id: 'doubao-seed-1-8-251215',
+      provider: 'doubao',
+      name: 'Doubao-Seed-1.8',
+      group: 'Doubao-Seed-1.8'
+    },
     {
       id: 'doubao-1-5-vision-pro-32k-250115',
       provider: 'doubao',
@@ -1785,5 +1791,13 @@ export const SYSTEM_MODELS: Record<SystemProviderId | 'defaultModel', Model[]> =
       provider: 'cerebras',
       group: 'qwen'
     }
+  ],
+  mimo: [
+    {
+      id: 'mimo-v2-flash',
+      name: 'Mimo V2 Flash',
+      provider: 'mimo',
+      group: 'Mimo'
+    }
   ]
 }
diff --git a/src/renderer/src/config/models/logo.ts b/src/renderer/src/config/models/logo.ts
index fe1a919c5e..75ad71f662 100644
--- a/src/renderer/src/config/models/logo.ts
+++ b/src/renderer/src/config/models/logo.ts
@@ -103,6 +103,7 @@ import MicrosoftModelLogo from '@renderer/assets/images/models/microsoft.png'
 import MicrosoftModelLogoDark from '@renderer/assets/images/models/microsoft_dark.png'
 import MidjourneyModelLogo from '@renderer/assets/images/models/midjourney.png'
 import MidjourneyModelLogoDark from '@renderer/assets/images/models/midjourney_dark.png'
+import MiMoModelLogo from '@renderer/assets/images/models/mimo.svg'
 import {
   default as MinicpmModelLogo,
   default as MinicpmModelLogoDark
@@ -301,7 +302,8 @@ export function getModelLogoById(modelId: string): string | undefined {
     bytedance: BytedanceModelLogo,
     ling: LingModelLogo,
     ring: LingModelLogo,
-    '(V_1|V_1_TURBO|V_2|V_2A|V_2_TURBO|DESCRIBE|UPSCALE)': IdeogramModelLogo
+    '(V_1|V_1_TURBO|V_2|V_2A|V_2_TURBO|DESCRIBE|UPSCALE)': IdeogramModelLogo,
+    mimo: MiMoModelLogo
   } as const satisfies Record<string, string>
 
   for (const key in logoMap) {
diff --git a/src/renderer/src/config/models/reasoning.ts b/src/renderer/src/config/models/reasoning.ts
index a5e47ef3b1..faa04721e6 100644
--- a/src/renderer/src/config/models/reasoning.ts
+++ b/src/renderer/src/config/models/reasoning.ts
@@ -52,6 +52,7 @@ export const MODEL_SUPPORTED_REASONING_EFFORT = {
   doubao_no_auto: ['high'] as const,
   doubao_after_251015: ['minimal', 'low', 'medium', 'high'] as const,
   hunyuan: ['auto'] as const,
+  mimo: ['auto'] as const,
   zhipu: ['auto'] as const,
   perplexity: ['low', 'medium', 'high'] as const,
   deepseek_hybrid: ['auto'] as const
@@ -59,31 +60,32 @@ export const MODEL_SUPPORTED_REASONING_EFFORT = {
 
 // 模型类型到支持选项的映射表
 export const MODEL_SUPPORTED_OPTIONS: ThinkingOptionConfig = {
-  default: ['none', ...MODEL_SUPPORTED_REASONING_EFFORT.default] as const,
-  o: MODEL_SUPPORTED_REASONING_EFFORT.o,
-  openai_deep_research: MODEL_SUPPORTED_REASONING_EFFORT.openai_deep_research,
-  gpt5: [...MODEL_SUPPORTED_REASONING_EFFORT.gpt5] as const,
-  gpt5pro: MODEL_SUPPORTED_REASONING_EFFORT.gpt5pro,
-  gpt5_codex: MODEL_SUPPORTED_REASONING_EFFORT.gpt5_codex,
-  gpt5_1: MODEL_SUPPORTED_REASONING_EFFORT.gpt5_1,
-  gpt5_1_codex: MODEL_SUPPORTED_REASONING_EFFORT.gpt5_1_codex,
-  gpt5_2: MODEL_SUPPORTED_REASONING_EFFORT.gpt5_2,
-  gpt5_1_codex_max: MODEL_SUPPORTED_REASONING_EFFORT.gpt5_1_codex_max,
-  gpt52pro: MODEL_SUPPORTED_REASONING_EFFORT.gpt52pro,
-  grok: MODEL_SUPPORTED_REASONING_EFFORT.grok,
-  grok4_fast: ['none', ...MODEL_SUPPORTED_REASONING_EFFORT.grok4_fast] as const,
-  gemini: ['none', ...MODEL_SUPPORTED_REASONING_EFFORT.gemini] as const,
-  gemini_pro: MODEL_SUPPORTED_REASONING_EFFORT.gemini_pro,
-  gemini3: MODEL_SUPPORTED_REASONING_EFFORT.gemini3,
-  qwen: ['none', ...MODEL_SUPPORTED_REASONING_EFFORT.qwen] as const,
-  qwen_thinking: MODEL_SUPPORTED_REASONING_EFFORT.qwen_thinking,
-  doubao: ['none', ...MODEL_SUPPORTED_REASONING_EFFORT.doubao] as const,
-  doubao_no_auto: ['none', ...MODEL_SUPPORTED_REASONING_EFFORT.doubao_no_auto] as const,
-  doubao_after_251015: MODEL_SUPPORTED_REASONING_EFFORT.doubao_after_251015,
-  hunyuan: ['none', ...MODEL_SUPPORTED_REASONING_EFFORT.hunyuan] as const,
-  zhipu: ['none', ...MODEL_SUPPORTED_REASONING_EFFORT.zhipu] as const,
-  perplexity: MODEL_SUPPORTED_REASONING_EFFORT.perplexity,
-  deepseek_hybrid: ['none', ...MODEL_SUPPORTED_REASONING_EFFORT.deepseek_hybrid] as const
+  default: ['default', 'none', ...MODEL_SUPPORTED_REASONING_EFFORT.default] as const,
+  o: ['default', ...MODEL_SUPPORTED_REASONING_EFFORT.o] as const,
+  openai_deep_research: ['default', ...MODEL_SUPPORTED_REASONING_EFFORT.openai_deep_research] as const,
+  gpt5: ['default', ...MODEL_SUPPORTED_REASONING_EFFORT.gpt5] as const,
+  gpt5pro: ['default', ...MODEL_SUPPORTED_REASONING_EFFORT.gpt5pro] as const,
+  gpt5_codex: ['default', ...MODEL_SUPPORTED_REASONING_EFFORT.gpt5_codex] as const,
+  gpt5_1: ['default', ...MODEL_SUPPORTED_REASONING_EFFORT.gpt5_1] as const,
+  gpt5_1_codex: ['default', ...MODEL_SUPPORTED_REASONING_EFFORT.gpt5_1_codex] as const,
+  gpt5_2: ['default', ...MODEL_SUPPORTED_REASONING_EFFORT.gpt5_2] as const,
+  gpt5_1_codex_max: ['default', ...MODEL_SUPPORTED_REASONING_EFFORT.gpt5_1_codex_max] as const,
+  gpt52pro: ['default', ...MODEL_SUPPORTED_REASONING_EFFORT.gpt52pro] as const,
+  grok: ['default', ...MODEL_SUPPORTED_REASONING_EFFORT.grok] as const,
+  grok4_fast: ['default', 'none', ...MODEL_SUPPORTED_REASONING_EFFORT.grok4_fast] as const,
+  gemini: ['default', 'none', ...MODEL_SUPPORTED_REASONING_EFFORT.gemini] as const,
+  gemini_pro: ['default', ...MODEL_SUPPORTED_REASONING_EFFORT.gemini_pro] as const,
+  gemini3: ['default', ...MODEL_SUPPORTED_REASONING_EFFORT.gemini3] as const,
+  qwen: ['default', 'none', ...MODEL_SUPPORTED_REASONING_EFFORT.qwen] as const,
+  qwen_thinking: ['default', ...MODEL_SUPPORTED_REASONING_EFFORT.qwen_thinking] as const,
+  doubao: ['default', 'none', ...MODEL_SUPPORTED_REASONING_EFFORT.doubao] as const,
+  doubao_no_auto: ['default', 'none', ...MODEL_SUPPORTED_REASONING_EFFORT.doubao_no_auto] as const,
+  doubao_after_251015: ['default', ...MODEL_SUPPORTED_REASONING_EFFORT.doubao_after_251015] as const,
+  mimo: ['default', 'none', ...MODEL_SUPPORTED_REASONING_EFFORT.mimo] as const,
+  hunyuan: ['default', 'none', ...MODEL_SUPPORTED_REASONING_EFFORT.hunyuan] as const,
+  zhipu: ['default', 'none', ...MODEL_SUPPORTED_REASONING_EFFORT.zhipu] as const,
+  perplexity: ['default', ...MODEL_SUPPORTED_REASONING_EFFORT.perplexity] as const,
+  deepseek_hybrid: ['default', 'none', ...MODEL_SUPPORTED_REASONING_EFFORT.deepseek_hybrid] as const
 } as const
 
 const withModelIdAndNameAsId = <T>(model: Model, fn: (model: Model) => T): { idResult: T; nameResult: T } => {
@@ -146,7 +148,7 @@ const _getThinkModelType = (model: Model): ThinkingModelType => {
   } else if (isSupportedThinkingTokenDoubaoModel(model)) {
     if (isDoubaoThinkingAutoModel(model)) {
       thinkingModelType = 'doubao'
-    } else if (isDoubaoSeedAfter251015(model)) {
+    } else if (isDoubaoSeedAfter251015(model) || isDoubaoSeed18Model(model)) {
       thinkingModelType = 'doubao_after_251015'
     } else {
       thinkingModelType = 'doubao_no_auto'
@@ -155,6 +157,7 @@ const _getThinkModelType = (model: Model): ThinkingModelType => {
   else if (isSupportedReasoningEffortPerplexityModel(model)) thinkingModelType = 'perplexity'
   else if (isSupportedThinkingTokenZhipuModel(model)) thinkingModelType = 'zhipu'
   else if (isDeepSeekHybridInferenceModel(model)) thinkingModelType = 'deepseek_hybrid'
+  else if (isSupportedThinkingTokenMiMoModel(model)) thinkingModelType = 'mimo'
   return thinkingModelType
 }
 
@@ -191,20 +194,28 @@ const _getModelSupportedReasoningEffortOptions = (model: Model): ReasoningEffort
  *          - The model is null/undefined
  *          - The model doesn't support reasoning effort or thinking tokens
  *
+ *          All reasoning models support the 'default' option (always the first element),
+ *          which represents no additional configuration for thinking behavior.
+ *
  * @example
- * // OpenAI o-series models support low, medium, high
+ * // OpenAI o-series models support default, low, medium, high
  * getModelSupportedReasoningEffortOptions({ id: 'o3-mini', ... })
- * // Returns: ['low', 'medium', 'high']
+ * // Returns: ['default', 'low', 'medium', 'high']
+ * // 'default' = no additional configuration for thinking behavior
  *
  * @example
- * // GPT-5.1 models support none, low, medium, high
+ * // GPT-5.1 models support default, none, low, medium, high
  * getModelSupportedReasoningEffortOptions({ id: 'gpt-5.1', ... })
- * // Returns: ['none', 'low', 'medium', 'high']
+ * // Returns: ['default', 'none', 'low', 'medium', 'high']
+ * // 'default' = no additional configuration
+ * // 'none' = explicitly disable reasoning
  *
  * @example
- * // Gemini Flash models support none, low, medium, high, auto
+ * // Gemini Flash models support default, none, low, medium, high, auto
  * getModelSupportedReasoningEffortOptions({ id: 'gemini-2.5-flash-latest', ... })
- * // Returns: ['none', 'low', 'medium', 'high', 'auto']
+ * // Returns: ['default', 'none', 'low', 'medium', 'high', 'auto']
+ * // 'default' = no additional configuration
+ * // 'auto' = let the model automatically decide
  *
  * @example
  * // Non-reasoning models return undefined
@@ -214,7 +225,7 @@ const _getModelSupportedReasoningEffortOptions = (model: Model): ReasoningEffort
  * @example
  * // Name fallback when id doesn't match
  * getModelSupportedReasoningEffortOptions({ id: 'custom-id', name: 'gpt-5.1', ... })
- * // Returns: ['none', 'low', 'medium', 'high']
+ * // Returns: ['default', 'none', 'low', 'medium', 'high']
  */
 export const getModelSupportedReasoningEffortOptions = (
   model: Model | undefined | null
@@ -255,7 +266,8 @@ function _isSupportedThinkingTokenModel(model: Model): boolean {
     isSupportedThinkingTokenClaudeModel(model) ||
     isSupportedThinkingTokenDoubaoModel(model) ||
     isSupportedThinkingTokenHunyuanModel(model) ||
-    isSupportedThinkingTokenZhipuModel(model)
+    isSupportedThinkingTokenZhipuModel(model) ||
+    isSupportedThinkingTokenMiMoModel(model)
   )
 }
 
@@ -449,7 +461,7 @@ export function isQwenAlwaysThinkModel(model?: Model): boolean {
 
 // Doubao 支持思考模式的模型正则
 export const DOUBAO_THINKING_MODEL_REGEX =
-  /doubao-(?:1[.-]5-thinking-vision-pro|1[.-]5-thinking-pro-m|seed-1[.-]6(?:-flash)?(?!-(?:thinking)(?:-|$))|seed-code(?:-preview)?(?:-\d+)?)(?:-[\w-]+)*/i
+  /doubao-(?:1[.-]5-thinking-vision-pro|1[.-]5-thinking-pro-m|seed-1[.-][68](?:-flash)?(?!-(?:thinking)(?:-|$))|seed-code(?:-preview)?(?:-\d+)?)(?:-[\w-]+)*/i
 
 // 支持 auto 的 Doubao 模型 doubao-seed-1.6-xxx doubao-seed-1-6-xxx  doubao-1-5-thinking-pro-m-xxx
 // Auto thinking is no longer supported after version 251015, see https://console.volcengine.com/ark/region:ark+cn-beijing/model/detail?Id=doubao-seed-1-6
@@ -467,6 +479,11 @@ export function isDoubaoSeedAfter251015(model: Model): boolean {
   return result
 }
 
+export function isDoubaoSeed18Model(model: Model): boolean {
+  const pattern = /doubao-seed-1[.-]8(?:-[\w-]+)?/i
+  return pattern.test(model.id) || pattern.test(model.name)
+}
+
 export function isSupportedThinkingTokenDoubaoModel(model?: Model): boolean {
   if (!model) {
     return false
@@ -548,6 +565,11 @@ export const isSupportedThinkingTokenZhipuModel = (model: Model): boolean => {
   return ['glm-4.5', 'glm-4.6'].some((id) => modelId.includes(id))
 }
 
+export const isSupportedThinkingTokenMiMoModel = (model: Model): boolean => {
+  const modelId = getLowerBaseModelName(model.id, '/')
+  return ['mimo-v2-flash'].some((id) => modelId.includes(id))
+}
+
 export const isDeepSeekHybridInferenceModel = (model: Model) => {
   const { idResult, nameResult } = withModelIdAndNameAsId(model, (model) => {
     const modelId = getLowerBaseModelName(model.id)
@@ -586,6 +608,8 @@ export const isZhipuReasoningModel = (model?: Model): boolean => {
   return isSupportedThinkingTokenZhipuModel(model) || modelId.includes('glm-z1')
 }
 
+export const isMiMoReasoningModel = isSupportedThinkingTokenMiMoModel
+
 export const isStepReasoningModel = (model?: Model): boolean => {
   if (!model) {
     return false
@@ -636,6 +660,7 @@ export function isReasoningModel(model?: Model): boolean {
     isDeepSeekHybridInferenceModel(model) ||
     isLingReasoningModel(model) ||
     isMiniMaxReasoningModel(model) ||
+    isMiMoReasoningModel(model) ||
     modelId.includes('magistral') ||
     modelId.includes('pangu-pro-moe') ||
     modelId.includes('seed-oss') ||
diff --git a/src/renderer/src/config/models/tooluse.ts b/src/renderer/src/config/models/tooluse.ts
index 04302b1845..4eaf66752a 100644
--- a/src/renderer/src/config/models/tooluse.ts
+++ b/src/renderer/src/config/models/tooluse.ts
@@ -27,12 +27,13 @@ export const FUNCTION_CALLING_MODELS = [
   'learnlm(?:-[\\w-]+)?',
   'gemini(?:-[\\w-]+)?', // 提前排除了gemini的嵌入模型
   'grok-3(?:-[\\w-]+)?',
-  'doubao-seed-1[.-]6(?:-[\\w-]+)?',
+  'doubao-seed-1[.-][68](?:-[\\w-]+)?',
   'doubao-seed-code(?:-[\\w-]+)?',
   'kimi-k2(?:-[\\w-]+)?',
   'ling-\\w+(?:-[\\w-]+)?',
   'ring-\\w+(?:-[\\w-]+)?',
-  'minimax-m2'
+  'minimax-m2',
+  'mimo-v2-flash'
 ] as const
 
 const FUNCTION_CALLING_EXCLUDED_MODELS = [
diff --git a/src/renderer/src/config/models/vision.ts b/src/renderer/src/config/models/vision.ts
index 183ec99433..fe4bc9912c 100644
--- a/src/renderer/src/config/models/vision.ts
+++ b/src/renderer/src/config/models/vision.ts
@@ -45,7 +45,7 @@ const visionAllowedModels = [
   'deepseek-vl(?:[\\w-]+)?',
   'kimi-latest',
   'gemma-3(?:-[\\w-]+)',
-  'doubao-seed-1[.-]6(?:-[\\w-]+)?',
+  'doubao-seed-1[.-][68](?:-[\\w-]+)?',
   'doubao-seed-code(?:-[\\w-]+)?',
   'kimi-thinking-preview',
   `gemma3(?:[-:\\w]+)?`,
diff --git a/src/renderer/src/config/providers.ts b/src/renderer/src/config/providers.ts
index bc32ef3490..1adeb58ad0 100644
--- a/src/renderer/src/config/providers.ts
+++ b/src/renderer/src/config/providers.ts
@@ -31,6 +31,7 @@ import JinaProviderLogo from '@renderer/assets/images/providers/jina.png'
 import LanyunProviderLogo from '@renderer/assets/images/providers/lanyun.png'
 import LMStudioProviderLogo from '@renderer/assets/images/providers/lmstudio.png'
 import LongCatProviderLogo from '@renderer/assets/images/providers/longcat.png'
+import MiMoProviderLogo from '@renderer/assets/images/providers/mimo.svg'
 import MinimaxProviderLogo from '@renderer/assets/images/providers/minimax.png'
 import MistralProviderLogo from '@renderer/assets/images/providers/mistral.png'
 import ModelScopeProviderLogo from '@renderer/assets/images/providers/modelscope.png'
@@ -695,6 +696,17 @@ export const SYSTEM_PROVIDERS_CONFIG: Record<SystemProviderId, SystemProvider> =
     models: SYSTEM_MODELS.cerebras,
     isSystem: true,
     enabled: false
+  },
+  mimo: {
+    id: 'mimo',
+    name: 'Xiaomi MiMo',
+    type: 'openai',
+    apiKey: '',
+    apiHost: 'https://api.xiaomimimo.com',
+    anthropicApiHost: 'https://api.xiaomimimo.com/anthropic',
+    models: SYSTEM_MODELS.mimo,
+    isSystem: true,
+    enabled: false
   }
 } as const
 
@@ -763,7 +775,8 @@ export const PROVIDER_LOGO_MAP: AtLeast<SystemProviderId, string> = {
   huggingface: HuggingfaceProviderLogo,
   sophnet: SophnetProviderLogo,
   gateway: AIGatewayProviderLogo,
-  cerebras: CerebrasProviderLogo
+  cerebras: CerebrasProviderLogo,
+  mimo: MiMoProviderLogo
 } as const
 
 export function getProviderLogo(providerId: string) {
@@ -1434,5 +1447,16 @@ export const PROVIDER_URLS: Record<SystemProviderId, ProviderUrls> = {
       docs: 'https://inference-docs.cerebras.ai/introduction',
       models: 'https://inference-docs.cerebras.ai/models/overview'
     }
+  },
+  mimo: {
+    api: {
+      url: 'https://api.xiaomimimo.com'
+    },
+    websites: {
+      official: 'https://platform.xiaomimimo.com/',
+      apiKey: 'https://platform.xiaomimimo.com/#/console/usage',
+      docs: 'https://platform.xiaomimimo.com/#/docs/welcome',
+      models: 'https://platform.xiaomimimo.com/'
+    }
   }
 }
diff --git a/src/renderer/src/i18n/label.ts b/src/renderer/src/i18n/label.ts
index 2830267088..2e6f84026e 100644
--- a/src/renderer/src/i18n/label.ts
+++ b/src/renderer/src/i18n/label.ts
@@ -5,7 +5,7 @@
  */
 
 import { loggerService } from '@logger'
-import type { AgentType, BuiltinMCPServerName, BuiltinOcrProviderId, ThinkingOption } from '@renderer/types'
+import type { AgentType, BuiltinMCPServerName, BuiltinOcrProviderId } from '@renderer/types'
 import { BuiltinMCPServerNames } from '@renderer/types'
 
 import i18n from './index'
@@ -88,7 +88,8 @@ const providerKeyMap = {
   huggingface: 'provider.huggingface',
   sophnet: 'provider.sophnet',
   gateway: 'provider.ai-gateway',
-  cerebras: 'provider.cerebras'
+  cerebras: 'provider.cerebras',
+  mimo: 'provider.mimo'
 } as const
 
 /**
@@ -310,20 +311,6 @@ export const getHttpMessageLabel = (key: string): string => {
   return getLabel(httpMessageKeyMap, key)
 }
 
-const reasoningEffortOptionsKeyMap: Record<ThinkingOption, string> = {
-  none: 'assistants.settings.reasoning_effort.off',
-  minimal: 'assistants.settings.reasoning_effort.minimal',
-  high: 'assistants.settings.reasoning_effort.high',
-  low: 'assistants.settings.reasoning_effort.low',
-  medium: 'assistants.settings.reasoning_effort.medium',
-  auto: 'assistants.settings.reasoning_effort.default',
-  xhigh: 'assistants.settings.reasoning_effort.xhigh'
-} as const
-
-export const getReasoningEffortOptionsLabel = (key: string): string => {
-  return getLabel(reasoningEffortOptionsKeyMap, key)
-}
-
 const fileFieldKeyMap = {
   created_at: 'files.created_at',
   size: 'files.size',
@@ -344,7 +331,8 @@ const builtInMcpDescriptionKeyMap: Record<BuiltinMCPServerName, string> = {
   [BuiltinMCPServerNames.difyKnowledge]: 'settings.mcp.builtinServersDescriptions.dify_knowledge',
   [BuiltinMCPServerNames.python]: 'settings.mcp.builtinServersDescriptions.python',
   [BuiltinMCPServerNames.didiMCP]: 'settings.mcp.builtinServersDescriptions.didi_mcp',
-  [BuiltinMCPServerNames.browser]: 'settings.mcp.builtinServersDescriptions.browser'
+  [BuiltinMCPServerNames.browser]: 'settings.mcp.builtinServersDescriptions.browser',
+  [BuiltinMCPServerNames.nowledgeMem]: 'settings.mcp.builtinServersDescriptions.nowledge_mem'
 } as const
 
 export const getBuiltInMcpServerDescriptionLabel = (key: string): string => {
diff --git a/src/renderer/src/i18n/locales/en-us.json b/src/renderer/src/i18n/locales/en-us.json
index f38cdc1def..f4012363e3 100644
--- a/src/renderer/src/i18n/locales/en-us.json
+++ b/src/renderer/src/i18n/locales/en-us.json
@@ -32,6 +32,7 @@
     },
     "gitBash": {
       "autoDetected": "Using auto-detected Git Bash",
+      "autoDiscoveredHint": "Auto-discovered",
       "clear": {
         "button": "Clear custom path"
       },
@@ -39,6 +40,7 @@
       "error": {
         "description": "Git Bash is required to run agents on Windows. The agent cannot function without it. Please install Git for Windows from",
         "recheck": "Recheck Git Bash Installation",
+        "required": "Git Bash path is required on Windows",
         "title": "Git Bash Required"
       },
       "found": {
@@ -51,7 +53,9 @@
         "invalidPath": "Selected file is not a valid Git Bash executable (bash.exe).",
         "title": "Select Git Bash executable"
       },
-      "success": "Git Bash detected successfully!"
+      "placeholder": "Select bash.exe path",
+      "success": "Git Bash detected successfully!",
+      "tooltip": "Git Bash is required to run agents on Windows. Install from git-scm.com if not available."
     },
     "input": {
       "placeholder": "Enter your message here, send with {{key}} - @ select path, / select command"
@@ -544,14 +548,23 @@
       "more": "Assistant Settings",
       "prompt": "Prompt Settings",
       "reasoning_effort": {
+        "auto": "Auto",
+        "auto_description": "Flexibly determine reasoning effort",
         "default": "Default",
+        "default_description": "Depend on the model's default behavior, without any configuration.",
         "high": "High",
+        "high_description": "High level reasoning",
         "label": "Reasoning effort",
         "low": "Low",
+        "low_description": "Low level reasoning",
         "medium": "Medium",
+        "medium_description": "Medium level reasoning",
         "minimal": "Minimal",
+        "minimal_description": "Minimal reasoning",
         "off": "Off",
-        "xhigh": "Extra High"
+        "off_description": "Disable reasoning",
+        "xhigh": "Extra High",
+        "xhigh_description": "Extra high level reasoning"
       },
       "regular_phrases": {
         "add": "Add Phrase",
@@ -2630,6 +2643,7 @@
     "lanyun": "LANYUN",
     "lmstudio": "LM Studio",
     "longcat": "LongCat AI",
+    "mimo": "Xiaomi MiMo",
     "minimax": "MiniMax",
     "mistral": "Mistral",
     "modelscope": "ModelScope",
@@ -3926,6 +3940,7 @@
         "mcp_auto_install": "Automatically install MCP service (beta)",
         "memory": "Persistent memory implementation based on a local knowledge graph. This enables the model to remember user-related information across different conversations. Requires configuring the MEMORY_FILE_PATH environment variable.",
         "no": "No description",
+        "nowledge_mem": "Requires Nowledge Mem app running locally. Keeps AI chats, tools, notes, agents, and files in private memory on your computer. Download from https://mem.nowledge.co/",
         "python": "Execute Python code in a secure sandbox environment. Run Python with Pyodide, supporting most standard libraries and scientific computing packages",
         "sequentialthinking": "A MCP server implementation that provides tools for dynamic and reflective problem solving through structured thinking processes"
       },
diff --git a/src/renderer/src/i18n/locales/zh-cn.json b/src/renderer/src/i18n/locales/zh-cn.json
index 882b897ef5..f0d4adf4c8 100644
--- a/src/renderer/src/i18n/locales/zh-cn.json
+++ b/src/renderer/src/i18n/locales/zh-cn.json
@@ -32,6 +32,7 @@
     },
     "gitBash": {
       "autoDetected": "使用自动检测的 Git Bash",
+      "autoDiscoveredHint": "自动发现",
       "clear": {
         "button": "清除自定义路径"
       },
@@ -39,6 +40,7 @@
       "error": {
         "description": "在 Windows 上运行智能体需要 Git Bash。没有它智能体无法运行。请从以下地址安装 Git for Windows",
         "recheck": "重新检测 Git Bash 安装",
+        "required": "在 Windows 上需要配置 Git Bash 路径",
         "title": "需要 Git Bash"
       },
       "found": {
@@ -51,7 +53,9 @@
         "invalidPath": "选择的文件不是有效的 Git Bash 可执行文件（bash.exe）。",
         "title": "选择 Git Bash 可执行文件"
       },
-      "success": "成功检测到 Git Bash！"
+      "placeholder": "选择 bash.exe 路径",
+      "success": "成功检测到 Git Bash！",
+      "tooltip": "在 Windows 上运行智能体需要 Git Bash。如果未安装，请从 git-scm.com 下载安装。"
     },
     "input": {
       "placeholder": "在这里输入消息，按 {{key}} 发送 - @ 选择路径， / 选择命令"
@@ -544,14 +548,23 @@
       "more": "助手设置",
       "prompt": "提示词设置",
       "reasoning_effort": {
+        "auto": "自动",
+        "auto_description": "灵活决定推理力度",
         "default": "默认",
+        "default_description": "依赖模型默认行为，不作任何配置",
         "high": "沉思",
+        "high_description": "高强度推理",
         "label": "思维链长度",
         "low": "浮想",
+        "low_description": "低强度推理",
         "medium": "斟酌",
+        "medium_description": "中强度推理",
         "minimal": "微念",
+        "minimal_description": "最小程度的思考",
         "off": "关闭",
-        "xhigh": "穷究"
+        "off_description": "禁用推理",
+        "xhigh": "穷究",
+        "xhigh_description": "超高强度推理"
       },
       "regular_phrases": {
         "add": "添加短语",
@@ -2630,6 +2643,7 @@
     "lanyun": "蓝耘科技",
     "lmstudio": "LM Studio",
     "longcat": "龙猫",
+    "mimo": "Xiaomi MiMo",
     "minimax": "MiniMax",
     "mistral": "Mistral",
     "modelscope": "ModelScope 魔搭",
@@ -3926,6 +3940,7 @@
         "mcp_auto_install": "自动安装 MCP 服务（测试版）",
         "memory": "基于本地知识图谱的持久性记忆基础实现。这使得模型能够在不同对话间记住用户的相关信息。需要配置 MEMORY_FILE_PATH 环境变量。",
         "no": "无描述",
+        "nowledge_mem": "需要本地运行 Nowledge Mem 应用。将 AI 对话、工具、笔记、智能体和文件保存在本地计算机的私有记忆中。请从 https://mem.nowledge.co/ 下载",
         "python": "在安全的沙盒环境中执行 Python 代码。使用 Pyodide 运行 Python，支持大多数标准库和科学计算包",
         "sequentialthinking": "一个 MCP 服务器实现，提供了通过结构化思维过程进行动态和反思性问题解决的工具"
       },
diff --git a/src/renderer/src/i18n/locales/zh-tw.json b/src/renderer/src/i18n/locales/zh-tw.json
index 3feb287c1d..9625c68386 100644
--- a/src/renderer/src/i18n/locales/zh-tw.json
+++ b/src/renderer/src/i18n/locales/zh-tw.json
@@ -32,6 +32,7 @@
     },
     "gitBash": {
       "autoDetected": "使用自動偵測的 Git Bash",
+      "autoDiscoveredHint": "自動發現",
       "clear": {
         "button": "清除自訂路徑"
       },
@@ -39,6 +40,7 @@
       "error": {
         "description": "在 Windows 上執行 Agent 需要 Git Bash。沒有它 Agent 無法運作。請從以下網址安裝 Git for Windows",
         "recheck": "重新偵測 Git Bash 安裝",
+        "required": "在 Windows 上需要設定 Git Bash 路徑",
         "title": "需要 Git Bash"
       },
       "found": {
@@ -51,7 +53,9 @@
         "invalidPath": "選擇的檔案不是有效的 Git Bash 可執行檔（bash.exe）。",
         "title": "選擇 Git Bash 可執行檔"
       },
-      "success": "成功偵測到 Git Bash！"
+      "placeholder": "選擇 bash.exe 路徑",
+      "success": "成功偵測到 Git Bash！",
+      "tooltip": "在 Windows 上執行 Agent 需要 Git Bash。如未安裝，請從 git-scm.com 下載安裝。"
     },
     "input": {
       "placeholder": "在這裡輸入您的訊息，使用 {{key}} 傳送 - @ 選擇路徑，/ 選擇命令"
@@ -544,14 +548,23 @@
       "more": "助手設定",
       "prompt": "提示詞設定",
       "reasoning_effort": {
+        "auto": "自動",
+        "auto_description": "彈性決定推理投入的心力",
         "default": "預設",
+        "default_description": "依賴模型的預設行為，無需任何配置。",
         "high": "盡力思考",
+        "high_description": "高級推理",
         "label": "思維鏈長度",
         "low": "稍微思考",
+        "low_description": "低階推理",
         "medium": "正常思考",
+        "medium_description": "中等程度推理",
         "minimal": "最少思考",
+        "minimal_description": "最少推理",
         "off": "關閉",
-        "xhigh": "極力思考"
+        "off_description": "禁用推理",
+        "xhigh": "極力思考",
+        "xhigh_description": "超高階推理"
       },
       "regular_phrases": {
         "add": "新增短語",
@@ -2630,6 +2643,7 @@
     "lanyun": "藍耘",
     "lmstudio": "LM Studio",
     "longcat": "龍貓",
+    "mimo": "[to be translated]:Xiaomi MiMo",
     "minimax": "MiniMax",
     "mistral": "Mistral",
     "modelscope": "ModelScope 魔搭",
@@ -3926,6 +3940,7 @@
         "mcp_auto_install": "自動安裝 MCP 服務（測試版）",
         "memory": "基於本機知識圖譜的持久性記憶基礎實做。這使得模型能夠在不同對話間記住使用者的相關資訊。需要設定 MEMORY_FILE_PATH 環境變數。",
         "no": "無描述",
+        "nowledge_mem": "需要本機執行 Nowledge Mem 應用程式。將 AI 對話、工具、筆記、代理和檔案保存在電腦上的私人記憶體中。請從 https://mem.nowledge.co/ 下載",
         "python": "在安全的沙盒環境中執行 Python 程式碼。使用 Pyodide 執行 Python，支援大多數標準函式庫和科學計算套件",
         "sequentialthinking": "一個 MCP 伺服器實做，提供了透過結構化思維過程進行動態和反思性問題解決的工具"
       },
diff --git a/src/renderer/src/i18n/translate/de-de.json b/src/renderer/src/i18n/translate/de-de.json
index f535978606..b3acb49950 100644
--- a/src/renderer/src/i18n/translate/de-de.json
+++ b/src/renderer/src/i18n/translate/de-de.json
@@ -32,6 +32,7 @@
     },
     "gitBash": {
       "autoDetected": "Automatisch ermitteltes Git Bash wird verwendet",
+      "autoDiscoveredHint": "[to be translated]:Auto-discovered",
       "clear": {
         "button": "Benutzerdefinierten Pfad löschen"
       },
@@ -39,6 +40,7 @@
       "error": {
         "description": "Git Bash ist erforderlich, um Agents unter Windows auszuführen. Der Agent kann ohne es nicht funktionieren. Bitte installieren Sie Git für Windows von",
         "recheck": "Überprüfe die Git Bash-Installation erneut",
+        "required": "[to be translated]:Git Bash path is required on Windows",
         "title": "Git Bash erforderlich"
       },
       "found": {
@@ -51,7 +53,9 @@
         "invalidPath": "Die ausgewählte Datei ist keine gültige Git Bash ausführbare Datei (bash.exe).",
         "title": "Git Bash ausführbare Datei auswählen"
       },
-      "success": "Git Bash erfolgreich erkannt!"
+      "placeholder": "[to be translated]:Select bash.exe path",
+      "success": "Git Bash erfolgreich erkannt!",
+      "tooltip": "[to be translated]:Git Bash is required to run agents on Windows. Install from git-scm.com if not available."
     },
     "input": {
       "placeholder": "Gib hier deine Nachricht ein, senden mit {{key}} – @ Pfad auswählen, / Befehl auswählen"
@@ -544,14 +548,23 @@
       "more": "Assistenteneinstellungen",
       "prompt": "Prompt-Einstellungen",
       "reasoning_effort": {
+        "auto": "Auto",
+        "auto_description": "Denkaufwand flexibel bestimmen",
         "default": "Standard",
+        "default_description": "Vom Standardverhalten des Modells abhängen, ohne Konfiguration.",
         "high": "Tiefes Nachdenken",
+        "high_description": "Ganzheitliches Denken",
         "label": "Gedankenkettenlänge",
         "low": "Spontan",
+        "low_description": "Geringfügige Argumentation",
         "medium": "Überlegt",
+        "medium_description": "Denken auf mittlerem Niveau",
         "minimal": "Minimal",
+        "minimal_description": "Minimales Denken",
         "off": "Aus",
-        "xhigh": "Extra hoch"
+        "off_description": "Denken deaktivieren",
+        "xhigh": "Extra hoch",
+        "xhigh_description": "Extra hohes Denkvermögen"
       },
       "regular_phrases": {
         "add": "Phrase hinzufügen",
@@ -2630,6 +2643,7 @@
     "lanyun": "Lanyun Technologie",
     "lmstudio": "LM Studio",
     "longcat": "Meißner Riesenhamster",
+    "mimo": "[to be translated]:Xiaomi MiMo",
     "minimax": "MiniMax",
     "mistral": "Mistral",
     "modelscope": "ModelScope",
@@ -3926,6 +3940,7 @@
         "mcp_auto_install": "MCP-Service automatisch installieren (Beta-Version)",
         "memory": "MCP-Server mit persistenter Erinnerungsbasis auf lokalem Wissensgraphen, der Informationen über verschiedene Dialoge hinweg speichert. MEMORY_FILE_PATH-Umgebungsvariable muss konfiguriert werden",
         "no": "Keine Beschreibung",
+        "nowledge_mem": "Erfordert lokal laufende Nowledge Mem App. Speichert KI-Chats, Tools, Notizen, Agenten und Dateien in einem privaten Speicher auf Ihrem Computer. Download unter https://mem.nowledge.co/",
         "python": "Python-Code in einem sicheren Sandbox-Umgebung ausführen. Verwendung von Pyodide für Python, Unterstützung für die meisten Standardbibliotheken und wissenschaftliche Pakete",
         "sequentialthinking": "MCP-Server-Implementierung mit strukturiertem Denkprozess, der dynamische und reflektierende Problemlösungen ermöglicht"
       },
diff --git a/src/renderer/src/i18n/translate/el-gr.json b/src/renderer/src/i18n/translate/el-gr.json
index 99592e9adc..ae7b855646 100644
--- a/src/renderer/src/i18n/translate/el-gr.json
+++ b/src/renderer/src/i18n/translate/el-gr.json
@@ -32,6 +32,7 @@
     },
     "gitBash": {
       "autoDetected": "Χρησιμοποιείται αυτόματα εντοπισμένο Git Bash",
+      "autoDiscoveredHint": "[to be translated]:Auto-discovered",
       "clear": {
         "button": "Διαγραφή προσαρμοσμένης διαδρομής"
       },
@@ -39,6 +40,7 @@
       "error": {
         "description": "Το Git Bash απαιτείται για την εκτέλεση πρακτόρων στα Windows. Ο πράκτορας δεν μπορεί να λειτουργήσει χωρίς αυτό. Παρακαλούμε εγκαταστήστε το Git για Windows από",
         "recheck": "Επανέλεγχος Εγκατάστασης του Git Bash",
+        "required": "[to be translated]:Git Bash path is required on Windows",
         "title": "Απαιτείται Git Bash"
       },
       "found": {
@@ -51,7 +53,9 @@
         "invalidPath": "Το επιλεγμένο αρχείο δεν είναι έγκυρο εκτελέσιμο Git Bash (bash.exe).",
         "title": "Επιλογή εκτελέσιμου Git Bash"
       },
-      "success": "Το Git Bash εντοπίστηκε με επιτυχία!"
+      "placeholder": "[to be translated]:Select bash.exe path",
+      "success": "Το Git Bash εντοπίστηκε με επιτυχία!",
+      "tooltip": "[to be translated]:Git Bash is required to run agents on Windows. Install from git-scm.com if not available."
     },
     "input": {
       "placeholder": "Εισάγετε το μήνυμά σας εδώ, στείλτε με {{key}} - @ επιλέξτε διαδρομή, / επιλέξτε εντολή"
@@ -544,14 +548,23 @@
       "more": "Ρυθμίσεις Βοηθού",
       "prompt": "Ρυθμίσεις προκαλύμματος",
       "reasoning_effort": {
+        "auto": "Αυτοκίνητο",
+        "auto_description": "Ευέλικτος καθορισμός της προσπάθειας συλλογισμού",
         "default": "Προεπιλογή",
+        "default_description": "Εξαρτηθείτε από την προεπιλεγμένη συμπεριφορά του μοντέλου, χωρίς καμία διαμόρφωση.",
         "high": "Μεγάλο",
+        "high_description": "Υψηλού επιπέδου συλλογισμός",
         "label": "Μήκος λογισμικού αλυσίδας",
         "low": "Μικρό",
+        "low_description": "Χαμηλού επιπέδου συλλογιστική",
         "medium": "Μεσαίο",
+        "medium_description": "Αιτιολόγηση μεσαίου επιπέδου",
         "minimal": "ελάχιστος",
+        "minimal_description": "Ελάχιστος συλλογισμός",
         "off": "Απενεργοποίηση",
-        "xhigh": "Εξαιρετικά Υψηλή"
+        "off_description": "Απενεργοποίηση λογικής",
+        "xhigh": "Εξαιρετικά Υψηλή",
+        "xhigh_description": "Εξαιρετικά υψηλού επιπέδου συλλογισμός"
       },
       "regular_phrases": {
         "add": "Προσθήκη φράσης",
@@ -2630,6 +2643,7 @@
     "lanyun": "Λανιούν Τεχνολογία",
     "lmstudio": "LM Studio",
     "longcat": "Τσίρο",
+    "mimo": "[to be translated]:Xiaomi MiMo",
     "minimax": "MiniMax",
     "mistral": "Mistral",
     "modelscope": "ModelScope Magpie",
@@ -3926,6 +3940,7 @@
         "mcp_auto_install": "Αυτόματη εγκατάσταση υπηρεσίας MCP (προβολή)",
         "memory": "Βασική υλοποίηση μόνιμης μνήμης με βάση τοπικό γράφημα γνώσης. Αυτό επιτρέπει στο μοντέλο να θυμάται πληροφορίες σχετικές με τον χρήστη ανάμεσα σε διαφορετικές συνομιλίες. Απαιτείται η ρύθμιση της μεταβλητής περιβάλλοντος MEMORY_FILE_PATH.",
         "no": "Χωρίς περιγραφή",
+        "nowledge_mem": "[to be translated]:Requires Nowledge Mem app running locally. Keeps AI chats, tools, notes, agents, and files in private memory on your computer. Download from https://mem.nowledge.co/",
         "python": "Εκτελέστε κώδικα Python σε ένα ασφαλές περιβάλλον sandbox. Χρησιμοποιήστε το Pyodide για να εκτελέσετε Python, υποστηρίζοντας την πλειονότητα των βιβλιοθηκών της τυπικής βιβλιοθήκης και των πακέτων επιστημονικού υπολογισμού",
         "sequentialthinking": "ένας εξυπηρετητής MCP που υλοποιείται, παρέχοντας εργαλεία για δυναμική και αναστοχαστική επίλυση προβλημάτων μέσω δομημένων διαδικασιών σκέψης"
       },
diff --git a/src/renderer/src/i18n/translate/es-es.json b/src/renderer/src/i18n/translate/es-es.json
index 31c7158587..26b499cba2 100644
--- a/src/renderer/src/i18n/translate/es-es.json
+++ b/src/renderer/src/i18n/translate/es-es.json
@@ -32,6 +32,7 @@
     },
     "gitBash": {
       "autoDetected": "Usando Git Bash detectado automáticamente",
+      "autoDiscoveredHint": "[to be translated]:Auto-discovered",
       "clear": {
         "button": "Borrar ruta personalizada"
       },
@@ -39,6 +40,7 @@
       "error": {
         "description": "Se requiere Git Bash para ejecutar agentes en Windows. El agente no puede funcionar sin él. Instale Git para Windows desde",
         "recheck": "Volver a verificar la instalación de Git Bash",
+        "required": "[to be translated]:Git Bash path is required on Windows",
         "title": "Git Bash Requerido"
       },
       "found": {
@@ -51,7 +53,9 @@
         "invalidPath": "El archivo seleccionado no es un ejecutable válido de Git Bash (bash.exe).",
         "title": "Seleccionar ejecutable de Git Bash"
       },
-      "success": "¡Git Bash detectado con éxito!"
+      "placeholder": "[to be translated]:Select bash.exe path",
+      "success": "¡Git Bash detectado con éxito!",
+      "tooltip": "[to be translated]:Git Bash is required to run agents on Windows. Install from git-scm.com if not available."
     },
     "input": {
       "placeholder": "Introduce tu mensaje aquí, envía con {{key}} - @ seleccionar ruta, / seleccionar comando"
@@ -544,14 +548,23 @@
       "more": "Configuración del Asistente",
       "prompt": "Configuración de Palabras Clave",
       "reasoning_effort": {
+        "auto": "Automóvil",
+        "auto_description": "Determinar flexiblemente el esfuerzo de razonamiento",
         "default": "Por defecto",
+        "default_description": "Depender del comportamiento predeterminado del modelo, sin ninguna configuración.",
         "high": "Largo",
+        "high_description": "Razonamiento de alto nivel",
         "label": "Longitud de Cadena de Razonamiento",
         "low": "Corto",
+        "low_description": "Razonamiento de bajo nivel",
         "medium": "Medio",
+        "medium_description": "Razonamiento de nivel medio",
         "minimal": "minimal",
+        "minimal_description": "Razonamiento mínimo",
         "off": "Apagado",
-        "xhigh": "Extra Alta"
+        "off_description": "Deshabilitar razonamiento",
+        "xhigh": "Extra Alta",
+        "xhigh_description": "Razonamiento de extra alto nivel"
       },
       "regular_phrases": {
         "add": "Agregar frase",
@@ -2630,6 +2643,7 @@
     "lanyun": "Tecnología Lanyun",
     "lmstudio": "Estudio LM",
     "longcat": "Totoro",
+    "mimo": "[to be translated]:Xiaomi MiMo",
     "minimax": "Minimax",
     "mistral": "Mistral",
     "modelscope": "ModelScope Módulo",
@@ -3926,6 +3940,7 @@
         "mcp_auto_install": "Instalación automática del servicio MCP (versión beta)",
         "memory": "Implementación básica de memoria persistente basada en un grafo de conocimiento local. Esto permite que el modelo recuerde información relevante del usuario entre diferentes conversaciones. Es necesario configurar la variable de entorno MEMORY_FILE_PATH.",
         "no": "sin descripción",
+        "nowledge_mem": "[to be translated]:Requires Nowledge Mem app running locally. Keeps AI chats, tools, notes, agents, and files in private memory on your computer. Download from https://mem.nowledge.co/",
         "python": "Ejecuta código Python en un entorno sandbox seguro. Usa Pyodide para ejecutar Python, compatible con la mayoría de las bibliotecas estándar y paquetes de cálculo científico.",
         "sequentialthinking": "Una implementación de servidor MCP que proporciona herramientas para la resolución dinámica y reflexiva de problemas mediante un proceso de pensamiento estructurado"
       },
diff --git a/src/renderer/src/i18n/translate/fr-fr.json b/src/renderer/src/i18n/translate/fr-fr.json
index da1d297a7f..4dff56d7e9 100644
--- a/src/renderer/src/i18n/translate/fr-fr.json
+++ b/src/renderer/src/i18n/translate/fr-fr.json
@@ -32,6 +32,7 @@
     },
     "gitBash": {
       "autoDetected": "Utilisation de Git Bash détecté automatiquement",
+      "autoDiscoveredHint": "[to be translated]:Auto-discovered",
       "clear": {
         "button": "Effacer le chemin personnalisé"
       },
@@ -39,6 +40,7 @@
       "error": {
         "description": "Git Bash est requis pour exécuter des agents sur Windows. L'agent ne peut pas fonctionner sans. Veuillez installer Git pour Windows depuis",
         "recheck": "Revérifier l'installation de Git Bash",
+        "required": "[to be translated]:Git Bash path is required on Windows",
         "title": "Git Bash requis"
       },
       "found": {
@@ -51,7 +53,9 @@
         "invalidPath": "Le fichier sélectionné n'est pas un exécutable Git Bash valide (bash.exe).",
         "title": "Sélectionner l'exécutable Git Bash"
       },
-      "success": "Git Bash détecté avec succès !"
+      "placeholder": "[to be translated]:Select bash.exe path",
+      "success": "Git Bash détecté avec succès !",
+      "tooltip": "[to be translated]:Git Bash is required to run agents on Windows. Install from git-scm.com if not available."
     },
     "input": {
       "placeholder": "Entrez votre message ici, envoyez avec {{key}} - @ sélectionner le chemin, / sélectionner la commande"
@@ -544,14 +548,23 @@
       "more": "Paramètres de l'assistant",
       "prompt": "Paramètres de l'invite",
       "reasoning_effort": {
+        "auto": "Auto",
+        "auto_description": "Déterminer de manière flexible l'effort de raisonnement",
         "default": "Par défaut",
+        "default_description": "Dépendre du comportement par défaut du modèle, sans aucune configuration.",
         "high": "Long",
+        "high_description": "Raisonnement de haut niveau",
         "label": "Longueur de la chaîne de raisonnement",
         "low": "Court",
+        "low_description": "Raisonnement de bas niveau",
         "medium": "Moyen",
+        "medium_description": "Raisonnement de niveau moyen",
         "minimal": "minimal",
+        "minimal_description": "Réflexion minimale",
         "off": "Off",
-        "xhigh": "Très élevée"
+        "off_description": "Désactiver le raisonnement",
+        "xhigh": "Très élevée",
+        "xhigh_description": "Raisonnement de très haut niveau"
       },
       "regular_phrases": {
         "add": "Добавить фразу",
@@ -2630,6 +2643,7 @@
     "lanyun": "Technologie Lan Yun",
     "lmstudio": "Studio LM",
     "longcat": "Mon voisin Totoro",
+    "mimo": "[to be translated]:Xiaomi MiMo",
     "minimax": "MiniMax",
     "mistral": "Mistral",
     "modelscope": "ModelScope MoDa",
@@ -3926,6 +3940,7 @@
         "mcp_auto_install": "Installation automatique du service MCP (version bêta)",
         "memory": "Implémentation de base de mémoire persistante basée sur un graphe de connaissances local. Cela permet au modèle de se souvenir des informations relatives à l'utilisateur entre différentes conversations. Nécessite la configuration de la variable d'environnement MEMORY_FILE_PATH.",
         "no": "sans description",
+        "nowledge_mem": "[to be translated]:Requires Nowledge Mem app running locally. Keeps AI chats, tools, notes, agents, and files in private memory on your computer. Download from https://mem.nowledge.co/",
         "python": "Exécutez du code Python dans un environnement bac à sable sécurisé. Utilisez Pyodide pour exécuter Python, prenant en charge la plupart des bibliothèques standard et des packages de calcul scientifique.",
         "sequentialthinking": "Un serveur MCP qui fournit des outils permettant une résolution dynamique et réflexive des problèmes à travers un processus de pensée structuré"
       },
diff --git a/src/renderer/src/i18n/translate/ja-jp.json b/src/renderer/src/i18n/translate/ja-jp.json
index 93bacf506c..090a1927cd 100644
--- a/src/renderer/src/i18n/translate/ja-jp.json
+++ b/src/renderer/src/i18n/translate/ja-jp.json
@@ -32,6 +32,7 @@
     },
     "gitBash": {
       "autoDetected": "自動検出されたGit Bashを使用中",
+      "autoDiscoveredHint": "[to be translated]:Auto-discovered",
       "clear": {
         "button": "カスタムパスをクリア"
       },
@@ -39,6 +40,7 @@
       "error": {
         "description": "Windowsでエージェントを実行するにはGit Bashが必要です。これがないとエージェントは動作しません。以下からGit for Windowsをインストールしてください。",
         "recheck": "Git Bashのインストールを再確認してください",
+        "required": "[to be translated]:Git Bash path is required on Windows",
         "title": "Git Bashが必要です"
       },
       "found": {
@@ -51,7 +53,9 @@
         "invalidPath": "選択されたファイルは有効なGit Bash実行ファイル（bash.exe）ではありません。",
         "title": "Git Bash実行ファイルを選択"
       },
-      "success": "Git Bashが正常に検出されました！"
+      "placeholder": "[to be translated]:Select bash.exe path",
+      "success": "Git Bashが正常に検出されました！",
+      "tooltip": "[to be translated]:Git Bash is required to run agents on Windows. Install from git-scm.com if not available."
     },
     "input": {
       "placeholder": "メッセージをここに入力し、{{key}}で送信 - @でパスを選択、/でコマンドを選択"
@@ -544,14 +548,23 @@
       "more": "アシスタント設定",
       "prompt": "プロンプト設定",
       "reasoning_effort": {
+        "auto": "自動",
+        "auto_description": "推論にかける労力を柔軟に調整する",
         "default": "デフォルト",
+        "default_description": "設定なしで、モデルの既定の動作に依存する。",
         "high": "最大限の思考",
+        "high_description": "高度な推論",
         "label": "思考連鎖の長さ",
         "low": "少しの思考",
+        "low_description": "低レベル推論",
         "medium": "普通の思考",
+        "medium_description": "中レベル推論",
         "minimal": "最小限の思考",
+        "minimal_description": "最小限の推論",
         "off": "オフ",
-        "xhigh": "超高"
+        "off_description": "推論を無効にする",
+        "xhigh": "超高",
+        "xhigh_description": "超高度な推論"
       },
       "regular_phrases": {
         "add": "プロンプトを追加",
@@ -2630,6 +2643,7 @@
     "lanyun": "LANYUN",
     "lmstudio": "LM Studio",
     "longcat": "トトロ",
+    "mimo": "[to be translated]:Xiaomi MiMo",
     "minimax": "MiniMax",
     "mistral": "Mistral",
     "modelscope": "ModelScope",
@@ -3926,6 +3940,7 @@
         "mcp_auto_install": "MCPサービスの自動インストール（ベータ版）",
         "memory": "ローカルのナレッジグラフに基づく永続的なメモリの基本的な実装です。これにより、モデルは異なる会話間でユーザーの関連情報を記憶できるようになります。MEMORY_FILE_PATH 環境変数の設定が必要です。",
         "no": "説明なし",
+        "nowledge_mem": "Nowledge Mem アプリをローカルで実行する必要があります。AI チャット、ツール、ノート、エージェント、ファイルをコンピューター上のプライベートメモリに保存します。https://mem.nowledge.co/ からダウンロードしてください",
         "python": "安全なサンドボックス環境でPythonコードを実行します。Pyodideを使用してPythonを実行し、ほとんどの標準ライブラリと科学計算パッケージをサポートしています。",
         "sequentialthinking": "構造化された思考プロセスを通じて動的かつ反省的な問題解決を行うためのツールを提供するMCPサーバーの実装"
       },
diff --git a/src/renderer/src/i18n/translate/pt-pt.json b/src/renderer/src/i18n/translate/pt-pt.json
index 9bd6881673..50cc4fae03 100644
--- a/src/renderer/src/i18n/translate/pt-pt.json
+++ b/src/renderer/src/i18n/translate/pt-pt.json
@@ -32,6 +32,7 @@
     },
     "gitBash": {
       "autoDetected": "Usando Git Bash detectado automaticamente",
+      "autoDiscoveredHint": "[to be translated]:Auto-discovered",
       "clear": {
         "button": "Limpar caminho personalizado"
       },
@@ -39,6 +40,7 @@
       "error": {
         "description": "O Git Bash é necessário para executar agentes no Windows. O agente não pode funcionar sem ele. Por favor, instale o Git para Windows a partir de",
         "recheck": "Reverificar a Instalação do Git Bash",
+        "required": "[to be translated]:Git Bash path is required on Windows",
         "title": "Git Bash Necessário"
       },
       "found": {
@@ -51,7 +53,9 @@
         "invalidPath": "O arquivo selecionado não é um executável válido do Git Bash (bash.exe).",
         "title": "Selecionar executável do Git Bash"
       },
-      "success": "Git Bash detectado com sucesso!"
+      "placeholder": "[to be translated]:Select bash.exe path",
+      "success": "Git Bash detectado com sucesso!",
+      "tooltip": "[to be translated]:Git Bash is required to run agents on Windows. Install from git-scm.com if not available."
     },
     "input": {
       "placeholder": "Digite sua mensagem aqui, envie com {{key}} - @ selecionar caminho, / selecionar comando"
@@ -544,14 +548,23 @@
       "more": "Configurações do Assistente",
       "prompt": "Configurações de Prompt",
       "reasoning_effort": {
+        "auto": "Automóvel",
+        "auto_description": "Determinar flexivelmente o esforço de raciocínio",
         "default": "Padrão",
+        "default_description": "Depender do comportamento padrão do modelo, sem qualquer configuração.",
         "high": "Longo",
+        "high_description": "Raciocínio de alto nível",
         "label": "Comprimento da Cadeia de Raciocínio",
         "low": "Curto",
+        "low_description": "Raciocínio de baixo nível",
         "medium": "Médio",
+        "medium_description": "Raciocínio de nível médio",
         "minimal": "mínimo",
+        "minimal_description": "Raciocínio mínimo",
         "off": "Desligado",
-        "xhigh": "Extra Alta"
+        "off_description": "Desabilitar raciocínio",
+        "xhigh": "Extra Alta",
+        "xhigh_description": "Raciocínio de altíssimo nível"
       },
       "regular_phrases": {
         "add": "Adicionar Frase",
@@ -2630,6 +2643,7 @@
     "lanyun": "Lanyun Tecnologia",
     "lmstudio": "Estúdio LM",
     "longcat": "Totoro",
+    "mimo": "[to be translated]:Xiaomi MiMo",
     "minimax": "Minimax",
     "mistral": "Mistral",
     "modelscope": "ModelScope MôDá",
@@ -3926,6 +3940,7 @@
         "mcp_auto_install": "Instalação automática do serviço MCP (beta)",
         "memory": "Implementação base de memória persistente baseada em grafos de conhecimento locais. Isso permite que o modelo lembre informações relevantes do utilizador entre diferentes conversas. É necessário configurar a variável de ambiente MEMORY_FILE_PATH.",
         "no": "sem descrição",
+        "nowledge_mem": "Requer a aplicação Nowledge Mem em execução localmente. Mantém conversas de IA, ferramentas, notas, agentes e ficheiros numa memória privada no seu computador. Transfira de https://mem.nowledge.co/",
         "python": "Executar código Python num ambiente sandbox seguro. Utilizar Pyodide para executar Python, suportando a maioria das bibliotecas padrão e pacotes de computação científica",
         "sequentialthinking": "Uma implementação de servidor MCP que fornece ferramentas para resolução dinâmica e reflexiva de problemas através de um processo de pensamento estruturado"
       },
diff --git a/src/renderer/src/i18n/translate/ru-ru.json b/src/renderer/src/i18n/translate/ru-ru.json
index 7665115d5c..8a6a781451 100644
--- a/src/renderer/src/i18n/translate/ru-ru.json
+++ b/src/renderer/src/i18n/translate/ru-ru.json
@@ -32,6 +32,7 @@
     },
     "gitBash": {
       "autoDetected": "Используется автоматически обнаруженный Git Bash",
+      "autoDiscoveredHint": "[to be translated]:Auto-discovered",
       "clear": {
         "button": "Очистить пользовательский путь"
       },
@@ -39,6 +40,7 @@
       "error": {
         "description": "Для запуска агентов в Windows требуется Git Bash. Без него агент не может работать. Пожалуйста, установите Git для Windows с",
         "recheck": "Повторная проверка установки Git Bash",
+        "required": "[to be translated]:Git Bash path is required on Windows",
         "title": "Требуется Git Bash"
       },
       "found": {
@@ -51,7 +53,9 @@
         "invalidPath": "Выбранный файл не является допустимым исполняемым файлом Git Bash (bash.exe).",
         "title": "Выберите исполняемый файл Git Bash"
       },
-      "success": "Git Bash успешно обнаружен!"
+      "placeholder": "[to be translated]:Select bash.exe path",
+      "success": "Git Bash успешно обнаружен!",
+      "tooltip": "[to be translated]:Git Bash is required to run agents on Windows. Install from git-scm.com if not available."
     },
     "input": {
       "placeholder": "Введите ваше сообщение здесь, отправьте с помощью {{key}} — @ выбрать путь, / выбрать команду"
@@ -544,14 +548,23 @@
       "more": "Настройки ассистента",
       "prompt": "Настройки промптов",
       "reasoning_effort": {
+        "auto": "Авто",
+        "auto_description": "Гибко определяйте усилие на рассуждение",
         "default": "По умолчанию",
+        "default_description": "Полагаться на поведение модели по умолчанию, без какой-либо конфигурации.",
         "high": "Стараюсь думать",
+        "high_description": "Высокоуровневое рассуждение",
         "label": "Настройки размышлений",
         "low": "Меньше думать",
+        "low_description": "Низкоуровневое рассуждение",
         "medium": "Среднее",
+        "medium_description": "Средний уровень рассуждения",
         "minimal": "минимальный",
+        "minimal_description": "Минимальное рассуждение",
         "off": "Выключить",
-        "xhigh": "Сверхвысокое"
+        "off_description": "Отключить рассуждение",
+        "xhigh": "Сверхвысокое",
+        "xhigh_description": "Высочайший уровень рассуждений"
       },
       "regular_phrases": {
         "add": "Добавить подсказку",
@@ -2630,6 +2643,7 @@
     "lanyun": "LANYUN",
     "lmstudio": "LM Studio",
     "longcat": "Тоторо",
+    "mimo": "[to be translated]:Xiaomi MiMo",
     "minimax": "MiniMax",
     "mistral": "Mistral",
     "modelscope": "ModelScope",
@@ -3926,6 +3940,7 @@
         "mcp_auto_install": "Автоматическая установка службы MCP (бета-версия)",
         "memory": "реализация постоянной памяти на основе локального графа знаний. Это позволяет модели запоминать информацию о пользователе между различными диалогами. Требуется настроить переменную среды MEMORY_FILE_PATH.",
         "no": "без описания",
+        "nowledge_mem": "Требуется запущенное локально приложение Nowledge Mem. Хранит чаты ИИ, инструменты, заметки, агентов и файлы в приватной памяти на вашем компьютере. Скачать можно на https://mem.nowledge.co/",
         "python": "Выполняйте код Python в безопасной песочнице. Запускайте Python с помощью Pyodide, поддерживается большинство стандартных библиотек и пакетов для научных вычислений",
         "sequentialthinking": "MCP серверная реализация, предоставляющая инструменты для динамического и рефлексивного решения проблем посредством структурированного мыслительного процесса"
       },
diff --git a/src/renderer/src/pages/home/Inputbar/tools/components/ThinkingButton.tsx b/src/renderer/src/pages/home/Inputbar/tools/components/ThinkingButton.tsx
index bcc395c53b..10b4656bc0 100644
--- a/src/renderer/src/pages/home/Inputbar/tools/components/ThinkingButton.tsx
+++ b/src/renderer/src/pages/home/Inputbar/tools/components/ThinkingButton.tsx
@@ -6,7 +6,8 @@ import {
   MdiLightbulbOn30,
   MdiLightbulbOn50,
   MdiLightbulbOn80,
-  MdiLightbulbOn90
+  MdiLightbulbOn90,
+  MdiLightbulbQuestion
 } from '@renderer/components/Icons/SVGIcon'
 import { QuickPanelReservedSymbol, useQuickPanel } from '@renderer/components/QuickPanel'
 import {
@@ -18,7 +19,6 @@ import {
   MODEL_SUPPORTED_OPTIONS
 } from '@renderer/config/models'
 import { useAssistant } from '@renderer/hooks/useAssistant'
-import { getReasoningEffortOptionsLabel } from '@renderer/i18n/label'
 import type { ToolQuickPanelApi } from '@renderer/pages/home/Inputbar/types'
 import type { Model, ThinkingOption } from '@renderer/types'
 import { Tooltip } from 'antd'
@@ -88,19 +88,48 @@ const ThinkingButton: FC<Props> = ({ quickPanel, model, assistantId }): ReactEle
     [updateAssistantSettings, assistant.enableWebSearch, model, t]
   )
 
+  const reasoningEffortOptionLabelMap = {
+    default: t('assistants.settings.reasoning_effort.default'),
+    none: t('assistants.settings.reasoning_effort.off'),
+    minimal: t('assistants.settings.reasoning_effort.minimal'),
+    high: t('assistants.settings.reasoning_effort.high'),
+    low: t('assistants.settings.reasoning_effort.low'),
+    medium: t('assistants.settings.reasoning_effort.medium'),
+    auto: t('assistants.settings.reasoning_effort.auto'),
+    xhigh: t('assistants.settings.reasoning_effort.xhigh')
+  } as const satisfies Record<ThinkingOption, string>
+
+  const reasoningEffortDescriptionMap = {
+    default: t('assistants.settings.reasoning_effort.default_description'),
+    none: t('assistants.settings.reasoning_effort.off_description'),
+    minimal: t('assistants.settings.reasoning_effort.minimal_description'),
+    low: t('assistants.settings.reasoning_effort.low_description'),
+    medium: t('assistants.settings.reasoning_effort.medium_description'),
+    high: t('assistants.settings.reasoning_effort.high_description'),
+    xhigh: t('assistants.settings.reasoning_effort.xhigh_description'),
+    auto: t('assistants.settings.reasoning_effort.auto_description')
+  } as const satisfies Record<ThinkingOption, string>
+
   const panelItems = useMemo(() => {
     // 使用表中定义的选项创建UI选项
     return supportedOptions.map((option) => ({
       level: option,
-      label: getReasoningEffortOptionsLabel(option),
-      description: '',
+      label: reasoningEffortOptionLabelMap[option],
+      description: reasoningEffortDescriptionMap[option],
       icon: ThinkingIcon({ option }),
       isSelected: currentReasoningEffort === option,
       action: () => onThinkingChange(option)
     }))
-  }, [currentReasoningEffort, supportedOptions, onThinkingChange])
+  }, [
+    supportedOptions,
+    reasoningEffortOptionLabelMap,
+    reasoningEffortDescriptionMap,
+    currentReasoningEffort,
+    onThinkingChange
+  ])
 
-  const isThinkingEnabled = currentReasoningEffort !== undefined && currentReasoningEffort !== 'none'
+  const isThinkingEnabled =
+    currentReasoningEffort !== undefined && currentReasoningEffort !== 'none' && currentReasoningEffort !== 'default'
 
   const disableThinking = useCallback(() => {
     onThinkingChange('none')
@@ -197,8 +226,9 @@ const ThinkingIcon = (props: { option?: ThinkingOption; isFixedReasoning?: boole
       case 'none':
         IconComponent = MdiLightbulbOffOutline
         break
+      case 'default':
       default:
-        IconComponent = MdiLightbulbOffOutline
+        IconComponent = MdiLightbulbQuestion
         break
     }
   }
diff --git a/src/renderer/src/pages/settings/MCPSettings/BuiltinMCPServerList.tsx b/src/renderer/src/pages/settings/MCPSettings/BuiltinMCPServerList.tsx
index 6ee9f3efca..1fc067b422 100644
--- a/src/renderer/src/pages/settings/MCPSettings/BuiltinMCPServerList.tsx
+++ b/src/renderer/src/pages/settings/MCPSettings/BuiltinMCPServerList.tsx
@@ -61,9 +61,14 @@ const BuiltinMCPServerList: FC = () => {
                   {getMcpTypeLabel(server.type ?? 'stdio')}
                 </Tag>
                 {server?.shouldConfig && (
-                  <Tag color="warning" style={{ borderRadius: 20, margin: 0, fontWeight: 500 }}>
-                    {t('settings.mcp.requiresConfig')}
-                  </Tag>
+                  <a
+                    href="https://docs.cherry-ai.com/advanced-basic/mcp/buildin"
+                    target="_blank"
+                    rel="noopener noreferrer">
+                    <Tag color="warning" style={{ borderRadius: 20, margin: 0, fontWeight: 500 }}>
+                      {t('settings.mcp.requiresConfig')}
+                    </Tag>
+                  </a>
                 )}
               </ServerFooter>
             </ServerCard>
diff --git a/src/renderer/src/pages/settings/ProviderSettings/ProviderSetting.tsx b/src/renderer/src/pages/settings/ProviderSettings/ProviderSetting.tsx
index 66807b5965..e1e01883fc 100644
--- a/src/renderer/src/pages/settings/ProviderSettings/ProviderSetting.tsx
+++ b/src/renderer/src/pages/settings/ProviderSettings/ProviderSetting.tsx
@@ -81,6 +81,7 @@ const ANTHROPIC_COMPATIBLE_PROVIDER_IDS = [
   SystemProviderIds.silicon,
   SystemProviderIds.qiniu,
   SystemProviderIds.dmxapi,
+  SystemProviderIds.mimo,
   SystemProviderIds.ppio
 ] as const
 type AnthropicCompatibleProviderId = (typeof ANTHROPIC_COMPATIBLE_PROVIDER_IDS)[number]
diff --git a/src/renderer/src/services/ApiService.ts b/src/renderer/src/services/ApiService.ts
index 3c081c3da1..0cd57a353a 100644
--- a/src/renderer/src/services/ApiService.ts
+++ b/src/renderer/src/services/ApiService.ts
@@ -34,6 +34,10 @@ import {
   getProviderByModel,
   getQuickModel
 } from './AssistantService'
+import { ConversationService } from './ConversationService'
+import { injectUserMessageWithKnowledgeSearchPrompt } from './KnowledgeService'
+import type { BlockManager } from './messageStreaming'
+import type { StreamProcessorCallbacks } from './StreamProcessingService'
 // import { processKnowledgeSearch } from './KnowledgeService'
 // import {
 //   filterContextMessages,
@@ -79,6 +83,59 @@ export async function fetchMcpTools(assistant: Assistant) {
   return mcpTools
 }
 
+/**
+ * 将用户消息转换为LLM可以理解的格式并发送请求
+ * @param request - 包含消息内容和助手信息的请求对象
+ * @param onChunkReceived - 接收流式响应数据的回调函数
+ */
+// 目前先按照函数来写,后续如果有需要到class的地方就改回来
+export async function transformMessagesAndFetch(
+  request: {
+    messages: Message[]
+    assistant: Assistant
+    blockManager: BlockManager
+    assistantMsgId: string
+    callbacks: StreamProcessorCallbacks
+    topicId?: string // 添加 topicId 用于 trace
+    options: {
+      signal?: AbortSignal
+      timeout?: number
+      headers?: Record<string, string>
+    }
+  },
+  onChunkReceived: (chunk: Chunk) => void
+) {
+  const { messages, assistant } = request
+
+  try {
+    const { modelMessages, uiMessages } = await ConversationService.prepareMessagesForModel(messages, assistant)
+
+    // replace prompt variables
+    assistant.prompt = await replacePromptVariables(assistant.prompt, assistant.model?.name)
+
+    // inject knowledge search prompt into model messages
+    await injectUserMessageWithKnowledgeSearchPrompt({
+      modelMessages,
+      assistant,
+      assistantMsgId: request.assistantMsgId,
+      topicId: request.topicId,
+      blockManager: request.blockManager,
+      setCitationBlockId: request.callbacks.setCitationBlockId!
+    })
+
+    await fetchChatCompletion({
+      messages: modelMessages,
+      assistant: assistant,
+      topicId: request.topicId,
+      requestOptions: request.options,
+      uiMessages,
+      onChunkReceived
+    })
+  } catch (error: any) {
+    onChunkReceived({ type: ChunkType.ERROR, error })
+  }
+}
+
 export async function fetchChatCompletion({
   messages,
   prompt,
diff --git a/src/renderer/src/services/AssistantService.ts b/src/renderer/src/services/AssistantService.ts
index 233b3c19ca..91a95d691a 100644
--- a/src/renderer/src/services/AssistantService.ts
+++ b/src/renderer/src/services/AssistantService.ts
@@ -38,7 +38,8 @@ export const DEFAULT_ASSISTANT_SETTINGS = {
   enableTopP: false,
   // It would gracefully fallback to prompt if not supported by model.
   toolUseMode: 'function',
-  customParameters: []
+  customParameters: [],
+  reasoning_effort: 'default'
 } as const satisfies AssistantSettings
 
 export function getDefaultAssistant(): Assistant {
@@ -186,7 +187,7 @@ export const getAssistantSettings = (assistant: Assistant): AssistantSettings =>
     streamOutput: assistant?.settings?.streamOutput ?? true,
     toolUseMode: assistant?.settings?.toolUseMode ?? 'function',
     defaultModel: assistant?.defaultModel ?? undefined,
-    reasoning_effort: assistant?.settings?.reasoning_effort ?? undefined,
+    reasoning_effort: assistant?.settings?.reasoning_effort ?? 'default',
     customParameters: assistant?.settings?.customParameters ?? []
   }
 }
diff --git a/src/renderer/src/services/KnowledgeService.ts b/src/renderer/src/services/KnowledgeService.ts
index e78cfa62e5..ce9577c68d 100644
--- a/src/renderer/src/services/KnowledgeService.ts
+++ b/src/renderer/src/services/KnowledgeService.ts
@@ -2,10 +2,13 @@ import { loggerService } from '@logger'
 import type { Span } from '@opentelemetry/api'
 import { ModernAiProvider } from '@renderer/aiCore'
 import AiProvider from '@renderer/aiCore/legacy'
+import { getMessageContent } from '@renderer/aiCore/plugins/searchOrchestrationPlugin'
 import { DEFAULT_KNOWLEDGE_DOCUMENT_COUNT, DEFAULT_KNOWLEDGE_THRESHOLD } from '@renderer/config/constant'
 import { getEmbeddingMaxContext } from '@renderer/config/embedings'
+import { REFERENCE_PROMPT } from '@renderer/config/prompts'
 import { addSpan, endSpan } from '@renderer/services/SpanManagerService'
 import store from '@renderer/store'
+import type { Assistant } from '@renderer/types'
 import {
   type FileMetadata,
   type KnowledgeBase,
@@ -16,13 +19,17 @@ import {
 } from '@renderer/types'
 import type { Chunk } from '@renderer/types/chunk'
 import { ChunkType } from '@renderer/types/chunk'
+import { MessageBlockStatus, MessageBlockType } from '@renderer/types/newMessage'
 import { routeToEndpoint } from '@renderer/utils'
 import type { ExtractResults } from '@renderer/utils/extract'
+import { createCitationBlock } from '@renderer/utils/messageUtils/create'
 import { isAzureOpenAIProvider, isGeminiProvider } from '@renderer/utils/provider'
+import type { ModelMessage, UserModelMessage } from 'ai'
 import { isEmpty } from 'lodash'
 
 import { getProviderByModel } from './AssistantService'
 import FileManager from './FileManager'
+import type { BlockManager } from './messageStreaming'
 
 const logger = loggerService.withContext('RendererKnowledgeService')
 
@@ -338,3 +345,128 @@ export function processKnowledgeReferences(
     }
   }
 }
+
+export const injectUserMessageWithKnowledgeSearchPrompt = async ({
+  modelMessages,
+  assistant,
+  assistantMsgId,
+  topicId,
+  blockManager,
+  setCitationBlockId
+}: {
+  modelMessages: ModelMessage[]
+  assistant: Assistant
+  assistantMsgId: string
+  topicId?: string
+  blockManager: BlockManager
+  setCitationBlockId: (blockId: string) => void
+}) => {
+  if (assistant.knowledge_bases?.length && modelMessages.length > 0) {
+    const lastUserMessage = modelMessages[modelMessages.length - 1]
+    const isUserMessage = lastUserMessage.role === 'user'
+
+    if (!isUserMessage) {
+      return
+    }
+
+    const knowledgeReferences = await getKnowledgeReferences({
+      assistant,
+      lastUserMessage,
+      topicId: topicId
+    })
+
+    if (knowledgeReferences.length === 0) {
+      return
+    }
+
+    await createKnowledgeReferencesBlock({
+      assistantMsgId,
+      knowledgeReferences,
+      blockManager,
+      setCitationBlockId
+    })
+
+    const question = getMessageContent(lastUserMessage) || ''
+    const references = JSON.stringify(knowledgeReferences, null, 2)
+
+    const knowledgeSearchPrompt = REFERENCE_PROMPT.replace('{question}', question).replace('{references}', references)
+
+    if (typeof lastUserMessage.content === 'string') {
+      lastUserMessage.content = knowledgeSearchPrompt
+    } else if (Array.isArray(lastUserMessage.content)) {
+      const textPart = lastUserMessage.content.find((part) => part.type === 'text')
+      if (textPart) {
+        textPart.text = knowledgeSearchPrompt
+      } else {
+        lastUserMessage.content.push({
+          type: 'text',
+          text: knowledgeSearchPrompt
+        })
+      }
+    }
+  }
+}
+
+export const getKnowledgeReferences = async ({
+  assistant,
+  lastUserMessage,
+  topicId
+}: {
+  assistant: Assistant
+  lastUserMessage: UserModelMessage
+  topicId?: string
+}) => {
+  // 如果助手没有知识库，返回空字符串
+  if (!assistant || isEmpty(assistant.knowledge_bases)) {
+    return []
+  }
+
+  // 获取知识库ID
+  const knowledgeBaseIds = assistant.knowledge_bases?.map((base) => base.id)
+
+  // 获取用户消息内容
+  const question = getMessageContent(lastUserMessage) || ''
+
+  // 获取知识库引用
+  const knowledgeReferences = await processKnowledgeSearch(
+    {
+      knowledge: {
+        question: [question],
+        rewrite: ''
+      }
+    },
+    knowledgeBaseIds,
+    topicId!
+  )
+
+  // 返回提示词
+  return knowledgeReferences
+}
+
+export const createKnowledgeReferencesBlock = async ({
+  assistantMsgId,
+  knowledgeReferences,
+  blockManager,
+  setCitationBlockId
+}: {
+  assistantMsgId: string
+  knowledgeReferences: KnowledgeReference[]
+  blockManager: BlockManager
+  setCitationBlockId: (blockId: string) => void
+}) => {
+  // 创建引用块
+  const citationBlock = createCitationBlock(
+    assistantMsgId,
+    { knowledge: knowledgeReferences },
+    { status: MessageBlockStatus.SUCCESS }
+  )
+
+  // 处理引用块
+  blockManager.handleBlockTransition(citationBlock, MessageBlockType.CITATION)
+
+  // 设置引用块ID
+  setCitationBlockId(citationBlock.id)
+
+  // 返回引用块
+  return citationBlock
+}
diff --git a/src/renderer/src/services/OrchestrateService.ts b/src/renderer/src/services/OrchestrateService.ts
deleted file mode 100644
index 71f17d6804..0000000000
--- a/src/renderer/src/services/OrchestrateService.ts
+++ /dev/null
@@ -1,91 +0,0 @@
-import type { Assistant, Message } from '@renderer/types'
-import type { Chunk } from '@renderer/types/chunk'
-import { ChunkType } from '@renderer/types/chunk'
-import { replacePromptVariables } from '@renderer/utils/prompt'
-
-import { fetchChatCompletion } from './ApiService'
-import { ConversationService } from './ConversationService'
-
-/**
- * The request object for handling a user message.
- */
-export interface OrchestrationRequest {
-  messages: Message[]
-  assistant: Assistant
-  options: {
-    signal?: AbortSignal
-    timeout?: number
-    headers?: Record<string, string>
-  }
-  topicId?: string // 添加 topicId 用于 trace
-}
-
-/**
- * The OrchestrationService is responsible for orchestrating the different services
- * to handle a user's message. It contains the core logic of the application.
- */
-// NOTE：暂时没有用到这个类
-export class OrchestrationService {
-  constructor() {
-    // In the future, this could be a singleton, but for now, a new instance is fine.
-    // this.conversationService = new ConversationService()
-  }
-
-  /**
-   * This is the core method to handle user messages.
-   * It takes the message context and an events object for callbacks,
-   * and orchestrates the call to the LLM.
-   * The logic is moved from `messageThunk.ts`.
-   * @param request The orchestration request containing messages and assistant info.
-   * @param events A set of callbacks to report progress and results to the UI layer.
-   */
-  async transformMessagesAndFetch(request: OrchestrationRequest, onChunkReceived: (chunk: Chunk) => void) {
-    const { messages, assistant } = request
-
-    try {
-      const { modelMessages, uiMessages } = await ConversationService.prepareMessagesForModel(messages, assistant)
-
-      await fetchChatCompletion({
-        messages: modelMessages,
-        assistant: assistant,
-        requestOptions: request.options,
-        onChunkReceived,
-        topicId: request.topicId,
-        uiMessages: uiMessages
-      })
-    } catch (error: any) {
-      onChunkReceived({ type: ChunkType.ERROR, error })
-    }
-  }
-}
-
-/**
- * 将用户消息转换为LLM可以理解的格式并发送请求
- * @param request - 包含消息内容和助手信息的请求对象
- * @param onChunkReceived - 接收流式响应数据的回调函数
- */
-// 目前先按照函数来写,后续如果有需要到class的地方就改回来
-export async function transformMessagesAndFetch(
-  request: OrchestrationRequest,
-  onChunkReceived: (chunk: Chunk) => void
-) {
-  const { messages, assistant } = request
-
-  try {
-    const { modelMessages, uiMessages } = await ConversationService.prepareMessagesForModel(messages, assistant)
-
-    // replace prompt variables
-    assistant.prompt = await replacePromptVariables(assistant.prompt, assistant.model?.name)
-
-    await fetchChatCompletion({
-      messages: modelMessages,
-      assistant: assistant,
-      requestOptions: request.options,
-      onChunkReceived,
-      topicId: request.topicId,
-      uiMessages
-    })
-  } catch (error: any) {
-    onChunkReceived({ type: ChunkType.ERROR, error })
-  }
-}
diff --git a/src/renderer/src/services/StreamProcessingService.ts b/src/renderer/src/services/StreamProcessingService.ts
index 26f52b8037..7e80672d5d 100644
--- a/src/renderer/src/services/StreamProcessingService.ts
+++ b/src/renderer/src/services/StreamProcessingService.ts
@@ -34,6 +34,10 @@ export interface StreamProcessorCallbacks {
   onLLMWebSearchInProgress?: () => void
   // LLM Web search complete
   onLLMWebSearchComplete?: (llmWebSearchResult: WebSearchResponse) => void
+  // Get citation block ID
+  getCitationBlockId?: () => string | null
+  // Set citation block ID
+  setCitationBlockId?: (blockId: string) => void
   // Image generation chunk received
   onImageCreated?: () => void
   onImageDelta?: (imageData: GenerateImageResponse) => void
diff --git a/src/renderer/src/services/messageStreaming/callbacks/citationCallbacks.ts b/src/renderer/src/services/messageStreaming/callbacks/citationCallbacks.ts
index 9e99fe7520..3245493636 100644
--- a/src/renderer/src/services/messageStreaming/callbacks/citationCallbacks.ts
+++ b/src/renderer/src/services/messageStreaming/callbacks/citationCallbacks.ts
@@ -121,6 +121,11 @@ export const createCitationCallbacks = (deps: CitationCallbacksDependencies) =>
     },
 
     // 暴露给外部的方法，用于textCallbacks中获取citationBlockId
-    getCitationBlockId: () => citationBlockId
+    getCitationBlockId: () => citationBlockId,
+
+    // 暴露给外部的方法，用于 KnowledgeService 中设置 citationBlockId
+    setCitationBlockId: (blockId: string) => {
+      citationBlockId = blockId
+    }
   }
 }
diff --git a/src/renderer/src/store/index.ts b/src/renderer/src/store/index.ts
index b29b4d1086..51d70ef6de 100644
--- a/src/renderer/src/store/index.ts
+++ b/src/renderer/src/store/index.ts
@@ -67,7 +67,7 @@ const persistedReducer = persistReducer(
   {
     key: 'cherry-studio',
     storage,
-    version: 186,
+    version: 187,
     blacklist: ['runtime', 'messages', 'messageBlocks', 'tabs', 'toolPermissions'],
     migrate
   },
diff --git a/src/renderer/src/store/mcp.ts b/src/renderer/src/store/mcp.ts
index ed7076bc1c..5b8d5bcdcf 100644
--- a/src/renderer/src/store/mcp.ts
+++ b/src/renderer/src/store/mcp.ts
@@ -183,6 +183,16 @@ export const builtinMCPServers: BuiltinMCPServer[] = [
     provider: 'CherryAI',
     installSource: 'builtin',
     isTrusted: true
+  },
+  {
+    id: nanoid(),
+    name: BuiltinMCPServerNames.nowledgeMem,
+    reference: 'https://mem.nowledge.co/',
+    type: 'inMemory',
+    isActive: false,
+    provider: 'Nowledge',
+    installSource: 'builtin',
+    isTrusted: true
   }
 ] as const
 
diff --git a/src/renderer/src/store/migrate.ts b/src/renderer/src/store/migrate.ts
index e7b423f094..a3dd1cbaa1 100644
--- a/src/renderer/src/store/migrate.ts
+++ b/src/renderer/src/store/migrate.ts
@@ -3043,6 +3043,21 @@ const migrateConfig = {
       logger.error('migrate 186 error', error as Error)
       return state
     }
+  },
+  '187': (state: RootState) => {
+    try {
+      state.assistants.assistants.forEach((assistant) => {
+        if (assistant.settings && assistant.settings.reasoning_effort === undefined) {
+          assistant.settings.reasoning_effort = 'default'
+        }
+      })
+      addProvider(state, 'mimo')
+      logger.info('migrate 187 success')
+      return state
+    } catch (error) {
+      logger.error('migrate 187 error', error as Error)
+      return state
+    }
   }
 }
 
diff --git a/src/renderer/src/store/thunk/messageThunk.ts b/src/renderer/src/store/thunk/messageThunk.ts
index a70fdf572d..8219fa0cce 100644
--- a/src/renderer/src/store/thunk/messageThunk.ts
+++ b/src/renderer/src/store/thunk/messageThunk.ts
@@ -2,12 +2,11 @@ import { loggerService } from '@logger'
 import { AiSdkToChunkAdapter } from '@renderer/aiCore/chunk/AiSdkToChunkAdapter'
 import { AgentApiClient } from '@renderer/api/agent'
 import db from '@renderer/databases'
-import { fetchMessagesSummary } from '@renderer/services/ApiService'
+import { fetchMessagesSummary, transformMessagesAndFetch } from '@renderer/services/ApiService'
 import { DbService } from '@renderer/services/db/DbService'
 import FileManager from '@renderer/services/FileManager'
 import { BlockManager } from '@renderer/services/messageStreaming/BlockManager'
 import { createCallbacks } from '@renderer/services/messageStreaming/callbacks'
-import { transformMessagesAndFetch } from '@renderer/services/OrchestrateService'
 import { endSpan } from '@renderer/services/SpanManagerService'
 import { createStreamProcessor, type StreamProcessorCallbacks } from '@renderer/services/StreamProcessingService'
 import store from '@renderer/store'
@@ -814,6 +813,9 @@ const fetchAndProcessAssistantResponseImpl = async (
         messages: messagesForContext,
         assistant,
         topicId,
+        blockManager,
+        assistantMsgId,
+        callbacks,
         options: {
           signal: abortController.signal,
           timeout: 30000,
diff --git a/src/renderer/src/types/index.ts b/src/renderer/src/types/index.ts
index 56a63e7d58..67a79f656b 100644
--- a/src/renderer/src/types/index.ts
+++ b/src/renderer/src/types/index.ts
@@ -103,13 +103,14 @@ const ThinkModelTypes = [
   'doubao',
   'doubao_no_auto',
   'doubao_after_251015',
+  'mimo',
   'hunyuan',
   'zhipu',
   'perplexity',
   'deepseek_hybrid'
 ] as const
 
-export type ReasoningEffortOption = NonNullable<OpenAI.ReasoningEffort> | 'auto'
+export type ReasoningEffortOption = NonNullable<OpenAI.ReasoningEffort> | 'auto' | 'default'
 export type ThinkingOption = ReasoningEffortOption
 export type ThinkingModelType = (typeof ThinkModelTypes)[number]
 export type ThinkingOptionConfig = Record<ThinkingModelType, ThinkingOption[]>
@@ -121,6 +122,8 @@ export function isThinkModelType(type: string): type is ThinkingModelType {
 }
 
 export const EFFORT_RATIO: EffortRatio = {
+  // 'default' is not expected to be used.
+  default: 0,
   none: 0.01,
   minimal: 0.05,
   low: 0.05,
@@ -141,12 +144,11 @@ export type AssistantSettings = {
   streamOutput: boolean
   defaultModel?: Model
   customParameters?: AssistantSettingCustomParameters[]
-  reasoning_effort?: ReasoningEffortOption
-  /** 保留上一次使用思考模型时的 reasoning effort, 在从非思考模型切换到思考模型时恢复.
-   *
-   * TODO: 目前 reasoning_effort === undefined 有两个语义，有的场景是显式关闭思考，有的场景是不传参。
-   * 未来应该重构思考控制，将启用/关闭思考和思考选项分离，这样就不用依赖 cache 了。
-   *
+  reasoning_effort: ReasoningEffortOption
+  /**
+   * Preserve the effective reasoning effort (not 'default') from the last use of a thinking model which supports thinking control,
+   * and restore it when switching back from a non-thinking or fixed reasoning model.
+   * FIXME: It should be managed by external cache service instead of being stored in the assistant
    */
   reasoning_effort_cache?: ReasoningEffortOption
   qwenThinkMode?: boolean
@@ -751,7 +753,8 @@ export const BuiltinMCPServerNames = {
   difyKnowledge: '@cherry/dify-knowledge',
   python: '@cherry/python',
   didiMCP: '@cherry/didi-mcp',
-  browser: '@cherry/browser'
+  browser: '@cherry/browser',
+  nowledgeMem: '@cherry/nowledge-mem'
 } as const
 
 export type BuiltinMCPServerName = (typeof BuiltinMCPServerNames)[keyof typeof BuiltinMCPServerNames]
diff --git a/yarn.lock b/yarn.lock
index 6e933257d1..ab781d3700 100644
--- a/yarn.lock
+++ b/yarn.lock
@@ -11246,7 +11246,7 @@ __metadata:
   languageName: node
   linkType: hard
 
-"buffer-equal-constant-time@npm:1.0.1":
+"buffer-equal-constant-time@npm:^1.0.1":
   version: 1.0.1
   resolution: "buffer-equal-constant-time@npm:1.0.1"
   checksum: 10c0/fb2294e64d23c573d0dd1f1e7a466c3e978fe94a4e0f8183937912ca374619773bef8e2aceb854129d2efecbbc515bbd0cc78d2734a3e3031edb0888531bbc8e
@@ -17178,24 +17178,24 @@ __metadata:
   languageName: node
   linkType: hard
 
-"jwa@npm:^2.0.0":
-  version: 2.0.0
-  resolution: "jwa@npm:2.0.0"
+"jwa@npm:^2.0.1":
+  version: 2.0.1
+  resolution: "jwa@npm:2.0.1"
   dependencies:
-    buffer-equal-constant-time: "npm:1.0.1"
+    buffer-equal-constant-time: "npm:^1.0.1"
     ecdsa-sig-formatter: "npm:1.0.11"
     safe-buffer: "npm:^5.0.1"
-  checksum: 10c0/6baab823b93c038ba1d2a9e531984dcadbc04e9eb98d171f4901b7a40d2be15961a359335de1671d78cb6d987f07cbe5d350d8143255977a889160c4d90fcc3c
+  checksum: 10c0/ab3ebc6598e10dc11419d4ed675c9ca714a387481466b10e8a6f3f65d8d9c9237e2826f2505280a739cf4cbcf511cb288eeec22b5c9c63286fc5a2e4f97e78cf
   languageName: node
   linkType: hard
 
 "jws@npm:^4.0.0":
-  version: 4.0.0
-  resolution: "jws@npm:4.0.0"
+  version: 4.0.1
+  resolution: "jws@npm:4.0.1"
   dependencies:
-    jwa: "npm:^2.0.0"
+    jwa: "npm:^2.0.1"
     safe-buffer: "npm:^5.0.1"
-  checksum: 10c0/f1ca77ea5451e8dc5ee219cb7053b8a4f1254a79cb22417a2e1043c1eb8a569ae118c68f24d72a589e8a3dd1824697f47d6bd4fb4bebb93a3bdf53545e721661
+  checksum: 10c0/6be1ed93023aef570ccc5ea8d162b065840f3ef12f0d1bb3114cade844de7a357d5dc558201d9a65101e70885a6fa56b17462f520e6b0d426195510618a154d0
   languageName: node
   linkType: hard
 

From 4173fcbb98de2a5725ea0b580a042bf2ed344c35 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 18 Dec 2025 15:16:34 +0800
Subject: [PATCH 41/53] feat(model): add parseModelId function to handle model
 identifiers with colons

---
 .../home/Inputbar/AgentSessionInputbar.tsx    |  6 ++-
 .../src/utils/__tests__/model.test.ts         | 54 ++++++++++++++++++-
 src/renderer/src/utils/model.ts               | 36 +++++++++++++
 3 files changed, 93 insertions(+), 3 deletions(-)

diff --git a/src/renderer/src/pages/home/Inputbar/AgentSessionInputbar.tsx b/src/renderer/src/pages/home/Inputbar/AgentSessionInputbar.tsx
index 850be7f727..2aedab0b21 100644
--- a/src/renderer/src/pages/home/Inputbar/AgentSessionInputbar.tsx
+++ b/src/renderer/src/pages/home/Inputbar/AgentSessionInputbar.tsx
@@ -23,6 +23,7 @@ import { abortCompletion } from '@renderer/utils/abortController'
 import { buildAgentSessionTopicId } from '@renderer/utils/agentSession'
 import { getSendMessageShortcutLabel } from '@renderer/utils/input'
 import { createMainTextBlock, createMessage } from '@renderer/utils/messageUtils/create'
+import { parseModelId } from '@renderer/utils/model'
 import { documentExts, imageExts, textExts } from '@shared/config/constant'
 import type { FC } from 'react'
 import React, { useCallback, useEffect, useMemo, useRef } from 'react'
@@ -67,8 +68,9 @@ const AgentSessionInputbar: FC<Props> = ({ agentId, sessionId }) => {
     if (!session) return null
 
     // Extract model info
-    const [providerId, actualModelId] = session.model?.split(':') ?? [undefined, undefined]
-    const actualModel = actualModelId ? getModel(actualModelId, providerId) : undefined
+    // Use parseModelId to handle model IDs with colons (e.g., "openrouter:anthropic/claude:free")
+    const parsed = parseModelId(session.model)
+    const actualModel = parsed ? getModel(parsed.modelId, parsed.providerId) : undefined
 
     const model: Model | undefined = actualModel
       ? {
diff --git a/src/renderer/src/utils/__tests__/model.test.ts b/src/renderer/src/utils/__tests__/model.test.ts
index fe1697e3ed..79f7948fb1 100644
--- a/src/renderer/src/utils/__tests__/model.test.ts
+++ b/src/renderer/src/utils/__tests__/model.test.ts
@@ -1,7 +1,7 @@
 import type { Model, ModelTag } from '@renderer/types'
 import { describe, expect, it, vi } from 'vitest'
 
-import { getModelTags, isFreeModel } from '../model'
+import { getModelTags, isFreeModel, parseModelId } from '../model'
 
 // Mock the model checking functions from @renderer/config/models
 vi.mock('@renderer/config/models', () => ({
@@ -92,4 +92,56 @@ describe('model', () => {
       expect(getModelTags(models_2)).toStrictEqual(expected_2)
     })
   })
+
+  describe('parseModelId', () => {
+    it('should parse model identifiers with single colon', () => {
+      expect(parseModelId('anthropic:claude-3-sonnet')).toEqual({
+        providerId: 'anthropic',
+        modelId: 'claude-3-sonnet'
+      })
+
+      expect(parseModelId('openai:gpt-4')).toEqual({
+        providerId: 'openai',
+        modelId: 'gpt-4'
+      })
+    })
+
+    it('should parse model identifiers with multiple colons', () => {
+      expect(parseModelId('openrouter:anthropic/claude-3.5-sonnet:free')).toEqual({
+        providerId: 'openrouter',
+        modelId: 'anthropic/claude-3.5-sonnet:free'
+      })
+
+      expect(parseModelId('provider:model:suffix:extra')).toEqual({
+        providerId: 'provider',
+        modelId: 'model:suffix:extra'
+      })
+    })
+
+    it('should return undefined for invalid inputs', () => {
+      expect(parseModelId(undefined)).toBeUndefined()
+      expect(parseModelId('')).toBeUndefined()
+      expect(parseModelId('no-colon')).toBeUndefined()
+      expect(parseModelId(':missing-provider')).toBeUndefined()
+      expect(parseModelId('missing-model:')).toBeUndefined()
+      expect(parseModelId(':')).toBeUndefined()
+    })
+
+    it('should handle edge cases', () => {
+      expect(parseModelId('a:b')).toEqual({
+        providerId: 'a',
+        modelId: 'b'
+      })
+
+      expect(parseModelId('provider:model-with-dashes')).toEqual({
+        providerId: 'provider',
+        modelId: 'model-with-dashes'
+      })
+
+      expect(parseModelId('provider:model/with/slashes')).toEqual({
+        providerId: 'provider',
+        modelId: 'model/with/slashes'
+      })
+    })
+  })
 })
diff --git a/src/renderer/src/utils/model.ts b/src/renderer/src/utils/model.ts
index a74ffab25f..23e955eff3 100644
--- a/src/renderer/src/utils/model.ts
+++ b/src/renderer/src/utils/model.ts
@@ -81,3 +81,39 @@ export const apiModelAdapter = (model: ApiModel): AdaptedApiModel => {
     origin: model
   }
 }
+
+/**
+ * Parse a model identifier in the format "provider:modelId"
+ * where modelId may contain additional colons (e.g., "openrouter:anthropic/claude-3.5-sonnet:free")
+ *
+ * @param modelIdentifier - The full model identifier string
+ * @returns Object with providerId and modelId, or undefined if invalid
+ *
+ * @example
+ * parseModelId("openrouter:anthropic/claude-3.5-sonnet:free")
+ * // => { providerId: "openrouter", modelId: "anthropic/claude-3.5-sonnet:free" }
+ *
+ * @example
+ * parseModelId("anthropic:claude-3-sonnet")
+ * // => { providerId: "anthropic", modelId: "claude-3-sonnet" }
+ *
+ * @example
+ * parseModelId("invalid") // => undefined
+ */
+export function parseModelId(modelIdentifier: string | undefined): { providerId: string; modelId: string } | undefined {
+  if (!modelIdentifier || typeof modelIdentifier !== 'string') {
+    return undefined
+  }
+
+  const colonIndex = modelIdentifier.indexOf(':')
+
+  // Must contain at least one colon and have content on both sides
+  if (colonIndex <= 0 || colonIndex >= modelIdentifier.length - 1) {
+    return undefined
+  }
+
+  return {
+    providerId: modelIdentifier.substring(0, colonIndex),
+    modelId: modelIdentifier.substring(colonIndex + 1)
+  }
+}

From eb57f50cfe584ddb705dce046bc5ae816c9e5514 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 18 Dec 2025 15:19:59 +0800
Subject: [PATCH 42/53] feat(model): enhance parseModelId to handle identifiers
 without provider prefix and improve edge case handling

---
 .../src/utils/__tests__/model.test.ts         | 37 +++++++++++++++++--
 src/renderer/src/utils/model.ts               | 32 ++++++++++++----
 2 files changed, 58 insertions(+), 11 deletions(-)

diff --git a/src/renderer/src/utils/__tests__/model.test.ts b/src/renderer/src/utils/__tests__/model.test.ts
index 79f7948fb1..d06a7a2f4b 100644
--- a/src/renderer/src/utils/__tests__/model.test.ts
+++ b/src/renderer/src/utils/__tests__/model.test.ts
@@ -118,13 +118,42 @@ describe('model', () => {
       })
     })
 
+    it('should handle model identifiers without provider prefix', () => {
+      expect(parseModelId('claude-3-sonnet')).toEqual({
+        providerId: undefined,
+        modelId: 'claude-3-sonnet'
+      })
+
+      expect(parseModelId('gpt-4')).toEqual({
+        providerId: undefined,
+        modelId: 'gpt-4'
+      })
+    })
+
     it('should return undefined for invalid inputs', () => {
       expect(parseModelId(undefined)).toBeUndefined()
       expect(parseModelId('')).toBeUndefined()
-      expect(parseModelId('no-colon')).toBeUndefined()
-      expect(parseModelId(':missing-provider')).toBeUndefined()
-      expect(parseModelId('missing-model:')).toBeUndefined()
-      expect(parseModelId(':')).toBeUndefined()
+      expect(parseModelId('   ')).toBeUndefined()
+    })
+
+    it('should handle edge cases with colons', () => {
+      // Colon at start - treat as modelId without provider
+      expect(parseModelId(':missing-provider')).toEqual({
+        providerId: undefined,
+        modelId: ':missing-provider'
+      })
+
+      // Colon at end - treat everything before as modelId
+      expect(parseModelId('missing-model:')).toEqual({
+        providerId: undefined,
+        modelId: 'missing-model'
+      })
+
+      // Only colon - treat as modelId without provider
+      expect(parseModelId(':')).toEqual({
+        providerId: undefined,
+        modelId: ':'
+      })
     })
 
     it('should handle edge cases', () => {
diff --git a/src/renderer/src/utils/model.ts b/src/renderer/src/utils/model.ts
index 23e955eff3..c3efda2cb7 100644
--- a/src/renderer/src/utils/model.ts
+++ b/src/renderer/src/utils/model.ts
@@ -87,7 +87,7 @@ export const apiModelAdapter = (model: ApiModel): AdaptedApiModel => {
  * where modelId may contain additional colons (e.g., "openrouter:anthropic/claude-3.5-sonnet:free")
  *
  * @param modelIdentifier - The full model identifier string
- * @returns Object with providerId and modelId, or undefined if invalid
+ * @returns Object with providerId and modelId. If no provider prefix found, providerId will be undefined
  *
  * @example
  * parseModelId("openrouter:anthropic/claude-3.5-sonnet:free")
@@ -98,20 +98,38 @@ export const apiModelAdapter = (model: ApiModel): AdaptedApiModel => {
  * // => { providerId: "anthropic", modelId: "claude-3-sonnet" }
  *
  * @example
- * parseModelId("invalid") // => undefined
+ * parseModelId("claude-3-sonnet")
+ * // => { providerId: undefined, modelId: "claude-3-sonnet" }
+ *
+ * @example
+ * parseModelId("") // => undefined
  */
-export function parseModelId(modelIdentifier: string | undefined): { providerId: string; modelId: string } | undefined {
-  if (!modelIdentifier || typeof modelIdentifier !== 'string') {
+export function parseModelId(
+  modelIdentifier: string | undefined
+): { providerId: string | undefined; modelId: string } | undefined {
+  if (!modelIdentifier || typeof modelIdentifier !== 'string' || modelIdentifier.trim() === '') {
     return undefined
   }
 
   const colonIndex = modelIdentifier.indexOf(':')
 
-  // Must contain at least one colon and have content on both sides
-  if (colonIndex <= 0 || colonIndex >= modelIdentifier.length - 1) {
-    return undefined
+  // No colon found or colon at the start - treat entire string as modelId
+  if (colonIndex <= 0) {
+    return {
+      providerId: undefined,
+      modelId: modelIdentifier
+    }
   }
 
+  // Colon at the end - treat everything before as modelId
+  if (colonIndex >= modelIdentifier.length - 1) {
+    return {
+      providerId: undefined,
+      modelId: modelIdentifier.substring(0, colonIndex)
+    }
+  }
+
+  // Standard format: "provider:modelId"
   return {
     providerId: modelIdentifier.substring(0, colonIndex),
     modelId: modelIdentifier.substring(colonIndex + 1)

From 08777e0746e6045c005a4cf5d3bfe9b2f4729075 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 18 Dec 2025 15:26:23 +0800
Subject: [PATCH 43/53] chore: lint

---
 src/renderer/src/config/models/reasoning.ts | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/renderer/src/config/models/reasoning.ts b/src/renderer/src/config/models/reasoning.ts
index ea7d8747f4..144afc52a7 100644
--- a/src/renderer/src/config/models/reasoning.ts
+++ b/src/renderer/src/config/models/reasoning.ts
@@ -54,7 +54,6 @@ export const MODEL_SUPPORTED_REASONING_EFFORT = {
   doubao_after_251015: ['minimal', 'low', 'medium', 'high'] as const,
   hunyuan: ['auto'] as const,
   mimo: ['auto'] as const,
-  mimo: ['auto'] as const,
   zhipu: ['auto'] as const,
   perplexity: ['low', 'medium', 'high'] as const,
   deepseek_hybrid: ['auto'] as const

From e89af9042caa11f7a744cec5b96c6e113e69e422 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 18 Dec 2025 15:39:21 +0800
Subject: [PATCH 44/53] test(schema): add comprehensive tests for
 jsonSchemaToZod function

---
 .../__tests__/jsonSchemaToZod.test.ts         | 340 ++++++++++++++++++
 .../apiServer/services/unified-messages.ts    |  66 ++--
 tests/main.setup.ts                           |  53 ++-
 3 files changed, 427 insertions(+), 32 deletions(-)
 create mode 100644 src/main/apiServer/services/__tests__/jsonSchemaToZod.test.ts

diff --git a/src/main/apiServer/services/__tests__/jsonSchemaToZod.test.ts b/src/main/apiServer/services/__tests__/jsonSchemaToZod.test.ts
new file mode 100644
index 0000000000..804db0d357
--- /dev/null
+++ b/src/main/apiServer/services/__tests__/jsonSchemaToZod.test.ts
@@ -0,0 +1,340 @@
+import { describe, expect, it } from 'vitest'
+import * as z from 'zod'
+
+import { type JsonSchemaLike, jsonSchemaToZod } from '../unified-messages'
+
+describe('jsonSchemaToZod', () => {
+  describe('Basic Types', () => {
+    it('should convert string type', () => {
+      const schema: JsonSchemaLike = { type: 'string' }
+      const result = jsonSchemaToZod(schema)
+      expect(result).toBeInstanceOf(z.ZodString)
+      expect(result.safeParse('hello').success).toBe(true)
+      expect(result.safeParse(123).success).toBe(false)
+    })
+
+    it('should convert string with minLength', () => {
+      const schema: JsonSchemaLike = { type: 'string', minLength: 3 }
+      const result = jsonSchemaToZod(schema)
+      expect(result.safeParse('ab').success).toBe(false)
+      expect(result.safeParse('abc').success).toBe(true)
+    })
+
+    it('should convert string with maxLength', () => {
+      const schema: JsonSchemaLike = { type: 'string', maxLength: 5 }
+      const result = jsonSchemaToZod(schema)
+      expect(result.safeParse('hello').success).toBe(true)
+      expect(result.safeParse('hello world').success).toBe(false)
+    })
+
+    it('should convert string with pattern', () => {
+      const schema: JsonSchemaLike = { type: 'string', pattern: '^[0-9]+$' }
+      const result = jsonSchemaToZod(schema)
+      expect(result.safeParse('123').success).toBe(true)
+      expect(result.safeParse('abc').success).toBe(false)
+    })
+
+    it('should convert number type', () => {
+      const schema: JsonSchemaLike = { type: 'number' }
+      const result = jsonSchemaToZod(schema)
+      expect(result).toBeInstanceOf(z.ZodNumber)
+      expect(result.safeParse(42).success).toBe(true)
+      expect(result.safeParse(3.14).success).toBe(true)
+      expect(result.safeParse('42').success).toBe(false)
+    })
+
+    it('should convert integer type', () => {
+      const schema: JsonSchemaLike = { type: 'integer' }
+      const result = jsonSchemaToZod(schema)
+      expect(result.safeParse(42).success).toBe(true)
+      expect(result.safeParse(3.14).success).toBe(false)
+    })
+
+    it('should convert number with minimum', () => {
+      const schema: JsonSchemaLike = { type: 'number', minimum: 10 }
+      const result = jsonSchemaToZod(schema)
+      expect(result.safeParse(5).success).toBe(false)
+      expect(result.safeParse(10).success).toBe(true)
+      expect(result.safeParse(15).success).toBe(true)
+    })
+
+    it('should convert number with maximum', () => {
+      const schema: JsonSchemaLike = { type: 'number', maximum: 100 }
+      const result = jsonSchemaToZod(schema)
+      expect(result.safeParse(50).success).toBe(true)
+      expect(result.safeParse(100).success).toBe(true)
+      expect(result.safeParse(150).success).toBe(false)
+    })
+
+    it('should convert boolean type', () => {
+      const schema: JsonSchemaLike = { type: 'boolean' }
+      const result = jsonSchemaToZod(schema)
+      expect(result).toBeInstanceOf(z.ZodBoolean)
+      expect(result.safeParse(true).success).toBe(true)
+      expect(result.safeParse(false).success).toBe(true)
+      expect(result.safeParse('true').success).toBe(false)
+    })
+
+    it('should convert null type', () => {
+      const schema: JsonSchemaLike = { type: 'null' }
+      const result = jsonSchemaToZod(schema)
+      expect(result).toBeInstanceOf(z.ZodNull)
+      expect(result.safeParse(null).success).toBe(true)
+      expect(result.safeParse(undefined).success).toBe(false)
+    })
+  })
+
+  describe('Enum Types', () => {
+    it('should convert string enum', () => {
+      const schema: JsonSchemaLike = { enum: ['red', 'green', 'blue'] }
+      const result = jsonSchemaToZod(schema)
+      expect(result.safeParse('red').success).toBe(true)
+      expect(result.safeParse('green').success).toBe(true)
+      expect(result.safeParse('yellow').success).toBe(false)
+    })
+
+    it('should convert non-string enum with literals', () => {
+      const schema: JsonSchemaLike = { enum: [1, 2, 3] }
+      const result = jsonSchemaToZod(schema)
+      expect(result.safeParse(1).success).toBe(true)
+      expect(result.safeParse(2).success).toBe(true)
+      expect(result.safeParse(4).success).toBe(false)
+    })
+
+    it('should convert single value enum', () => {
+      const schema: JsonSchemaLike = { enum: ['only'] }
+      const result = jsonSchemaToZod(schema)
+      expect(result.safeParse('only').success).toBe(true)
+      expect(result.safeParse('other').success).toBe(false)
+    })
+
+    it('should convert mixed enum', () => {
+      const schema: JsonSchemaLike = { enum: ['text', 1, true] }
+      const result = jsonSchemaToZod(schema)
+      expect(result.safeParse('text').success).toBe(true)
+      expect(result.safeParse(1).success).toBe(true)
+      expect(result.safeParse(true).success).toBe(true)
+      expect(result.safeParse(false).success).toBe(false)
+    })
+  })
+
+  describe('Array Types', () => {
+    it('should convert array of strings', () => {
+      const schema: JsonSchemaLike = {
+        type: 'array',
+        items: { type: 'string' }
+      }
+      const result = jsonSchemaToZod(schema)
+      expect(result.safeParse(['a', 'b']).success).toBe(true)
+      expect(result.safeParse([1, 2]).success).toBe(false)
+    })
+
+    it('should convert array without items (unknown)', () => {
+      const schema: JsonSchemaLike = { type: 'array' }
+      const result = jsonSchemaToZod(schema)
+      expect(result.safeParse([]).success).toBe(true)
+      expect(result.safeParse(['a', 1, true]).success).toBe(true)
+    })
+
+    it('should convert array with minItems', () => {
+      const schema: JsonSchemaLike = {
+        type: 'array',
+        items: { type: 'number' },
+        minItems: 2
+      }
+      const result = jsonSchemaToZod(schema)
+      expect(result.safeParse([1]).success).toBe(false)
+      expect(result.safeParse([1, 2]).success).toBe(true)
+    })
+
+    it('should convert array with maxItems', () => {
+      const schema: JsonSchemaLike = {
+        type: 'array',
+        items: { type: 'number' },
+        maxItems: 3
+      }
+      const result = jsonSchemaToZod(schema)
+      expect(result.safeParse([1, 2, 3]).success).toBe(true)
+      expect(result.safeParse([1, 2, 3, 4]).success).toBe(false)
+    })
+  })
+
+  describe('Object Types', () => {
+    it('should convert simple object', () => {
+      const schema: JsonSchemaLike = {
+        type: 'object',
+        properties: {
+          name: { type: 'string' },
+          age: { type: 'number' }
+        }
+      }
+      const result = jsonSchemaToZod(schema)
+      expect(result.safeParse({ name: 'John', age: 30 }).success).toBe(true)
+      expect(result.safeParse({ name: 'John', age: '30' }).success).toBe(false)
+    })
+
+    it('should handle required fields', () => {
+      const schema: JsonSchemaLike = {
+        type: 'object',
+        properties: {
+          name: { type: 'string' },
+          age: { type: 'number' }
+        },
+        required: ['name']
+      }
+      const result = jsonSchemaToZod(schema)
+      expect(result.safeParse({ name: 'John', age: 30 }).success).toBe(true)
+      expect(result.safeParse({ age: 30 }).success).toBe(false)
+      expect(result.safeParse({ name: 'John' }).success).toBe(true)
+    })
+
+    it('should convert empty object', () => {
+      const schema: JsonSchemaLike = { type: 'object' }
+      const result = jsonSchemaToZod(schema)
+      expect(result.safeParse({}).success).toBe(true)
+    })
+
+    it('should convert nested objects', () => {
+      const schema: JsonSchemaLike = {
+        type: 'object',
+        properties: {
+          user: {
+            type: 'object',
+            properties: {
+              name: { type: 'string' },
+              email: { type: 'string' }
+            }
+          }
+        }
+      }
+      const result = jsonSchemaToZod(schema)
+      expect(result.safeParse({ user: { name: 'John', email: 'john@example.com' } }).success).toBe(true)
+      expect(result.safeParse({ user: { name: 'John' } }).success).toBe(true)
+    })
+  })
+
+  describe('Union Types', () => {
+    it('should convert union type (type array)', () => {
+      const schema: JsonSchemaLike = { type: ['string', 'null'] }
+      const result = jsonSchemaToZod(schema)
+      expect(result.safeParse('hello').success).toBe(true)
+      expect(result.safeParse(null).success).toBe(true)
+      expect(result.safeParse(123).success).toBe(false)
+    })
+
+    it('should convert single type array', () => {
+      const schema: JsonSchemaLike = { type: ['string'] }
+      const result = jsonSchemaToZod(schema)
+      expect(result.safeParse('hello').success).toBe(true)
+      expect(result.safeParse(123).success).toBe(false)
+    })
+
+    it('should convert multiple union types', () => {
+      const schema: JsonSchemaLike = { type: ['string', 'number', 'boolean'] }
+      const result = jsonSchemaToZod(schema)
+      expect(result.safeParse('text').success).toBe(true)
+      expect(result.safeParse(42).success).toBe(true)
+      expect(result.safeParse(true).success).toBe(true)
+      expect(result.safeParse(null).success).toBe(false)
+    })
+  })
+
+  describe('Description Handling', () => {
+    it('should preserve description for string', () => {
+      const schema: JsonSchemaLike = {
+        type: 'string',
+        description: 'A user name'
+      }
+      const result = jsonSchemaToZod(schema)
+      expect(result.description).toBe('A user name')
+    })
+
+    it('should preserve description for enum', () => {
+      const schema: JsonSchemaLike = {
+        enum: ['red', 'green', 'blue'],
+        description: 'Available colors'
+      }
+      const result = jsonSchemaToZod(schema)
+      expect(result.description).toBe('Available colors')
+    })
+
+    it('should preserve description for object', () => {
+      const schema: JsonSchemaLike = {
+        type: 'object',
+        description: 'User object',
+        properties: {
+          name: { type: 'string' }
+        }
+      }
+      const result = jsonSchemaToZod(schema)
+      expect(result.description).toBe('User object')
+    })
+  })
+
+  describe('Edge Cases', () => {
+    it('should handle unknown type', () => {
+      const schema: JsonSchemaLike = { type: 'unknown-type' as any }
+      const result = jsonSchemaToZod(schema)
+      expect(result).toBeInstanceOf(z.ZodType)
+      expect(result.safeParse(anything).success).toBe(true)
+    })
+
+    it('should handle schema without type', () => {
+      const schema: JsonSchemaLike = {}
+      const result = jsonSchemaToZod(schema)
+      expect(result).toBeInstanceOf(z.ZodType)
+      expect(result.safeParse(anything).success).toBe(true)
+    })
+
+    it('should handle complex nested schema', () => {
+      const schema: JsonSchemaLike = {
+        type: 'object',
+        properties: {
+          items: {
+            type: 'array',
+            items: {
+              type: 'object',
+              properties: {
+                id: { type: 'integer' },
+                name: { type: 'string' },
+                tags: {
+                  type: 'array',
+                  items: { type: 'string' }
+                }
+              },
+              required: ['id']
+            }
+          }
+        }
+      }
+      const result = jsonSchemaToZod(schema)
+      const validData = {
+        items: [
+          { id: 1, name: 'Item 1', tags: ['tag1', 'tag2'] },
+          { id: 2, tags: [] }
+        ]
+      }
+      expect(result.safeParse(validData).success).toBe(true)
+
+      const invalidData = {
+        items: [{ name: 'No ID' }]
+      }
+      expect(result.safeParse(invalidData).success).toBe(false)
+    })
+  })
+
+  describe('OpenRouter Model IDs', () => {
+    it('should handle model identifier format with colons', () => {
+      const schema: JsonSchemaLike = {
+        type: 'string',
+        enum: ['openrouter:anthropic/claude-3.5-sonnet:free', 'openrouter:gpt-4:paid']
+      }
+      const result = jsonSchemaToZod(schema)
+      expect(result.safeParse('openrouter:anthropic/claude-3.5-sonnet:free').success).toBe(true)
+      expect(result.safeParse('openrouter:gpt-4:paid').success).toBe(true)
+      expect(result.safeParse('other').success).toBe(false)
+    })
+  })
+})
+
+const anything = Math.random() > 0.5 ? 'string' : Math.random() > 0.5 ? 123 : { a: true }
diff --git a/src/main/apiServer/services/unified-messages.ts b/src/main/apiServer/services/unified-messages.ts
index 5525d85c44..38c0f61d3e 100644
--- a/src/main/apiServer/services/unified-messages.ts
+++ b/src/main/apiServer/services/unified-messages.ts
@@ -1,7 +1,7 @@
 import type { AnthropicProviderOptions } from '@ai-sdk/anthropic'
 import type { GoogleGenerativeAIProviderOptions } from '@ai-sdk/google'
 import type { OpenAIResponsesProviderOptions } from '@ai-sdk/openai'
-import type { LanguageModelV2Middleware, LanguageModelV2ToolResultOutput } from '@ai-sdk/provider'
+import type { JSONSchema7, LanguageModelV2Middleware, LanguageModelV2ToolResultOutput } from '@ai-sdk/provider'
 import type { ProviderOptions, ReasoningPart, ToolCallPart, ToolResultPart } from '@ai-sdk/provider-utils'
 import type {
   ImageBlockParam,
@@ -143,18 +143,20 @@ function convertAnthropicToolResultToAiSdk(
   return { type: 'content', value: values }
 }
 
-// Type alias for JSON Schema (compatible with recursive calls)
-type JsonSchemaLike = AnthropicTool.InputSchema | Record<string, unknown>
+/**
+ * JSON Schema type for tool input schemas
+ * Uses the standard JSONSchema7 type from the json-schema package (via @ai-sdk/provider)
+ */
+export type JsonSchemaLike = JSONSchema7
 
 /**
  * Convert JSON Schema to Zod schema
  * This avoids non-standard fields like input_examples that Anthropic doesn't support
  */
-function jsonSchemaToZod(schema: JsonSchemaLike): z.ZodTypeAny {
-  const s = schema as Record<string, unknown>
-  const schemaType = s.type as string | string[] | undefined
-  const enumValues = s.enum as unknown[] | undefined
-  const description = s.description as string | undefined
+export function jsonSchemaToZod(schema: JsonSchemaLike): z.ZodTypeAny {
+  const schemaType = schema.type
+  const enumValues = schema.enum
+  const description = schema.description
 
   // Handle enum first
   if (enumValues && Array.isArray(enumValues) && enumValues.length > 0) {
@@ -173,7 +175,13 @@ function jsonSchemaToZod(schema: JsonSchemaLike): z.ZodTypeAny {
 
   // Handle union types (type: ["string", "null"])
   if (Array.isArray(schemaType)) {
-    const schemas = schemaType.map((t) => jsonSchemaToZod({ ...s, type: t, enum: undefined }))
+    const schemas = schemaType.map((t) =>
+      jsonSchemaToZod({
+        ...schema,
+        type: t,
+        enum: undefined
+      })
+    )
     if (schemas.length === 1) {
       return schemas[0]
     }
@@ -184,17 +192,17 @@ function jsonSchemaToZod(schema: JsonSchemaLike): z.ZodTypeAny {
   switch (schemaType) {
     case 'string': {
       let zodString = z.string()
-      if (typeof s.minLength === 'number') zodString = zodString.min(s.minLength)
-      if (typeof s.maxLength === 'number') zodString = zodString.max(s.maxLength)
-      if (typeof s.pattern === 'string') zodString = zodString.regex(new RegExp(s.pattern))
+      if (typeof schema.minLength === 'number') zodString = zodString.min(schema.minLength)
+      if (typeof schema.maxLength === 'number') zodString = zodString.max(schema.maxLength)
+      if (typeof schema.pattern === 'string') zodString = zodString.regex(new RegExp(schema.pattern))
       return description ? zodString.describe(description) : zodString
     }
 
     case 'number':
     case 'integer': {
       let zodNumber = schemaType === 'integer' ? z.number().int() : z.number()
-      if (typeof s.minimum === 'number') zodNumber = zodNumber.min(s.minimum)
-      if (typeof s.maximum === 'number') zodNumber = zodNumber.max(s.maximum)
+      if (typeof schema.minimum === 'number') zodNumber = zodNumber.min(schema.minimum)
+      if (typeof schema.maximum === 'number') zodNumber = zodNumber.max(schema.maximum)
       return description ? zodNumber.describe(description) : zodNumber
     }
 
@@ -207,24 +215,33 @@ function jsonSchemaToZod(schema: JsonSchemaLike): z.ZodTypeAny {
       return z.null()
 
     case 'array': {
-      const items = s.items as Record<string, unknown> | undefined
-      let zodArray = items ? z.array(jsonSchemaToZod(items)) : z.array(z.unknown())
-      if (typeof s.minItems === 'number') zodArray = zodArray.min(s.minItems)
-      if (typeof s.maxItems === 'number') zodArray = zodArray.max(s.maxItems)
+      const items = schema.items
+      let zodArray: z.ZodArray<z.ZodTypeAny>
+      if (items && typeof items === 'object' && !Array.isArray(items)) {
+        zodArray = z.array(jsonSchemaToZod(items as JsonSchemaLike))
+      } else {
+        zodArray = z.array(z.unknown())
+      }
+      if (typeof schema.minItems === 'number') zodArray = zodArray.min(schema.minItems)
+      if (typeof schema.maxItems === 'number') zodArray = zodArray.max(schema.maxItems)
       return description ? zodArray.describe(description) : zodArray
     }
 
     case 'object': {
-      const properties = s.properties as Record<string, Record<string, unknown>> | undefined
-      const required = (s.required as string[]) || []
+      const properties = schema.properties
+      const required = schema.required || []
 
       // Always use z.object() to ensure "properties" field is present in output schema
       // OpenAI requires explicit properties field even for empty objects
       const shape: Record<string, z.ZodTypeAny> = {}
-      if (properties) {
+      if (properties && typeof properties === 'object') {
         for (const [key, propSchema] of Object.entries(properties)) {
-          const zodProp = jsonSchemaToZod(propSchema)
-          shape[key] = required.includes(key) ? zodProp : zodProp.optional()
+          if (typeof propSchema === 'boolean') {
+            shape[key] = propSchema ? z.unknown() : z.never()
+          } else {
+            const zodProp = jsonSchemaToZod(propSchema as JsonSchemaLike)
+            shape[key] = required.includes(key) ? zodProp : zodProp.optional()
+          }
         }
       }
 
@@ -246,7 +263,8 @@ function convertAnthropicToolsToAiSdk(tools: MessageCreateParams['tools']): Reco
     if (anthropicTool.type === 'bash_20250124') continue
     const toolDef = anthropicTool as AnthropicTool
     const rawSchema = toolDef.input_schema
-    const schema = jsonSchemaToZod(rawSchema)
+    // Convert Anthropic's InputSchema to JSONSchema7-compatible format
+    const schema = jsonSchemaToZod(rawSchema as JsonSchemaLike)
 
     // Use tool() with inputSchema (AI SDK v5 API)
     const aiTool = tool({
diff --git a/tests/main.setup.ts b/tests/main.setup.ts
index 5cadb89d02..2370781564 100644
--- a/tests/main.setup.ts
+++ b/tests/main.setup.ts
@@ -61,7 +61,19 @@ vi.mock('electron', () => ({
     getPrimaryDisplay: vi.fn(),
     getAllDisplays: vi.fn()
   },
-  Notification: vi.fn()
+  Notification: vi.fn(),
+  net: {
+    fetch: vi.fn(() =>
+      Promise.resolve({
+        ok: true,
+        status: 200,
+        statusText: 'OK',
+        json: vi.fn(() => Promise.resolve({})),
+        text: vi.fn(() => Promise.resolve('')),
+        headers: new Headers()
+      })
+    )
+  }
 }))
 
 // Mock Winston for LoggerService dependencies
@@ -97,15 +109,40 @@ vi.mock('winston-daily-rotate-file', () => {
   }))
 })
 
-// Mock Node.js modules
-vi.mock('node:os', () => ({
-  platform: vi.fn(() => 'darwin'),
-  arch: vi.fn(() => 'x64'),
-  version: vi.fn(() => '20.0.0'),
-  cpus: vi.fn(() => [{ model: 'Mock CPU' }]),
-  totalmem: vi.fn(() => 8 * 1024 * 1024 * 1024) // 8GB
+// Mock main process services
+vi.mock('@main/services/AnthropicService', () => ({
+  default: {}
 }))
 
+vi.mock('@main/services/CopilotService', () => ({
+  default: {}
+}))
+
+vi.mock('@main/services/ReduxService', () => ({
+  reduxService: {
+    selectSync: vi.fn()
+  }
+}))
+
+vi.mock('@main/integration/cherryai', () => ({
+  generateSignature: vi.fn()
+}))
+
+// Mock Node.js modules
+vi.mock('node:os', async () => {
+  const actual = await vi.importActual<typeof import('node:os')>('node:os')
+  return {
+    ...actual,
+    default: actual,
+    platform: vi.fn(() => 'darwin'),
+    arch: vi.fn(() => 'x64'),
+    version: vi.fn(() => '20.0.0'),
+    cpus: vi.fn(() => [{ model: 'Mock CPU' }]),
+    totalmem: vi.fn(() => 8 * 1024 * 1024 * 1024), // 8GB
+    homedir: vi.fn(() => '/tmp')
+  }
+})
+
 vi.mock('node:path', async () => {
   const actual = await vi.importActual('node:path')
   return {

From 5304b585b992c0b88b337ee4e51e9fa4b2830a00 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 18 Dec 2025 15:50:23 +0800
Subject: [PATCH 45/53] chore: improve comments

---
 src/main/apiServer/services/unified-messages.ts | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/main/apiServer/services/unified-messages.ts b/src/main/apiServer/services/unified-messages.ts
index 38c0f61d3e..7b465d75ad 100644
--- a/src/main/apiServer/services/unified-messages.ts
+++ b/src/main/apiServer/services/unified-messages.ts
@@ -145,13 +145,13 @@ function convertAnthropicToolResultToAiSdk(
 
 /**
  * JSON Schema type for tool input schemas
- * Uses the standard JSONSchema7 type from the json-schema package (via @ai-sdk/provider)
  */
 export type JsonSchemaLike = JSONSchema7
 
 /**
  * Convert JSON Schema to Zod schema
  * This avoids non-standard fields like input_examples that Anthropic doesn't support
+ * TODO: Anthropic/beta support input_examples
  */
 export function jsonSchemaToZod(schema: JsonSchemaLike): z.ZodTypeAny {
   const schemaType = schema.type

From 2c910322f8cbda277f49cd89da024663dbd8ea8f Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 18 Dec 2025 15:59:27 +0800
Subject: [PATCH 46/53] feat(token): enhance token estimation using tokenx
 library for improved accuracy and image support

---
 src/main/apiServer/routes/messages.ts | 43 +++++++++++++++++++--------
 1 file changed, 31 insertions(+), 12 deletions(-)

diff --git a/src/main/apiServer/routes/messages.ts b/src/main/apiServer/routes/messages.ts
index 1e18c86118..bcba993915 100644
--- a/src/main/apiServer/routes/messages.ts
+++ b/src/main/apiServer/routes/messages.ts
@@ -5,6 +5,7 @@ import { getAiSdkProviderId } from '@shared/provider'
 import type { Provider } from '@types'
 import type { Request, Response } from 'express'
 import express from 'express'
+import { approximateTokenSize } from 'tokenx'
 
 import { messagesService } from '../services/messages'
 import { generateUnifiedMessage, streamUnifiedMessages } from '../services/unified-messages'
@@ -45,25 +46,34 @@ const providerRouter = express.Router({ mergeParams: true })
 
 /**
  * Estimate token count from messages
- * Simple approximation: ~4 characters per token for English text
+ * Uses tokenx library for accurate token estimation and supports images
  */
 interface CountTokensInput {
-  messages: Array<{ role: string; content: string | Array<{ type: string; text?: string }> }>
+  messages: Array<{
+    role: string
+    content:
+      | string
+      | Array<{
+          type: string
+          text?: string
+          source?: { type: string; media_type?: string; data?: string }
+        }>
+  }>
   system?: string | Array<{ type: string; text?: string }>
 }
 
 function estimateTokenCount(input: CountTokensInput): number {
   const { messages, system } = input
-  let totalChars = 0
+  let totalTokens = 0
 
-  // Count system message tokens
+  // Count system message tokens using tokenx
   if (system) {
     if (typeof system === 'string') {
-      totalChars += system.length
+      totalTokens += approximateTokenSize(system)
     } else if (Array.isArray(system)) {
       for (const block of system) {
         if (block.type === 'text' && block.text) {
-          totalChars += block.text.length
+          totalTokens += approximateTokenSize(block.text)
         }
       }
     }
@@ -72,20 +82,29 @@ function estimateTokenCount(input: CountTokensInput): number {
   // Count message tokens
   for (const msg of messages) {
     if (typeof msg.content === 'string') {
-      totalChars += msg.content.length
+      totalTokens += approximateTokenSize(msg.content)
     } else if (Array.isArray(msg.content)) {
       for (const block of msg.content) {
         if (block.type === 'text' && block.text) {
-          totalChars += block.text.length
+          totalTokens += approximateTokenSize(block.text)
+        } else if (block.type === 'image') {
+          // Image token estimation (consistent with TokenService)
+          // Base64 images: estimate from data length
+          if (block.source?.data) {
+            const dataSize = block.source.data.length * 0.75 // base64 to bytes
+            totalTokens += Math.floor(dataSize / 100)
+          } else {
+            // Default image token estimate
+            totalTokens += 1000
+          }
         }
       }
     }
-    // Add overhead for role
-    totalChars += 10
+    // Add role overhead
+    totalTokens += 3
   }
 
-  // Estimate tokens (~4 chars per token, with some overhead)
-  return Math.ceil(totalChars / 4) + messages.length * 3
+  return totalTokens
 }
 
 // Helper function for basic request validation

From 45d404e12709f68708049e6c4f2aeca3ab98b642 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 18 Dec 2025 16:19:17 +0800
Subject: [PATCH 47/53] feat(tokens): enhance token estimation and refactor
 count_tokens endpoint for improved handling

---
 src/main/apiServer/routes/messages.ts | 195 +++++++++++++-------------
 1 file changed, 101 insertions(+), 94 deletions(-)

diff --git a/src/main/apiServer/routes/messages.ts b/src/main/apiServer/routes/messages.ts
index bcba993915..0b26db3960 100644
--- a/src/main/apiServer/routes/messages.ts
+++ b/src/main/apiServer/routes/messages.ts
@@ -46,20 +46,11 @@ const providerRouter = express.Router({ mergeParams: true })
 
 /**
  * Estimate token count from messages
- * Uses tokenx library for accurate token estimation and supports images
+ * Uses tokenx library for accurate token estimation and supports images, tools
  */
 interface CountTokensInput {
-  messages: Array<{
-    role: string
-    content:
-      | string
-      | Array<{
-          type: string
-          text?: string
-          source?: { type: string; media_type?: string; data?: string }
-        }>
-  }>
-  system?: string | Array<{ type: string; text?: string }>
+  messages: MessageCreateParams['messages']
+  system?: MessageCreateParams['system']
 }
 
 function estimateTokenCount(input: CountTokensInput): number {
@@ -89,14 +80,40 @@ function estimateTokenCount(input: CountTokensInput): number {
           totalTokens += approximateTokenSize(block.text)
         } else if (block.type === 'image') {
           // Image token estimation (consistent with TokenService)
-          // Base64 images: estimate from data length
-          if (block.source?.data) {
+          if (block.source.type === 'base64') {
+            // Base64 images: estimate from data length
             const dataSize = block.source.data.length * 0.75 // base64 to bytes
             totalTokens += Math.floor(dataSize / 100)
           } else {
-            // Default image token estimate
+            // URL images: use default estimate
             totalTokens += 1000
           }
+        } else if (block.type === 'tool_use') {
+          // Tool use token estimation: name + input JSON
+          if (block.name) {
+            totalTokens += approximateTokenSize(block.name)
+          }
+          if (block.input) {
+            const inputJson = JSON.stringify(block.input)
+            totalTokens += approximateTokenSize(inputJson)
+          }
+          // Add overhead for tool use structure
+          totalTokens += 10
+        } else if (block.type === 'tool_result') {
+          // Tool result token estimation
+          if (typeof block.content === 'string') {
+            totalTokens += approximateTokenSize(block.content)
+          } else if (Array.isArray(block.content)) {
+            for (const item of block.content) {
+              if (typeof item === 'string') {
+                totalTokens += approximateTokenSize(item)
+              } else if (item.type === 'text' && item.text) {
+                totalTokens += approximateTokenSize(item.text)
+              }
+            }
+          }
+          // Add overhead for tool result structure
+          totalTokens += 10
         }
       }
     }
@@ -127,6 +144,70 @@ async function validateRequestBody(req: Request): Promise<{ valid: boolean; erro
   return { valid: true }
 }
 
+/**
+ * Shared handler for count_tokens endpoint
+ * Validates request and returns token count estimation
+ */
+async function handleCountTokens(
+  req: Request,
+  res: Response,
+  options: {
+    requireModel?: boolean
+    logContext?: Record<string, any>
+  } = {}
+): Promise<Response> {
+  try {
+    const { model, messages, system } = req.body
+    const { requireModel = false, logContext = {} } = options
+
+    // Validate model parameter if required
+    if (requireModel && !model) {
+      return res.status(400).json({
+        type: 'error',
+        error: {
+          type: 'invalid_request_error',
+          message: 'model parameter is required'
+        }
+      })
+    }
+
+    // Validate messages parameter
+    if (!messages || !Array.isArray(messages)) {
+      return res.status(400).json({
+        type: 'error',
+        error: {
+          type: 'invalid_request_error',
+          message: 'messages parameter is required'
+        }
+      })
+    }
+
+    // Estimate token count
+    const estimatedTokens = estimateTokenCount({ messages, system })
+
+    // Log with context
+    logger.debug('Token count estimated', {
+      model,
+      messageCount: messages.length,
+      estimatedTokens,
+      ...logContext
+    })
+
+    return res.json({
+      input_tokens: estimatedTokens
+    })
+  } catch (error: any) {
+    logger.error('Token counting error', { error })
+    return res.status(500).json({
+      type: 'error',
+      error: {
+        type: 'api_error',
+        message: error.message || 'Internal server error'
+      }
+    })
+  }
+}
+
 interface HandleMessageProcessingOptions {
   res: Response
   provider: Provider
@@ -650,91 +731,17 @@ providerRouter.post('/', async (req: Request, res: Response) => {
  *         description: Bad request
  */
 router.post('/count_tokens', async (req: Request, res: Response) => {
-  try {
-    const { model, messages, system } = req.body
-
-    if (!model) {
-      return res.status(400).json({
-        type: 'error',
-        error: {
-          type: 'invalid_request_error',
-          message: 'model parameter is required'
-        }
-      })
-    }
-
-    if (!messages || !Array.isArray(messages)) {
-      return res.status(400).json({
-        type: 'error',
-        error: {
-          type: 'invalid_request_error',
-          message: 'messages parameter is required'
-        }
-      })
-    }
-
-    const estimatedTokens = estimateTokenCount({ messages, system })
-
-    logger.debug('Token count estimated', {
-      model,
-      messageCount: messages.length,
-      estimatedTokens
-    })
-
-    return res.json({
-      input_tokens: estimatedTokens
-    })
-  } catch (error: any) {
-    logger.error('Token counting error', { error })
-    return res.status(500).json({
-      type: 'error',
-      error: {
-        type: 'api_error',
-        message: error.message || 'Internal server error'
-      }
-    })
-  }
+  return handleCountTokens(req, res, { requireModel: true })
 })
 
 /**
  * Provider-specific count_tokens endpoint
  */
 providerRouter.post('/count_tokens', async (req: Request, res: Response) => {
-  try {
-    const { model, messages, system } = req.body
-
-    if (!messages || !Array.isArray(messages)) {
-      return res.status(400).json({
-        type: 'error',
-        error: {
-          type: 'invalid_request_error',
-          message: 'messages parameter is required'
-        }
-      })
-    }
-
-    const estimatedTokens = estimateTokenCount({ messages, system })
-
-    logger.debug('Token count estimated (provider route)', {
-      providerId: req.params.provider,
-      model,
-      messageCount: messages.length,
-      estimatedTokens
-    })
-
-    return res.json({
-      input_tokens: estimatedTokens
-    })
-  } catch (error: any) {
-    logger.error('Token counting error', { error })
-    return res.status(500).json({
-      type: 'error',
-      error: {
-        type: 'api_error',
-        message: error.message || 'Internal server error'
-      }
-    })
-  }
+  return handleCountTokens(req, res, {
+    requireModel: false,
+    logContext: { providerId: req.params.provider }
+  })
 })
 
 export { providerRouter as messagesProviderRoutes, router as messagesRoutes }

From 90ed074ecd01d37c233bc4c6a8530b1d4dc0a450 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 18 Dec 2025 16:26:47 +0800
Subject: [PATCH 48/53] test(token): export CountTokensInput interface and
 estimateTokenCount function for improved token estimation

---
 .../routes/__tests__/messages.test.ts         | 393 ++++++++++++++++++
 src/main/apiServer/routes/messages.ts         |   4 +-
 2 files changed, 395 insertions(+), 2 deletions(-)
 create mode 100644 src/main/apiServer/routes/__tests__/messages.test.ts

diff --git a/src/main/apiServer/routes/__tests__/messages.test.ts b/src/main/apiServer/routes/__tests__/messages.test.ts
new file mode 100644
index 0000000000..b07b82e317
--- /dev/null
+++ b/src/main/apiServer/routes/__tests__/messages.test.ts
@@ -0,0 +1,393 @@
+import { describe, expect, it } from 'vitest'
+
+import { estimateTokenCount } from '../messages'
+
+describe('estimateTokenCount', () => {
+  describe('Text Content', () => {
+    it('should estimate tokens for simple string content', () => {
+      const input = {
+        messages: [
+          {
+            role: 'user' as const,
+            content: 'Hello, world!'
+          }
+        ]
+      }
+      const tokens = estimateTokenCount(input)
+      // Should include text tokens + role overhead (3)
+      expect(tokens).toBeGreaterThan(3)
+      expect(tokens).toBeLessThan(20)
+    })
+
+    it('should estimate tokens for multiple messages', () => {
+      const input = {
+        messages: [
+          { role: 'user' as const, content: 'First message' },
+          { role: 'assistant' as const, content: 'Second message' },
+          { role: 'user' as const, content: 'Third message' }
+        ]
+      }
+      const tokens = estimateTokenCount(input)
+      // Should include text tokens + role overhead (3 per message = 9)
+      expect(tokens).toBeGreaterThan(9)
+    })
+
+    it('should estimate tokens for text content blocks', () => {
+      const input = {
+        messages: [
+          {
+            role: 'user' as const,
+            content: [
+              { type: 'text' as const, text: 'Hello' },
+              { type: 'text' as const, text: 'World' }
+            ]
+          }
+        ]
+      }
+      const tokens = estimateTokenCount(input)
+      expect(tokens).toBeGreaterThan(3)
+    })
+
+    it('should handle empty messages array', () => {
+      const input = {
+        messages: []
+      }
+      const tokens = estimateTokenCount(input)
+      expect(tokens).toBe(0)
+    })
+
+    it('should handle messages with empty content', () => {
+      const input = {
+        messages: [{ role: 'user' as const, content: '' }]
+      }
+      const tokens = estimateTokenCount(input)
+      // Should only have role overhead (3)
+      expect(tokens).toBe(3)
+    })
+  })
+
+  describe('System Messages', () => {
+    it('should estimate tokens for string system message', () => {
+      const input = {
+        messages: [{ role: 'user' as const, content: 'Hello' }],
+        system: 'You are a helpful assistant.'
+      }
+      const tokens = estimateTokenCount(input)
+      // Should include system tokens + message tokens + role overhead
+      expect(tokens).toBeGreaterThan(3)
+    })
+
+    it('should estimate tokens for system content blocks', () => {
+      const input = {
+        messages: [{ role: 'user' as const, content: 'Hello' }],
+        system: [
+          { type: 'text' as const, text: 'System instruction 1' },
+          { type: 'text' as const, text: 'System instruction 2' }
+        ]
+      }
+      const tokens = estimateTokenCount(input)
+      expect(tokens).toBeGreaterThan(3)
+    })
+  })
+
+  describe('Image Content', () => {
+    it('should estimate tokens for base64 images', () => {
+      // Create a fake base64 string (400 characters = ~300 bytes when decoded)
+      const fakeBase64 = 'A'.repeat(400)
+      const input = {
+        messages: [
+          {
+            role: 'user' as const,
+            content: [
+              {
+                type: 'image' as const,
+                source: {
+                  type: 'base64' as const,
+                  media_type: 'image/png' as const,
+                  data: fakeBase64
+                }
+              }
+            ]
+          }
+        ]
+      }
+      const tokens = estimateTokenCount(input)
+      // Should estimate based on data size: 400 * 0.75 / 100 = 3 tokens + role overhead (3)
+      expect(tokens).toBeGreaterThan(3)
+      expect(tokens).toBeLessThan(10)
+    })
+
+    it('should estimate tokens for URL images', () => {
+      const input = {
+        messages: [
+          {
+            role: 'user' as const,
+            content: [
+              {
+                type: 'image' as const,
+                source: {
+                  type: 'url' as const,
+                  url: 'https://example.com/image.png'
+                }
+              }
+            ]
+          }
+        ]
+      }
+      const tokens = estimateTokenCount(input)
+      // Should use default estimate: 1000 + role overhead (3)
+      expect(tokens).toBe(1003)
+    })
+
+    it('should estimate tokens for mixed text and image content', () => {
+      const input = {
+        messages: [
+          {
+            role: 'user' as const,
+            content: [
+              { type: 'text' as const, text: 'What is in this image?' },
+              {
+                type: 'image' as const,
+                source: {
+                  type: 'url' as const,
+                  url: 'https://example.com/image.png'
+                }
+              }
+            ]
+          }
+        ]
+      }
+      const tokens = estimateTokenCount(input)
+      // Should include text tokens + 1000 (image) + role overhead (3)
+      expect(tokens).toBeGreaterThan(1003)
+    })
+  })
+
+  describe('Tool Content', () => {
+    it('should estimate tokens for tool_use blocks', () => {
+      const input = {
+        messages: [
+          {
+            role: 'assistant' as const,
+            content: [
+              {
+                type: 'tool_use' as const,
+                id: 'tool_123',
+                name: 'get_weather',
+                input: { location: 'San Francisco', unit: 'celsius' }
+              }
+            ]
+          }
+        ]
+      }
+      const tokens = estimateTokenCount(input)
+      // Should include: tool name tokens + input JSON tokens + 10 (overhead) + 3 (role)
+      expect(tokens).toBeGreaterThan(13)
+    })
+
+    it('should estimate tokens for tool_result blocks with string content', () => {
+      const input = {
+        messages: [
+          {
+            role: 'user' as const,
+            content: [
+              {
+                type: 'tool_result' as const,
+                tool_use_id: 'tool_123',
+                content: 'The weather in San Francisco is 18°C and sunny.'
+              }
+            ]
+          }
+        ]
+      }
+      const tokens = estimateTokenCount(input)
+      // Should include: content tokens + 10 (overhead) + 3 (role)
+      expect(tokens).toBeGreaterThan(13)
+    })
+
+    it('should estimate tokens for tool_result blocks with array content', () => {
+      const input = {
+        messages: [
+          {
+            role: 'user' as const,
+            content: [
+              {
+                type: 'tool_result' as const,
+                tool_use_id: 'tool_123',
+                content: [
+                  { type: 'text' as const, text: 'Result 1' },
+                  { type: 'text' as const, text: 'Result 2' }
+                ]
+              }
+            ]
+          }
+        ]
+      }
+      const tokens = estimateTokenCount(input)
+      // Should include: text tokens + 10 (overhead) + 3 (role)
+      expect(tokens).toBeGreaterThan(13)
+    })
+
+    it('should handle tool_use without input', () => {
+      const input = {
+        messages: [
+          {
+            role: 'assistant' as const,
+            content: [
+              {
+                type: 'tool_use' as const,
+                id: 'tool_123',
+                name: 'no_input_tool',
+                input: {}
+              }
+            ]
+          }
+        ]
+      }
+      const tokens = estimateTokenCount(input)
+      // Should include: tool name tokens + 10 (overhead) + 3 (role)
+      expect(tokens).toBeGreaterThan(13)
+    })
+  })
+
+  describe('Complex Scenarios', () => {
+    it('should estimate tokens for multi-turn conversation with various content types', () => {
+      const input = {
+        messages: [
+          {
+            role: 'user' as const,
+            content: [
+              { type: 'text' as const, text: 'Analyze this image' },
+              {
+                type: 'image' as const,
+                source: {
+                  type: 'url' as const,
+                  url: 'https://example.com/chart.png'
+                }
+              }
+            ]
+          },
+          {
+            role: 'assistant' as const,
+            content: [
+              {
+                type: 'tool_use' as const,
+                id: 'tool_1',
+                name: 'analyze_image',
+                input: { url: 'https://example.com/chart.png' }
+              }
+            ]
+          },
+          {
+            role: 'user' as const,
+            content: [
+              {
+                type: 'tool_result' as const,
+                tool_use_id: 'tool_1',
+                content: 'The chart shows sales data for Q4 2024.'
+              }
+            ]
+          },
+          {
+            role: 'assistant' as const,
+            content: 'Based on the analysis, the sales trend is positive.'
+          }
+        ],
+        system: 'You are a data analyst assistant.'
+      }
+      const tokens = estimateTokenCount(input)
+      // Should include:
+      // - System message tokens
+      // - Message 1: text + image (1000) + 3
+      // - Message 2: tool_use + 10 + 3
+      // - Message 3: tool_result + 10 + 3
+      // - Message 4: text + 3
+      expect(tokens).toBeGreaterThan(1032) // At least 1000 (image) + 32 (overhead)
+    })
+
+    it('should handle very long text content', () => {
+      const longText = 'word '.repeat(1000) // ~5000 characters
+      const input = {
+        messages: [{ role: 'user' as const, content: longText }]
+      }
+      const tokens = estimateTokenCount(input)
+      // Should estimate based on text length using tokenx
+      expect(tokens).toBeGreaterThan(1000)
+    })
+
+    it('should handle multiple images in single message', () => {
+      const input = {
+        messages: [
+          {
+            role: 'user' as const,
+            content: [
+              {
+                type: 'image' as const,
+                source: { type: 'url' as const, url: 'https://example.com/1.png' }
+              },
+              {
+                type: 'image' as const,
+                source: { type: 'url' as const, url: 'https://example.com/2.png' }
+              },
+              {
+                type: 'image' as const,
+                source: { type: 'url' as const, url: 'https://example.com/3.png' }
+              }
+            ]
+          }
+        ]
+      }
+      const tokens = estimateTokenCount(input)
+      // Should estimate: 3 * 1000 (images) + 3 (role)
+      expect(tokens).toBe(3003)
+    })
+  })
+
+  describe('Edge Cases', () => {
+    it('should handle undefined system message', () => {
+      const input = {
+        messages: [{ role: 'user' as const, content: 'Hello' }],
+        system: undefined
+      }
+      const tokens = estimateTokenCount(input)
+      expect(tokens).toBeGreaterThan(0)
+    })
+
+    it('should handle empty system message', () => {
+      const input = {
+        messages: [{ role: 'user' as const, content: 'Hello' }],
+        system: ''
+      }
+      const tokens = estimateTokenCount(input)
+      expect(tokens).toBeGreaterThan(0)
+    })
+
+    it('should handle content blocks with missing text', () => {
+      const input = {
+        messages: [
+          {
+            role: 'user' as const,
+            content: [{ type: 'text' as const, text: undefined as any }]
+          }
+        ]
+      }
+      const tokens = estimateTokenCount(input)
+      // Should only have role overhead
+      expect(tokens).toBe(3)
+    })
+
+    it('should handle empty content array', () => {
+      const input = {
+        messages: [
+          {
+            role: 'user' as const,
+            content: []
+          }
+        ]
+      }
+      const tokens = estimateTokenCount(input)
+      // Should only have role overhead
+      expect(tokens).toBe(3)
+    })
+  })
+})
diff --git a/src/main/apiServer/routes/messages.ts b/src/main/apiServer/routes/messages.ts
index 0b26db3960..2264cbb846 100644
--- a/src/main/apiServer/routes/messages.ts
+++ b/src/main/apiServer/routes/messages.ts
@@ -48,12 +48,12 @@ const providerRouter = express.Router({ mergeParams: true })
  * Estimate token count from messages
  * Uses tokenx library for accurate token estimation and supports images, tools
  */
-interface CountTokensInput {
+export interface CountTokensInput {
   messages: MessageCreateParams['messages']
   system?: MessageCreateParams['system']
 }
 
-function estimateTokenCount(input: CountTokensInput): number {
+export function estimateTokenCount(input: CountTokensInput): number {
   const { messages, system } = input
   let totalTokens = 0
 

From c877a3c4a59b8dd8a73ba1b001c3408b379a5c70 Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 18 Dec 2025 16:58:19 +0800
Subject: [PATCH 49/53] test(aisdkToAnthropicSSE): add comprehensive tests for
 AiSdkToAnthropicSSE event processing and utility functions

---
 .../__tests__/AiSdkToAnthropicSSE.test.ts     | 538 ++++++++++++++++++
 1 file changed, 538 insertions(+)
 create mode 100644 src/main/apiServer/adapters/__tests__/AiSdkToAnthropicSSE.test.ts

diff --git a/src/main/apiServer/adapters/__tests__/AiSdkToAnthropicSSE.test.ts b/src/main/apiServer/adapters/__tests__/AiSdkToAnthropicSSE.test.ts
new file mode 100644
index 0000000000..766677b60d
--- /dev/null
+++ b/src/main/apiServer/adapters/__tests__/AiSdkToAnthropicSSE.test.ts
@@ -0,0 +1,538 @@
+import type { RawMessageStreamEvent } from '@anthropic-ai/sdk/resources/messages'
+import type { FinishReason, LanguageModelUsage, TextStreamPart, ToolSet } from 'ai'
+import { describe, expect, it, vi } from 'vitest'
+
+import { AiSdkToAnthropicSSE, formatSSEDone, formatSSEEvent } from '../AiSdkToAnthropicSSE'
+
+// Helper to create properly typed mock events with all required fields
+const createTextDelta = (text: string, id = 'text_0'): TextStreamPart<ToolSet> => ({
+  type: 'text-delta',
+  id,
+  text
+})
+
+const createTextStart = (id = 'text_0'): TextStreamPart<ToolSet> => ({
+  type: 'text-start',
+  id
+})
+
+const createTextEnd = (id = 'text_0'): TextStreamPart<ToolSet> => ({
+  type: 'text-end',
+  id
+})
+
+const createFinish = (
+  finishReason: FinishReason | undefined = 'stop',
+  totalUsage?: Partial<LanguageModelUsage>
+): TextStreamPart<ToolSet> => {
+  const defaultUsage: LanguageModelUsage = {
+    inputTokens: 0,
+    outputTokens: 0,
+    totalTokens: 0
+  }
+  const event: TextStreamPart<ToolSet> = {
+    type: 'finish',
+    finishReason: finishReason || 'stop',
+    totalUsage: { ...defaultUsage, ...totalUsage }
+  }
+  return event
+}
+
+// Helper to create stream from extended events
+// Note: The adapter runtime accepts both standard and extended events
+function createMockStream(events: readonly TextStreamPart<ToolSet>[]) {
+  return new ReadableStream<TextStreamPart<ToolSet>>({
+    start(controller) {
+      for (const event of events) {
+        controller.enqueue(event)
+      }
+      controller.close()
+    }
+  })
+}
+
+describe('AiSdkToAnthropicSSE', () => {
+  describe('Text Processing', () => {
+    it('should emit message_start and process text-delta events', async () => {
+      const events: RawMessageStreamEvent[] = []
+      const adapter = new AiSdkToAnthropicSSE({
+        model: 'test:model',
+        onEvent: (event) => events.push(event)
+      })
+
+      // Create a mock stream with text events
+      const stream = createMockStream([createTextDelta('Hello'), createTextDelta(' world'), createFinish('stop')])
+
+      await adapter.processStream(stream)
+
+      // Verify message_start
+      expect(events[0]).toMatchObject({
+        type: 'message_start',
+        message: {
+          role: 'assistant',
+          model: 'test:model'
+        }
+      })
+
+      // Verify content_block_start for text
+      expect(events[1]).toMatchObject({
+        type: 'content_block_start',
+        content_block: { type: 'text' }
+      })
+
+      // Verify text deltas
+      expect(events[2]).toMatchObject({
+        type: 'content_block_delta',
+        delta: { type: 'text_delta', text: 'Hello' }
+      })
+      expect(events[3]).toMatchObject({
+        type: 'content_block_delta',
+        delta: { type: 'text_delta', text: ' world' }
+      })
+
+      // Verify content_block_stop
+      expect(events[4]).toMatchObject({
+        type: 'content_block_stop'
+      })
+
+      // Verify message_delta with stop_reason
+      expect(events[5]).toMatchObject({
+        type: 'message_delta',
+        delta: { stop_reason: 'end_turn' }
+      })
+
+      // Verify message_stop
+      expect(events[6]).toMatchObject({
+        type: 'message_stop'
+      })
+    })
+
+    it('should handle text-start and text-end events', async () => {
+      const events: RawMessageStreamEvent[] = []
+      const adapter = new AiSdkToAnthropicSSE({
+        model: 'test:model',
+        onEvent: (event) => events.push(event)
+      })
+
+      const stream = createMockStream([
+        createTextStart(),
+        createTextDelta('Test'),
+        createTextEnd(),
+        createFinish('stop')
+      ])
+
+      await adapter.processStream(stream)
+
+      // Should have content_block_start, delta, and content_block_stop
+      const blockEvents = events.filter((e) => e.type.startsWith('content_block'))
+      expect(blockEvents.length).toBeGreaterThanOrEqual(3)
+    })
+
+    it('should auto-start text block if not explicitly started', async () => {
+      const events: RawMessageStreamEvent[] = []
+      const adapter = new AiSdkToAnthropicSSE({
+        model: 'test:model',
+        onEvent: (event) => events.push(event)
+      })
+
+      const stream = createMockStream([createTextDelta('Auto-started'), createFinish('stop')])
+
+      await adapter.processStream(stream)
+
+      // Should automatically emit content_block_start
+      expect(events.some((e) => e.type === 'content_block_start')).toBe(true)
+    })
+  })
+
+  describe('Tool Call Processing', () => {
+    it('should emit tool_use block for tool-call events', async () => {
+      const events: RawMessageStreamEvent[] = []
+      const adapter = new AiSdkToAnthropicSSE({
+        model: 'test:model',
+        onEvent: (event) => events.push(event)
+      })
+
+      const stream = createMockStream([
+        {
+          type: 'tool-call',
+          toolCallId: 'call_123',
+          toolName: 'get_weather',
+          input: { location: 'SF' }
+        },
+        createFinish('tool-calls')
+      ])
+
+      await adapter.processStream(stream)
+
+      // Find tool_use block events
+      const blockStart = events.find((e) => {
+        if (e.type === 'content_block_start') {
+          return e.content_block.type === 'tool_use'
+        }
+        return false
+      })
+      expect(blockStart).toBeDefined()
+      if (blockStart && blockStart.type === 'content_block_start') {
+        expect(blockStart.content_block).toMatchObject({
+          type: 'tool_use',
+          id: 'call_123',
+          name: 'get_weather'
+        })
+      }
+
+      // Should emit input_json_delta
+      const delta = events.find((e) => {
+        if (e.type === 'content_block_delta') {
+          return e.delta.type === 'input_json_delta'
+        }
+        return false
+      })
+      expect(delta).toBeDefined()
+
+      // Should have stop_reason as tool_use
+      const messageDelta = events.find((e) => e.type === 'message_delta')
+      if (messageDelta && messageDelta.type === 'message_delta') {
+        expect(messageDelta.delta.stop_reason).toBe('tool_use')
+      }
+    })
+
+    it('should not create duplicate tool blocks', async () => {
+      const events: RawMessageStreamEvent[] = []
+      const adapter = new AiSdkToAnthropicSSE({
+        model: 'test:model',
+        onEvent: (event) => events.push(event)
+      })
+
+      const toolCallEvent: TextStreamPart<ToolSet> = {
+        type: 'tool-call',
+        toolCallId: 'call_123',
+        toolName: 'test_tool',
+        input: {}
+      }
+      const stream = createMockStream([toolCallEvent, toolCallEvent, createFinish()])
+
+      await adapter.processStream(stream)
+
+      // Should only have one tool_use block
+      const toolBlocks = events.filter((e) => {
+        if (e.type === 'content_block_start') {
+          return e.content_block.type === 'tool_use'
+        }
+        return false
+      })
+      expect(toolBlocks.length).toBe(1)
+    })
+  })
+
+  describe('Reasoning/Thinking Processing', () => {
+    it('should emit thinking block for reasoning events', async () => {
+      const events: RawMessageStreamEvent[] = []
+      const adapter = new AiSdkToAnthropicSSE({
+        model: 'test:model',
+        onEvent: (event) => events.push(event)
+      })
+
+      const stream = createMockStream([
+        { type: 'reasoning-start', id: 'reason_1' },
+        { type: 'reasoning-delta', id: 'reason_1', text: 'Thinking...' },
+        { type: 'reasoning-end', id: 'reason_1' },
+        createFinish()
+      ])
+
+      await adapter.processStream(stream)
+
+      // Find thinking block events
+      const blockStart = events.find((e) => {
+        if (e.type === 'content_block_start') {
+          return e.content_block.type === 'thinking'
+        }
+        return false
+      })
+      expect(blockStart).toBeDefined()
+
+      // Should emit thinking_delta
+      const delta = events.find((e) => {
+        if (e.type === 'content_block_delta') {
+          return e.delta.type === 'thinking_delta'
+        }
+        return false
+      })
+      expect(delta).toBeDefined()
+      if (delta && delta.type === 'content_block_delta' && delta.delta.type === 'thinking_delta') {
+        expect(delta.delta.thinking).toBe('Thinking...')
+      }
+    })
+
+    it('should handle multiple thinking blocks', async () => {
+      const events: RawMessageStreamEvent[] = []
+      const adapter = new AiSdkToAnthropicSSE({
+        model: 'test:model',
+        onEvent: (event) => events.push(event)
+      })
+
+      const stream = createMockStream([
+        { type: 'reasoning-start', id: 'reason_1' },
+        { type: 'reasoning-delta', id: 'reason_1', text: 'First thought' },
+        { type: 'reasoning-start', id: 'reason_2' },
+        { type: 'reasoning-delta', id: 'reason_2', text: 'Second thought' },
+        { type: 'reasoning-end', id: 'reason_1' },
+        { type: 'reasoning-end', id: 'reason_2' },
+        createFinish()
+      ])
+
+      await adapter.processStream(stream)
+
+      // Should have two thinking blocks
+      const thinkingBlocks = events.filter((e) => {
+        if (e.type === 'content_block_start') {
+          return e.content_block.type === 'thinking'
+        }
+        return false
+      })
+      expect(thinkingBlocks.length).toBe(2)
+    })
+  })
+
+  describe('Finish Reasons', () => {
+    it('should map finish reasons correctly', async () => {
+      const testCases: Array<{
+        aiSdkReason: FinishReason
+        expectedReason: string
+      }> = [
+        { aiSdkReason: 'stop', expectedReason: 'end_turn' },
+        { aiSdkReason: 'length', expectedReason: 'max_tokens' },
+        { aiSdkReason: 'tool-calls', expectedReason: 'tool_use' },
+        { aiSdkReason: 'content-filter', expectedReason: 'refusal' }
+      ]
+
+      for (const { aiSdkReason, expectedReason } of testCases) {
+        const events: RawMessageStreamEvent[] = []
+        const adapter = new AiSdkToAnthropicSSE({
+          model: 'test:model',
+          onEvent: (event) => events.push(event)
+        })
+
+        const stream = createMockStream([createFinish(aiSdkReason)])
+
+        await adapter.processStream(stream)
+
+        const messageDelta = events.find((e) => e.type === 'message_delta')
+        if (messageDelta && messageDelta.type === 'message_delta') {
+          expect(messageDelta.delta.stop_reason).toBe(expectedReason)
+        }
+      }
+    })
+  })
+
+  describe('Usage Tracking', () => {
+    it('should track token usage', async () => {
+      const events: RawMessageStreamEvent[] = []
+      const adapter = new AiSdkToAnthropicSSE({
+        model: 'test:model',
+        inputTokens: 100,
+        onEvent: (event) => events.push(event)
+      })
+
+      const stream = createMockStream([
+        createTextDelta('Hello'),
+        createFinish('stop', {
+          inputTokens: 100,
+          outputTokens: 50,
+          cachedInputTokens: 20
+        })
+      ])
+
+      await adapter.processStream(stream)
+
+      const messageDelta = events.find((e) => e.type === 'message_delta')
+      if (messageDelta && messageDelta.type === 'message_delta') {
+        expect(messageDelta.usage).toMatchObject({
+          input_tokens: 100,
+          output_tokens: 50,
+          cache_creation_input_tokens: 20
+        })
+      }
+    })
+  })
+
+  describe('Non-Streaming Response', () => {
+    it('should build complete message for non-streaming', async () => {
+      const adapter = new AiSdkToAnthropicSSE({
+        model: 'test:model',
+        onEvent: vi.fn()
+      })
+
+      const stream = createMockStream([
+        createTextDelta('Hello world'),
+        {
+          type: 'tool-call',
+          toolCallId: 'call_1',
+          toolName: 'test',
+          input: { arg: 'value' }
+        },
+        createFinish('tool-calls', { inputTokens: 10, outputTokens: 20 })
+      ])
+
+      await adapter.processStream(stream)
+
+      const response = adapter.buildNonStreamingResponse()
+
+      expect(response).toMatchObject({
+        type: 'message',
+        role: 'assistant',
+        model: 'test:model',
+        stop_reason: 'tool_use'
+      })
+
+      expect(response.content).toHaveLength(2)
+      expect(response.content[0]).toMatchObject({
+        type: 'text',
+        text: 'Hello world'
+      })
+      expect(response.content[1]).toMatchObject({
+        type: 'tool_use',
+        id: 'call_1',
+        name: 'test',
+        input: { arg: 'value' }
+      })
+
+      expect(response.usage).toMatchObject({
+        input_tokens: 10,
+        output_tokens: 20
+      })
+    })
+  })
+
+  describe('Error Handling', () => {
+    it('should throw on error events', async () => {
+      const adapter = new AiSdkToAnthropicSSE({
+        model: 'test:model',
+        onEvent: vi.fn()
+      })
+
+      const testError = new Error('Test error')
+      const stream = createMockStream([{ type: 'error', error: testError }])
+
+      await expect(adapter.processStream(stream)).rejects.toThrow('Test error')
+    })
+  })
+
+  describe('Edge Cases', () => {
+    it('should handle empty stream', async () => {
+      const events: RawMessageStreamEvent[] = []
+      const adapter = new AiSdkToAnthropicSSE({
+        model: 'test:model',
+        onEvent: (event) => events.push(event)
+      })
+
+      const stream = new ReadableStream<TextStreamPart<ToolSet>>({
+        start(controller) {
+          controller.close()
+        }
+      })
+
+      await adapter.processStream(stream)
+
+      // Should still emit message_start, message_delta, and message_stop
+      expect(events.some((e) => e.type === 'message_start')).toBe(true)
+      expect(events.some((e) => e.type === 'message_delta')).toBe(true)
+      expect(events.some((e) => e.type === 'message_stop')).toBe(true)
+    })
+
+    it('should handle empty text deltas', async () => {
+      const events: RawMessageStreamEvent[] = []
+      const adapter = new AiSdkToAnthropicSSE({
+        model: 'test:model',
+        onEvent: (event) => events.push(event)
+      })
+
+      const stream = createMockStream([createTextDelta(''), createTextDelta(''), createFinish()])
+
+      await adapter.processStream(stream)
+
+      // Should not emit deltas for empty text
+      const deltas = events.filter((e) => e.type === 'content_block_delta')
+      expect(deltas.length).toBe(0)
+    })
+  })
+
+  describe('Utility Functions', () => {
+    it('should format SSE events correctly', () => {
+      const event: RawMessageStreamEvent = {
+        type: 'message_start',
+        message: {
+          id: 'msg_123',
+          type: 'message',
+          role: 'assistant',
+          content: [],
+          model: 'test',
+          stop_reason: null,
+          stop_sequence: null,
+          usage: {
+            input_tokens: 10,
+            output_tokens: 0,
+            cache_creation_input_tokens: 0,
+            cache_read_input_tokens: 0,
+            server_tool_use: null
+          }
+        }
+      }
+
+      const formatted = formatSSEEvent(event)
+
+      expect(formatted).toContain('event: message_start')
+      expect(formatted).toContain('data: ')
+      expect(formatted).toContain('"type":"message_start"')
+      expect(formatted.endsWith('\n\n')).toBe(true)
+    })
+
+    it('should format SSE done marker correctly', () => {
+      const done = formatSSEDone()
+
+      expect(done).toBe('data: [DONE]\n\n')
+    })
+  })
+
+  describe('Message ID', () => {
+    it('should use provided message ID', () => {
+      const adapter = new AiSdkToAnthropicSSE({
+        model: 'test:model',
+        messageId: 'custom_msg_123',
+        onEvent: vi.fn()
+      })
+
+      expect(adapter.getMessageId()).toBe('custom_msg_123')
+    })
+
+    it('should generate message ID if not provided', () => {
+      const adapter = new AiSdkToAnthropicSSE({
+        model: 'test:model',
+        onEvent: vi.fn()
+      })
+
+      const messageId = adapter.getMessageId()
+      expect(messageId).toMatch(/^msg_/)
+    })
+  })
+
+  describe('Input Tokens', () => {
+    it('should allow setting input tokens', () => {
+      const events: RawMessageStreamEvent[] = []
+      const adapter = new AiSdkToAnthropicSSE({
+        model: 'test:model',
+        onEvent: (event) => events.push(event)
+      })
+
+      adapter.setInputTokens(500)
+
+      const stream = createMockStream([createFinish()])
+
+      return adapter.processStream(stream).then(() => {
+        const messageStart = events.find((e) => e.type === 'message_start')
+        if (messageStart && messageStart.type === 'message_start') {
+          expect(messageStart.message.usage.input_tokens).toBe(500)
+        }
+      })
+    })
+  })
+})

From 9c1f538f15035bb559b75259b7165c4bfcac94fc Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 18 Dec 2025 17:04:32 +0800
Subject: [PATCH 50/53] test(unified-messages): add unit tests for
 convertAnthropicToolsToAiSdk and convertAnthropicToAiMessages functions

---
 .../__tests__/unified-messages.test.ts        | 795 ++++++++++++++++++
 .../apiServer/services/unified-messages.ts    |   6 +-
 2 files changed, 799 insertions(+), 2 deletions(-)
 create mode 100644 src/main/apiServer/services/__tests__/unified-messages.test.ts

diff --git a/src/main/apiServer/services/__tests__/unified-messages.test.ts b/src/main/apiServer/services/__tests__/unified-messages.test.ts
new file mode 100644
index 0000000000..f8ee1a4952
--- /dev/null
+++ b/src/main/apiServer/services/__tests__/unified-messages.test.ts
@@ -0,0 +1,795 @@
+import type { MessageCreateParams } from '@anthropic-ai/sdk/resources/messages'
+import { describe, expect, it } from 'vitest'
+
+import { convertAnthropicToAiMessages, convertAnthropicToolsToAiSdk } from '../unified-messages'
+
+describe('unified-messages', () => {
+  describe('convertAnthropicToolsToAiSdk', () => {
+    it('should return undefined for empty tools array', () => {
+      const result = convertAnthropicToolsToAiSdk([])
+      expect(result).toBeUndefined()
+    })
+
+    it('should return undefined for undefined tools', () => {
+      const result = convertAnthropicToolsToAiSdk(undefined)
+      expect(result).toBeUndefined()
+    })
+
+    it('should convert simple tool with string schema', () => {
+      const anthropicTools: MessageCreateParams['tools'] = [
+        {
+          type: 'custom',
+          name: 'get_weather',
+          description: 'Get current weather',
+          input_schema: {
+            type: 'object',
+            properties: {
+              location: { type: 'string' }
+            },
+            required: ['location']
+          }
+        }
+      ]
+
+      const result = convertAnthropicToolsToAiSdk(anthropicTools)
+      expect(result).toBeDefined()
+      expect(result).toHaveProperty('get_weather')
+      expect(result!.get_weather).toHaveProperty('description', 'Get current weather')
+    })
+
+    it('should convert multiple tools', () => {
+      const anthropicTools: MessageCreateParams['tools'] = [
+        {
+          type: 'custom',
+          name: 'tool1',
+          description: 'First tool',
+          input_schema: {
+            type: 'object',
+            properties: {}
+          }
+        },
+        {
+          type: 'custom',
+          name: 'tool2',
+          description: 'Second tool',
+          input_schema: {
+            type: 'object',
+            properties: {}
+          }
+        }
+      ]
+
+      const result = convertAnthropicToolsToAiSdk(anthropicTools)
+      expect(result).toBeDefined()
+      expect(Object.keys(result!)).toHaveLength(2)
+      expect(result).toHaveProperty('tool1')
+      expect(result).toHaveProperty('tool2')
+    })
+
+    it('should convert tool with complex schema', () => {
+      const anthropicTools: MessageCreateParams['tools'] = [
+        {
+          type: 'custom',
+          name: 'search',
+          description: 'Search for information',
+          input_schema: {
+            type: 'object',
+            properties: {
+              query: { type: 'string', minLength: 1 },
+              limit: { type: 'integer', minimum: 1, maximum: 100 },
+              filters: {
+                type: 'array',
+                items: { type: 'string' }
+              }
+            },
+            required: ['query']
+          }
+        }
+      ]
+
+      const result = convertAnthropicToolsToAiSdk(anthropicTools)
+      expect(result).toBeDefined()
+      expect(result).toHaveProperty('search')
+    })
+
+    it('should skip bash_20250124 tool type', () => {
+      const anthropicTools: MessageCreateParams['tools'] = [
+        {
+          type: 'bash_20250124',
+          name: 'bash'
+        },
+        {
+          type: 'custom',
+          name: 'regular_tool',
+          description: 'A regular tool',
+          input_schema: {
+            type: 'object',
+            properties: {}
+          }
+        }
+      ]
+
+      const result = convertAnthropicToolsToAiSdk(anthropicTools)
+      expect(result).toBeDefined()
+      expect(Object.keys(result!)).toHaveLength(1)
+      expect(result).toHaveProperty('regular_tool')
+      expect(result).not.toHaveProperty('bash')
+    })
+
+    it('should handle tool with no description', () => {
+      const anthropicTools: MessageCreateParams['tools'] = [
+        {
+          type: 'custom',
+          name: 'no_desc_tool',
+          input_schema: {
+            type: 'object',
+            properties: {}
+          }
+        }
+      ]
+
+      const result = convertAnthropicToolsToAiSdk(anthropicTools)
+      expect(result).toBeDefined()
+      expect(result).toHaveProperty('no_desc_tool')
+      expect(result!.no_desc_tool).toHaveProperty('description', '')
+    })
+  })
+
+  describe('convertAnthropicToAiMessages', () => {
+    describe('System Messages', () => {
+      it('should convert string system message', () => {
+        const params: MessageCreateParams = {
+          model: 'claude-3-5-sonnet-20241022',
+          max_tokens: 1024,
+          system: 'You are a helpful assistant.',
+          messages: [
+            {
+              role: 'user',
+              content: 'Hello'
+            }
+          ]
+        }
+
+        const result = convertAnthropicToAiMessages(params)
+        expect(result).toHaveLength(2)
+        expect(result[0]).toEqual({
+          role: 'system',
+          content: 'You are a helpful assistant.'
+        })
+      })
+
+      it('should convert array system message', () => {
+        const params: MessageCreateParams = {
+          model: 'claude-3-5-sonnet-20241022',
+          max_tokens: 1024,
+          system: [
+            { type: 'text', text: 'Instruction 1' },
+            { type: 'text', text: 'Instruction 2' }
+          ],
+          messages: [
+            {
+              role: 'user',
+              content: 'Hello'
+            }
+          ]
+        }
+
+        const result = convertAnthropicToAiMessages(params)
+        expect(result[0]).toEqual({
+          role: 'system',
+          content: 'Instruction 1\nInstruction 2'
+        })
+      })
+
+      it('should handle no system message', () => {
+        const params: MessageCreateParams = {
+          model: 'claude-3-5-sonnet-20241022',
+          max_tokens: 1024,
+          messages: [
+            {
+              role: 'user',
+              content: 'Hello'
+            }
+          ]
+        }
+
+        const result = convertAnthropicToAiMessages(params)
+        expect(result[0].role).toBe('user')
+      })
+    })
+
+    describe('Text Messages', () => {
+      it('should convert simple string message', () => {
+        const params: MessageCreateParams = {
+          model: 'claude-3-5-sonnet-20241022',
+          max_tokens: 1024,
+          messages: [
+            {
+              role: 'user',
+              content: 'Hello, world!'
+            }
+          ]
+        }
+
+        const result = convertAnthropicToAiMessages(params)
+        expect(result).toHaveLength(1)
+        expect(result[0]).toEqual({
+          role: 'user',
+          content: 'Hello, world!'
+        })
+      })
+
+      it('should convert text block array', () => {
+        const params: MessageCreateParams = {
+          model: 'claude-3-5-sonnet-20241022',
+          max_tokens: 1024,
+          messages: [
+            {
+              role: 'user',
+              content: [
+                { type: 'text', text: 'First part' },
+                { type: 'text', text: 'Second part' }
+              ]
+            }
+          ]
+        }
+
+        const result = convertAnthropicToAiMessages(params)
+        expect(result).toHaveLength(1)
+        expect(result[0].role).toBe('user')
+        expect(Array.isArray(result[0].content)).toBe(true)
+        if (Array.isArray(result[0].content)) {
+          expect(result[0].content).toHaveLength(2)
+          expect(result[0].content[0]).toEqual({ type: 'text', text: 'First part' })
+          expect(result[0].content[1]).toEqual({ type: 'text', text: 'Second part' })
+        }
+      })
+
+      it('should convert assistant message', () => {
+        const params: MessageCreateParams = {
+          model: 'claude-3-5-sonnet-20241022',
+          max_tokens: 1024,
+          messages: [
+            {
+              role: 'user',
+              content: 'Hello'
+            },
+            {
+              role: 'assistant',
+              content: 'Hi there!'
+            }
+          ]
+        }
+
+        const result = convertAnthropicToAiMessages(params)
+        expect(result).toHaveLength(2)
+        expect(result[1]).toEqual({
+          role: 'assistant',
+          content: 'Hi there!'
+        })
+      })
+    })
+
+    describe('Image Messages', () => {
+      it('should convert base64 image', () => {
+        const params: MessageCreateParams = {
+          model: 'claude-3-5-sonnet-20241022',
+          max_tokens: 1024,
+          messages: [
+            {
+              role: 'user',
+              content: [
+                {
+                  type: 'image',
+                  source: {
+                    type: 'base64',
+                    media_type: 'image/png',
+                    data: 'iVBORw0KGgo='
+                  }
+                }
+              ]
+            }
+          ]
+        }
+
+        const result = convertAnthropicToAiMessages(params)
+        expect(result).toHaveLength(1)
+        expect(Array.isArray(result[0].content)).toBe(true)
+        if (Array.isArray(result[0].content)) {
+          expect(result[0].content).toHaveLength(1)
+          const imagePart = result[0].content[0]
+          if (imagePart.type === 'image') {
+            expect(imagePart.image).toBe('data:image/png;base64,iVBORw0KGgo=')
+          }
+        }
+      })
+
+      it('should convert URL image', () => {
+        const params: MessageCreateParams = {
+          model: 'claude-3-5-sonnet-20241022',
+          max_tokens: 1024,
+          messages: [
+            {
+              role: 'user',
+              content: [
+                {
+                  type: 'image',
+                  source: {
+                    type: 'url',
+                    url: 'https://example.com/image.png'
+                  }
+                }
+              ]
+            }
+          ]
+        }
+
+        const result = convertAnthropicToAiMessages(params)
+        if (Array.isArray(result[0].content)) {
+          const imagePart = result[0].content[0]
+          if (imagePart.type === 'image') {
+            expect(imagePart.image).toBe('https://example.com/image.png')
+          }
+        }
+      })
+
+      it('should convert mixed text and image content', () => {
+        const params: MessageCreateParams = {
+          model: 'claude-3-5-sonnet-20241022',
+          max_tokens: 1024,
+          messages: [
+            {
+              role: 'user',
+              content: [
+                { type: 'text', text: 'Look at this:' },
+                {
+                  type: 'image',
+                  source: {
+                    type: 'url',
+                    url: 'https://example.com/pic.jpg'
+                  }
+                }
+              ]
+            }
+          ]
+        }
+
+        const result = convertAnthropicToAiMessages(params)
+        if (Array.isArray(result[0].content)) {
+          expect(result[0].content).toHaveLength(2)
+          expect(result[0].content[0].type).toBe('text')
+          expect(result[0].content[1].type).toBe('image')
+        }
+      })
+    })
+
+    describe('Tool Messages', () => {
+      it('should convert tool_use block', () => {
+        const params: MessageCreateParams = {
+          model: 'claude-3-5-sonnet-20241022',
+          max_tokens: 1024,
+          messages: [
+            {
+              role: 'user',
+              content: 'What is the weather?'
+            },
+            {
+              role: 'assistant',
+              content: [
+                {
+                  type: 'tool_use',
+                  id: 'call_123',
+                  name: 'get_weather',
+                  input: { location: 'San Francisco' }
+                }
+              ]
+            }
+          ]
+        }
+
+        const result = convertAnthropicToAiMessages(params)
+        expect(result).toHaveLength(2)
+        const assistantMsg = result[1]
+        expect(assistantMsg.role).toBe('assistant')
+        if (Array.isArray(assistantMsg.content)) {
+          expect(assistantMsg.content).toHaveLength(1)
+          const toolCall = assistantMsg.content[0]
+          if (toolCall.type === 'tool-call') {
+            expect(toolCall.toolName).toBe('get_weather')
+            expect(toolCall.toolCallId).toBe('call_123')
+            expect(toolCall.input).toEqual({ location: 'San Francisco' })
+          }
+        }
+      })
+
+      it('should convert tool_result with string content', () => {
+        const params: MessageCreateParams = {
+          model: 'claude-3-5-sonnet-20241022',
+          max_tokens: 1024,
+          messages: [
+            {
+              role: 'assistant',
+              content: [
+                {
+                  type: 'tool_use',
+                  id: 'call_123',
+                  name: 'get_weather',
+                  input: {}
+                }
+              ]
+            },
+            {
+              role: 'user',
+              content: [
+                {
+                  type: 'tool_result',
+                  tool_use_id: 'call_123',
+                  content: 'Temperature is 72°F'
+                }
+              ]
+            }
+          ]
+        }
+
+        const result = convertAnthropicToAiMessages(params)
+        const toolMsg = result[1]
+        expect(toolMsg.role).toBe('tool')
+        if (Array.isArray(toolMsg.content)) {
+          expect(toolMsg.content).toHaveLength(1)
+          const toolResult = toolMsg.content[0]
+          if (toolResult.type === 'tool-result') {
+            expect(toolResult.toolCallId).toBe('call_123')
+            expect(toolResult.toolName).toBe('get_weather')
+            if (toolResult.output.type === 'text') {
+              expect(toolResult.output.value).toBe('Temperature is 72°F')
+            }
+          }
+        }
+      })
+
+      it('should convert tool_result with array content', () => {
+        const params: MessageCreateParams = {
+          model: 'claude-3-5-sonnet-20241022',
+          max_tokens: 1024,
+          messages: [
+            {
+              role: 'assistant',
+              content: [
+                {
+                  type: 'tool_use',
+                  id: 'call_456',
+                  name: 'analyze',
+                  input: {}
+                }
+              ]
+            },
+            {
+              role: 'user',
+              content: [
+                {
+                  type: 'tool_result',
+                  tool_use_id: 'call_456',
+                  content: [
+                    { type: 'text', text: 'Result part 1' },
+                    { type: 'text', text: 'Result part 2' }
+                  ]
+                }
+              ]
+            }
+          ]
+        }
+
+        const result = convertAnthropicToAiMessages(params)
+        const toolMsg = result[1]
+        if (Array.isArray(toolMsg.content)) {
+          const toolResult = toolMsg.content[0]
+          if (toolResult.type === 'tool-result' && toolResult.output.type === 'content') {
+            expect(toolResult.output.value).toHaveLength(2)
+            expect(toolResult.output.value[0]).toEqual({ type: 'text', text: 'Result part 1' })
+            expect(toolResult.output.value[1]).toEqual({ type: 'text', text: 'Result part 2' })
+          }
+        }
+      })
+
+      it('should convert tool_result with image content', () => {
+        const params: MessageCreateParams = {
+          model: 'claude-3-5-sonnet-20241022',
+          max_tokens: 1024,
+          messages: [
+            {
+              role: 'assistant',
+              content: [
+                {
+                  type: 'tool_use',
+                  id: 'call_789',
+                  name: 'screenshot',
+                  input: {}
+                }
+              ]
+            },
+            {
+              role: 'user',
+              content: [
+                {
+                  type: 'tool_result',
+                  tool_use_id: 'call_789',
+                  content: [
+                    {
+                      type: 'image',
+                      source: {
+                        type: 'base64',
+                        media_type: 'image/png',
+                        data: 'abc123'
+                      }
+                    }
+                  ]
+                }
+              ]
+            }
+          ]
+        }
+
+        const result = convertAnthropicToAiMessages(params)
+        const toolMsg = result[1]
+        if (Array.isArray(toolMsg.content)) {
+          const toolResult = toolMsg.content[0]
+          if (toolResult.type === 'tool-result' && toolResult.output.type === 'content') {
+            expect(toolResult.output.value).toHaveLength(1)
+            const media = toolResult.output.value[0]
+            if (media.type === 'media') {
+              expect(media.data).toBe('abc123')
+              expect(media.mediaType).toBe('image/png')
+            }
+          }
+        }
+      })
+
+      it('should handle multiple tool calls', () => {
+        const params: MessageCreateParams = {
+          model: 'claude-3-5-sonnet-20241022',
+          max_tokens: 1024,
+          messages: [
+            {
+              role: 'assistant',
+              content: [
+                {
+                  type: 'tool_use',
+                  id: 'call_1',
+                  name: 'tool1',
+                  input: {}
+                },
+                {
+                  type: 'tool_use',
+                  id: 'call_2',
+                  name: 'tool2',
+                  input: {}
+                }
+              ]
+            }
+          ]
+        }
+
+        const result = convertAnthropicToAiMessages(params)
+        if (Array.isArray(result[0].content)) {
+          expect(result[0].content).toHaveLength(2)
+          expect(result[0].content[0].type).toBe('tool-call')
+          expect(result[0].content[1].type).toBe('tool-call')
+        }
+      })
+    })
+
+    describe('Thinking Content', () => {
+      it('should convert thinking block to reasoning', () => {
+        const params: MessageCreateParams = {
+          model: 'claude-3-5-sonnet-20241022',
+          max_tokens: 1024,
+          messages: [
+            {
+              role: 'assistant',
+              content: [
+                {
+                  type: 'thinking',
+                  thinking: 'Let me analyze this...',
+                  signature: 'sig123'
+                },
+                {
+                  type: 'text',
+                  text: 'Here is my answer'
+                }
+              ]
+            }
+          ]
+        }
+
+        const result = convertAnthropicToAiMessages(params)
+        if (Array.isArray(result[0].content)) {
+          expect(result[0].content).toHaveLength(2)
+          const reasoning = result[0].content[0]
+          if (reasoning.type === 'reasoning') {
+            expect(reasoning.text).toBe('Let me analyze this...')
+          }
+          const text = result[0].content[1]
+          if (text.type === 'text') {
+            expect(text.text).toBe('Here is my answer')
+          }
+        }
+      })
+
+      it('should convert redacted_thinking to reasoning', () => {
+        const params: MessageCreateParams = {
+          model: 'claude-3-5-sonnet-20241022',
+          max_tokens: 1024,
+          messages: [
+            {
+              role: 'assistant',
+              content: [
+                {
+                  type: 'redacted_thinking',
+                  data: '[Redacted]'
+                }
+              ]
+            }
+          ]
+        }
+
+        const result = convertAnthropicToAiMessages(params)
+        if (Array.isArray(result[0].content)) {
+          expect(result[0].content).toHaveLength(1)
+          const reasoning = result[0].content[0]
+          if (reasoning.type === 'reasoning') {
+            expect(reasoning.text).toBe('[Redacted]')
+          }
+        }
+      })
+    })
+
+    describe('Multi-turn Conversations', () => {
+      it('should handle complete conversation flow', () => {
+        const params: MessageCreateParams = {
+          model: 'claude-3-5-sonnet-20241022',
+          max_tokens: 1024,
+          system: 'You are a helpful assistant.',
+          messages: [
+            {
+              role: 'user',
+              content: 'What is the weather in SF?'
+            },
+            {
+              role: 'assistant',
+              content: [
+                {
+                  type: 'tool_use',
+                  id: 'weather_call',
+                  name: 'get_weather',
+                  input: { location: 'SF' }
+                }
+              ]
+            },
+            {
+              role: 'user',
+              content: [
+                {
+                  type: 'tool_result',
+                  tool_use_id: 'weather_call',
+                  content: '72°F and sunny'
+                }
+              ]
+            },
+            {
+              role: 'assistant',
+              content: 'The weather in San Francisco is 72°F and sunny.'
+            }
+          ]
+        }
+
+        const result = convertAnthropicToAiMessages(params)
+        expect(result).toHaveLength(5)
+        expect(result[0].role).toBe('system')
+        expect(result[1].role).toBe('user')
+        expect(result[2].role).toBe('assistant')
+        expect(result[3].role).toBe('tool')
+        expect(result[4].role).toBe('assistant')
+      })
+    })
+
+    describe('Edge Cases', () => {
+      it('should handle empty content array for user', () => {
+        const params: MessageCreateParams = {
+          model: 'claude-3-5-sonnet-20241022',
+          max_tokens: 1024,
+          messages: [
+            {
+              role: 'user',
+              content: []
+            }
+          ]
+        }
+
+        const result = convertAnthropicToAiMessages(params)
+        expect(result).toHaveLength(0)
+      })
+
+      it('should handle empty content array for assistant', () => {
+        const params: MessageCreateParams = {
+          model: 'claude-3-5-sonnet-20241022',
+          max_tokens: 1024,
+          messages: [
+            {
+              role: 'assistant',
+              content: []
+            }
+          ]
+        }
+
+        const result = convertAnthropicToAiMessages(params)
+        expect(result).toHaveLength(0)
+      })
+
+      it('should handle tool_result without matching tool_use', () => {
+        const params: MessageCreateParams = {
+          model: 'claude-3-5-sonnet-20241022',
+          max_tokens: 1024,
+          messages: [
+            {
+              role: 'user',
+              content: [
+                {
+                  type: 'tool_result',
+                  tool_use_id: 'unknown_call',
+                  content: 'Some result'
+                }
+              ]
+            }
+          ]
+        }
+
+        const result = convertAnthropicToAiMessages(params)
+        expect(result).toHaveLength(1)
+        if (Array.isArray(result[0].content)) {
+          const toolResult = result[0].content[0]
+          if (toolResult.type === 'tool-result') {
+            expect(toolResult.toolName).toBe('unknown')
+          }
+        }
+      })
+
+      it('should handle tool_result with empty content', () => {
+        const params: MessageCreateParams = {
+          model: 'claude-3-5-sonnet-20241022',
+          max_tokens: 1024,
+          messages: [
+            {
+              role: 'assistant',
+              content: [
+                {
+                  type: 'tool_use',
+                  id: 'call_empty',
+                  name: 'empty_tool',
+                  input: {}
+                }
+              ]
+            },
+            {
+              role: 'user',
+              content: [
+                {
+                  type: 'tool_result',
+                  tool_use_id: 'call_empty'
+                }
+              ]
+            }
+          ]
+        }
+
+        const result = convertAnthropicToAiMessages(params)
+        const toolMsg = result[1]
+        if (Array.isArray(toolMsg.content)) {
+          const toolResult = toolMsg.content[0]
+          if (toolResult.type === 'tool-result' && toolResult.output.type === 'text') {
+            expect(toolResult.output.value).toBe('')
+          }
+        }
+      })
+    })
+  })
+})
diff --git a/src/main/apiServer/services/unified-messages.ts b/src/main/apiServer/services/unified-messages.ts
index 7b465d75ad..1e6990bceb 100644
--- a/src/main/apiServer/services/unified-messages.ts
+++ b/src/main/apiServer/services/unified-messages.ts
@@ -255,7 +255,9 @@ export function jsonSchemaToZod(schema: JsonSchemaLike): z.ZodTypeAny {
   }
 }
 
-function convertAnthropicToolsToAiSdk(tools: MessageCreateParams['tools']): Record<string, AiSdkTool> | undefined {
+export function convertAnthropicToolsToAiSdk(
+  tools: MessageCreateParams['tools']
+): Record<string, AiSdkTool> | undefined {
   if (!tools || tools.length === 0) return undefined
 
   const aiSdkTools: Record<string, AiSdkTool> = {}
@@ -277,7 +279,7 @@ function convertAnthropicToolsToAiSdk(tools: MessageCreateParams['tools']): Reco
   return Object.keys(aiSdkTools).length > 0 ? aiSdkTools : undefined
 }
 
-function convertAnthropicToAiMessages(params: MessageCreateParams): ModelMessage[] {
+export function convertAnthropicToAiMessages(params: MessageCreateParams): ModelMessage[] {
   const messages: ModelMessage[] = []
 
   // System message

From 9a72a8df2c33ff34dee4594e63470d6fb6ae149a Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 18 Dec 2025 20:17:39 +0800
Subject: [PATCH 51/53] refactor: rename directory

---
 packages/shared/{middleware => ai-sdk-middlewares}/index.ts | 0
 .../{middleware => ai-sdk-middlewares}/middlewares.ts       | 0
 packages/shared/provider/format.ts                          | 2 +-
 packages/shared/provider/sdk-config.ts                      | 2 +-
 packages/shared/{utils.ts => utils/headers.ts}              | 0
 packages/shared/utils/index.ts                              | 2 ++
 packages/shared/{api => utils/url}/index.ts                 | 0
 src/main/apiServer/routes/messages.ts                       | 2 +-
 src/main/apiServer/services/unified-messages.ts             | 2 +-
 .../src/aiCore/middleware/AiSdkMiddlewareBuilder.ts         | 2 +-
 .../src/aiCore/provider/__tests__/providerConfig.test.ts    | 6 +++---
 src/renderer/src/utils/api.ts                               | 2 +-
 12 files changed, 11 insertions(+), 9 deletions(-)
 rename packages/shared/{middleware => ai-sdk-middlewares}/index.ts (100%)
 rename packages/shared/{middleware => ai-sdk-middlewares}/middlewares.ts (100%)
 rename packages/shared/{utils.ts => utils/headers.ts} (100%)
 rename packages/shared/{api => utils/url}/index.ts (100%)

diff --git a/packages/shared/middleware/index.ts b/packages/shared/ai-sdk-middlewares/index.ts
similarity index 100%
rename from packages/shared/middleware/index.ts
rename to packages/shared/ai-sdk-middlewares/index.ts
diff --git a/packages/shared/middleware/middlewares.ts b/packages/shared/ai-sdk-middlewares/middlewares.ts
similarity index 100%
rename from packages/shared/middleware/middlewares.ts
rename to packages/shared/ai-sdk-middlewares/middlewares.ts
diff --git a/packages/shared/provider/format.ts b/packages/shared/provider/format.ts
index cbef857d68..3a1fc637a7 100644
--- a/packages/shared/provider/format.ts
+++ b/packages/shared/provider/format.ts
@@ -14,7 +14,7 @@ import {
   isWithTrailingSharp,
   routeToEndpoint,
   withoutTrailingSlash
-} from '../api'
+} from '../utils/url'
 import {
   isAnthropicProvider,
   isAzureOpenAIProvider,
diff --git a/packages/shared/provider/sdk-config.ts b/packages/shared/provider/sdk-config.ts
index 350e686e61..df4b52ca41 100644
--- a/packages/shared/provider/sdk-config.ts
+++ b/packages/shared/provider/sdk-config.ts
@@ -9,7 +9,7 @@ import { formatPrivateKey, hasProviderConfig, ProviderConfigFactory } from '@che
 import { defaultAppHeaders } from '@shared/utils'
 import { isEmpty } from 'lodash'
 
-import { routeToEndpoint } from '../api'
+import { routeToEndpoint } from '../utils/url'
 import { isAzureOpenAIProvider, isOllamaProvider } from './detection'
 import { getAiSdkProviderId } from './mapping'
 import type { MinimalProvider } from './types'
diff --git a/packages/shared/utils.ts b/packages/shared/utils/headers.ts
similarity index 100%
rename from packages/shared/utils.ts
rename to packages/shared/utils/headers.ts
diff --git a/packages/shared/utils/index.ts b/packages/shared/utils/index.ts
index 838c28e6c0..11cefe0c9b 100644
--- a/packages/shared/utils/index.ts
+++ b/packages/shared/utils/index.ts
@@ -1 +1,3 @@
+export { defaultAppHeaders } from './headers'
 export { getBaseModelName, getLowerBaseModelName } from './naming'
+export * from './url'
diff --git a/packages/shared/api/index.ts b/packages/shared/utils/url/index.ts
similarity index 100%
rename from packages/shared/api/index.ts
rename to packages/shared/utils/url/index.ts
diff --git a/src/main/apiServer/routes/messages.ts b/src/main/apiServer/routes/messages.ts
index 2264cbb846..dbd6b676cc 100644
--- a/src/main/apiServer/routes/messages.ts
+++ b/src/main/apiServer/routes/messages.ts
@@ -1,6 +1,6 @@
 import type { MessageCreateParams } from '@anthropic-ai/sdk/resources'
 import { loggerService } from '@logger'
-import { buildSharedMiddlewares, type SharedMiddlewareConfig } from '@shared/middleware'
+import { buildSharedMiddlewares, type SharedMiddlewareConfig } from '@shared/ai-sdk-middlewares'
 import { getAiSdkProviderId } from '@shared/provider'
 import type { Provider } from '@types'
 import type { Request, Response } from 'express'
diff --git a/src/main/apiServer/services/unified-messages.ts b/src/main/apiServer/services/unified-messages.ts
index 1e6990bceb..e1b8301515 100644
--- a/src/main/apiServer/services/unified-messages.ts
+++ b/src/main/apiServer/services/unified-messages.ts
@@ -18,7 +18,7 @@ import anthropicService from '@main/services/AnthropicService'
 import copilotService from '@main/services/CopilotService'
 import { reduxService } from '@main/services/ReduxService'
 import type { OpenRouterProviderOptions } from '@openrouter/ai-sdk-provider'
-import { isGemini3ModelId } from '@shared/middleware'
+import { isGemini3ModelId } from '@shared/ai-sdk-middlewares'
 import {
   type AiSdkConfig,
   type AiSdkConfigContext,
diff --git a/src/renderer/src/aiCore/middleware/AiSdkMiddlewareBuilder.ts b/src/renderer/src/aiCore/middleware/AiSdkMiddlewareBuilder.ts
index ae83df4f3f..b1e2c07732 100644
--- a/src/renderer/src/aiCore/middleware/AiSdkMiddlewareBuilder.ts
+++ b/src/renderer/src/aiCore/middleware/AiSdkMiddlewareBuilder.ts
@@ -5,7 +5,7 @@ import type { MCPTool } from '@renderer/types'
 import { type Assistant, type Message, type Model, type Provider, SystemProviderIds } from '@renderer/types'
 import type { Chunk } from '@renderer/types/chunk'
 import { isOllamaProvider, isSupportEnableThinkingProvider } from '@renderer/utils/provider'
-import { openrouterReasoningMiddleware, skipGeminiThoughtSignatureMiddleware } from '@shared/middleware'
+import { openrouterReasoningMiddleware, skipGeminiThoughtSignatureMiddleware } from '@shared/ai-sdk-middlewares'
 import type { LanguageModelMiddleware } from 'ai'
 import { extractReasoningMiddleware, simulateStreamingMiddleware } from 'ai'
 
diff --git a/src/renderer/src/aiCore/provider/__tests__/providerConfig.test.ts b/src/renderer/src/aiCore/provider/__tests__/providerConfig.test.ts
index 59975c824c..3d1bc2ac3c 100644
--- a/src/renderer/src/aiCore/provider/__tests__/providerConfig.test.ts
+++ b/src/renderer/src/aiCore/provider/__tests__/providerConfig.test.ts
@@ -46,8 +46,8 @@ vi.mock('@renderer/utils/api', () => ({
   isWithTrailingSharp: vi.fn((host) => host?.endsWith('#') || false)
 }))
 
-// Also mock @shared/api since formatProviderApiHost uses it directly
-vi.mock('@shared/api', async (importOriginal) => {
+// Also mock @shared/utils/url since formatProviderApiHost uses it directly
+vi.mock('@shared/utils/url', async (importOriginal) => {
   const actual = (await importOriginal()) as any
   return {
     ...actual,
@@ -93,7 +93,7 @@ vi.mock('@renderer/services/AssistantService', () => ({
 import { getProviderByModel } from '@renderer/services/AssistantService'
 import type { Model, Provider } from '@renderer/types'
 import { isAzureOpenAIProvider, isCherryAIProvider, isPerplexityProvider } from '@renderer/utils/provider'
-import { formatApiHost } from '@shared/api'
+import { formatApiHost } from '@shared/utils/url'
 
 import { COPILOT_DEFAULT_HEADERS, COPILOT_EDITOR_VERSION, isCopilotResponsesModel } from '../constants'
 import { getActualProvider, providerToAiSdkConfig } from '../providerConfig'
diff --git a/src/renderer/src/utils/api.ts b/src/renderer/src/utils/api.ts
index f6e0c63c58..216a8c51f6 100644
--- a/src/renderer/src/utils/api.ts
+++ b/src/renderer/src/utils/api.ts
@@ -14,7 +14,7 @@ export {
   withoutTrailingApiVersion,
   withoutTrailingSharp,
   withoutTrailingSlash
-} from '@shared/api'
+} from '@shared/utils/url'
 
 /**
  * 格式化 API key 字符串。

From 1723d72b29b62c79bab38e48c1509732af50c19e Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 18 Dec 2025 20:25:44 +0800
Subject: [PATCH 52/53] refacto: reasoning cache implementation and update
 import paths

---
 .../apiServer/adapters/AiSdkToAnthropicSSE.ts |  2 +-
 .../apiServer/services/reasoning-cache.ts     | 45 +++++++++++++++++++
 .../apiServer/services/unified-messages.ts    |  2 +-
 src/main/services/CacheService.ts             | 21 ---------
 4 files changed, 47 insertions(+), 23 deletions(-)
 create mode 100644 src/main/apiServer/services/reasoning-cache.ts

diff --git a/src/main/apiServer/adapters/AiSdkToAnthropicSSE.ts b/src/main/apiServer/adapters/AiSdkToAnthropicSSE.ts
index f24d8304a7..9ef19c0b9d 100644
--- a/src/main/apiServer/adapters/AiSdkToAnthropicSSE.ts
+++ b/src/main/apiServer/adapters/AiSdkToAnthropicSSE.ts
@@ -38,7 +38,7 @@ import type {
 import { loggerService } from '@logger'
 import { type FinishReason, type LanguageModelUsage, type TextStreamPart, type ToolSet } from 'ai'
 
-import { googleReasoningCache, openRouterReasoningCache } from '../../services/CacheService'
+import { googleReasoningCache, openRouterReasoningCache } from '../services/reasoning-cache'
 
 const logger = loggerService.withContext('AiSdkToAnthropicSSE')
 
diff --git a/src/main/apiServer/services/reasoning-cache.ts b/src/main/apiServer/services/reasoning-cache.ts
new file mode 100644
index 0000000000..eb39e691d8
--- /dev/null
+++ b/src/main/apiServer/services/reasoning-cache.ts
@@ -0,0 +1,45 @@
+/**
+ * Reasoning Cache Service
+ *
+ * Manages reasoning-related caching for AI providers that support thinking/reasoning modes.
+ * This includes Google Gemini's thought signatures and OpenRouter's reasoning details.
+ */
+
+import type { ReasoningDetailUnion } from '@main/apiServer/adapters/openrouter'
+import { CacheService } from '@main/services/CacheService'
+
+/**
+ * Interface for reasoning cache
+ */
+export interface IReasoningCache<T> {
+  set(key: string, value: T): void
+  get(key: string): T | undefined
+}
+
+/**
+ * Cache duration: 30 minutes
+ * Reasoning data is typically only needed within a short conversation context
+ */
+const REASONING_CACHE_DURATION = 30 * 60 * 1000
+
+/**
+ * Google Gemini reasoning cache
+ *
+ * Stores thought signatures for Gemini 3 models to handle multi-turn conversations
+ * where the model needs to maintain thinking context across tool calls.
+ */
+export const googleReasoningCache: IReasoningCache<string> = {
+  set: (key, value) => CacheService.set(`google-reasoning:${key}`, value, REASONING_CACHE_DURATION),
+  get: (key) => CacheService.get(`google-reasoning:${key}`) || undefined
+}
+
+/**
+ * OpenRouter reasoning cache
+ *
+ * Stores reasoning details from OpenRouter responses to preserve thinking tokens
+ * and reasoning metadata across the conversation flow.
+ */
+export const openRouterReasoningCache: IReasoningCache<ReasoningDetailUnion[]> = {
+  set: (key, value) => CacheService.set(`openrouter-reasoning:${key}`, value, REASONING_CACHE_DURATION),
+  get: (key) => CacheService.get(`openrouter-reasoning:${key}`) || undefined
+}
diff --git a/src/main/apiServer/services/unified-messages.ts b/src/main/apiServer/services/unified-messages.ts
index e1b8301515..b9c306b2f9 100644
--- a/src/main/apiServer/services/unified-messages.ts
+++ b/src/main/apiServer/services/unified-messages.ts
@@ -42,7 +42,7 @@ import { net } from 'electron'
 import type { Response } from 'express'
 import * as z from 'zod'
 
-import { googleReasoningCache, openRouterReasoningCache } from '../../services/CacheService'
+import { googleReasoningCache, openRouterReasoningCache } from './reasoning-cache'
 
 const logger = loggerService.withContext('UnifiedMessagesService')
 
diff --git a/src/main/services/CacheService.ts b/src/main/services/CacheService.ts
index 84c6935d3d..d2984a9984 100644
--- a/src/main/services/CacheService.ts
+++ b/src/main/services/CacheService.ts
@@ -1,19 +1,9 @@
-import type { ReasoningDetailUnion } from '@main/apiServer/adapters/openrouter'
-
 interface CacheItem<T> {
   data: T
   timestamp: number
   duration: number
 }
 
-/**
- * Interface for reasoning cache
- */
-export interface IReasoningCache<T> {
-  set(key: string, value: T): void
-  get(key: string): T | undefined
-}
-
 export class CacheService {
   private static cache: Map<string, CacheItem<any>> = new Map()
 
@@ -82,14 +72,3 @@ export class CacheService {
     return true
   }
 }
-
-// Singleton cache instances using CacheService
-export const googleReasoningCache: IReasoningCache<string> = {
-  set: (key, value) => CacheService.set(`google-reasoning:${key}`, value, 30 * 60 * 1000),
-  get: (key) => CacheService.get(`google-reasoning:${key}`) || undefined
-}
-
-export const openRouterReasoningCache: IReasoningCache<ReasoningDetailUnion[]> = {
-  set: (key, value) => CacheService.set(`openrouter-reasoning:${key}`, value, 30 * 60 * 1000),
-  get: (key) => CacheService.get(`openrouter-reasoning:${key}`) || undefined
-}

From f20db1ac84fca7445607c0bbff0d0fd447bfbd9f Mon Sep 17 00:00:00 2001
From: suyao <sy20010504@gmail.com>
Date: Thu, 18 Dec 2025 20:37:49 +0800
Subject: [PATCH 53/53] chore: improve comment

---
 .../apiServer/adapters/__tests__/AiSdkToAnthropicSSE.test.ts  | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/src/main/apiServer/adapters/__tests__/AiSdkToAnthropicSSE.test.ts b/src/main/apiServer/adapters/__tests__/AiSdkToAnthropicSSE.test.ts
index 766677b60d..bbeed2563c 100644
--- a/src/main/apiServer/adapters/__tests__/AiSdkToAnthropicSSE.test.ts
+++ b/src/main/apiServer/adapters/__tests__/AiSdkToAnthropicSSE.test.ts
@@ -4,7 +4,6 @@ import { describe, expect, it, vi } from 'vitest'
 
 import { AiSdkToAnthropicSSE, formatSSEDone, formatSSEEvent } from '../AiSdkToAnthropicSSE'
 
-// Helper to create properly typed mock events with all required fields
 const createTextDelta = (text: string, id = 'text_0'): TextStreamPart<ToolSet> => ({
   type: 'text-delta',
   id,
@@ -38,8 +37,7 @@ const createFinish = (
   return event
 }
 
-// Helper to create stream from extended events
-// Note: The adapter runtime accepts both standard and extended events
+// Helper to create stream
 function createMockStream(events: readonly TextStreamPart<ToolSet>[]) {
   return new ReadableStream<TextStreamPart<ToolSet>>({
     start(controller) {