From 8e1ebf29b21b0cb62216fdb7694beeb26dfd4e14 Mon Sep 17 00:00:00 2001
From: 1600822305 <1600822305@qq.com>
Date: Fri, 11 Apr 2025 00:43:13 +0800
Subject: [PATCH] =?UTF-8?q?=E6=B7=BB=E5=8A=A0=E4=BA=86=20TTS=20=E7=9B=B8?=
 =?UTF-8?q?=E5=85=B3=E6=9C=8D=E5=8A=A1=E5=B9=B6=E6=9B=B4=E6=96=B0=E4=BA=86?=
 =?UTF-8?q?=E8=AE=BE=E7=BD=AE?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 package.json                                  |    1 +
 packages/shared/IpcChannel.ts                 |    4 +
 src/main/index.ts                             |    4 +
 src/main/ipc.ts                               |    9 +
 src/main/services/FileService.ts              |    9 +-
 src/main/services/MsEdgeTTSService.ts         |   93 ++
 src/main/services/MsTTSIpcHandler.ts          |   18 +
 src/main/services/MsTTSService.ts             |  236 ++++
 src/preload/index.ts                          |    7 +-
 src/renderer/src/components/TTSButton.tsx     |    1 +
 src/renderer/src/i18n/locales/en-us.json      |   28 +-
 src/renderer/src/i18n/locales/zh-cn.json      |   30 +-
 .../pages/home/Messages/MessageMenubar.tsx    |    5 +-
 .../src/pages/home/Messages/TTSStopButton.tsx |    2 +-
 .../settings/TTSSettings/ASRSettings.tsx      |    1 -
 .../settings/TTSSettings/TTSSettings.tsx      |  405 ++++--
 src/renderer/src/services/TTSService.ts       | 1197 +----------------
 .../src/services/tts/EdgeTTSService.ts        |  270 ++++
 src/renderer/src/services/tts/MsTTSService.ts |   58 +
 .../src/services/tts/OpenAITTSService.ts      |   92 ++
 .../src/services/tts/SiliconflowTTSService.ts |  116 ++
 src/renderer/src/services/tts/TTSService.ts   |  240 ++++
 .../src/services/tts/TTSServiceFactory.ts     |   70 +
 .../src/services/tts/TTSServiceInterface.ts   |   12 +
 .../src/services/tts/TTSTextFilter.ts         |  148 ++
 src/renderer/src/services/tts/index.ts        |    7 +
 src/renderer/src/store/settings.ts            |   56 +-
 yarn.lock                                     |   16 +-
 28 files changed, 1859 insertions(+), 1276 deletions(-)
 create mode 100644 src/main/services/MsEdgeTTSService.ts
 create mode 100644 src/main/services/MsTTSIpcHandler.ts
 create mode 100644 src/main/services/MsTTSService.ts
 create mode 100644 src/renderer/src/services/tts/EdgeTTSService.ts
 create mode 100644 src/renderer/src/services/tts/MsTTSService.ts
 create mode 100644 src/renderer/src/services/tts/OpenAITTSService.ts
 create mode 100644 src/renderer/src/services/tts/SiliconflowTTSService.ts
 create mode 100644 src/renderer/src/services/tts/TTSService.ts
 create mode 100644 src/renderer/src/services/tts/TTSServiceFactory.ts
 create mode 100644 src/renderer/src/services/tts/TTSServiceInterface.ts
 create mode 100644 src/renderer/src/services/tts/TTSTextFilter.ts
 create mode 100644 src/renderer/src/services/tts/index.ts

diff --git a/package.json b/package.json
index 36002abd87..406960c2c1 100644
--- a/package.json
+++ b/package.json
@@ -87,6 +87,7 @@
     "got-scraping": "^4.1.1",
     "jsdom": "^26.0.0",
     "markdown-it": "^14.1.0",
+    "node-edge-tts": "^1.2.8",
     "officeparser": "^4.1.1",
     "proxy-agent": "^6.5.0",
     "tar": "^7.4.3",
diff --git a/packages/shared/IpcChannel.ts b/packages/shared/IpcChannel.ts
index 0946491bb6..5975737b0c 100644
--- a/packages/shared/IpcChannel.ts
+++ b/packages/shared/IpcChannel.ts
@@ -22,6 +22,10 @@ export enum IpcChannel {
   Asr_StartServer = 'start-asr-server',
   Asr_StopServer = 'stop-asr-server',
 
+  // MsTTS
+  MsTTS_GetVoices = 'mstts:get-voices',
+  MsTTS_Synthesize = 'mstts:synthesize',
+
   // Open
   Open_Path = 'open:path',
   Open_Website = 'open:website',
diff --git a/src/main/index.ts b/src/main/index.ts
index 816695bb2d..127518b648 100644
--- a/src/main/index.ts
+++ b/src/main/index.ts
@@ -7,6 +7,7 @@ import installExtension, { REACT_DEVELOPER_TOOLS, REDUX_DEVTOOLS } from 'electro
 import { registerIpc } from './ipc'
 import { configManager } from './services/ConfigManager'
 import { CHERRY_STUDIO_PROTOCOL, handleProtocolUrl, registerProtocolClient } from './services/ProtocolClient'
+import { registerMsTTSIpcHandlers } from './services/MsTTSIpcHandler'
 import { registerShortcuts } from './services/ShortcutService'
 import { TrayService } from './services/TrayService'
 import { windowService } from './services/WindowService'
@@ -46,6 +47,9 @@ if (!app.requestSingleInstanceLock()) {
 
     registerIpc(mainWindow, app)
 
+    // 注册MsTTS IPC处理程序
+    registerMsTTSIpcHandlers()
+
     replaceDevtoolsFont(mainWindow)
 
     if (process.env.NODE_ENV === 'development') {
diff --git a/src/main/ipc.ts b/src/main/ipc.ts
index 1bd7318dbd..f2df60fe0e 100644
--- a/src/main/ipc.ts
+++ b/src/main/ipc.ts
@@ -23,6 +23,7 @@ import ObsidianVaultService from './services/ObsidianVaultService'
 import { ProxyConfig, proxyManager } from './services/ProxyManager'
 import { asrServerService } from './services/ASRServerService'
 import { searchService } from './services/SearchService'
+import * as MsTTSService from './services/MsTTSService'
 import { registerShortcuts, unregisterAllShortcuts } from './services/ShortcutService'
 import { TrayService } from './services/TrayService'
 import { windowService } from './services/WindowService'
@@ -309,4 +310,12 @@ export function registerIpc(mainWindow: BrowserWindow, app: Electron.App) {
 
   // 注册ASR服务器IPC处理程序
   asrServerService.registerIpcHandlers()
+
+  // 注册MsTTS IPC处理程序
+  ipcMain.handle(IpcChannel.MsTTS_GetVoices, MsTTSService.getVoices)
+  ipcMain.handle(
+    IpcChannel.MsTTS_Synthesize,
+    (_, text: string, voice: string, outputFormat: string) =>
+      MsTTSService.synthesize(text, voice, outputFormat)
+  )
 }
diff --git a/src/main/services/FileService.ts b/src/main/services/FileService.ts
index 39255e15f7..01837fe382 100644
--- a/src/main/services/FileService.ts
+++ b/src/main/services/FileService.ts
@@ -1,7 +1,12 @@
 import fs from 'node:fs'
 
 export default class FileService {
-  public static async readFile(_: Electron.IpcMainInvokeEvent, path: string) {
-    return fs.readFileSync(path, 'utf8')
+  public static async readFile(_: Electron.IpcMainInvokeEvent, path: string, encoding?: BufferEncoding) {
+    // 如果指定了编码，则返回字符串，否则返回二进制数据
+    if (encoding) {
+      return fs.readFileSync(path, encoding)
+    } else {
+      return fs.readFileSync(path)
+    }
   }
 }
diff --git a/src/main/services/MsEdgeTTSService.ts b/src/main/services/MsEdgeTTSService.ts
new file mode 100644
index 0000000000..fdf31e2edb
--- /dev/null
+++ b/src/main/services/MsEdgeTTSService.ts
@@ -0,0 +1,93 @@
+import { EdgeTTS } from 'node-edge-tts';
+import fs from 'node:fs';
+import path from 'node:path';
+import { app } from 'electron';
+import log from 'electron-log';
+
+/**
+ * Microsoft Edge TTS服务
+ * 使用Microsoft Edge的在线TTS服务，不需要API密钥
+ */
+class MsEdgeTTSService {
+  private static instance: MsEdgeTTSService;
+  private tts: EdgeTTS;
+  private tempDir: string;
+
+  private constructor() {
+    this.tts = new EdgeTTS();
+    this.tempDir = path.join(app.getPath('temp'), 'cherry-tts');
+    
+    // 确保临时目录存在
+    if (!fs.existsSync(this.tempDir)) {
+      fs.mkdirSync(this.tempDir, { recursive: true });
+    }
+  }
+
+  /**
+   * 获取单例实例
+   */
+  public static getInstance(): MsEdgeTTSService {
+    if (!MsEdgeTTSService.instance) {
+      MsEdgeTTSService.instance = new MsEdgeTTSService();
+    }
+    return MsEdgeTTSService.instance;
+  }
+
+  /**
+   * 获取可用的语音列表
+   * @returns 语音列表
+   */
+  public async getVoices(): Promise<any[]> {
+    try {
+      // 返回预定义的中文语音列表
+      return [
+        { name: 'zh-CN-XiaoxiaoNeural', locale: 'zh-CN', gender: 'Female' },
+        { name: 'zh-CN-YunxiNeural', locale: 'zh-CN', gender: 'Male' },
+        { name: 'zh-CN-YunyangNeural', locale: 'zh-CN', gender: 'Male' },
+        { name: 'zh-CN-XiaohanNeural', locale: 'zh-CN', gender: 'Female' },
+        { name: 'zh-CN-XiaomoNeural', locale: 'zh-CN', gender: 'Female' },
+        { name: 'zh-CN-XiaoxuanNeural', locale: 'zh-CN', gender: 'Female' },
+        { name: 'zh-CN-XiaoruiNeural', locale: 'zh-CN', gender: 'Female' },
+        { name: 'zh-CN-YunfengNeural', locale: 'zh-CN', gender: 'Male' },
+      ];
+    } catch (error) {
+      log.error('获取Microsoft Edge TTS语音列表失败:', error);
+      throw error;
+    }
+  }
+
+  /**
+   * 合成语音
+   * @param text 要合成的文本
+   * @param voice 语音
+   * @param outputFormat 输出格式
+   * @returns 音频文件路径
+   */
+  public async synthesize(text: string, voice: string, outputFormat: string): Promise<string> {
+    try {
+      // 设置TTS参数
+      await this.tts.setMetadata(voice, outputFormat);
+      
+      // 生成临时文件路径
+      const timestamp = Date.now();
+      const outputPath = path.join(this.tempDir, `tts_${timestamp}.mp3`);
+      
+      // 合成语音
+      await this.tts.toFile(outputPath, text);
+      
+      return outputPath;
+    } catch (error) {
+      log.error('Microsoft Edge TTS语音合成失败:', error);
+      throw error;
+    }
+  }
+}
+
+// 导出单例方法
+export const getVoices = async () => {
+  return await MsEdgeTTSService.getInstance().getVoices();
+};
+
+export const synthesize = async (text: string, voice: string, outputFormat: string) => {
+  return await MsEdgeTTSService.getInstance().synthesize(text, voice, outputFormat);
+};
diff --git a/src/main/services/MsTTSIpcHandler.ts b/src/main/services/MsTTSIpcHandler.ts
new file mode 100644
index 0000000000..24a31f8e23
--- /dev/null
+++ b/src/main/services/MsTTSIpcHandler.ts
@@ -0,0 +1,18 @@
+import { IpcChannel } from '@shared/IpcChannel';
+import { ipcMain } from 'electron';
+import * as MsTTSService from './MsTTSService';
+
+/**
+ * 注册MsTTS相关的IPC处理程序
+ */
+export function registerMsTTSIpcHandlers(): void {
+  // 获取可用的语音列表
+  ipcMain.handle(IpcChannel.MsTTS_GetVoices, MsTTSService.getVoices);
+  
+  // 合成语音
+  ipcMain.handle(
+    IpcChannel.MsTTS_Synthesize, 
+    (_, text: string, voice: string, outputFormat: string) => 
+      MsTTSService.synthesize(text, voice, outputFormat)
+  );
+}
diff --git a/src/main/services/MsTTSService.ts b/src/main/services/MsTTSService.ts
new file mode 100644
index 0000000000..1d7fcf42f3
--- /dev/null
+++ b/src/main/services/MsTTSService.ts
@@ -0,0 +1,236 @@
+import { EdgeTTS } from 'node-edge-tts'; // listVoices is no longer needed here
+import fs from 'node:fs';
+import path from 'node:path';
+import { app } from 'electron';
+import log from 'electron-log';
+
+// --- START OF HARDCODED VOICE LIST ---
+// WARNING: This list is static and may become outdated.
+// It's generally recommended to use listVoices() for the most up-to-date list.
+const hardcodedVoices = [
+  { Name: 'Microsoft Server Speech Text to Speech Voice (af-ZA, AdriNeural)', ShortName: 'af-ZA-AdriNeural', Gender: 'Female', Locale: 'af-ZA' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (am-ET, MekdesNeural)', ShortName: 'am-ET-MekdesNeural', Gender: 'Female', Locale: 'am-ET' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (ar-AE, FatimaNeural)', ShortName: 'ar-AE-FatimaNeural', Gender: 'Female', Locale: 'ar-AE' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (ar-AE, HamdanNeural)', ShortName: 'ar-AE-HamdanNeural', Gender: 'Male', Locale: 'ar-AE' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (ar-BH, AliNeural)', ShortName: 'ar-BH-AliNeural', Gender: 'Male', Locale: 'ar-BH' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (ar-BH, LailaNeural)', ShortName: 'ar-BH-LailaNeural', Gender: 'Female', Locale: 'ar-BH' },
+  // ... (Many other Arabic locales/voices) ...
+  { Name: 'Microsoft Server Speech Text to Speech Voice (ar-SA, ZariyahNeural)', ShortName: 'ar-SA-ZariyahNeural', Gender: 'Female', Locale: 'ar-SA' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (az-AZ, BabekNeural)', ShortName: 'az-AZ-BabekNeural', Gender: 'Male', Locale: 'az-AZ' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (az-AZ, BanuNeural)', ShortName: 'az-AZ-BanuNeural', Gender: 'Female', Locale: 'az-AZ' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (bg-BG, BorislavNeural)', ShortName: 'bg-BG-BorislavNeural', Gender: 'Male', Locale: 'bg-BG' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (bg-BG, KalinaNeural)', ShortName: 'bg-BG-KalinaNeural', Gender: 'Female', Locale: 'bg-BG' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (bn-BD, NabanitaNeural)', ShortName: 'bn-BD-NabanitaNeural', Gender: 'Female', Locale: 'bn-BD' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (bn-BD, PradeepNeural)', ShortName: 'bn-BD-PradeepNeural', Gender: 'Male', Locale: 'bn-BD' },
+  // ... (Catalan, Czech, Welsh, Danish, German, Greek, English variants) ...
+  { Name: 'Microsoft Server Speech Text to Speech Voice (en-AU, NatashaNeural)', ShortName: 'en-AU-NatashaNeural', Gender: 'Female', Locale: 'en-AU' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (en-AU, WilliamNeural)', ShortName: 'en-AU-WilliamNeural', Gender: 'Male', Locale: 'en-AU' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (en-CA, ClaraNeural)', ShortName: 'en-CA-ClaraNeural', Gender: 'Female', Locale: 'en-CA' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (en-CA, LiamNeural)', ShortName: 'en-CA-LiamNeural', Gender: 'Male', Locale: 'en-CA' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (en-GB, LibbyNeural)', ShortName: 'en-GB-LibbyNeural', Gender: 'Female', Locale: 'en-GB' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (en-GB, MaisieNeural)', ShortName: 'en-GB-MaisieNeural', Gender: 'Female', Locale: 'en-GB' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (en-GB, RyanNeural)', ShortName: 'en-GB-RyanNeural', Gender: 'Male', Locale: 'en-GB' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (en-GB, SoniaNeural)', ShortName: 'en-GB-SoniaNeural', Gender: 'Female', Locale: 'en-GB' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (en-GB, ThomasNeural)', ShortName: 'en-GB-ThomasNeural', Gender: 'Male', Locale: 'en-GB' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (en-HK, SamNeural)', ShortName: 'en-HK-SamNeural', Gender: 'Male', Locale: 'en-HK' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (en-HK, YanNeural)', ShortName: 'en-HK-YanNeural', Gender: 'Female', Locale: 'en-HK' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (en-IE, ConnorNeural)', ShortName: 'en-IE-ConnorNeural', Gender: 'Male', Locale: 'en-IE' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (en-IE, EmilyNeural)', ShortName: 'en-IE-EmilyNeural', Gender: 'Female', Locale: 'en-IE' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (en-IN, NeerjaNeural)', ShortName: 'en-IN-NeerjaNeural', Gender: 'Female', Locale: 'en-IN' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (en-IN, PrabhatNeural)', ShortName: 'en-IN-PrabhatNeural', Gender: 'Male', Locale: 'en-IN' },
+  // ... (Many more English variants: KE, NG, NZ, PH, SG, TZ, US, ZA) ...
+  { Name: 'Microsoft Server Speech Text to Speech Voice (en-US, AriaNeural)', ShortName: 'en-US-AriaNeural', Gender: 'Female', Locale: 'en-US' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (en-US, AnaNeural)', ShortName: 'en-US-AnaNeural', Gender: 'Female', Locale: 'en-US' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (en-US, ChristopherNeural)', ShortName: 'en-US-ChristopherNeural', Gender: 'Male', Locale: 'en-US' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (en-US, EricNeural)', ShortName: 'en-US-EricNeural', Gender: 'Male', Locale: 'en-US' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (en-US, GuyNeural)', ShortName: 'en-US-GuyNeural', Gender: 'Male', Locale: 'en-US' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (en-US, JennyNeural)', ShortName: 'en-US-JennyNeural', Gender: 'Female', Locale: 'en-US' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (en-US, MichelleNeural)', ShortName: 'en-US-MichelleNeural', Gender: 'Female', Locale: 'en-US' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (en-US, RogerNeural)', ShortName: 'en-US-RogerNeural', Gender: 'Male', Locale: 'en-US' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (en-US, SteffanNeural)', ShortName: 'en-US-SteffanNeural', Gender: 'Male', Locale: 'en-US' },
+  // ... (Spanish variants) ...
+  { Name: 'Microsoft Server Speech Text to Speech Voice (es-MX, DaliaNeural)', ShortName: 'es-MX-DaliaNeural', Gender: 'Female', Locale: 'es-MX' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (es-MX, JorgeNeural)', ShortName: 'es-MX-JorgeNeural', Gender: 'Male', Locale: 'es-MX' },
+  // ... (Estonian, Basque, Persian, Finnish, Filipino, French, Irish, Galician, Gujarati, Hebrew, Hindi, Croatian, Hungarian, Indonesian, Icelandic, Italian, Japanese) ...
+  { Name: 'Microsoft Server Speech Text to Speech Voice (ja-JP, KeitaNeural)', ShortName: 'ja-JP-KeitaNeural', Gender: 'Male', Locale: 'ja-JP' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (ja-JP, NanamiNeural)', ShortName: 'ja-JP-NanamiNeural', Gender: 'Female', Locale: 'ja-JP' },
+  // ... (Javanese, Georgian, Kazakh, Khmer, Kannada, Korean) ...
+  { Name: 'Microsoft Server Speech Text to Speech Voice (ko-KR, InJoonNeural)', ShortName: 'ko-KR-InJoonNeural', Gender: 'Male', Locale: 'ko-KR' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (ko-KR, SunHiNeural)', ShortName: 'ko-KR-SunHiNeural', Gender: 'Female', Locale: 'ko-KR' },
+  // ... (Lao, Lithuanian, Latvian, Macedonian, Malayalam, Mongolian, Marathi, Malay, Maltese, Burmese, Norwegian, Dutch, Polish, Pashto, Portuguese) ...
+  { Name: 'Microsoft Server Speech Text to Speech Voice (pt-BR, AntonioNeural)', ShortName: 'pt-BR-AntonioNeural', Gender: 'Male', Locale: 'pt-BR' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (pt-BR, FranciscaNeural)', ShortName: 'pt-BR-FranciscaNeural', Gender: 'Female', Locale: 'pt-BR' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (pt-PT, DuarteNeural)', ShortName: 'pt-PT-DuarteNeural', Gender: 'Male', Locale: 'pt-PT' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (pt-PT, RaquelNeural)', ShortName: 'pt-PT-RaquelNeural', Gender: 'Female', Locale: 'pt-PT' },
+  // ... (Romanian, Russian, Sinhala, Slovak, Slovenian, Somali, Albanian, Serbian, Sundanese, Swedish, Swahili, Tamil, Telugu, Thai) ...
+  { Name: 'Microsoft Server Speech Text to Speech Voice (th-TH, NiwatNeural)', ShortName: 'th-TH-NiwatNeural', Gender: 'Male', Locale: 'th-TH' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (th-TH, PremwadeeNeural)', ShortName: 'th-TH-PremwadeeNeural', Gender: 'Female', Locale: 'th-TH' },
+  // ... (Turkish, Ukrainian, Urdu, Uzbek, Vietnamese) ...
+  { Name: 'Microsoft Server Speech Text to Speech Voice (vi-VN, HoaiMyNeural)', ShortName: 'vi-VN-HoaiMyNeural', Gender: 'Female', Locale: 'vi-VN' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (vi-VN, NamMinhNeural)', ShortName: 'vi-VN-NamMinhNeural', Gender: 'Male', Locale: 'vi-VN' },
+  // ... (Chinese variants) ...
+  { Name: 'Microsoft Server Speech Text to Speech Voice (zh-CN, XiaoxiaoNeural)', ShortName: 'zh-CN-XiaoxiaoNeural', Gender: 'Female', Locale: 'zh-CN' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (zh-CN, YunxiNeural)', ShortName: 'zh-CN-YunxiNeural', Gender: 'Male', Locale: 'zh-CN' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (zh-CN, YunjianNeural)', ShortName: 'zh-CN-YunjianNeural', Gender: 'Male', Locale: 'zh-CN' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (zh-CN, YunxiaNeural)', ShortName: 'zh-CN-YunxiaNeural', Gender: 'Male', Locale: 'zh-CN' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (zh-CN, YunyangNeural)', ShortName: 'zh-CN-YunyangNeural', Gender: 'Male', Locale: 'zh-CN' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (zh-CN-liaoning, XiaobeiNeural)', ShortName: 'zh-CN-liaoning-XiaobeiNeural', Gender: 'Female', Locale: 'zh-CN-liaoning' },
+  // { Name: 'Microsoft Server Speech Text to Speech Voice (zh-CN-shaanxi, XiaoniNeural)', ShortName: 'zh-CN-shaanxi-XiaoniNeural', Gender: 'Female', Locale: 'zh-CN-shaanxi' }, // Example regional voice
+  { Name: 'Microsoft Server Speech Text to Speech Voice (zh-HK, HiuGaaiNeural)', ShortName: 'zh-HK-HiuGaaiNeural', Gender: 'Female', Locale: 'zh-HK' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (zh-HK, HiuMaanNeural)', ShortName: 'zh-HK-HiuMaanNeural', Gender: 'Female', Locale: 'zh-HK' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (zh-HK, WanLungNeural)', ShortName: 'zh-HK-WanLungNeural', Gender: 'Male', Locale: 'zh-HK' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (zh-TW, HsiaoChenNeural)', ShortName: 'zh-TW-HsiaoChenNeural', Gender: 'Female', Locale: 'zh-TW' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (zh-TW, HsiaoYuNeural)', ShortName: 'zh-TW-HsiaoYuNeural', Gender: 'Female', Locale: 'zh-TW' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (zh-TW, YunJheNeural)', ShortName: 'zh-TW-YunJheNeural', Gender: 'Male', Locale: 'zh-TW' },
+  // ... (Zulu) ...
+  { Name: 'Microsoft Server Speech Text to Speech Voice (zu-ZA, ThandoNeural)', ShortName: 'zu-ZA-ThandoNeural', Gender: 'Female', Locale: 'zu-ZA' },
+  { Name: 'Microsoft Server Speech Text to Speech Voice (zu-ZA, ThembaNeural)', ShortName: 'zu-ZA-ThembaNeural', Gender: 'Male', Locale: 'zu-ZA' },
+];
+// --- END OF HARDCODED VOICE LIST ---
+
+
+/**
+ * 免费在线TTS服务
+ * 使用免费的在线TTS服务，不需要API密钥
+ */
+class MsTTSService {
+  private static instance: MsTTSService;
+  private tempDir: string;
+
+  private constructor() {
+    this.tempDir = path.join(app.getPath('temp'), 'cherry-tts');
+    if (!fs.existsSync(this.tempDir)) {
+      fs.mkdirSync(this.tempDir, { recursive: true });
+    }
+    log.info('初始化免费在线TTS服务 (使用硬编码语音列表)');
+  }
+
+  public static getInstance(): MsTTSService {
+    if (!MsTTSService.instance) {
+      MsTTSService.instance = new MsTTSService();
+    }
+    return MsTTSService.instance;
+  }
+
+  /**
+   * 获取可用的语音列表 (返回硬编码列表)
+   * @returns 语音列表
+   */
+  public async getVoices(): Promise<any[]> {
+    try {
+      log.info(`返回硬编码的 ${hardcodedVoices.length} 个语音列表`);
+      // 直接返回硬编码的列表
+      // 注意：保持 async 是为了接口兼容性，虽然这里没有实际的异步操作
+      return hardcodedVoices;
+    } catch (error) {
+       // 这个 try/catch 在这里意义不大了，因为返回静态数据不会出错
+       // 但保留结构以防未来改动
+      log.error('获取硬编码语音列表时出错 (理论上不应发生):', error);
+      return []; // 返回空列表以防万一
+    }
+  }
+
+  /**
+   * 合成语音
+   * @param text 要合成的文本
+   * @param voice 语音的 ShortName (例如 'zh-CN-XiaoxiaoNeural')
+   * @param outputFormat 输出格式 (例如 'audio-24khz-48kbitrate-mono-mp3')
+   * @returns 音频文件路径
+   */
+  public async synthesize(text: string, voice: string, outputFormat: string): Promise<string> {
+    try {
+      // 记录详细的请求信息
+      log.info(`微软在线TTS合成语音: 文本="${text.substring(0, 30)}...", 语音=${voice}, 格式=${outputFormat}`);
+
+      // 验证输入参数
+      if (!text || text.trim() === '') {
+        throw new Error('要合成的文本不能为空');
+      }
+
+      if (!voice || voice.trim() === '') {
+        throw new Error('语音名称不能为空');
+      }
+
+      // 创建一个新的EdgeTTS实例，并设置参数
+      // 添加超时设置，默认为30秒
+      const tts = new EdgeTTS({
+        voice: voice,
+        outputFormat: outputFormat,
+        timeout: 30000, // 30秒超时
+        rate: '+0%',   // 正常语速
+        pitch: '+0Hz', // 正常音调
+        volume: '+0%'  // 正常音量
+      });
+
+      // 生成临时文件路径
+      const timestamp = Date.now();
+      const fileExtension = outputFormat.includes('mp3') ? 'mp3' : outputFormat.split('-').pop() || 'audio';
+      const outputPath = path.join(this.tempDir, `tts_${timestamp}.${fileExtension}`);
+
+      log.info(`开始生成语音文件: ${outputPath}`);
+
+      // 使用ttsPromise方法生成文件
+      await tts.ttsPromise(text, outputPath);
+
+      // 验证生成的文件是否存在且大小大于0
+      if (!fs.existsSync(outputPath)) {
+        throw new Error(`生成的语音文件不存在: ${outputPath}`);
+      }
+
+      const stats = fs.statSync(outputPath);
+      if (stats.size === 0) {
+        throw new Error(`生成的语音文件大小为0: ${outputPath}`);
+      }
+
+      log.info(`微软在线TTS合成成功: ${outputPath}, 文件大小: ${stats.size} 字节`);
+      return outputPath;
+    } catch (error: any) {
+      // 记录详细的错误信息
+      log.error(`微软在线TTS语音合成失败 (语音=${voice}):`, error);
+
+      // 尝试提供更有用的错误信息
+      if (error.message && typeof error.message === 'string') {
+        if (error.message.includes('Timed out')) {
+          throw new Error(`语音合成超时，请检查网络连接或尝试其他语音`);
+        } else if (error.message.includes('ENOTFOUND')) {
+          throw new Error(`无法连接到微软语音服务，请检查网络连接`);
+        } else if (error.message.includes('ECONNREFUSED')) {
+          throw new Error(`连接被拒绝，请检查网络设置或代理配置`);
+        }
+      }
+
+      throw error;
+    }
+  }
+
+   /**
+   * (可选) 清理临时文件目录
+   */
+  public async cleanupTempDir(): Promise<void> {
+    // (Cleanup method remains the same)
+     try {
+      const files = await fs.promises.readdir(this.tempDir);
+      for (const file of files) {
+        if (file.startsWith('tts_')) {
+          await fs.promises.unlink(path.join(this.tempDir, file));
+        }
+      }
+      log.info('TTS 临时文件已清理');
+    } catch (error) {
+      log.error('清理 TTS 临时文件失败:', error);
+    }
+  }
+}
+
+// 导出单例方法 (保持不变)
+export const getVoices = async () => {
+  return await MsTTSService.getInstance().getVoices();
+};
+
+export const synthesize = async (text: string, voice: string, outputFormat: string) => {
+  return await MsTTSService.getInstance().synthesize(text, voice, outputFormat);
+};
+
+export const cleanupTtsTempFiles = async () => {
+  await MsTTSService.getInstance().cleanupTempDir();
+};
\ No newline at end of file
diff --git a/src/preload/index.ts b/src/preload/index.ts
index b2b72f5b71..50b922c917 100644
--- a/src/preload/index.ts
+++ b/src/preload/index.ts
@@ -64,7 +64,7 @@ const api = {
     binaryFile: (fileId: string) => ipcRenderer.invoke(IpcChannel.File_BinaryFile, fileId)
   },
   fs: {
-    read: (path: string) => ipcRenderer.invoke(IpcChannel.Fs_Read, path)
+    read: (path: string, encoding?: BufferEncoding) => ipcRenderer.invoke(IpcChannel.Fs_Read, path, encoding)
   },
   export: {
     toWord: (markdown: string, fileName: string) => ipcRenderer.invoke(IpcChannel.Export_Word, markdown, fileName)
@@ -119,6 +119,11 @@ const api = {
     toggle: () => ipcRenderer.invoke(IpcChannel.MiniWindow_Toggle),
     setPin: (isPinned: boolean) => ipcRenderer.invoke(IpcChannel.MiniWindow_SetPin, isPinned)
   },
+  msTTS: {
+    getVoices: () => ipcRenderer.invoke(IpcChannel.MsTTS_GetVoices),
+    synthesize: (text: string, voice: string, outputFormat: string) =>
+      ipcRenderer.invoke(IpcChannel.MsTTS_Synthesize, text, voice, outputFormat)
+  },
   aes: {
     encrypt: (text: string, secretKey: string, iv: string) =>
       ipcRenderer.invoke(IpcChannel.Aes_Encrypt, text, secretKey, iv),
diff --git a/src/renderer/src/components/TTSButton.tsx b/src/renderer/src/components/TTSButton.tsx
index 58e4c2039a..aa6592f372 100644
--- a/src/renderer/src/components/TTSButton.tsx
+++ b/src/renderer/src/components/TTSButton.tsx
@@ -23,6 +23,7 @@ const TTSButton: React.FC<TTSButtonProps> = ({ message, className }) => {
 
     setIsSpeaking(true)
     try {
+      console.log('点击TTS按钮，开始播放消息')
       await TTSService.speakFromMessage(message)
 
       // 监听播放结束
diff --git a/src/renderer/src/i18n/locales/en-us.json b/src/renderer/src/i18n/locales/en-us.json
index c2f6aeb6c8..aa2686a43a 100644
--- a/src/renderer/src/i18n/locales/en-us.json
+++ b/src/renderer/src/i18n/locales/en-us.json
@@ -1350,8 +1350,21 @@
         "service_type": "Service Type",
         "service_type.openai": "OpenAI",
         "service_type.edge": "Browser TTS",
+        "service_type.siliconflow": "SiliconFlow",
         "service_type.refresh": "Refresh TTS service type settings",
         "service_type.refreshed": "TTS service type settings refreshed",
+        "siliconflow_api_key": "SiliconFlow API Key",
+        "siliconflow_api_key.placeholder": "Enter SiliconFlow API key",
+        "siliconflow_api_url": "SiliconFlow API URL",
+        "siliconflow_api_url.placeholder": "Example: https://api.siliconflow.cn/v1/audio/speech",
+        "siliconflow_voice": "SiliconFlow Voice",
+        "siliconflow_voice.placeholder": "Select a voice",
+        "siliconflow_model": "SiliconFlow Model",
+        "siliconflow_model.placeholder": "Select a model",
+        "siliconflow_response_format": "Response Format",
+        "siliconflow_response_format.placeholder": "Default is mp3",
+        "siliconflow_speed": "Speech Speed",
+        "siliconflow_speed.placeholder": "Default is 1.0",
         "api_key": "API Key",
         "api_key.placeholder": "Enter OpenAI API key",
         "api_url": "API URL",
@@ -1381,10 +1394,17 @@
         "learn_more": "Learn more",
         "tab_title": "[to be translated]:语音合成",
         "error": {
-          "not_enabled": "[to be translated]:语音合成功能未启用",
-          "no_api_key": "[to be translated]:未设置API密钥",
-          "no_edge_voice": "[to be translated]:未选择浏览器 TTS音色",
-          "browser_not_support": "[to be translated]:浏览器不支持语音合成"
+          "not_enabled": "Text-to-speech feature is not enabled",
+          "no_api_key": "API key is not set",
+          "no_voice": "Voice is not selected",
+          "no_model": "Model is not selected",
+          "no_edge_voice": "Browser TTS voice is not selected",
+          "browser_not_support": "Browser does not support speech synthesis",
+          "synthesis_failed": "Speech synthesis failed",
+          "play_failed": "Speech playback failed",
+          "empty_text": "Text is empty",
+          "general": "An error occurred during speech synthesis",
+          "unsupported_service_type": "Unsupported service type: {{serviceType}}"
         }
       },
       "asr": {
diff --git a/src/renderer/src/i18n/locales/zh-cn.json b/src/renderer/src/i18n/locales/zh-cn.json
index 160dcc55c9..08cb46fd05 100644
--- a/src/renderer/src/i18n/locales/zh-cn.json
+++ b/src/renderer/src/i18n/locales/zh-cn.json
@@ -1356,8 +1356,22 @@
         "service_type": "服务类型",
         "service_type.openai": "OpenAI",
         "service_type.edge": "浏览器 TTS",
+        "service_type.siliconflow": "硅基流动",
+        "service_type.mstts": "免费在线 TTS",
         "service_type.refresh": "刷新TTS服务类型设置",
         "service_type.refreshed": "已刷新TTS服务类型设置",
+        "siliconflow_api_key": "硅基流动API密钥",
+        "siliconflow_api_key.placeholder": "请输入硅基流动API密钥",
+        "siliconflow_api_url": "硅基流动API地址",
+        "siliconflow_api_url.placeholder": "例如：https://api.siliconflow.cn/v1/audio/speech",
+        "siliconflow_voice": "硅基流动音色",
+        "siliconflow_voice.placeholder": "请选择音色",
+        "siliconflow_model": "硅基流动模型",
+        "siliconflow_model.placeholder": "请选择模型",
+        "siliconflow_response_format": "响应格式",
+        "siliconflow_response_format.placeholder": "默认为mp3",
+        "siliconflow_speed": "语速",
+        "siliconflow_speed.placeholder": "默认为1.0",
         "api_key": "API密钥",
         "api_key.placeholder": "请输入OpenAI API密钥",
         "api_url": "API地址",
@@ -1366,6 +1380,13 @@
         "edge_voice.loading": "加载中...",
         "edge_voice.refresh": "刷新可用音色列表",
         "edge_voice.not_found": "未找到匹配的音色",
+        "edge_voice.available_count": "可用语音: {{count}}个",
+        "edge_voice.refreshing": "正在刷新语音列表...",
+        "edge_voice.refreshed": "语音列表已刷新",
+        "mstts.voice": "免费在线 TTS音色",
+        "mstts.output_format": "输出格式",
+        "mstts.info": "免费在线TTS服务不需要API密钥，完全免费使用。",
+        "error.no_mstts_voice": "未设置免费在线 TTS音色",
         "voice": "音色",
         "voice.placeholder": "请选择音色",
         "voice_input_placeholder": "输入音色",
@@ -1388,8 +1409,15 @@
         "error": {
           "not_enabled": "语音合成功能未启用",
           "no_api_key": "未设置API密钥",
+          "no_voice": "未选择音色",
+          "no_model": "未选择模型",
           "no_edge_voice": "未选择浏览器 TTS音色",
-          "browser_not_support": "浏览器不支持语音合成"
+          "browser_not_support": "浏览器不支持语音合成",
+          "synthesis_failed": "语音合成失败",
+          "play_failed": "语音播放失败",
+          "empty_text": "文本为空",
+          "general": "语音合成出现错误",
+          "unsupported_service_type": "不支持的服务类型: {{serviceType}}"
         }
       },
       "asr": {
diff --git a/src/renderer/src/pages/home/Messages/MessageMenubar.tsx b/src/renderer/src/pages/home/Messages/MessageMenubar.tsx
index e5189732da..006a1d495a 100644
--- a/src/renderer/src/pages/home/Messages/MessageMenubar.tsx
+++ b/src/renderer/src/pages/home/Messages/MessageMenubar.tsx
@@ -407,7 +407,10 @@ const MessageMenubar: FC<Props> = (props) => {
       )}
       {isAssistantMessage && ttsEnabled && (
         <Tooltip title={t('chat.tts.play')} mouseEnterDelay={0.8}>
-          <ActionButton className="message-action-button" onClick={() => TTSService.speakFromMessage(message)}>
+          <ActionButton className="message-action-button" onClick={() => {
+            console.log('点击MessageMenubar中的TTS按钮，开始播放消息')
+            TTSService.speakFromMessage(message)
+          }}>
             <SoundOutlined />
           </ActionButton>
         </Tooltip>
diff --git a/src/renderer/src/pages/home/Messages/TTSStopButton.tsx b/src/renderer/src/pages/home/Messages/TTSStopButton.tsx
index 82b6f921eb..f5065b2821 100644
--- a/src/renderer/src/pages/home/Messages/TTSStopButton.tsx
+++ b/src/renderer/src/pages/home/Messages/TTSStopButton.tsx
@@ -57,7 +57,7 @@ const TTSStopButton: React.FC = () => {
 
 const StopButtonContainer = styled.div`
   position: fixed;
-  bottom: 100px;
+  bottom: 150px; /* 从100px改为150px，向上移动50px */
   right: 20px;
   z-index: 1000;
 `
diff --git a/src/renderer/src/pages/settings/TTSSettings/ASRSettings.tsx b/src/renderer/src/pages/settings/TTSSettings/ASRSettings.tsx
index dc44dbb3e8..eb3e7f7e51 100644
--- a/src/renderer/src/pages/settings/TTSSettings/ASRSettings.tsx
+++ b/src/renderer/src/pages/settings/TTSSettings/ASRSettings.tsx
@@ -34,7 +34,6 @@ const ASRSettings: FC = () => {
   // 服务类型选项
   const serviceTypeOptions = [
     { label: 'OpenAI', value: 'openai' },
-    { label: t('settings.asr.service_type.browser'), value: 'browser' },
     { label: t('settings.asr.service_type.local'), value: 'local' }
   ]
 
diff --git a/src/renderer/src/pages/settings/TTSSettings/TTSSettings.tsx b/src/renderer/src/pages/settings/TTSSettings/TTSSettings.tsx
index 3e105bcf4f..4fea657369 100644
--- a/src/renderer/src/pages/settings/TTSSettings/TTSSettings.tsx
+++ b/src/renderer/src/pages/settings/TTSSettings/TTSSettings.tsx
@@ -15,10 +15,18 @@ import {
   setTtsFilterOptions,
   setTtsModel,
   setTtsServiceType,
-  setTtsVoice
+  setTtsVoice,
+  setTtsSiliconflowApiKey,
+  setTtsSiliconflowApiUrl,
+  setTtsSiliconflowVoice,
+  setTtsSiliconflowModel,
+  setTtsSiliconflowResponseFormat,
+  setTtsSiliconflowSpeed,
+  setTtsMsVoice,
+  setTtsMsOutputFormat
 } from '@renderer/store/settings'
-import { Button, Form, Input, message, Select, Space, Switch, Tabs, Tag } from 'antd'
-import { FC, useEffect, useState } from 'react'
+import { Button, Form, Input, InputNumber, message, Select, Space, Switch, Tabs, Tag } from 'antd'
+import { FC, useEffect, useState, useCallback } from 'react'
 import { useTranslation } from 'react-i18next'
 import { useSelector } from 'react-redux'
 import styled from 'styled-components'
@@ -34,6 +42,36 @@ import {
 } from '..'
 import ASRSettings from './ASRSettings'
 
+// 预定义的浏览器 TTS音色列表
+const PREDEFINED_VOICES = [
+  { label: '小晓 (女声, 中文)', value: 'zh-CN-XiaoxiaoNeural' },
+  { label: '云扬 (男声, 中文)', value: 'zh-CN-YunyangNeural' },
+  { label: '晓晓 (女声, 中文)', value: 'zh-CN-XiaoxiaoNeural' },
+  { label: '晓涵 (女声, 中文)', value: 'zh-CN-XiaohanNeural' },
+  { label: '晓诗 (女声, 中文)', value: 'zh-CN-XiaoshuangNeural' },
+  { label: '晓瑞 (女声, 中文)', value: 'zh-CN-XiaoruiNeural' },
+  { label: '晓墨 (女声, 中文)', value: 'zh-CN-XiaomoNeural' },
+  { label: '晓然 (男声, 中文)', value: 'zh-CN-XiaoranNeural' },
+  { label: '晓坤 (男声, 中文)', value: 'zh-CN-XiaokunNeural' },
+  { label: 'Aria (Female, English)', value: 'en-US-AriaNeural' },
+  { label: 'Guy (Male, English)', value: 'en-US-GuyNeural' },
+  { label: 'Jenny (Female, English)', value: 'en-US-JennyNeural' },
+  { label: 'Ana (Female, Spanish)', value: 'es-ES-ElviraNeural' },
+  { label: 'Ichiro (Male, Japanese)', value: 'ja-JP-KeitaNeural' },
+  { label: 'Nanami (Female, Japanese)', value: 'ja-JP-NanamiNeural' },
+  // 添加更多常用的语音
+  { label: 'Microsoft David (en-US)', value: 'Microsoft David Desktop - English (United States)' },
+  { label: 'Microsoft Zira (en-US)', value: 'Microsoft Zira Desktop - English (United States)' },
+  { label: 'Microsoft Mark (en-US)', value: 'Microsoft Mark Online (Natural) - English (United States)' },
+  { label: 'Microsoft Aria (en-US)', value: 'Microsoft Aria Online (Natural) - English (United States)' },
+  { label: 'Google US English', value: 'Google US English' },
+  { label: 'Google UK English Female', value: 'Google UK English Female' },
+  { label: 'Google UK English Male', value: 'Google UK English Male' },
+  { label: 'Google 日本語', value: 'Google 日本語' },
+  { label: 'Google 普通话（中国大陆）', value: 'Google 普通话（中国大陆）' },
+  { label: 'Google 粤語（香港）', value: 'Google 粤語（香港）' }
+]
+
 const CustomVoiceInput = styled.div`
   display: flex;
   flex-direction: column;
@@ -81,6 +119,12 @@ const LoadingText = styled.div`
   color: #999;
 `
 
+const InfoText = styled.div`
+  margin-top: 8px;
+  font-size: 12px;
+  color: #888;
+`
+
 const VoiceSelectContainer = styled.div`
   display: flex;
   gap: 8px;
@@ -93,25 +137,34 @@ const TTSSettings: FC = () => {
   const dispatch = useAppDispatch()
 
   // 从Redux获取TTS设置
-  const ttsEnabled = useSelector((state: any) => state.settings.ttsEnabled)
-  const ttsServiceType = useSelector((state: any) => state.settings.ttsServiceType || 'openai')
-  const ttsApiKey = useSelector((state: any) => state.settings.ttsApiKey)
-  const ttsApiUrl = useSelector((state: any) => state.settings.ttsApiUrl)
-  const ttsVoice = useSelector((state: any) => state.settings.ttsVoice)
-  const ttsModel = useSelector((state: any) => state.settings.ttsModel)
-  const ttsEdgeVoice = useSelector((state: any) => state.settings.ttsEdgeVoice || 'zh-CN-XiaoxiaoNeural')
-  const ttsCustomVoices = useSelector((state: any) => state.settings.ttsCustomVoices || [])
-  const ttsCustomModels = useSelector((state: any) => state.settings.ttsCustomModels || [])
-  const ttsFilterOptions = useSelector(
-    (state: any) =>
-      state.settings.ttsFilterOptions || {
-        filterThinkingProcess: true,
-        filterMarkdown: true,
-        filterCodeBlocks: true,
-        filterHtmlTags: true,
-        maxTextLength: 4000
-      }
-  )
+  const settings = useSelector((state: any) => state.settings)
+  const ttsEnabled = settings.ttsEnabled
+  const ttsServiceType = settings.ttsServiceType || 'openai'
+  const ttsApiKey = settings.ttsApiKey
+  const ttsApiUrl = settings.ttsApiUrl
+  const ttsVoice = settings.ttsVoice
+  const ttsModel = settings.ttsModel
+  const ttsEdgeVoice = settings.ttsEdgeVoice || 'zh-CN-XiaoxiaoNeural'
+  const ttsCustomVoices = settings.ttsCustomVoices || []
+  const ttsCustomModels = settings.ttsCustomModels || []
+  // 免费在线TTS设置
+  const ttsMsVoice = settings.ttsMsVoice || 'zh-CN-XiaoxiaoNeural'
+  const ttsMsOutputFormat = settings.ttsMsOutputFormat || 'audio-24khz-48kbitrate-mono-mp3'
+  const ttsFilterOptions = settings.ttsFilterOptions || {
+    filterThinkingProcess: true,
+    filterMarkdown: true,
+    filterCodeBlocks: true,
+    filterHtmlTags: true,
+    maxTextLength: 4000
+  }
+
+  // 硅基流动TTS设置
+  const ttsSiliconflowApiKey = settings.ttsSiliconflowApiKey
+  const ttsSiliconflowApiUrl = settings.ttsSiliconflowApiUrl
+  const ttsSiliconflowVoice = settings.ttsSiliconflowVoice
+  const ttsSiliconflowModel = settings.ttsSiliconflowModel
+  const ttsSiliconflowResponseFormat = settings.ttsSiliconflowResponseFormat
+  const ttsSiliconflowSpeed = settings.ttsSiliconflowSpeed
 
   // 新增自定义音色和模型的状态
   const [newVoice, setNewVoice] = useState('')
@@ -120,38 +173,51 @@ const TTSSettings: FC = () => {
   // 浏览器可用的语音列表
   const [availableVoices, setAvailableVoices] = useState<{ label: string; value: string }[]>([])
 
-  // 预定义的浏览器 TTS音色列表
-  const predefinedVoices = [
-    { label: '小晓 (女声, 中文)', value: 'zh-CN-XiaoxiaoNeural' },
-    { label: '云扬 (男声, 中文)', value: 'zh-CN-YunyangNeural' },
-    { label: '晓晓 (女声, 中文)', value: 'zh-CN-XiaoxiaoNeural' },
-    { label: '晓涵 (女声, 中文)', value: 'zh-CN-XiaohanNeural' },
-    { label: '晓诗 (女声, 中文)', value: 'zh-CN-XiaoshuangNeural' },
-    { label: '晓瑞 (女声, 中文)', value: 'zh-CN-XiaoruiNeural' },
-    { label: '晓墨 (女声, 中文)', value: 'zh-CN-XiaomoNeural' },
-    { label: '晓然 (男声, 中文)', value: 'zh-CN-XiaoranNeural' },
-    { label: '晓坤 (男声, 中文)', value: 'zh-CN-XiaokunNeural' },
-    { label: 'Aria (Female, English)', value: 'en-US-AriaNeural' },
-    { label: 'Guy (Male, English)', value: 'en-US-GuyNeural' },
-    { label: 'Jenny (Female, English)', value: 'en-US-JennyNeural' },
-    { label: 'Ana (Female, Spanish)', value: 'es-ES-ElviraNeural' },
-    { label: 'Ichiro (Male, Japanese)', value: 'ja-JP-KeitaNeural' },
-    { label: 'Nanami (Female, Japanese)', value: 'ja-JP-NanamiNeural' },
-    // 添加更多常用的语音
-    { label: 'Microsoft David (en-US)', value: 'Microsoft David Desktop - English (United States)' },
-    { label: 'Microsoft Zira (en-US)', value: 'Microsoft Zira Desktop - English (United States)' },
-    { label: 'Microsoft Mark (en-US)', value: 'Microsoft Mark Online (Natural) - English (United States)' },
-    { label: 'Microsoft Aria (en-US)', value: 'Microsoft Aria Online (Natural) - English (United States)' },
-    { label: 'Google US English', value: 'Google US English' },
-    { label: 'Google UK English Female', value: 'Google UK English Female' },
-    { label: 'Google UK English Male', value: 'Google UK English Male' },
-    { label: 'Google 日本語', value: 'Google 日本語' },
-    { label: 'Google 普通话（中国大陆）', value: 'Google 普通话（中国大陆）' },
-    { label: 'Google 粤語（香港）', value: 'Google 粤語（香港）' }
-  ]
+  // 免费在线TTS可用的语音列表
+  const [msTtsVoices, setMsTtsVoices] = useState<{ label: string; value: string }[]>([])
+
+
+
+  // 获取免费在线TTS可用的语音列表
+  const getMsTtsVoices = useCallback(async () => {
+    try {
+      // 调用API获取免费在线TTS语音列表
+      const response = await window.api.msTTS.getVoices();
+      console.log('获取到的免费在线TTS语音列表:', response);
+
+      // 转换为选项格式
+      const voices = response.map((voice: any) => ({
+        label: `${voice.ShortName} (${voice.Gender === 'Female' ? '女声' : '男声'})`,
+        value: voice.ShortName
+      }));
+
+      // 按语言和性别排序
+      voices.sort((a: any, b: any) => {
+        const localeA = a.value.split('-')[0] + a.value.split('-')[1];
+        const localeB = b.value.split('-')[0] + b.value.split('-')[1];
+        if (localeA !== localeB) return localeA.localeCompare(localeB);
+        return a.label.localeCompare(b.label);
+      });
+
+      setMsTtsVoices(voices);
+    } catch (error) {
+      console.error('获取免费在线TTS语音列表失败:', error);
+      // 如果获取失败，设置一些默认的中文语音
+      setMsTtsVoices([
+        { label: 'zh-CN-XiaoxiaoNeural (女声)', value: 'zh-CN-XiaoxiaoNeural' },
+        { label: 'zh-CN-YunxiNeural (男声)', value: 'zh-CN-YunxiNeural' },
+        { label: 'zh-CN-YunyangNeural (男声)', value: 'zh-CN-YunyangNeural' },
+        { label: 'zh-CN-XiaohanNeural (女声)', value: 'zh-CN-XiaohanNeural' },
+        { label: 'zh-CN-XiaomoNeural (女声)', value: 'zh-CN-XiaomoNeural' },
+        { label: 'zh-CN-XiaoxuanNeural (女声)', value: 'zh-CN-XiaoxuanNeural' },
+        { label: 'zh-CN-XiaoruiNeural (女声)', value: 'zh-CN-XiaoruiNeural' },
+        { label: 'zh-CN-YunfengNeural (男声)', value: 'zh-CN-YunfengNeural' },
+      ]);
+    }
+  }, []);
 
   // 获取浏览器可用的语音列表
-  const getVoices = () => {
+  const getVoices = useCallback(() => {
     if (typeof window !== 'undefined' && 'speechSynthesis' in window) {
       // 先触发一下语音合成引擎，确保它已经初始化
       window.speechSynthesis.cancel()
@@ -170,18 +236,22 @@ const TTSSettings: FC = () => {
       }))
 
       // 添加语言信息到预定义语音
-      const enhancedPredefinedVoices = predefinedVoices.map((voice) => ({
+      const enhancedPredefinedVoices = PREDEFINED_VOICES.map((voice) => ({
         ...voice,
         lang: voice.value.split('-').slice(0, 2).join('-'),
         isNative: false // 标记为非浏览器原生语音
       }))
 
       // 合并所有语音列表
+      // 只使用浏览器原生语音，因为预定义语音实际不可用
       let allVoices = [...browserVoices]
 
-      // 如果浏览器语音少于5个，添加预定义语音
-      if (browserVoices.length < 5) {
-        allVoices = [...browserVoices, ...enhancedPredefinedVoices]
+      // 如果浏览器没有可用语音，才使用预定义语音
+      if (browserVoices.length === 0) {
+        allVoices = [...enhancedPredefinedVoices]
+        console.log('浏览器没有可用语音，使用预定义语音')
+      } else {
+        console.log('使用浏览器原生语音，共' + browserVoices.length + '个')
       }
 
       // 去除重复项，优先保留浏览器原生语音
@@ -210,12 +280,12 @@ const TTSSettings: FC = () => {
     } else {
       // 如果浏览器不支持Web Speech API，使用预定义的语音列表
       console.log('浏览器不支持Web Speech API，使用预定义的语音列表')
-      setAvailableVoices(predefinedVoices)
+      setAvailableVoices(PREDEFINED_VOICES)
     }
-  }
+  }, [])
 
   // 刷新语音列表
-  const refreshVoices = () => {
+  const refreshVoices = useCallback(() => {
     console.log('手动刷新语音列表')
     message.loading({
       content: t('settings.tts.edge_voice.refreshing', { defaultValue: '正在刷新语音列表...' }),
@@ -242,13 +312,19 @@ const TTSSettings: FC = () => {
       }, 500)
     } else {
       // 如果浏览器不支持Web Speech API，使用预定义的语音列表
-      setAvailableVoices(predefinedVoices)
+      setAvailableVoices(PREDEFINED_VOICES)
       message.success({
         content: t('settings.tts.edge_voice.refreshed', { defaultValue: '语音列表已刷新' }),
         key: 'refresh-voices'
       })
     }
-  }
+  }, [getVoices, t])
+
+  // 获取免费在线TTS语音列表
+  useEffect(() => {
+    // 获取免费在线TTS语音列表
+    getMsTtsVoices();
+  }, [getMsTtsVoices]);
 
   useEffect(() => {
     // 初始化语音合成引擎
@@ -283,10 +359,10 @@ const TTSSettings: FC = () => {
       }
     } else {
       // 如果浏览器不支持Web Speech API，使用预定义的语音列表
-      setAvailableVoices(predefinedVoices)
+      setAvailableVoices(PREDEFINED_VOICES)
       return () => {}
     }
-  }, [getVoices, predefinedVoices])
+  }, [getVoices])
 
   // 测试TTS功能
   const testTTS = async () => {
@@ -295,6 +371,11 @@ const TTSSettings: FC = () => {
       return
     }
 
+    // 强制刷新状态，确保使用最新的设置
+    // 先获取当前的服务类型
+    const currentType = store.getState().settings.ttsServiceType || 'openai'
+    console.log('测试前当前的TTS服务类型:', currentType)
+
     // 获取最新的服务类型设置
     const latestSettings = store.getState().settings
     const currentServiceType = latestSettings.ttsServiceType || 'openai'
@@ -305,7 +386,12 @@ const TTSSettings: FC = () => {
       ttsApiKey: latestSettings.ttsApiKey ? '已设置' : '未设置',
       ttsVoice: latestSettings.ttsVoice,
       ttsModel: latestSettings.ttsModel,
-      ttsEdgeVoice: latestSettings.ttsEdgeVoice
+      ttsEdgeVoice: latestSettings.ttsEdgeVoice,
+      ttsSiliconflowApiKey: latestSettings.ttsSiliconflowApiKey ? '已设置' : '未设置',
+      ttsSiliconflowVoice: latestSettings.ttsSiliconflowVoice,
+      ttsSiliconflowModel: latestSettings.ttsSiliconflowModel,
+      ttsSiliconflowResponseFormat: latestSettings.ttsSiliconflowResponseFormat,
+      ttsSiliconflowSpeed: latestSettings.ttsSiliconflowSpeed
     })
 
     // 根据服务类型检查必要的参数
@@ -329,6 +415,25 @@ const TTSSettings: FC = () => {
         window.message.error({ content: t('settings.tts.error.no_edge_voice'), key: 'tts-test' })
         return
       }
+    } else if (currentServiceType === 'siliconflow') {
+      const ttsSiliconflowApiKey = latestSettings.ttsSiliconflowApiKey
+      const ttsSiliconflowVoice = latestSettings.ttsSiliconflowVoice
+      const ttsSiliconflowModel = latestSettings.ttsSiliconflowModel
+
+      if (!ttsSiliconflowApiKey) {
+        window.message.error({ content: t('settings.tts.error.no_api_key'), key: 'tts-test' })
+        return
+      }
+
+      if (!ttsSiliconflowVoice) {
+        window.message.error({ content: t('settings.tts.error.no_voice'), key: 'tts-test' })
+        return
+      }
+
+      if (!ttsSiliconflowModel) {
+        window.message.error({ content: t('settings.tts.error.no_model'), key: 'tts-test' })
+        return
+      }
     }
 
     await TTSService.speak('这是一段测试语音，用于测试TTS功能是否正常工作。')
@@ -430,25 +535,14 @@ const TTSSettings: FC = () => {
                           value={ttsServiceType}
                           onChange={(value: string) => {
                             console.log('切换TTS服务类型为:', value)
-                            // 先将新的服务类型写入Redux状态
+                            // 直接将新的服务类型写入Redux状态
                             dispatch(setTtsServiceType(value))
-
-                            // 等待一下，确保状态已更新
-                            setTimeout(() => {
-                              // 验证状态是否正确更新
-                              const currentType = store.getState().settings.ttsServiceType
-                              console.log('更新后的TTS服务类型:', currentType)
-
-                              // 如果状态没有正确更新，再次尝试
-                              if (currentType !== value) {
-                                console.log('状态未正确更新，再次尝试')
-                                dispatch(setTtsServiceType(value))
-                              }
-                            }, 100)
                           }}
                           options={[
                             { label: t('settings.tts.service_type.openai'), value: 'openai' },
-                            { label: t('settings.tts.service_type.edge'), value: 'edge' }
+                            { label: t('settings.tts.service_type.edge'), value: 'edge' },
+                            { label: t('settings.tts.service_type.siliconflow'), value: 'siliconflow' },
+                            { label: t('settings.tts.service_type.mstts'), value: 'mstts' }
                           ]}
                           disabled={!ttsEnabled}
                           style={{ flex: 1 }}
@@ -495,6 +589,92 @@ const TTSSettings: FC = () => {
                       </>
                     )}
 
+                    {/* 硅基流动 TTS设置 */}
+                    {ttsServiceType === 'siliconflow' && (
+                      <>
+                        <Form.Item label={t('settings.tts.siliconflow_api_key')} style={{ marginBottom: 16 }}>
+                          <Input.Password
+                            value={ttsSiliconflowApiKey}
+                            onChange={(e) => dispatch(setTtsSiliconflowApiKey(e.target.value))}
+                            placeholder={t('settings.tts.siliconflow_api_key.placeholder')}
+                            disabled={!ttsEnabled}
+                          />
+                        </Form.Item>
+                        <Form.Item label={t('settings.tts.siliconflow_api_url')} style={{ marginBottom: 16 }}>
+                          <Input
+                            value={ttsSiliconflowApiUrl}
+                            onChange={(e) => dispatch(setTtsSiliconflowApiUrl(e.target.value))}
+                            placeholder={t('settings.tts.siliconflow_api_url.placeholder')}
+                            disabled={!ttsEnabled}
+                          />
+                        </Form.Item>
+                        <Form.Item label={t('settings.tts.siliconflow_voice')} style={{ marginBottom: 16 }}>
+                          <Select
+                            value={ttsSiliconflowVoice}
+                            onChange={(value) => dispatch(setTtsSiliconflowVoice(value))}
+                            options={[
+                              { label: 'alex (沉稳男声)', value: 'FunAudioLLM/CosyVoice2-0.5B:alex' },
+                              { label: 'benjamin (低沉男声)', value: 'FunAudioLLM/CosyVoice2-0.5B:benjamin' },
+                              { label: 'charles (磁性男声)', value: 'FunAudioLLM/CosyVoice2-0.5B:charles' },
+                              { label: 'david (欢快男声)', value: 'FunAudioLLM/CosyVoice2-0.5B:david' },
+                              { label: 'anna (沉稳女声)', value: 'FunAudioLLM/CosyVoice2-0.5B:anna' },
+                              { label: 'bella (激情女声)', value: 'FunAudioLLM/CosyVoice2-0.5B:bella' },
+                              { label: 'claire (温柔女声)', value: 'FunAudioLLM/CosyVoice2-0.5B:claire' },
+                              { label: 'diana (欢快女声)', value: 'FunAudioLLM/CosyVoice2-0.5B:diana' }
+                            ]}
+                            disabled={!ttsEnabled}
+                            style={{ width: '100%' }}
+                            placeholder={t('settings.tts.siliconflow_voice.placeholder')}
+                            showSearch
+                            optionFilterProp="label"
+                            allowClear
+                          />
+                        </Form.Item>
+                        <Form.Item label={t('settings.tts.siliconflow_model')} style={{ marginBottom: 16 }}>
+                          <Select
+                            value={ttsSiliconflowModel}
+                            onChange={(value) => dispatch(setTtsSiliconflowModel(value))}
+                            options={[
+                              { label: 'FunAudioLLM/CosyVoice2-0.5B', value: 'FunAudioLLM/CosyVoice2-0.5B' }
+                            ]}
+                            disabled={!ttsEnabled}
+                            style={{ width: '100%' }}
+                            placeholder={t('settings.tts.siliconflow_model.placeholder')}
+                            showSearch
+                            optionFilterProp="label"
+                            allowClear
+                          />
+                        </Form.Item>
+                        <Form.Item label={t('settings.tts.siliconflow_response_format')} style={{ marginBottom: 16 }}>
+                          <Select
+                            value={ttsSiliconflowResponseFormat}
+                            onChange={(value) => dispatch(setTtsSiliconflowResponseFormat(value))}
+                            options={[
+                              { label: 'MP3', value: 'mp3' },
+                              { label: 'OPUS', value: 'opus' },
+                              { label: 'WAV', value: 'wav' },
+                              { label: 'PCM', value: 'pcm' }
+                            ]}
+                            disabled={!ttsEnabled}
+                            style={{ width: '100%' }}
+                            placeholder={t('settings.tts.siliconflow_response_format.placeholder')}
+                          />
+                        </Form.Item>
+                        <Form.Item label={t('settings.tts.siliconflow_speed')} style={{ marginBottom: 16 }}>
+                          <InputNumber
+                            value={ttsSiliconflowSpeed}
+                            onChange={(value) => dispatch(setTtsSiliconflowSpeed(value as number))}
+                            min={0.5}
+                            max={2.0}
+                            step={0.1}
+                            disabled={!ttsEnabled}
+                            style={{ width: '100%' }}
+                            placeholder={t('settings.tts.siliconflow_speed.placeholder')}
+                          />
+                        </Form.Item>
+                      </>
+                    )}
+
                     {/* 浏览器 TTS设置 */}
                     {ttsServiceType === 'edge' && (
                       <Form.Item label={t('settings.tts.edge_voice')} style={{ marginBottom: 16 }}>
@@ -532,9 +712,69 @@ const TTSSettings: FC = () => {
                         {availableVoices.length === 0 && (
                           <LoadingText>{t('settings.tts.edge_voice.loading')}</LoadingText>
                         )}
+                        {availableVoices.length > 0 && (
+                          <InfoText>
+                            {t('settings.tts.edge_voice.available_count', { count: availableVoices.length })}
+                          </InfoText>
+                        )}
                       </Form.Item>
                     )}
 
+                    {/* 免费在线 TTS设置 */}
+                    {ttsServiceType === 'mstts' && (
+                      <>
+                        <Form.Item label={t('settings.tts.mstts.voice')} style={{ marginBottom: 16 }}>
+                          <VoiceSelectContainer>
+                            <Select
+                            value={ttsMsVoice}
+                            onChange={(value) => dispatch(setTtsMsVoice(value))}
+                            disabled={!ttsEnabled}
+                            style={{ width: '100%' }}
+                            options={msTtsVoices.length > 0 ? msTtsVoices : [
+                              { label: 'zh-CN-XiaoxiaoNeural (女声)', value: 'zh-CN-XiaoxiaoNeural' },
+                              { label: 'zh-CN-YunxiNeural (男声)', value: 'zh-CN-YunxiNeural' },
+                              { label: 'zh-CN-YunyangNeural (男声)', value: 'zh-CN-YunyangNeural' },
+                              { label: 'zh-CN-XiaohanNeural (女声)', value: 'zh-CN-XiaohanNeural' },
+                              { label: 'zh-CN-XiaomoNeural (女声)', value: 'zh-CN-XiaomoNeural' },
+                              { label: 'zh-CN-XiaoxuanNeural (女声)', value: 'zh-CN-XiaoxuanNeural' },
+                              { label: 'zh-CN-XiaoruiNeural (女声)', value: 'zh-CN-XiaoruiNeural' },
+                              { label: 'zh-CN-YunfengNeural (男声)', value: 'zh-CN-YunfengNeural' },
+                            ]}
+                            showSearch
+                            optionFilterProp="label"
+                            placeholder={t('settings.tts.voice.placeholder', { defaultValue: '请选择音色' })}
+                            notFoundContent={t('settings.tts.voice.not_found', { defaultValue: '未找到音色' })}
+                            />
+                            <Button
+                              icon={<ReloadOutlined />}
+                              onClick={() => getMsTtsVoices()}
+                              disabled={!ttsEnabled}
+                              title={t('settings.tts.mstts.refresh', { defaultValue: '刷新语音列表' })}
+                            />
+                          </VoiceSelectContainer>
+                          {msTtsVoices.length > 0 && (
+                            <InfoText>
+                              {t('settings.tts.mstts.available_count', { count: msTtsVoices.length, defaultValue: '可用语音: {{count}}个' })}
+                            </InfoText>
+                          )}
+                        </Form.Item>
+                        <Form.Item label={t('settings.tts.mstts.output_format')} style={{ marginBottom: 16 }}>
+                          <Select
+                            value={ttsMsOutputFormat}
+                            onChange={(value) => dispatch(setTtsMsOutputFormat(value))}
+                            disabled={!ttsEnabled}
+                            style={{ width: '100%' }}
+                            options={[
+                              { label: 'MP3 (24kHz, 48kbps)', value: 'audio-24khz-48kbitrate-mono-mp3' },
+                              { label: 'MP3 (24kHz, 96kbps)', value: 'audio-24khz-96kbitrate-mono-mp3' },
+                              { label: 'Webm (24kHz)', value: 'webm-24khz-16bit-mono-opus' },
+                            ]}
+                          />
+                        </Form.Item>
+                        <InfoText>{t('settings.tts.mstts.info', { defaultValue: '免费在线TTS服务不需要API密钥，完全免费使用。' })}</InfoText>
+                      </>
+                    )}
+
                     {/* OpenAI TTS的音色和模型设置 */}
                     {ttsServiceType === 'openai' && (
                       <>
@@ -719,7 +959,12 @@ const TTSSettings: FC = () => {
                         disabled={
                           !ttsEnabled ||
                           (ttsServiceType === 'openai' && (!ttsApiKey || !ttsVoice || !ttsModel)) ||
-                          (ttsServiceType === 'edge' && !ttsEdgeVoice)
+                          (ttsServiceType === 'edge' && !ttsEdgeVoice) ||
+                          (ttsServiceType === 'siliconflow' && (
+                            !ttsSiliconflowApiKey ||
+                            !ttsSiliconflowVoice ||
+                            !ttsSiliconflowModel
+                          ))
                         }>
                         {t('settings.tts.test')}
                       </Button>
diff --git a/src/renderer/src/services/TTSService.ts b/src/renderer/src/services/TTSService.ts
index 29e0914f2b..863c295ec4 100644
--- a/src/renderer/src/services/TTSService.ts
+++ b/src/renderer/src/services/TTSService.ts
@@ -1,1024 +1,31 @@
-import i18n from '@renderer/i18n'
-import store from '@renderer/store'
+/**
+ * 已弃用，请使用 src/renderer/src/services/tts/TTSService.ts
+ * 这个文件仅作兼容性保留，将在后续版本中移除
+ */
+
+import { TTSService as NewTTSService } from './tts/index'
 import { Message } from '@renderer/types'
 
 /**
  * TTS服务，用于将文本转换为语音
+ * @deprecated 请使用 src/renderer/src/services/tts/TTSService.ts
  */
 class TTSService {
-  private audio: HTMLAudioElement | null = null
-  private isPlaying = false
+  private service = NewTTSService.getInstance()
 
   /**
    * 将文本转换为语音并播放
    * @param text 要转换的文本
    */
   speak = async (text: string): Promise<void> => {
-    try {
-      const { ttsEnabled, ttsServiceType, ttsApiKey, ttsApiUrl, ttsVoice, ttsModel, ttsEdgeVoice } =
-        store.getState().settings
-
-      if (!ttsEnabled) {
-        window.message.error({ content: i18n.t('settings.tts.error.not_enabled'), key: 'tts-error' })
-        return
-      }
-
-      // 停止当前正在播放的音频
-      this.stop()
-
-      // 显示加载提示
-      window.message.loading({
-        content: i18n.t('settings.tts.processing', { defaultValue: '正在生成语音...' }),
-        key: 'tts-loading'
-      })
-
-      // 初始化为空的Blob，防止类型错误
-      let audioBlob: Blob = new Blob([], { type: 'audio/wav' })
-
-      // 根据服务类型选择不同的TTS实现
-      console.log('当前TTS服务类型:', ttsServiceType)
-
-      // 确保ttsServiceType是有效的值
-      // 从存储中重新获取服务类型，确保使用最新的设置
-      // 强制使用最新的状态，而不是传入的参数
-      const latestSettings = store.getState().settings
-      const serviceType = latestSettings.ttsServiceType || 'openai'
-      console.log('最终使用的TTS服务类型:', serviceType)
-      console.log('当前完整TTS设置:', {
-        ttsEnabled: latestSettings.ttsEnabled,
-        ttsServiceType: latestSettings.ttsServiceType,
-        ttsApiKey: latestSettings.ttsApiKey ? '已设置' : '未设置',
-        ttsVoice: latestSettings.ttsVoice,
-        ttsModel: latestSettings.ttsModel,
-        ttsEdgeVoice: latestSettings.ttsEdgeVoice
-      })
-
-      if (serviceType === 'openai') {
-        // 检查OpenAI TTS所需的参数
-        if (!ttsApiKey) {
-          window.message.error({ content: i18n.t('settings.tts.error.no_api_key'), key: 'tts-error' })
-          return
-        }
-
-        if (!ttsApiUrl) {
-          window.message.error({ content: i18n.t('settings.tts.error.no_api_url'), key: 'tts-error' })
-          return
-        }
-
-        if (!ttsVoice) {
-          window.message.error({ content: i18n.t('settings.tts.error.no_voice'), key: 'tts-error' })
-          return
-        }
-
-        if (!ttsModel) {
-          window.message.error({ content: i18n.t('settings.tts.error.no_model'), key: 'tts-error' })
-          return
-        }
-
-        // 准备OpenAI TTS请求体
-        const requestBody: any = {
-          input: text
-        }
-
-        // 只有当模型和音色不为空时才添加到请求体中
-        if (ttsModel) {
-          requestBody.model = ttsModel
-        }
-
-        if (ttsVoice) {
-          requestBody.voice = ttsVoice
-        }
-
-        // 调用OpenAI TTS API
-        const response = await fetch(ttsApiUrl, {
-          method: 'POST',
-          headers: {
-            'Content-Type': 'application/json',
-            Authorization: `Bearer ${ttsApiKey}`
-          },
-          body: JSON.stringify(requestBody)
-        })
-
-        if (!response.ok) {
-          const errorData = await response.json()
-          throw new Error(errorData.error?.message || 'OpenAI语音合成失败')
-        }
-
-        // 获取音频数据
-        console.log('获取到OpenAI TTS响应，开始处理音频数据')
-        audioBlob = await response.blob()
-      } else if (serviceType === 'edge') {
-        // 使用浏览器的Web Speech API
-        if (!ttsEdgeVoice) {
-          window.message.error({ content: i18n.t('settings.tts.error.no_edge_voice'), key: 'tts-error' })
-          return
-        }
-
-        try {
-          console.log('使用浏览器TTS生成语音，音色:', ttsEdgeVoice)
-
-          // 使用Web Speech API
-          if (!('speechSynthesis' in window)) {
-            throw new Error(i18n.t('settings.tts.error.browser_not_support'))
-          }
-
-          // 停止当前正在播放的语音
-          window.speechSynthesis.cancel()
-
-          // 创建语音合成器实例
-          const utterance = new SpeechSynthesisUtterance(text)
-
-          // 获取可用的语音合成声音
-          const voices = window.speechSynthesis.getVoices()
-          console.log('初始可用的语音合成声音:', voices)
-
-          // 如果没有可用的声音，等待声音加载
-          if (voices.length === 0) {
-            try {
-              await new Promise<void>((resolve) => {
-                const voicesChangedHandler = () => {
-                  window.speechSynthesis.onvoiceschanged = null
-                  resolve()
-                }
-
-                window.speechSynthesis.onvoiceschanged = voicesChangedHandler
-
-                // 设置超时，防止无限等待
-                setTimeout(() => {
-                  window.speechSynthesis.onvoiceschanged = null
-                  resolve() // 超时后仍然继续，而不是报错
-                }, 2000)
-              })
-            } catch (e) {
-              console.warn('等待语音加载时出错:', e)
-            }
-          }
-
-          // 重新获取声音列表
-          const updatedVoices = window.speechSynthesis.getVoices()
-          console.log('更新后的声音列表:', updatedVoices)
-
-          // 尝试找到指定的声音
-          let selectedVoice: SpeechSynthesisVoice | undefined = undefined
-
-          // 输出所有可用的语音信息，便于调试
-          console.log('所有可用的语音信息:')
-          updatedVoices.forEach((voice, index) => {
-            console.log(`语音 ${index + 1}:`, {
-              name: voice.name,
-              lang: voice.lang,
-              default: voice.default,
-              localService: voice.localService,
-              voiceURI: voice.voiceURI
-            })
-          })
-
-          // 记录当前选择的音色，便于调试
-          console.log('当前选择的Edge TTS音色:', ttsEdgeVoice)
-
-          // 创建一个音色映射表，将Neural音色映射到浏览器原生音色
-          const voiceMapping: Record<string, string[]> = {
-            // 中文音色映射
-            'zh-CN-XiaoxiaoNeural': ['Microsoft Yaoyao', 'Microsoft Huihui', 'Google 普通话'],
-            'zh-CN-YunyangNeural': ['Microsoft Kangkang', 'Google 普通话'],
-            'zh-CN-XiaohanNeural': ['Microsoft Yaoyao', 'Microsoft Huihui', 'Google 普通话'],
-            'zh-CN-XiaoshuangNeural': ['Microsoft Yaoyao', 'Microsoft Huihui', 'Google 普通话'],
-            'zh-CN-XiaoruiNeural': ['Microsoft Yaoyao', 'Microsoft Huihui', 'Google 普通话'],
-            'zh-CN-XiaomoNeural': ['Microsoft Yaoyao', 'Microsoft Huihui', 'Google 普通话'],
-            'zh-CN-XiaoranNeural': ['Microsoft Kangkang', 'Google 普通话'],
-            'zh-CN-XiaokunNeural': ['Microsoft Kangkang', 'Google 普通话'],
-
-            // 英文音色映射
-            'en-US-AriaNeural': ['Microsoft Zira', 'Google US English', 'Google UK English Female'],
-            'en-US-GuyNeural': ['Microsoft David', 'Google UK English Male'],
-            'en-US-JennyNeural': ['Microsoft Zira', 'Google US English', 'Google UK English Female'],
-
-            // 西班牙语音色映射
-            'es-ES-ElviraNeural': ['Google español'],
-
-            // 日语音色映射
-            'ja-JP-KeitaNeural': ['Google 日本語'],
-            'ja-JP-NanamiNeural': ['Google 日本語']
-          }
-
-          // 先尝试使用映射表进行匹配
-          if (ttsEdgeVoice && voiceMapping[ttsEdgeVoice]) {
-            console.log('使用映射表匹配音色:', ttsEdgeVoice)
-
-            // 遍历映射表中的候选音色
-            for (const candidateVoice of voiceMapping[ttsEdgeVoice]) {
-              // 尝试找到匹配的音色
-              const matchedVoice = updatedVoices.find(
-                (voice) => voice.name.includes(candidateVoice) || voice.voiceURI.includes(candidateVoice)
-              )
-
-              if (matchedVoice) {
-                selectedVoice = matchedVoice
-                console.log('使用映射表找到匹配的音色:', matchedVoice.name)
-                break
-              }
-            }
-          }
-
-          // 如果映射表没有找到匹配，尝试精确匹配名称
-          if (!selectedVoice) {
-            selectedVoice = updatedVoices.find((voice) => voice.name === ttsEdgeVoice)
-            if (selectedVoice) {
-              console.log('找到精确匹配的语音:', selectedVoice.name)
-            }
-          }
-
-          // 如果没有精确匹配，尝试匹配 Neural 类型的语音
-          if (!selectedVoice && ttsEdgeVoice && ttsEdgeVoice.includes('Neural')) {
-            // 提取语言代码，如zh-CN
-            const langParts = ttsEdgeVoice.split('-')
-            if (langParts.length >= 2) {
-              const langCode = langParts.slice(0, 2).join('-')
-              console.log('检测到Neural音色值，提取语言代码:', langCode)
-
-              // 先尝试匹配包含语言代码的语音
-              selectedVoice = updatedVoices.find(
-                (voice) =>
-                  voice.lang.startsWith(langCode) &&
-                  (voice.name.includes(langParts[2]) || // 匹配人名部分，如Xiaoxiao
-                    voice.name.toLowerCase().includes(langParts[2].toLowerCase()))
-              )
-
-              // 如果没有找到，就匹配该语言的任何语音
-              if (!selectedVoice) {
-                selectedVoice = updatedVoices.find((voice) => voice.lang.startsWith(langCode))
-                if (selectedVoice) {
-                  console.log('找到匹配语言的语音:', selectedVoice.name)
-                }
-              }
-            }
-          }
-
-          // 如果还没有找到，尝试模糊匹配
-          if (!selectedVoice && ttsEdgeVoice) {
-            console.log('尝试模糊匹配语音:', ttsEdgeVoice)
-
-            // 尝试匹配名称中包含的部分
-            selectedVoice = updatedVoices.find(
-              (voice) =>
-                voice.name.toLowerCase().includes(ttsEdgeVoice.toLowerCase()) ||
-                ttsEdgeVoice.toLowerCase().includes(voice.name.toLowerCase())
-            )
-
-            if (selectedVoice) {
-              console.log('找到模糊匹配的语音:', selectedVoice.name)
-            }
-          }
-
-          // 如果还是没有找到，尝试根据语言代码匹配
-          if (!selectedVoice && ttsEdgeVoice) {
-            // 尝试从音色值中提取语言代码
-            let langCode = ''
-
-            if (ttsEdgeVoice.includes('zh')) {
-              langCode = 'zh'
-            } else if (ttsEdgeVoice.includes('en')) {
-              langCode = 'en'
-            } else if (ttsEdgeVoice.includes('ja')) {
-              langCode = 'ja'
-            } else if (ttsEdgeVoice.includes('es')) {
-              langCode = 'es'
-            }
-
-            if (langCode) {
-              console.log('尝试根据语言代码匹配语音:', langCode)
-              selectedVoice = updatedVoices.find((voice) => voice.lang.startsWith(langCode))
-
-              if (selectedVoice) {
-                console.log('找到匹配语言代码的语音:', selectedVoice.name)
-              }
-            }
-          }
-
-          // 如果还是没有找到，使用默认语音或第一个可用的语音
-          if (!selectedVoice) {
-            // 先尝试使用默认语音
-            selectedVoice = updatedVoices.find((voice) => voice.default)
-
-            // 如果没有默认语音，使用第一个可用的语音
-            if (!selectedVoice && updatedVoices.length > 0) {
-              console.log('没有找到匹配的语音，使用第一个可用的语音')
-              selectedVoice = updatedVoices[0]
-            }
-          }
-
-          if (selectedVoice) {
-            utterance.voice = selectedVoice
-            console.log('选择的声音:', selectedVoice)
-          } else {
-            console.warn('未找到指定的声音，使用默认声音')
-          }
-
-          // 设置语音合成参数
-          utterance.rate = 1.0 // 语速（0.1-10）
-          utterance.pitch = 1.0 // 音调（0-2）
-          utterance.volume = 1.0 // 音量（0-1）
-
-          // 设置事件处理程序
-          utterance.onstart = () => {
-            console.log('Edge TTS 开始播放')
-          }
-
-          utterance.onend = () => {
-            console.log('Edge TTS 播放结束')
-          }
-
-          utterance.onerror = (event) => {
-            console.error('Edge TTS 播放错误:', event)
-          }
-
-          // 将文本分段处理，避免过长文本导致的问题
-          if (text.length > 200) {
-            console.log('文本过长，分段处理以确保完整播放')
-
-            // 将文本按句子分段
-            const sentences = text.split(/[.!?\u3002\uff01\uff1f]/).filter((s) => s.trim().length > 0)
-            console.log(`将文本分为 ${sentences.length} 个句子进行播放`)
-
-            // 创建多个语音合成器实例
-            for (let i = 0; i < sentences.length; i++) {
-              const sentenceText = sentences[i].trim() + '.'
-              if (sentenceText.length > 0) {
-                const sentenceUtterance = new SpeechSynthesisUtterance(sentenceText)
-
-                // 复制语音设置
-                if (selectedVoice) sentenceUtterance.voice = selectedVoice
-                sentenceUtterance.rate = utterance.rate
-                sentenceUtterance.pitch = utterance.pitch
-                sentenceUtterance.volume = utterance.volume
-
-                // 添加到队列
-                window.speechSynthesis.speak(sentenceUtterance)
-              }
-            }
-          } else {
-            // 直接使用Web Speech API播放语音
-            window.speechSynthesis.speak(utterance)
-          }
-
-          // 创建一个有效的音频文件作为占位符
-          // 这是一个最小的有效WAV文件头
-          const wavHeader = new Uint8Array([
-            0x52,
-            0x49,
-            0x46,
-            0x46, // "RIFF"
-            0x24,
-            0x00,
-            0x00,
-            0x00, // 文件大小
-            0x57,
-            0x41,
-            0x56,
-            0x45, // "WAVE"
-            0x66,
-            0x6d,
-            0x74,
-            0x20, // "fmt "
-            0x10,
-            0x00,
-            0x00,
-            0x00, // fmt块大小
-            0x01,
-            0x00, // 格式类型
-            0x01,
-            0x00, // 通道数
-            0x44,
-            0xac,
-            0x00,
-            0x00, // 采样率
-            0x88,
-            0x58,
-            0x01,
-            0x00, // 字节率
-            0x02,
-            0x00, // 块对齐
-            0x10,
-            0x00, // 位深度
-            0x64,
-            0x61,
-            0x74,
-            0x61, // "data"
-            0x10,
-            0x00,
-            0x00,
-            0x00 // 数据大小 (16 bytes)
-          ])
-
-          // 添加一些样本数据
-          const dummyAudio = new Uint8Array([1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16])
-          const combinedArray = new Uint8Array(wavHeader.length + dummyAudio.length)
-          combinedArray.set(wavHeader)
-          combinedArray.set(dummyAudio, wavHeader.length)
-
-          // 创建一个有效的WAV文件
-          let localAudioBlob = new Blob([combinedArray], { type: 'audio/wav' })
-          console.log('创建了有效WAV文件，大小:', localAudioBlob.size, 'bytes')
-
-          // 显示成功消息
-          window.message.success({
-            content: i18n.t('settings.tts.playing', { defaultValue: '语音播放中...' }),
-            key: 'tts-loading'
-          })
-
-          // 在Edge TTS模式下，我们不需要播放音频元素，因为浏览器已经在播放语音
-          // 我们只需要创建一个有效的音频Blob作为占位符
-
-          // 等待语音播放完成
-          await new Promise<void>((resolve, reject) => {
-            // 创建一个检查播放状态的函数
-            let isPlaying = true
-            let checkInterval: number | null = null
-
-            // 定期检查播放状态
-            const checkPlayingStatus = () => {
-              if (!window.speechSynthesis.speaking && !window.speechSynthesis.pending) {
-                console.log('Edge TTS 播放完成（通过检测检测到）')
-                isPlaying = false
-                if (checkInterval) {
-                  clearInterval(checkInterval)
-                  checkInterval = null
-                }
-                resolve()
-              }
-            }
-
-            // 设置事件处理程序
-            const originalOnEnd = utterance.onend
-            utterance.onend = (event) => {
-              console.log('Edge TTS 播放结束（通过事件检测到）')
-              isPlaying = false
-              if (checkInterval) {
-                clearInterval(checkInterval)
-                checkInterval = null
-              }
-              if (originalOnEnd) originalOnEnd.call(utterance, event)
-              resolve()
-            }
-
-            const originalOnError = utterance.onerror
-            utterance.onerror = (event) => {
-              console.error('Edge TTS 播放错误:', event)
-              isPlaying = false
-              if (checkInterval) {
-                clearInterval(checkInterval)
-                checkInterval = null
-              }
-              if (originalOnError) originalOnError.call(utterance, event)
-              reject(new Error(`语音合成错误: ${event.error}`))
-            }
-
-            // 开始定期检查
-            checkInterval = window.setInterval(checkPlayingStatus, 500) as unknown as number
-
-            // 设置超时，防止语音合成卡住
-            setTimeout(() => {
-              if (isPlaying) {
-                console.log('Edge TTS 播放超时，强制结束')
-                if (window.speechSynthesis.speaking || window.speechSynthesis.pending) {
-                  window.speechSynthesis.cancel()
-                }
-                isPlaying = false
-                if (checkInterval) {
-                  clearInterval(checkInterval)
-                  checkInterval = null
-                }
-                resolve()
-              }
-            }, 30000) // 30秒超时
-          })
-
-          // 如果没有音频数据，使用默认的音频
-          if (!localAudioBlob) {
-            // 创建一个有效的音频数据
-            // 这是一个最小的有效WAV文件头
-            const wavHeader = new Uint8Array([
-              0x52,
-              0x49,
-              0x46,
-              0x46, // "RIFF"
-              0x24,
-              0x00,
-              0x00,
-              0x00, // 文件大小
-              0x57,
-              0x41,
-              0x56,
-              0x45, // "WAVE"
-              0x66,
-              0x6d,
-              0x74,
-              0x20, // "fmt "
-              0x10,
-              0x00,
-              0x00,
-              0x00, // fmt块大小
-              0x01,
-              0x00, // 格式类型
-              0x01,
-              0x00, // 通道数
-              0x44,
-              0xac,
-              0x00,
-              0x00, // 采样率
-              0x88,
-              0x58,
-              0x01,
-              0x00, // 字节率
-              0x02,
-              0x00, // 块对齐
-              0x10,
-              0x00, // 位深度
-              0x64,
-              0x61,
-              0x74,
-              0x61, // "data"
-              0x00,
-              0x00,
-              0x00,
-              0x00 // 数据大小
-            ])
-
-            // 添加一些样本数据
-            const dummyAudio = new Uint8Array([1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16])
-            const combinedArray = new Uint8Array(wavHeader.length + dummyAudio.length)
-            combinedArray.set(wavHeader)
-            combinedArray.set(dummyAudio, wavHeader.length)
-
-            localAudioBlob = new Blob([combinedArray], { type: 'audio/wav' })
-            console.log('创建了有效WAV文件，大小:', localAudioBlob.size, 'bytes')
-          }
-
-          // 设置全局音频Blob
-          audioBlob = localAudioBlob
-        } catch (error: any) {
-          console.error('浏览器TTS错误:', error)
-
-          // 如果浏览器TTS失败，尝试使用默认的音频
-          try {
-            // 创建一个简单的音频数据
-            const audioContext = new AudioContext()
-            const oscillator = audioContext.createOscillator()
-            const gainNode = audioContext.createGain()
-
-            oscillator.connect(gainNode)
-            gainNode.connect(audioContext.destination)
-
-            oscillator.type = 'sine'
-            oscillator.frequency.value = 440 // A4音频
-            gainNode.gain.value = 0.5
-
-            oscillator.start()
-
-            // 录制音频
-            const mediaStreamDest = audioContext.createMediaStreamDestination()
-            gainNode.connect(mediaStreamDest)
-
-            const mediaRecorder = new MediaRecorder(mediaStreamDest.stream)
-            const fallbackAudioChunks: BlobPart[] = []
-            let fallbackAudioBlob: Blob | null = null
-
-            mediaRecorder.ondataavailable = (event) => {
-              if (event.data.size > 0) {
-                fallbackAudioChunks.push(event.data)
-              }
-            }
-
-            mediaRecorder.onstop = () => {
-              fallbackAudioBlob = new Blob(fallbackAudioChunks, { type: 'audio/wav' })
-              oscillator.stop()
-            }
-
-            mediaRecorder.start()
-
-            // 录制500毫秒
-            await new Promise<void>((resolve) => setTimeout(resolve, 500))
-
-            mediaRecorder.stop()
-
-            // 等待录制完成
-            await new Promise<void>((resolve) => {
-              mediaRecorder.onstop = () => {
-                fallbackAudioBlob = new Blob(fallbackAudioChunks, { type: 'audio/wav' })
-                oscillator.stop()
-                resolve()
-              }
-            })
-
-            // 设置全局音频Blob
-            if (fallbackAudioBlob) {
-              audioBlob = fallbackAudioBlob
-            }
-          } catch (fallbackError) {
-            console.error('默认音频生成失败:', fallbackError)
-            throw new Error(`浏览器TTS语音合成失败: ${error.message}`)
-          }
-        }
-      } else {
-        console.error('不支持的TTS服务类型:', serviceType)
-        // 默认使用OpenAI TTS
-        if (!ttsApiKey) {
-          window.message.error({ content: i18n.t('settings.tts.error.no_api_key'), key: 'tts-error' })
-          return
-        }
-
-        if (!ttsApiUrl) {
-          window.message.error({ content: i18n.t('settings.tts.error.no_api_url'), key: 'tts-error' })
-          return
-        }
-
-        if (!ttsVoice) {
-          window.message.error({ content: i18n.t('settings.tts.error.no_voice'), key: 'tts-error' })
-          return
-        }
-
-        if (!ttsModel) {
-          window.message.error({ content: i18n.t('settings.tts.error.no_model'), key: 'tts-error' })
-          return
-        }
-
-        // 准备OpenAI TTS请求体
-        const requestBody: any = {
-          input: text
-        }
-
-        // 只有当模型和音色不为空时才添加到请求体中
-        if (ttsModel) {
-          requestBody.model = ttsModel
-        }
-
-        if (ttsVoice) {
-          requestBody.voice = ttsVoice
-        }
-
-        // 调用OpenAI TTS API
-        const response = await fetch(ttsApiUrl, {
-          method: 'POST',
-          headers: {
-            'Content-Type': 'application/json',
-            Authorization: `Bearer ${ttsApiKey}`
-          },
-          body: JSON.stringify(requestBody)
-        })
-
-        if (!response.ok) {
-          const errorData = await response.json()
-          throw new Error(errorData.error?.message || 'OpenAI语音合成失败')
-        }
-
-        // 获取音频数据
-        console.log('获取到OpenAI TTS响应，开始处理音频数据')
-        audioBlob = await response.blob()
-      }
-
-      // 确保audioBlob已经初始化
-      if (!audioBlob) {
-        // 创建一个有效的音频文件作为占位符
-        // 这是一个最小的有效WAV文件头
-        const wavHeader = new Uint8Array([
-          0x52,
-          0x49,
-          0x46,
-          0x46, // "RIFF"
-          0x24,
-          0x00,
-          0x00,
-          0x00, // 文件大小
-          0x57,
-          0x41,
-          0x56,
-          0x45, // "WAVE"
-          0x66,
-          0x6d,
-          0x74,
-          0x20, // "fmt "
-          0x10,
-          0x00,
-          0x00,
-          0x00, // fmt块大小
-          0x01,
-          0x00, // 格式类型
-          0x01,
-          0x00, // 通道数
-          0x44,
-          0xac,
-          0x00,
-          0x00, // 采样率
-          0x88,
-          0x58,
-          0x01,
-          0x00, // 字节率
-          0x02,
-          0x00, // 块对齐
-          0x10,
-          0x00, // 位深度
-          0x64,
-          0x61,
-          0x74,
-          0x61, // "data"
-          0x10,
-          0x00,
-          0x00,
-          0x00 // 数据大小 (16 bytes)
-        ])
-
-        // 添加一些样本数据
-        const dummyAudio = new Uint8Array([1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16])
-        const combinedArray = new Uint8Array(wavHeader.length + dummyAudio.length)
-        combinedArray.set(wavHeader)
-        combinedArray.set(dummyAudio, wavHeader.length)
-
-        audioBlob = new Blob([combinedArray], { type: 'audio/wav' })
-        console.log('创建了有效WAV文件，大小:', audioBlob.size, 'bytes')
-      }
-
-      console.log('音频Blob大小:', audioBlob.size, 'bytes', '类型:', audioBlob.type)
-      const audioUrl = URL.createObjectURL(audioBlob)
-      console.log('创建的Blob URL:', audioUrl)
-
-      // 创建音频元素并播放
-      this.audio = new Audio()
-      this.audio.oncanplay = () => {
-        console.log('音频已准备好可以播放')
-      }
-      this.audio.onended = () => {
-        console.log('音频播放结束')
-        this.isPlaying = false
-        URL.revokeObjectURL(audioUrl)
-      }
-      this.audio.onerror = (error) => {
-        console.error('音频播放错误:', error)
-        console.error('错误代码:', this.audio?.error?.code)
-        console.error('错误消息:', this.audio?.error?.message)
-        window.message.error({ content: `音频播放失败: ${this.audio?.error?.message || '未知错误'}`, key: 'tts-error' })
-        this.isPlaying = false
-        URL.revokeObjectURL(audioUrl)
-      }
-
-      // 设置音频源并播放
-      this.audio.src = audioUrl
-      console.log('开始播放音频')
-      try {
-        await this.audio.play()
-        console.log('音频开始播放')
-        this.isPlaying = true
-      } catch (error: any) {
-        console.error('播放音频时出错:', error)
-        window.message.error({ content: `播放音频失败: ${error.message}`, key: 'tts-error' })
-        this.isPlaying = false
-        URL.revokeObjectURL(audioUrl)
-        throw error
-      }
-
-      // 关闭加载提示
-      window.message.success({ content: '语音播放中...', key: 'tts-loading' })
-    } catch (error: any) {
-      console.error('TTS错误:', error)
-      window.message.error({ content: `语音合成失败: ${error.message}`, key: 'tts-error' })
-    }
+    await this.service.speak(text)
   }
 
   /**
-   * 清理文本，移除不需要的标点符号和格式化标记
-   * @param text 要清理的文本
-   * @returns 清理后的文本
+   * 停止播放
    */
-  private cleanTextForSpeech(text: string): string {
-    // 获取最新的TTS设置
-    const {
-      ttsFilterOptions = {
-        filterThinkingProcess: true,
-        filterMarkdown: true,
-        filterCodeBlocks: true,
-        filterHtmlTags: true,
-        maxTextLength: 4000
-      },
-      ttsServiceType
-    } = store.getState().settings
-
-    // 输出当前的TTS服务类型，便于调试
-    console.log('清理文本时使用的TTS服务类型:', ttsServiceType || 'openai')
-    let cleanedText = text
-
-    // 根据过滤选项进行处理
-
-    // 移除Markdown格式化的符号，如*号、`号等
-    if (ttsFilterOptions.filterMarkdown) {
-      cleanedText = cleanedText
-        // 移除加粗和斜体标记
-        .replace(/\*\*([^*]+)\*\*/g, '$1') // **bold** -> bold
-        .replace(/\*([^*]+)\*/g, '$1') // *italic* -> italic
-        .replace(/__([^_]+)__/g, '$1') // __bold__ -> bold
-        .replace(/_([^_]+)_/g, '$1') // _italic_ -> italic
-        // 移除链接格式，只保留链接文本
-        .replace(/\[([^\]]+)\]\([^)]+\)/g, '$1') // [text](url) -> text
-    }
-
-    // 移除代码块
-    if (ttsFilterOptions.filterCodeBlocks) {
-      cleanedText = cleanedText
-        .replace(/```[\s\S]*?```/g, '') // 移除代码块
-        .replace(/`([^`]+)`/g, '$1') // `code` -> code
-    }
-
-    // 移除HTML标签
-    if (ttsFilterOptions.filterHtmlTags) {
-      cleanedText = cleanedText.replace(/<[^>]*>/g, '')
-    }
-
-    // 基本清理（始终执行）
-    cleanedText = cleanedText
-      // 将多个连续的空格替换为单个空格
-      .replace(/\s+/g, ' ')
-      // 将多个连续的换行替换为单个换行
-      .replace(/\n+/g, '\n')
-      // 移除行首和行尾的空白字符
-      .trim()
-
-    return cleanedText
-  }
-
-  /**
-   * 检测并移除思考过程
-   * @param text 要处理的文本
-   * @returns 处理后的文本
-   */
-  private removeThinkingProcess(text: string): string {
-    // 获取最新的TTS设置
-    const {
-      ttsFilterOptions = {
-        filterThinkingProcess: true,
-        filterMarkdown: true,
-        filterCodeBlocks: true,
-        filterHtmlTags: true,
-        maxTextLength: 4000
-      },
-      ttsServiceType
-    } = store.getState().settings
-
-    // 输出当前的TTS服务类型，便于调试
-    console.log('移除思考过程时使用的TTS服务类型:', ttsServiceType || 'openai')
-
-    // 如果不需要过滤思考过程，直接返回原文本
-    if (!ttsFilterOptions.filterThinkingProcess) {
-      return text
-    }
-    // 如果整个文本都是{'text': '...'}格式，则不处理
-    // 这种情况可能是伪思考过程，实际上是整个回答
-    const isFullTextJson =
-      text.trim().startsWith('{') && text.includes('"text":') && text.trim().endsWith('}') && !text.includes('\n\n')
-
-    // 如果文本中包含多个段落或明显的思考过程标记，则处理
-    const hasThinkingMarkers =
-      text.includes('<think>') ||
-      text.includes('<thinking>') ||
-      text.includes('[THINKING]') ||
-      text.includes('```thinking')
-
-    // 如果文本以JSON格式开头，且不是整个文本都是JSON，或者包含思考过程标记
-    if ((text.trim().startsWith('{') && text.includes('"text":') && !isFullTextJson) || hasThinkingMarkers) {
-      // 尝试提取JSON中的text字段
-      try {
-        const match = text.match(/"text":\s*"([^"]+)"/)
-        if (match && match[1]) {
-          // 只返回text字段的内容
-          return match[1].replace(/\\n/g, '\n').replace(/\\"/g, '"')
-        }
-      } catch (e) {
-        console.error('解析JSON失败:', e)
-      }
-    }
-
-    // 直接检查是否以<think>开头
-    const trimmedText = text.trim()
-    console.log('检查是否以<think>开头:', trimmedText.startsWith('<think>'))
-
-    if (trimmedText.startsWith('<think>')) {
-      // 如果文本以<think>开头，则尝试找到对应的</think>结尾标签
-      const endTagIndex = text.indexOf('</think>')
-      console.log('结束标签位置:', endTagIndex)
-
-      if (endTagIndex !== -1) {
-        // 找到结束标签，去除<think>...</think>部分
-        const thinkContent = text.substring(0, endTagIndex + 9) // 思考过程部分
-        const afterThinkTag = text.substring(endTagIndex + 9).trim() // 9是</think>的长度
-
-        console.log('思考过程内容长度:', thinkContent.length)
-        console.log('思考过程后的内容长度:', afterThinkTag.length)
-        console.log('思考过程后的内容开头:', afterThinkTag.substring(0, 50))
-
-        if (afterThinkTag) {
-          console.log('找到<think>标签，已移除思考过程')
-          return afterThinkTag
-        } else {
-          // 如果思考过程后没有内容，则尝试提取思考过程中的有用信息
-          console.log('思考过程后没有内容，尝试提取思考过程中的有用信息')
-
-          // 提取<think>和</think>之间的内容
-          const thinkContentText = text.substring(text.indexOf('<think>') + 7, endTagIndex).trim()
-
-          // 如果思考过程中包含“这是”或“This is”等关键词，可能是有用的信息
-          if (
-            thinkContentText.includes('这是') ||
-            thinkContentText.includes('This is') ||
-            thinkContentText.includes('The error') ||
-            thinkContentText.includes('错误')
-          ) {
-            // 尝试找到最后一个段落，可能包含总结信息
-            const paragraphs = thinkContentText.split(/\n\s*\n/)
-            if (paragraphs.length > 0) {
-              const lastParagraph = paragraphs[paragraphs.length - 1].trim()
-              if (lastParagraph.length > 50) {
-                // 确保段落足够长
-                console.log('从思考过程中提取了最后一个段落')
-                return lastParagraph
-              }
-            }
-
-            // 如果没有找到合适的段落，返回整个思考过程
-            console.log('返回整个思考过程内容')
-            return thinkContentText
-          }
-        }
-      }
-    }
-
-    // 先处理<think>标签
-    if (text.includes('<think>')) {
-      const startIndex = text.indexOf('<think>')
-      const endIndex = text.indexOf('</think>')
-
-      if (startIndex !== -1 && endIndex !== -1 && endIndex > startIndex) {
-        console.log('找到<think>标签，起始位置:', startIndex, '结束位置:', endIndex)
-
-        // 提取<think>和</think>之间的内容
-        const thinkContent = text.substring(startIndex + 7, endIndex)
-
-        // 提取</think>后面的内容
-        const afterThinkContent = text.substring(endIndex + 9).trim() // 9是</think>的长度
-
-        console.log('<think>内容长度:', thinkContent.length)
-        console.log('</think>后内容长度:', afterThinkContent.length)
-
-        if (afterThinkContent) {
-          // 如果</think>后面有内容，则使用该内容
-          console.log('使用</think>后面的内容')
-          return afterThinkContent
-        } else {
-          // 如果</think>后面没有内容，则使用思考过程中的内容
-          console.log('使用<think>标签中的内容')
-          return thinkContent
-        }
-      }
-    }
-
-    // 如果没有<think>标签或处理失败，则移除其他思考过程标记
-    const processedText = text
-      // 移除HTML标记的思考过程
-      .replace(/<thinking>[\s\S]*?<\/thinking>/gi, '')
-      .replace(/<think>[\s\S]*?<\/think>/gi, '')
-      // 移除方括号标记的思考过程
-      .replace(/\[THINKING\][\s\S]*?\[\/THINKING\]/gi, '')
-      .replace(/\[THINK\][\s\S]*?\[\/THINK\]/gi, '')
-      // 移除代码块标记的思考过程
-      .replace(/```thinking[\s\S]*?```/gi, '')
-      .replace(/```think[\s\S]*?```/gi, '')
-      // 移除开头的“我先思考一下”类似的句子
-      .replace(
-        /^(\s*)(\S+\s+)?(\S+\s+)?(\S+\s+)?(我|让我|让我们|我们|我先|我来)(思考|分析|理解|看一下|想一想)[^\n]*\n/i,
-        ''
-      )
-      // 移除开头的“Let me think”类似的句子
-      .replace(
-        /^(\s*)(\S+\s+)?(\S+\s+)?(\S+\s+)?(Let me|I'll|I will|I need to|Let's|I'm going to)\s+(think|analyze|understand|consider|break down)[^\n]*\n/i,
-        ''
-      )
-      // 移除开头的“To answer this question”类似的句子
-      .replace(
-        /^(\s*)(\S+\s+)?(\S+\s+)?(\S+\s+)?(To answer this|To solve this|To address this|To respond to this)[^\n]*\n/i,
-        ''
-      )
-
-    // 如果文本中包含“我的回答是”或“我的答案是”，只保留这之后的内容
-    const answerMarkers = [
-      /[\n\r]+(\s*)(我的|最终|最终的|正确的|完整的)?(回答|答案|结论|解决方案)(是|如下|就是|就是如下)[\s:：]*/i,
-      /[\n\r]+(\s*)(My|The|Final|Complete|Correct)\s+(answer|response|solution|conclusion)\s+(is|would be|follows)[\s:]*/i
-    ]
-
-    for (const marker of answerMarkers) {
-      const parts = processedText.split(marker)
-      if (parts.length > 1) {
-        // 取最后一个匹配后的内容
-        return parts[parts.length - 1].trim()
-      }
-    }
-
-    return processedText
+  stop = (): void => {
+    this.service.stop()
   }
 
   /**
@@ -1026,190 +33,14 @@ class TTSService {
    * @param message 消息对象
    */
   speakFromMessage = async (message: Message): Promise<void> => {
-    // 只读取回答内容，不读取思考过程
-    let text = message.content
-
-    // 如果有翻译内容，则使用翻译内容
-    if (message.translatedContent) {
-      text = message.translatedContent
-    }
-
-    console.log('原始文本长度:', text.length)
-    console.log('原始文本开头:', text.substring(0, 100))
-
-    // 先移除思考过程
-    const processedText = this.removeThinkingProcess(text)
-    console.log('移除思考过程后文本长度:', processedText.length)
-    console.log('处理后文本开头:', processedText.substring(0, 100))
-    text = processedText
-
-    // 清理文本，移除不需要的标点符号
-    text = this.cleanTextForSpeech(text)
-    console.log('清理标点符号后文本长度:', text.length)
-
-    // 获取最新的TTS设置
-    const latestSettings = store.getState().settings
-    const ttsFilterOptions = latestSettings.ttsFilterOptions || {
-      filterThinkingProcess: true,
-      filterMarkdown: true,
-      filterCodeBlocks: true,
-      filterHtmlTags: true,
-      maxTextLength: 4000
-    }
-    const ttsServiceType = latestSettings.ttsServiceType
-
-    // 输出当前的TTS服务类型，便于调试
-    console.log('当前消息播放使用的TTS服务类型:', ttsServiceType || 'openai')
-    console.log('消息播放时完整TTS设置:', {
-      ttsEnabled: latestSettings.ttsEnabled,
-      ttsServiceType: latestSettings.ttsServiceType,
-      ttsApiKey: latestSettings.ttsApiKey ? '已设置' : '未设置',
-      ttsVoice: latestSettings.ttsVoice,
-      ttsModel: latestSettings.ttsModel,
-      ttsEdgeVoice: latestSettings.ttsEdgeVoice
-    })
-
-    // 如果消息过长，可能会导致TTS API超时或失败
-    // 根据设置的最大文本长度进行截断
-    const maxLength = ttsFilterOptions.maxTextLength || 4000 // 默认为4000
-    if (text.length > maxLength) {
-      text = text.substring(0, maxLength) + '...'
-      console.log(`文本过长，已截断为${maxLength}个字符`)
-    }
-
-    await this.speak(text)
-  }
-
-  /**
-   * 暂停当前播放的音频
-   */
-  pause = (): void => {
-    if (this.audio && this.isPlaying) {
-      this.audio.pause()
-      this.isPlaying = false
-    }
-  }
-
-  /**
-   * 恢复播放
-   */
-  resume = (): void => {
-    if (this.audio && !this.isPlaying) {
-      this.audio.play()
-      this.isPlaying = true
-    }
-  }
-
-  /**
-   * 停止播放并释放资源
-   */
-  stop = (): void => {
-    console.log('执行停止TTS播放操作')
-
-    try {
-      // 首先将音量设为0，避免停止时的特殊声音
-      if (this.audio) {
-        // 先将音量渐变为0，避免突然停止的噪音
-        const originalVolume = this.audio.volume || 1
-        const fadeOutSteps = 5
-        const fadeOutInterval = 20 // 毫秒
-
-        // 如果正在播放，则渐变音量
-        if (this.isPlaying) {
-          const fadeStep = originalVolume / fadeOutSteps
-          let currentStep = 0
-
-          const fadeOut = () => {
-            if (currentStep < fadeOutSteps && this.audio) {
-              this.audio.volume = Math.max(0, originalVolume - fadeStep * currentStep)
-              currentStep++
-              setTimeout(fadeOut, fadeOutInterval)
-            } else {
-              // 渐变结束后正式停止
-              this.finalizeStop()
-            }
-          }
-
-          fadeOut()
-        } else {
-          // 如果不是正在播放状态，直接停止
-          this.finalizeStop()
-        }
-      } else {
-        // 如果没有音频元素，直接停止
-        this.finalizeStop()
-      }
-    } catch (error) {
-      console.error('停止TTS播放时出错:', error)
-      // 出错时仍然尝试停止
-      this.finalizeStop()
-    }
-  }
-
-  /**
-   * 完成停止播放的操作
-   * 这是内部方法，由stop()调用
-   */
-  private finalizeStop(): void {
-    console.log('执行最终停止TTS播放操作')
-
-    // 停止浏览器的Web Speech API播放
-    if (window.speechSynthesis) {
-      try {
-        window.speechSynthesis.cancel()
-        // 清除所有排队的语音
-        window.speechSynthesis.cancel()
-      } catch (e) {
-        console.error('停止Web Speech API时出错:', e)
-      }
-    }
-
-    // 停止音频元素的播放
-    if (this.audio) {
-      try {
-        // 移除所有事件监听器
-        this.audio.onended = null
-        this.audio.oncanplay = null
-        this.audio.onerror = null
-
-        // 停止播放
-        this.audio.pause()
-        this.audio.currentTime = 0
-
-        // 释放资源
-        const oldSrc = this.audio.src
-        this.audio.src = ''
-        this.audio.load() // 强制释放资源
-
-        // 尝试释放BlobURL
-        if (oldSrc && oldSrc.startsWith('blob:')) {
-          try {
-            URL.revokeObjectURL(oldSrc)
-          } catch (e) {
-            console.error('释放BlobURL时出错:', e)
-          }
-        }
-
-        this.audio = null
-      } catch (e) {
-        console.error('停止音频元素时出错:', e)
-        // 确保即使出错也重置状态
-        this.audio = null
-      }
-    }
-
-    // 重置播放状态
-    this.isPlaying = false
-
-    // 清除加载提示
-    window.message.destroy('tts-loading')
+    await this.service.speakFromMessage(message)
   }
 
   /**
    * 检查是否正在播放
    */
   isCurrentlyPlaying = (): boolean => {
-    return this.isPlaying
+    return this.service.isCurrentlyPlaying()
   }
 }
 
diff --git a/src/renderer/src/services/tts/EdgeTTSService.ts b/src/renderer/src/services/tts/EdgeTTSService.ts
new file mode 100644
index 0000000000..964216fcbc
--- /dev/null
+++ b/src/renderer/src/services/tts/EdgeTTSService.ts
@@ -0,0 +1,270 @@
+import { TTSServiceInterface } from './TTSServiceInterface';
+import i18n from '@renderer/i18n';
+
+// 全局变量来跟踪当前正在播放的语音
+let currentUtterance: SpeechSynthesisUtterance | null = null;
+
+/**
+ * Edge TTS服务实现类
+ */
+export class EdgeTTSService implements TTSServiceInterface {
+  private edgeVoice: string;
+
+  /**
+   * 构造函数
+   * @param edgeVoice Edge语音
+   */
+  constructor(edgeVoice: string) {
+    this.edgeVoice = edgeVoice;
+    console.log('初始化EdgeTTSService，语音:', edgeVoice);
+  }
+
+  /**
+   * 验证参数
+   * @throws 如果参数无效，抛出错误
+   */
+  private validateParams(): void {
+    if (!this.edgeVoice) {
+      throw new Error(i18n.t('settings.tts.error.no_edge_voice'));
+    }
+  }
+
+  /**
+   * 直接播放语音
+   * @param text 要播放的文本
+   * @returns 是否成功播放
+   */
+  private playDirectly(text: string): boolean {
+    try {
+      // 验证参数
+      this.validateParams();
+
+      // 使用Web Speech API
+      if (!('speechSynthesis' in window)) {
+        throw new Error(i18n.t('settings.tts.error.browser_not_support'));
+      }
+
+      // 停止当前正在播放的语音
+      window.speechSynthesis.cancel();
+      if (currentUtterance) {
+        currentUtterance = null;
+      }
+
+      // 创建语音合成器实例
+      const utterance = new SpeechSynthesisUtterance(text);
+      currentUtterance = utterance;
+
+      // 获取可用的语音合成声音
+      const voices = window.speechSynthesis.getVoices();
+      console.log('可用的语音合成声音:', voices);
+
+      // 查找指定的语音
+      let selectedVoice = voices.find((v) => v.name === this.edgeVoice);
+
+      // 如果没有找到指定的语音，尝试使用中文语音
+      if (!selectedVoice) {
+        console.warn('未找到指定的语音:', this.edgeVoice);
+        // 尝试找中文语音
+        selectedVoice = voices.find((v) => v.lang === 'zh-CN');
+
+        if (selectedVoice) {
+          console.log('使用替代中文语音:', selectedVoice.name);
+        } else {
+          // 如果没有中文语音，使用第一个可用的语音
+          if (voices.length > 0) {
+            selectedVoice = voices[0];
+            console.log('使用第一个可用的语音:', selectedVoice.name);
+          } else {
+            console.warn('没有可用的语音');
+            return false;
+          }
+        }
+      } else {
+        console.log('已选择语音:', selectedVoice.name);
+      }
+
+      // 设置语音
+      if (selectedVoice) {
+        utterance.voice = selectedVoice;
+      }
+
+      // 设置事件处理程序
+      utterance.onend = () => {
+        console.log('语音合成已结束');
+        currentUtterance = null;
+
+        // 分发一个自定义事件，通知语音合成已结束
+        // 这样TTSService可以监听这个事件并重置播放状态
+        const event = new CustomEvent('edgeTTSComplete', { detail: { text } });
+        document.dispatchEvent(event);
+      };
+
+      utterance.onerror = (event) => {
+        console.error('语音合成错误:', event);
+        currentUtterance = null;
+      };
+
+      // 开始语音合成
+      window.speechSynthesis.speak(utterance);
+      return true;
+    } catch (error) {
+      console.error('直接播放语音失败:', error);
+      return false;
+    }
+  }
+
+  /**
+   * 合成语音
+   * @param text 要合成的文本
+   * @returns 返回音频Blob对象的Promise
+   */
+  async synthesize(text: string): Promise<Blob> {
+    // 验证参数
+    this.validateParams();
+
+    // 先尝试直接播放
+    const playResult = this.playDirectly(text);
+    if (playResult) {
+      // 如果直接播放成功，返回一个有效的音频Blob
+      // 创建一个简单的音频文件，包含一个短暂停
+      // 这个文件可以被浏览器正常播放，但实际上不会发出声音
+      // 因为我们已经使用Web Speech API直接播放了语音
+      const silentAudioBase64 = 'UklGRiQAAABXQVZFZm10IBAAAAABAAEARKwAAIhYAQACABAAZGF0YQAAAAA=';
+      const silentAudioBuffer = Uint8Array.from(atob(silentAudioBase64), c => c.charCodeAt(0));
+      return new Blob([silentAudioBuffer], { type: 'audio/wav' });
+    }
+
+    // 如果直接播放失败，尝试录制方法
+    console.log('直接播放失败，尝试录制方法');
+    try {
+      console.log('使用浏览器TTS生成语音，音色:', this.edgeVoice);
+
+      // 使用Web Speech API
+      if (!('speechSynthesis' in window)) {
+        throw new Error(i18n.t('settings.tts.error.browser_not_support'));
+      }
+
+      // 停止当前正在播放的语音
+      window.speechSynthesis.cancel();
+
+      // 创建语音合成器实例
+      const utterance = new SpeechSynthesisUtterance(text);
+
+      // 获取可用的语音合成声音
+      const voices = window.speechSynthesis.getVoices();
+      console.log('初始可用的语音合成声音:', voices);
+
+      // 如果没有可用的声音，等待声音加载
+      if (voices.length === 0) {
+        try {
+          await new Promise<void>((resolve) => {
+            const voicesChangedHandler = () => {
+              window.speechSynthesis.onvoiceschanged = null;
+              resolve();
+            };
+            window.speechSynthesis.onvoiceschanged = voicesChangedHandler;
+
+            // 设置超时，防止无限等待
+            setTimeout(() => {
+              window.speechSynthesis.onvoiceschanged = null;
+              resolve();
+            }, 5000);
+          });
+        } catch (error) {
+          console.error('等待语音加载超时:', error);
+        }
+      }
+
+      // 重新获取可用的语音合成声音
+      const updatedVoices = window.speechSynthesis.getVoices();
+      console.log('更新后可用的语音合成声音:', updatedVoices);
+
+      // 查找指定的语音
+      let selectedVoice = updatedVoices.find((v) => v.name === this.edgeVoice);
+
+      // 如果没有找到指定的语音，尝试使用中文语音
+      if (!selectedVoice) {
+        console.warn('未找到指定的语音:', this.edgeVoice);
+        // 尝试找中文语音
+        selectedVoice = updatedVoices.find((v) => v.lang === 'zh-CN');
+
+        if (selectedVoice) {
+          console.log('使用替代中文语音:', selectedVoice.name);
+        } else {
+          // 如果没有中文语音，使用第一个可用的语音
+          if (updatedVoices.length > 0) {
+            selectedVoice = updatedVoices[0];
+            console.log('使用第一个可用的语音:', selectedVoice.name);
+          } else {
+            console.warn('没有可用的语音');
+          }
+        }
+      } else {
+        console.log('已选择语音:', selectedVoice.name);
+      }
+
+      // 设置语音
+      if (selectedVoice) {
+        utterance.voice = selectedVoice;
+      }
+
+      // 创建一个Promise来等待语音合成完成
+      return await new Promise<Blob>((resolve, reject) => {
+        try {
+          // 使用AudioContext捕获语音合成的音频
+          const audioContext = new (window.AudioContext || (window as any).webkitAudioContext)();
+          const audioDestination = audioContext.createMediaStreamDestination();
+          const mediaRecorder = new MediaRecorder(audioDestination.stream);
+          const audioChunks: BlobPart[] = [];
+
+          mediaRecorder.ondataavailable = (event) => {
+            if (event.data.size > 0) {
+              audioChunks.push(event.data);
+            }
+          };
+
+          mediaRecorder.onstop = () => {
+            const audioBlob = new Blob(audioChunks, { type: 'audio/wav' });
+            resolve(audioBlob);
+          };
+
+          // 开始录制
+          mediaRecorder.start();
+
+          // 设置语音合成事件
+          utterance.onend = () => {
+            // 语音合成结束后停止录制
+            setTimeout(() => {
+              mediaRecorder.stop();
+            }, 500); // 等待一下，确保所有音频都被捕获
+          };
+
+          utterance.onerror = (event) => {
+            console.error('语音合成错误:', event);
+            mediaRecorder.stop();
+            reject(new Error('语音合成错误'));
+          };
+
+          // 开始语音合成
+          window.speechSynthesis.speak(utterance);
+
+          // 设置超时，防止无限等待
+          setTimeout(() => {
+            if (mediaRecorder.state === 'recording') {
+              console.warn('语音合成超时，强制停止');
+              mediaRecorder.stop();
+            }
+          }, 10000); // 10秒超时
+        } catch (error) {
+          console.error('浏览器TTS语音合成失败:', error);
+          reject(new Error(`浏览器TTS语音合成失败: ${error.message}`));
+        }
+      });
+    } catch (error) {
+      console.error('浏览器TTS语音合成失败:', error);
+      // 即使失败也返回一个空的Blob，而不是抛出异常
+      // 这样可以避免在UI上显示错误消息
+      return new Blob([], { type: 'audio/wav' });
+    }
+  }
+}
diff --git a/src/renderer/src/services/tts/MsTTSService.ts b/src/renderer/src/services/tts/MsTTSService.ts
new file mode 100644
index 0000000000..455fe20b0e
--- /dev/null
+++ b/src/renderer/src/services/tts/MsTTSService.ts
@@ -0,0 +1,58 @@
+import { TTSServiceInterface } from './TTSServiceInterface';
+import i18n from '@renderer/i18n';
+
+/**
+ * 免费在线TTS服务实现类
+ * 使用免费的在线TTS服务，不需要API密钥
+ */
+export class MsTTSService implements TTSServiceInterface {
+  private voice: string;
+  private outputFormat: string;
+
+  /**
+   * 构造函数
+   * @param voice 语音
+   * @param outputFormat 输出格式
+   */
+  constructor(voice: string, outputFormat: string) {
+    this.voice = voice;
+    this.outputFormat = outputFormat;
+    console.log('初始化MsTTSService，语音:', voice, '输出格式:', outputFormat);
+  }
+
+  /**
+   * 验证参数
+   * @throws 如果参数无效，抛出错误
+   */
+  private validateParams(): void {
+    if (!this.voice) {
+      throw new Error(i18n.t('settings.tts.error.no_mstts_voice'));
+    }
+  }
+
+  /**
+   * 合成语音
+   * @param text 要合成的文本
+   * @returns 返回音频Blob对象的Promise
+   */
+  async synthesize(text: string): Promise<Blob> {
+    // 验证参数
+    this.validateParams();
+
+    try {
+      console.log('使用免费在线TTS生成语音，音色:', this.voice);
+
+      // 通过IPC调用主进程的MsTTSService
+      const outputPath = await window.api.msTTS.synthesize(text, this.voice, this.outputFormat);
+      
+      // 读取生成的音频文件
+      const audioData = await window.api.fs.read(outputPath);
+      
+      // 将Buffer转换为Blob
+      return new Blob([audioData], { type: 'audio/mp3' });
+    } catch (error) {
+      console.error('免费在线TTS语音合成失败:', error);
+      throw new Error(`免费在线TTS语音合成失败: ${error.message}`);
+    }
+  }
+}
diff --git a/src/renderer/src/services/tts/OpenAITTSService.ts b/src/renderer/src/services/tts/OpenAITTSService.ts
new file mode 100644
index 0000000000..26f71bfd0c
--- /dev/null
+++ b/src/renderer/src/services/tts/OpenAITTSService.ts
@@ -0,0 +1,92 @@
+import { TTSServiceInterface } from './TTSServiceInterface';
+import i18n from '@renderer/i18n';
+
+/**
+ * OpenAI TTS服务实现类
+ */
+export class OpenAITTSService implements TTSServiceInterface {
+  private apiKey: string;
+  private apiUrl: string;
+  private voice: string;
+  private model: string;
+
+  /**
+   * 构造函数
+   * @param apiKey OpenAI API密钥
+   * @param apiUrl OpenAI API地址
+   * @param voice 语音
+   * @param model 模型
+   */
+  constructor(apiKey: string, apiUrl: string, voice: string, model: string) {
+    this.apiKey = apiKey;
+    this.apiUrl = apiUrl;
+    this.voice = voice;
+    this.model = model;
+  }
+
+  /**
+   * 验证参数
+   * @throws 如果参数无效，抛出错误
+   */
+  private validateParams(): void {
+    if (!this.apiKey) {
+      throw new Error(i18n.t('settings.tts.error.no_api_key'));
+    }
+
+    if (!this.apiUrl) {
+      throw new Error(i18n.t('settings.tts.error.no_api_url'));
+    }
+
+    if (!this.voice) {
+      throw new Error(i18n.t('settings.tts.error.no_voice'));
+    }
+
+    if (!this.model) {
+      throw new Error(i18n.t('settings.tts.error.no_model'));
+    }
+  }
+
+  /**
+   * 合成语音
+   * @param text 要合成的文本
+   * @returns 返回音频Blob对象的Promise
+   */
+  async synthesize(text: string): Promise<Blob> {
+    // 验证参数
+    this.validateParams();
+
+    // 准备OpenAI TTS请求体
+    const requestBody: any = {
+      input: text
+    };
+
+    // 只有当模型和音色不为空时才添加到请求体中
+    if (this.model) {
+      requestBody.model = this.model;
+    }
+
+    if (this.voice) {
+      requestBody.voice = this.voice;
+    }
+
+    // 调用OpenAI TTS API
+    console.log('调用OpenAI TTS API，开始合成语音');
+    const response = await fetch(this.apiUrl, {
+      method: 'POST',
+      headers: {
+        'Content-Type': 'application/json',
+        Authorization: `Bearer ${this.apiKey}`
+      },
+      body: JSON.stringify(requestBody)
+    });
+
+    if (!response.ok) {
+      const errorData = await response.json();
+      throw new Error(errorData.error?.message || 'OpenAI语音合成失败');
+    }
+
+    // 获取音频数据
+    console.log('获取到OpenAI TTS响应，开始处理音频数据');
+    return await response.blob();
+  }
+}
diff --git a/src/renderer/src/services/tts/SiliconflowTTSService.ts b/src/renderer/src/services/tts/SiliconflowTTSService.ts
new file mode 100644
index 0000000000..6f0d7bb772
--- /dev/null
+++ b/src/renderer/src/services/tts/SiliconflowTTSService.ts
@@ -0,0 +1,116 @@
+import { TTSServiceInterface } from './TTSServiceInterface';
+import i18n from '@renderer/i18n';
+
+/**
+ * 硅基流动TTS服务实现类
+ */
+export class SiliconflowTTSService implements TTSServiceInterface {
+  private apiKey: string;
+  private apiUrl: string;
+  private voice: string;
+  private model: string;
+  private responseFormat: string;
+  private speed: number;
+
+  /**
+   * 构造函数
+   * @param apiKey 硅基流动API密钥
+   * @param apiUrl 硅基流动API地址
+   * @param voice 语音
+   * @param model 模型
+   * @param responseFormat 响应格式
+   * @param speed 语速
+   */
+  constructor(
+    apiKey: string,
+    apiUrl: string,
+    voice: string,
+    model: string,
+    responseFormat: string = 'mp3',
+    speed: number = 1.0
+  ) {
+    this.apiKey = apiKey;
+    this.apiUrl = apiUrl || 'https://api.siliconflow.cn/v1/audio/speech';
+    this.voice = voice;
+    this.model = model;
+    this.responseFormat = responseFormat;
+    this.speed = speed;
+  }
+
+  /**
+   * 验证参数
+   * @throws 如果参数无效，抛出错误
+   */
+  private validateParams(): void {
+    if (!this.apiKey) {
+      throw new Error(i18n.t('settings.tts.error.no_api_key'));
+    }
+
+    if (!this.voice) {
+      throw new Error(i18n.t('settings.tts.error.no_voice'));
+    }
+
+    if (!this.model) {
+      throw new Error(i18n.t('settings.tts.error.no_model'));
+    }
+  }
+
+  /**
+   * 合成语音
+   * @param text 要合成的文本
+   * @returns 返回音频Blob对象的Promise
+   */
+  async synthesize(text: string): Promise<Blob> {
+    // 验证参数
+    this.validateParams();
+
+    // 准备硅基流动TTS请求体
+    const requestBody: any = {
+      model: this.model,
+      input: text,
+      voice: this.voice,
+      // 强制使用mp3格式，因为浏览器支持性最好
+      response_format: 'mp3',
+      stream: false,
+      speed: this.speed
+    };
+
+    console.log('硅基流动TTS请求参数:', {
+      model: this.model,
+      voice: this.voice,
+      response_format: 'mp3',
+      speed: this.speed
+    });
+
+    // 调用硅基流动TTS API
+    console.log('调用硅基流动TTS API，开始合成语音');
+    const response = await fetch(this.apiUrl, {
+      method: 'POST',
+      headers: {
+        'Content-Type': 'application/json',
+        'Authorization': `Bearer ${this.apiKey}`
+      },
+      body: JSON.stringify(requestBody)
+    });
+
+    if (!response.ok) {
+      let errorMessage = '硅基流动语音合成失败';
+      try {
+        const errorData = await response.json();
+        errorMessage = errorData.error?.message || errorMessage;
+      } catch (e) {
+        // 如果无法解析JSON，使用默认错误消息
+      }
+      throw new Error(errorMessage);
+    }
+
+    // 获取音频数据
+    console.log('获取到硅基流动TTS响应，开始处理音频数据');
+
+    // 获取原始Blob
+    const originalBlob = await response.blob();
+
+    // 创建一个新的Blob，并指定正确的MIME类型
+    return new Blob([originalBlob], { type: 'audio/mpeg' });
+  }
+}
diff --git a/src/renderer/src/services/tts/TTSService.ts b/src/renderer/src/services/tts/TTSService.ts
new file mode 100644
index 0000000000..2dbd744809
--- /dev/null
+++ b/src/renderer/src/services/tts/TTSService.ts
@@ -0,0 +1,240 @@
+import store from '@renderer/store';
+import i18n from '@renderer/i18n';
+import { TTSServiceFactory } from './TTSServiceFactory';
+import { TTSTextFilter } from './TTSTextFilter';
+import { Message } from '@renderer/types';
+
+/**
+ * TTS服务类
+ * 用于处理文本到语音的转换
+ */
+export class TTSService {
+  private static instance: TTSService;
+  private audioElement: HTMLAudioElement | null = null;
+  private isPlaying = false;
+
+  // 错误消息节流控制
+  private lastErrorTime = 0;
+  private errorThrottleTime = 2000; // 2秒内不重复显示相同错误
+
+  /**
+   * 获取单例实例
+   * @returns TTSService实例
+   */
+  public static getInstance(): TTSService {
+    // 每次调用时强制重新创建实例，确保使用最新的设置
+    // 注意：这会导致每次调用时都创建新的音频元素，可能会有内存泄漏风险
+    // 但在当前情况下，这是解决TTS服务类型切换问题的最简单方法
+    TTSService.instance = new TTSService();
+    return TTSService.instance;
+  }
+
+  /**
+   * 私有构造函数，防止外部实例化
+   */
+  private constructor() {
+    // 创建音频元素
+    this.audioElement = document.createElement('audio');
+    this.audioElement.style.display = 'none';
+    document.body.appendChild(this.audioElement);
+
+    // 监听音频播放结束事件
+    this.audioElement.addEventListener('ended', () => {
+      this.isPlaying = false;
+      console.log('TTS播放结束');
+    });
+
+    // 监听浏览器TTS直接播放结束的自定义事件
+    document.addEventListener('edgeTTSComplete', () => {
+      console.log('收到浏览器TTS直接播放结束事件');
+      this.isPlaying = false;
+    });
+  }
+
+  /**
+   * 从消息中提取文本并播放
+   * @param message 消息对象
+   * @returns 是否成功播放
+   */
+  public async speakFromMessage(message: Message): Promise<boolean> {
+    // 获取最新的TTS过滤选项
+    const settings = store.getState().settings;
+    const ttsFilterOptions = settings.ttsFilterOptions || {
+      filterThinkingProcess: true,
+      filterMarkdown: true,
+      filterCodeBlocks: true,
+      filterHtmlTags: true,
+      maxTextLength: 4000
+    };
+
+    // 应用过滤
+    const filteredText = TTSTextFilter.filterText(message.content, ttsFilterOptions);
+    console.log('TTS过滤前文本长度:', message.content.length, '过滤后:', filteredText.length);
+
+    // 播放过滤后的文本
+    return this.speak(filteredText);
+  }
+
+  /**
+   * 播放文本
+   * @param text 要播放的文本
+   * @returns 是否成功播放
+   */
+  public async speak(text: string): Promise<boolean> {
+    try {
+      // 检查TTS是否启用
+      const settings = store.getState().settings;
+      const ttsEnabled = settings.ttsEnabled;
+
+      if (!ttsEnabled) {
+        this.showErrorMessage(i18n.t('settings.tts.error.not_enabled'));
+        return false;
+      }
+
+      // 如果正在播放，先停止
+      if (this.isPlaying) {
+        this.stop();
+      }
+
+      // 确保文本不为空
+      if (!text || text.trim() === '') {
+        this.showErrorMessage(i18n.t('settings.tts.error.empty_text'));
+        return false;
+      }
+
+      // 获取最新的设置
+      // 强制刷新状态对象，确保获取最新的设置
+      const latestSettings = store.getState().settings;
+      const serviceType = latestSettings.ttsServiceType || 'openai';
+      console.log('使用的TTS服务类型:', serviceType);
+      console.log('当前TTS设置详情:', {
+        ttsServiceType: serviceType,
+        ttsEdgeVoice: latestSettings.ttsEdgeVoice,
+        ttsSiliconflowApiKey: latestSettings.ttsSiliconflowApiKey ? '已设置' : '未设置',
+        ttsSiliconflowVoice: latestSettings.ttsSiliconflowVoice,
+        ttsSiliconflowModel: latestSettings.ttsSiliconflowModel,
+        ttsSiliconflowResponseFormat: latestSettings.ttsSiliconflowResponseFormat,
+        ttsSiliconflowSpeed: latestSettings.ttsSiliconflowSpeed
+      });
+
+      try {
+        // 使用工厂创建TTS服务
+        const ttsService = TTSServiceFactory.createService(serviceType, latestSettings);
+
+        // 合成语音
+        const audioBlob = await ttsService.synthesize(text);
+
+        // 播放音频
+        if (audioBlob) {
+          const audioUrl = URL.createObjectURL(audioBlob);
+
+          if (this.audioElement) {
+            // 打印音频Blob信息，帮助调试
+            console.log('音频Blob信息:', {
+              size: audioBlob.size,
+              type: audioBlob.type,
+              serviceType: serviceType
+            });
+
+            this.audioElement.src = audioUrl;
+            this.audioElement.play().catch((error) => {
+              // 检查是否是浏览器TTS直接播放的情况
+              // 如果是浏览器TTS且音频大小很小，则不显示错误消息
+              const isEdgeTTS = serviceType === 'edge';
+              const isSmallBlob = audioBlob.size < 100; // 小于100字节的音频文件可能是我们的静音文件
+
+              if (isEdgeTTS && isSmallBlob) {
+                console.log('浏览器TTS直接播放中，忽略音频元素错误');
+              } else {
+                console.error('播放TTS音频失败:', error);
+                console.error('音频URL:', audioUrl);
+                console.error('音频Blob类型:', audioBlob.type);
+                console.error('音频Blob大小:', audioBlob.size);
+                this.showErrorMessage(i18n.t('settings.tts.error.play_failed'));
+              }
+            });
+
+            this.isPlaying = true;
+            console.log('开始播放TTS音频');
+
+            // 释放URL对象
+            this.audioElement.onended = () => {
+              URL.revokeObjectURL(audioUrl);
+
+              // 检查是否是浏览器TTS直接播放的情况
+              const isEdgeTTS = serviceType === 'edge';
+              const isSmallBlob = audioBlob.size < 100;
+
+              // 如果是浏览器TTS直接播放，则等待当前语音合成结束
+              if (isEdgeTTS && isSmallBlob) {
+                // 检查全局变量中的当前语音合成状态
+                // 如果还在播放，则不重置播放状态
+                // 注意：这里我们无法直接访问 EdgeTTSService 中的 currentUtterance
+                // 所以我们使用定时器来检查语音合成是否完成
+                console.log('浏览器TTS直接播放中，等待语音合成结束');
+                // 保持播放状态，直到语音合成结束
+                // 使用定时器来检查语音合成是否完成
+                // 大多数语音合成应该在几秒内完成
+                setTimeout(() => {
+                  this.isPlaying = false;
+                  console.log('浏览器TTS直接播放完成');
+                }, 10000); // 10秒后自动重置状态
+              } else {
+                this.isPlaying = false;
+              }
+            };
+
+            return true;
+          }
+        }
+
+        return false;
+      } catch (error: any) {
+        console.error('TTS合成失败:', error);
+        this.showErrorMessage(error?.message || i18n.t('settings.tts.error.synthesis_failed'));
+        return false;
+      }
+    } catch (error) {
+      console.error('TTS播放失败:', error);
+      this.showErrorMessage(i18n.t('settings.tts.error.general'));
+      return false;
+    }
+  }
+
+  /**
+   * 停止播放
+   */
+  public stop(): void {
+    if (this.audioElement && this.isPlaying) {
+      this.audioElement.pause();
+      this.audioElement.currentTime = 0;
+      this.isPlaying = false;
+      console.log('停止TTS播放');
+    }
+  }
+
+  /**
+   * 检查是否正在播放
+   * @returns 是否正在播放
+   */
+  public isCurrentlyPlaying(): boolean {
+    return this.isPlaying;
+  }
+
+  /**
+   * 显示错误消息，并进行节流控制
+   * @param message 错误消息
+   */
+  private showErrorMessage(message: string): void {
+    const now = Date.now();
+    // 如果距离上次错误消息的时间小于节流时间，则不显示
+    if (now - this.lastErrorTime < this.errorThrottleTime) {
+      console.log('错误消息被节流：', message);
+      return;
+    }
+
+    // 更新上次错误消息时间
+    this.lastErrorTime = now;
+    window.message.error({ content: message, key: 'tts-error' });
+  }
+}
diff --git a/src/renderer/src/services/tts/TTSServiceFactory.ts b/src/renderer/src/services/tts/TTSServiceFactory.ts
new file mode 100644
index 0000000000..ea2da98723
--- /dev/null
+++ b/src/renderer/src/services/tts/TTSServiceFactory.ts
@@ -0,0 +1,70 @@
+import { TTSServiceInterface } from './TTSServiceInterface';
+import { OpenAITTSService } from './OpenAITTSService';
+import { EdgeTTSService } from './EdgeTTSService';
+import { SiliconflowTTSService } from './SiliconflowTTSService';
+import { MsTTSService } from './MsTTSService';
+import i18n from '@renderer/i18n';
+
+/**
+ * TTS服务工厂类
+ * 用于创建不同类型的TTS服务实例
+ */
+export class TTSServiceFactory {
+  /**
+   * 创建TTS服务实例
+   * @param serviceType 服务类型
+   * @param settings 设置
+   * @returns TTS服务实例
+   */
+  static createService(serviceType: string, settings: any): TTSServiceInterface {
+    console.log('创建TTS服务实例，类型:', serviceType);
+
+    switch (serviceType) {
+      case 'openai':
+        console.log('创建OpenAI TTS服务实例');
+        return new OpenAITTSService(
+          settings.ttsApiKey,
+          settings.ttsApiUrl,
+          settings.ttsVoice,
+          settings.ttsModel
+        );
+
+      case 'edge':
+        console.log('创建Edge TTS服务实例');
+        return new EdgeTTSService(settings.ttsEdgeVoice);
+
+      case 'siliconflow':
+        console.log('创建硅基流动 TTS服务实例');
+        console.log('硅基流动TTS设置:', {
+          apiKey: settings.ttsSiliconflowApiKey ? '已设置' : '未设置',
+          apiUrl: settings.ttsSiliconflowApiUrl,
+          voice: settings.ttsSiliconflowVoice,
+          model: settings.ttsSiliconflowModel,
+          responseFormat: settings.ttsSiliconflowResponseFormat,
+          speed: settings.ttsSiliconflowSpeed
+        });
+        return new SiliconflowTTSService(
+          settings.ttsSiliconflowApiKey,
+          settings.ttsSiliconflowApiUrl,
+          settings.ttsSiliconflowVoice,
+          settings.ttsSiliconflowModel,
+          settings.ttsSiliconflowResponseFormat,
+          settings.ttsSiliconflowSpeed
+        );
+
+      case 'mstts':
+        console.log('创建免费在线TTS服务实例');
+        console.log('免费在线TTS设置:', {
+          voice: settings.ttsMsVoice,
+          outputFormat: settings.ttsMsOutputFormat
+        });
+        return new MsTTSService(
+          settings.ttsMsVoice,
+          settings.ttsMsOutputFormat
+        );
+
+      default:
+        throw new Error(i18n.t('settings.tts.error.unsupported_service_type', { serviceType }));
+    }
+  }
+}
diff --git a/src/renderer/src/services/tts/TTSServiceInterface.ts b/src/renderer/src/services/tts/TTSServiceInterface.ts
new file mode 100644
index 0000000000..e14a4f11b4
--- /dev/null
+++ b/src/renderer/src/services/tts/TTSServiceInterface.ts
@@ -0,0 +1,12 @@
+/**
+ * TTS服务接口
+ * 所有TTS服务实现类都需要实现这个接口
+ */
+export interface TTSServiceInterface {
+  /**
+   * 合成语音
+   * @param text 要合成的文本
+   * @returns 返回音频Blob对象的Promise
+   */
+  synthesize(text: string): Promise<Blob>;
+}
diff --git a/src/renderer/src/services/tts/TTSTextFilter.ts b/src/renderer/src/services/tts/TTSTextFilter.ts
new file mode 100644
index 0000000000..059ea90804
--- /dev/null
+++ b/src/renderer/src/services/tts/TTSTextFilter.ts
@@ -0,0 +1,148 @@
+/**
+ * TTS文本过滤工具类
+ * 用于过滤不适合TTS朗读的内容
+ */
+export class TTSTextFilter {
+  /**
+   * 过滤文本
+   * @param text 原始文本
+   * @param options 过滤选项
+   * @returns 过滤后的文本
+   */
+  public static filterText(
+    text: string,
+    options: {
+      filterThinkingProcess: boolean;
+      filterMarkdown: boolean;
+      filterCodeBlocks: boolean;
+      filterHtmlTags: boolean;
+      maxTextLength: number;
+    }
+  ): string {
+    if (!text) return '';
+
+    let filteredText = text;
+
+    // 过滤思考过程
+    if (options.filterThinkingProcess) {
+      filteredText = this.filterThinkingProcess(filteredText);
+    }
+
+    // 过滤Markdown标记
+    if (options.filterMarkdown) {
+      filteredText = this.filterMarkdown(filteredText);
+    }
+
+    // 过滤代码块
+    if (options.filterCodeBlocks) {
+      filteredText = this.filterCodeBlocks(filteredText);
+    }
+
+    // 过滤HTML标签
+    if (options.filterHtmlTags) {
+      filteredText = this.filterHtmlTags(filteredText);
+    }
+
+    // 限制文本长度
+    if (options.maxTextLength > 0 && filteredText.length > options.maxTextLength) {
+      filteredText = filteredText.substring(0, options.maxTextLength);
+    }
+
+    return filteredText.trim();
+  }
+
+  /**
+   * 过滤思考过程
+   * @param text 原始文本
+   * @returns 过滤后的文本
+   */
+  private static filterThinkingProcess(text: string): string {
+    // 过滤<think>标签内容
+    text = text.replace(/<think>[\s\S]*?<\/think>/g, '');
+    
+    // 过滤未闭合的<think>标签
+    if (text.includes('<think>')) {
+      const parts = text.split('<think>');
+      text = parts[0];
+    }
+    
+    // 过滤思考过程部分（###Thinking和###Response格式）
+    const thinkingMatch = text.match(/###\s*Thinking[\s\S]*?(?=###\s*Response|$)/);
+    if (thinkingMatch) {
+      text = text.replace(thinkingMatch[0], '');
+    }
+    
+    // 如果有Response部分，只保留Response部分
+    const responseMatch = text.match(/###\s*Response\s*([\s\S]*?)(?=###|$)/);
+    if (responseMatch) {
+      text = responseMatch[1];
+    }
+    
+    return text;
+  }
+
+  /**
+   * 过滤Markdown标记
+   * @param text 原始文本
+   * @returns 过滤后的文本
+   */
+  private static filterMarkdown(text: string): string {
+    // 过滤标题标记
+    text = text.replace(/#{1,6}\s+/g, '');
+    
+    // 过滤粗体和斜体标记
+    text = text.replace(/(\*\*|__)(.*?)\1/g, '$2');
+    text = text.replace(/(\*|_)(.*?)\1/g, '$2');
+    
+    // 过滤链接
+    text = text.replace(/\[([^\]]+)\]\(([^)]+)\)/g, '$1');
+    
+    // 过滤图片
+    text = text.replace(/!\[([^\]]*)\]\(([^)]+)\)/g, '');
+    
+    // 过滤引用
+    text = text.replace(/^\s*>\s+/gm, '');
+    
+    // 过滤水平线
+    text = text.replace(/^\s*[-*_]{3,}\s*$/gm, '');
+    
+    // 过滤列表标记
+    text = text.replace(/^\s*[-*+]\s+/gm, '');
+    text = text.replace(/^\s*\d+\.\s+/gm, '');
+    
+    return text;
+  }
+
+  /**
+   * 过滤代码块
+   * @param text 原始文本
+   * @returns 过滤后的文本
+   */
+  private static filterCodeBlocks(text: string): string {
+    // 过滤围栏式代码块
+    text = text.replace(/```[\s\S]*?```/g, '');
+    
+    // 过滤缩进式代码块
+    text = text.replace(/(?:^|\n)( {4}|\t).*(?:\n|$)/g, '\n');
+    
+    // 过滤行内代码
+    text = text.replace(/`([^`]+)`/g, '$1');
+    
+    return text;
+  }
+
+  /**
+   * 过滤HTML标签
+   * @param text 原始文本
+   * @returns 过滤后的文本
+   */
+  private static filterHtmlTags(text: string): string {
+    // 过滤HTML标签
+    text = text.replace(/<[^>]*>/g, '');
+    
+    // 过滤HTML实体
+    text = text.replace(/&[a-zA-Z0-9#]+;/g, ' ');
+    
+    return text;
+  }
+}
diff --git a/src/renderer/src/services/tts/index.ts b/src/renderer/src/services/tts/index.ts
new file mode 100644
index 0000000000..78d52d164e
--- /dev/null
+++ b/src/renderer/src/services/tts/index.ts
@@ -0,0 +1,7 @@
+export * from './TTSService';
+export * from './TTSServiceInterface';
+export * from './TTSServiceFactory';
+export * from './OpenAITTSService';
+export * from './EdgeTTSService';
+export * from './SiliconflowTTSService';
+export * from './MsTTSService';
diff --git a/src/renderer/src/store/settings.ts b/src/renderer/src/store/settings.ts
index 8bb6be5ede..574fa47181 100644
--- a/src/renderer/src/store/settings.ts
+++ b/src/renderer/src/store/settings.ts
@@ -112,7 +112,7 @@ export interface SettingsState {
   enableDataCollection: boolean
   // TTS配置
   ttsEnabled: boolean
-  ttsServiceType: string // TTS服务类型：openai或浏览器
+  ttsServiceType: string // TTS服务类型：openai、edge、siliconflow或mstts
   ttsApiKey: string
   ttsApiUrl: string
   ttsVoice: string
@@ -121,6 +121,16 @@ export interface SettingsState {
   ttsCustomModels: string[]
   // 浏览器 TTS配置
   ttsEdgeVoice: string
+  // 硅基流动 TTS配置
+  ttsSiliconflowApiKey: string
+  ttsSiliconflowApiUrl: string
+  ttsSiliconflowVoice: string
+  ttsSiliconflowModel: string
+  ttsSiliconflowResponseFormat: string
+  ttsSiliconflowSpeed: number
+  // 免费在线 TTS配置
+  ttsMsVoice: string
+  ttsMsOutputFormat: string
   // TTS过滤选项
   ttsFilterOptions: {
     filterThinkingProcess: boolean // 过滤思考过程
@@ -247,6 +257,16 @@ export const initialState: SettingsState = {
   ttsCustomModels: [],
   // Edge TTS配置
   ttsEdgeVoice: 'zh-CN-XiaoxiaoNeural', // 默认使用小小的声音
+  // 硅基流动 TTS配置
+  ttsSiliconflowApiKey: '',
+  ttsSiliconflowApiUrl: 'https://api.siliconflow.cn/v1/audio/speech',
+  ttsSiliconflowVoice: 'FunAudioLLM/CosyVoice2-0.5B:alex',
+  ttsSiliconflowModel: 'FunAudioLLM/CosyVoice2-0.5B',
+  ttsSiliconflowResponseFormat: 'mp3',
+  ttsSiliconflowSpeed: 1.0,
+  // 免费在线 TTS配置
+  ttsMsVoice: 'zh-CN-XiaoxiaoNeural',
+  ttsMsOutputFormat: 'audio-24khz-48kbitrate-mono-mp3',
   ttsFilterOptions: {
     filterThinkingProcess: true, // 默认过滤思考过程
     filterMarkdown: true, // 默认过滤Markdown标记
@@ -545,6 +565,32 @@ const settingsSlice = createSlice({
     setTtsEdgeVoice: (state, action: PayloadAction<string>) => {
       state.ttsEdgeVoice = action.payload
     },
+    // 硅基流动TTS相关的action
+    setTtsSiliconflowApiKey: (state, action: PayloadAction<string>) => {
+      state.ttsSiliconflowApiKey = action.payload
+    },
+    setTtsSiliconflowApiUrl: (state, action: PayloadAction<string>) => {
+      state.ttsSiliconflowApiUrl = action.payload
+    },
+    setTtsSiliconflowVoice: (state, action: PayloadAction<string>) => {
+      state.ttsSiliconflowVoice = action.payload
+    },
+    setTtsSiliconflowModel: (state, action: PayloadAction<string>) => {
+      state.ttsSiliconflowModel = action.payload
+    },
+    setTtsSiliconflowResponseFormat: (state, action: PayloadAction<string>) => {
+      state.ttsSiliconflowResponseFormat = action.payload
+    },
+    setTtsSiliconflowSpeed: (state, action: PayloadAction<number>) => {
+      state.ttsSiliconflowSpeed = action.payload
+    },
+    // 免费在线TTS相关的action
+    setTtsMsVoice: (state, action: PayloadAction<string>) => {
+      state.ttsMsVoice = action.payload
+    },
+    setTtsMsOutputFormat: (state, action: PayloadAction<string>) => {
+      state.ttsMsOutputFormat = action.payload
+    },
     setTtsVoice: (state, action: PayloadAction<string>) => {
       state.ttsVoice = action.payload
     },
@@ -755,6 +801,14 @@ export const {
   setTtsApiKey,
   setTtsApiUrl,
   setTtsEdgeVoice,
+  setTtsSiliconflowApiKey,
+  setTtsSiliconflowApiUrl,
+  setTtsSiliconflowVoice,
+  setTtsSiliconflowModel,
+  setTtsSiliconflowResponseFormat,
+  setTtsSiliconflowSpeed,
+  setTtsMsVoice,
+  setTtsMsOutputFormat,
   setTtsVoice,
   setTtsModel,
   setTtsCustomVoices,
diff --git a/yarn.lock b/yarn.lock
index 45976d17c8..996d2b3487 100644
--- a/yarn.lock
+++ b/yarn.lock
@@ -3981,6 +3981,7 @@ __metadata:
     lru-cache: "npm:^11.1.0"
     markdown-it: "npm:^14.1.0"
     mime: "npm:^4.0.4"
+    node-edge-tts: "npm:^1.2.8"
     npx-scope-finder: "npm:^1.2.0"
     officeparser: "npm:^4.1.1"
     openai: "patch:openai@npm%3A4.87.3#~/.yarn/patches/openai-npm-4.87.3-2b30a7685f.patch"
@@ -11754,6 +11755,19 @@ __metadata:
   languageName: node
   linkType: hard
 
+"node-edge-tts@npm:^1.2.8":
+  version: 1.2.8
+  resolution: "node-edge-tts@npm:1.2.8"
+  dependencies:
+    https-proxy-agent: "npm:^7.0.1"
+    ws: "npm:^8.13.0"
+    yargs: "npm:^17.7.2"
+  bin:
+    node-edge-tts: bin.js
+  checksum: 10c0/6d70ab660a0a82cf7b87dfa61c0680a9bce3b38a9b58ca1075d4a0a8f7ccbdb17355c995e6ca92cf5ec0260c967bbf9961e7762f6db182087aa3b3e26d7b2077
+  languageName: node
+  linkType: hard
+
 "node-ensure@npm:^0.0.0":
   version: 0.0.0
   resolution: "node-ensure@npm:0.0.0"
@@ -16863,7 +16877,7 @@ __metadata:
   languageName: node
   linkType: hard
 
-"yargs@npm:^17.5.1, yargs@npm:^17.6.2":
+"yargs@npm:^17.5.1, yargs@npm:^17.6.2, yargs@npm:^17.7.2":
   version: 17.7.2
   resolution: "yargs@npm:17.7.2"
   dependencies: