From ad277bc1aa63d12faef0faf15facfb0be5aa4ef2 Mon Sep 17 00:00:00 2001
From: Megghy <megghy@qq.com>
Date: Mon, 13 Oct 2025 18:25:20 +0800
Subject: [PATCH] feat: Enhance TTS functionality with Azure support and UI
 improvements

- Updated component declarations to include new Naive UI components.
- Refactored environment variable access to use import.meta.env.
- Added TTS_API_URL constant for Azure TTS integration.
- Expanded SpeechSettings interface to support Azure voice and language options.
- Implemented Azure TTS voice selection and loading mechanism in ReadDanmaku.vue.
- Added loading timeout for audio playback and improved error handling.
- Enhanced UI to allow users to select Azure voices and configure speech settings.
---
 src/client/ClientReadDanmaku.vue    | 1244 +--------------------------
 src/components.d.ts                 |    9 +-
 src/data/constants.ts               |    5 +-
 src/store/useSpeechService.ts       |   86 +-
 src/views/open_live/ReadDanmaku.vue |  240 +++++-
 5 files changed, 318 insertions(+), 1266 deletions(-)
diff --git a/src/client/ClientReadDanmaku.vue b/src/client/ClientReadDanmaku.vue
index c90f65d..ba52a2a 100644
--- a/src/client/ClientReadDanmaku.vue
+++ b/src/client/ClientReadDanmaku.vue
@@ -1,1246 +1,8 @@
 <script setup lang="ts">
-import type { EventModel } from '@/api/api-models'
-import {
-  CheckmarkCircle20Filled,
-  Dismiss20Filled,
-  Info24Filled,
-  Mic24Filled,
-  MicOff24Filled,
-  Play20Filled,
-  Settings20Filled,
-  Speaker124Filled,
-} from '@vicons/fluent'
-import {
-  NAlert,
-  NButton,
-  NCard,
-  NCheckbox,
-  NCollapse,
-  NCollapseItem,
-  NDivider,
-  NEmpty,
-  NGrid,
-  NGi,
-  NIcon,
-  NInput,
-  NInputGroup,
-  NInputGroupLabel,
-  NInputNumber,
-  NList,
-  NListItem,
-  NPopconfirm,
-  NRadioButton,
-  NRadioGroup,
-  NScrollbar,
-  NSelect,
-  NSlider,
-  NSpace,
-  NSpin,
-  NStatistic,
-  NTag,
-  NText,
-  NTooltip,
-  useMessage,
-} from 'naive-ui'
-import { computed, onMounted, onUnmounted, ref, watch } from 'vue'
-import { useAccount } from '@/api/account'
-import { EventDataTypes } from '@/api/api-models'
-import { copyToClipboard } from '@/Utils'
-import { useDanmakuClient } from '@/store/useDanmakuClient'
-import { templateConstants, useSpeechService } from '@/store/useSpeechService'
+import ReadDanmaku from '@/views/open_live/ReadDanmaku.vue';
 
-const message = useMessage()
-const accountInfo = useAccount()
-const client = await useDanmakuClient().initOpenlive()
-const speechService = useSpeechService()
-
-const {
-  settings,
-  speechState,
-  speakQueue,
-  readedDanmaku,
-  speechSynthesisInfo,
-  apiAudio,
-} = speechService
-
-// 音频输出设备相关
-const availableDevices = ref<MediaDeviceInfo[]>([])
-const selectedDeviceId = ref<string>('default')
-const isLoadingDevices = ref(false)
-
-// 计算属性
-const isVtsuruVoiceAPI = computed(() => {
-  return (
-    settings.value.voiceType == 'api'
-    && settings.value.voiceAPI?.toLowerCase().trim().startsWith('voice.vtsuru.live')
-  )
-})
-
-const voiceOptions = computed(() => {
-  return speechService.getAvailableVoices()
-})
-
-const queueStats = computed(() => {
-  const total = speakQueue.value.length
-  const gifts = speakQueue.value.filter(item => item.data.type === EventDataTypes.Gift).length
-  const messages = speakQueue.value.filter(item => item.data.type === EventDataTypes.Message).length
-  const waiting = speakQueue.value.filter(
-    item =>
-      item.data.type === EventDataTypes.Gift
-      && settings.value.combineGiftDelay
-      && item.updateAt > Date.now() - settings.value.combineGiftDelay * 1000,
-  ).length
-
-  return { total, gifts, messages, waiting }
-})
-
-const deviceOptions = computed(() => {
-  return [
-    { label: '默认设备', value: 'default' },
-    ...availableDevices.value.map(device => ({
-      label: device.label || `设备 ${device.deviceId.substring(0, 8)}`,
-      value: device.deviceId,
-    })),
-  ]
-})
-
-// 获取音频输出设备列表
-async function loadAudioDevices() {
-  try {
-    isLoadingDevices.value = true
-
-    // 请求权限
-    await navigator.mediaDevices.getUserMedia({ audio: true })
-
-    // 获取设备列表
-    const devices = await navigator.mediaDevices.enumerateDevices()
-    availableDevices.value = devices.filter(device => device.kind === 'audiooutput')
-
-    console.log('[TTS] 已加载音频输出设备:', availableDevices.value.length)
-  } catch (error) {
-    console.error('[TTS] 获取音频设备失败:', error)
-    message.warning('无法获取音频设备列表，将使用默认设备')
-  } finally {
-    isLoadingDevices.value = false
-  }
-}
-
-// 切换音频输出设备
-async function changeAudioDevice(deviceId: string) {
-  if (!apiAudio.value) return
-
-  try {
-    // @ts-ignore - setSinkId 可能在某些浏览器中不可用
-    if (typeof apiAudio.value.setSinkId === 'function') {
-      // @ts-ignore
-      await apiAudio.value.setSinkId(deviceId)
-      message.success(`已切换到: ${deviceOptions.value.find(d => d.value === deviceId)?.label}`)
-      console.log('[TTS] 音频输出设备已切换:', deviceId)
-    } else {
-      message.warning('当前浏览器不支持切换音频输出设备')
-    }
-  } catch (error) {
-    console.error('[TTS] 切换音频设备失败:', error)
-    message.error('切换音频设备失败')
-  }
-}
-
-// 监听设备选择变化
-watch(selectedDeviceId, (newDeviceId) => {
-  changeAudioDevice(newDeviceId)
-})
-
-// 方法
-function onGetEvent(data: EventModel) {
-  speechService.addToQueue(data)
-}
-
-function startSpeech() {
-  speechService.startSpeech()
-}
-
-function stopSpeech() {
-  speechService.stopSpeech()
-}
-
-function cancelSpeech() {
-  speechService.cancelSpeech()
-}
-
-function forceSpeak(data: EventModel) {
-  speechService.forceSpeak(data)
-}
-
-function removeFromQueue(item: any) {
-  speechService.removeFromQueue(item)
-}
-
-function clearQueue() {
-  speakQueue.value = []
-  message.success('队列已清空')
-}
-
-async function uploadConfig() {
-  await speechService.uploadConfig()
-}
-
-async function downloadConfig() {
-  await speechService.downloadConfig()
-}
-
-/**
- * 创建测试事件数据
- */
-function createTestEventData(type: EventDataTypes, overrides: Partial<EventModel>): EventModel {
-  const baseData = {
-    type,
-    uname: accountInfo.value?.name ?? '测试用户',
-    uid: accountInfo.value?.biliId ?? 0,
-    msg: '',
-    price: 0,
-    num: 0,
-    time: Date.now(),
-    guard_level: 0,
-    fans_medal_level: 1,
-    fans_medal_name: '',
-    fans_medal_wearing_status: false,
-    emoji: undefined,
-    uface: '',
-    open_id: '00000000-0000-0000-0000-000000000000',
-    ouid: '00000000-0000-0000-0000-000000000000',
-  }
-  return { ...baseData, ...overrides }
-}
-
-/**
- * 测试不同类型的事件
- */
-function test(type: EventDataTypes) {
-  let testData: EventModel
-  switch (type) {
-    case EventDataTypes.Message:
-      testData = createTestEventData(EventDataTypes.Message, { msg: '测试弹幕' })
-      break
-    case EventDataTypes.Enter:
-      testData = createTestEventData(EventDataTypes.Enter, {})
-      break
-    case EventDataTypes.SC:
-      testData = createTestEventData(EventDataTypes.SC, { msg: '测试留言', price: 30, num: 1 })
-      break
-    case EventDataTypes.Guard:
-      testData = createTestEventData(EventDataTypes.Guard, { msg: '舰长', num: 1, guard_level: 3 })
-      break
-    case EventDataTypes.Gift:
-      testData = createTestEventData(EventDataTypes.Gift, { msg: '测试礼物', price: 5, num: 5 })
-      break
-    default:
-      return
-  }
-
-  if (speechState.canSpeech) {
-    onGetEvent(testData)
-  } else {
-    forceSpeak(testData)
-  }
-}
-
-function testAPI() {
-  const url = speechService.buildApiUrl('这是一条测试弹幕')
-  if (url) {
-    speechState.isSpeaking = true
-    speechState.isApiAudioLoading = true
-    speechState.apiAudioSrc = url
-  }
-}
-
-function getEventTypeTag(type: EventDataTypes) {
-  switch (type) {
-    case EventDataTypes.Message:
-      return { text: '弹幕', type: 'info' as const }
-    case EventDataTypes.Gift:
-      return { text: '礼物', type: 'success' as const }
-    case EventDataTypes.Guard:
-      return { text: '舰长', type: 'warning' as const }
-    case EventDataTypes.SC:
-      return { text: 'SC', type: 'error' as const }
-    case EventDataTypes.Enter:
-      return { text: '进入', type: 'default' as const }
-    default:
-      return { text: '未知', type: 'default' as const }
-  }
-}
-
-function onAPIError(_e: Event) {
-  if (!speechState.apiAudioSrc) return
-  message.error('音频加载失败, 请检查API是否可用以及网络连接')
-  cancelSpeech()
-}
-
-// 生命周期
-onMounted(async () => {
-  await speechService.initialize()
-  await loadAudioDevices()
-
-  client.onEvent('danmaku', onGetEvent)
-  client.onEvent('sc', onGetEvent)
-  client.onEvent('guard', onGetEvent)
-  client.onEvent('gift', onGetEvent)
-  client.onEvent('enter', onGetEvent)
-
-  // 监听设备变化
-  navigator.mediaDevices.addEventListener('devicechange', loadAudioDevices)
-})
-
-onUnmounted(() => {
-  client.offEvent('danmaku', onGetEvent)
-  client.offEvent('sc', onGetEvent)
-  client.offEvent('guard', onGetEvent)
-  client.offEvent('gift', onGetEvent)
-  client.offEvent('enter', onGetEvent)
-
-  speechService.stopSpeech()
-
-  // 移除设备变化监听
-  navigator.mediaDevices.removeEventListener('devicechange', loadAudioDevices)
-})
 </script>
 
 <template>
-  <div class="read-danmaku-container">
-    <NAlert
-      v-if="!speechSynthesisInfo || !speechSynthesisInfo.speechSynthesis"
-      type="error"
-      title="不支持语音功能"
-    >
-      你的浏览器不支持语音功能，请使用现代浏览器如 Chrome、Edge 等
-    </NAlert>
-
-    <template v-else>
-      <!-- 顶部提示区域 -->
-      <NSpace
-        vertical
-        :size="12"
-      >
-        <NAlert
-          v-if="settings.voiceType == 'local'"
-          type="info"
-          closable
-        >
-          <template #icon>
-            <NIcon :component="Info24Filled" />
-          </template>
-          建议在 Edge 浏览器使用
-          <NTooltip>
-            <template #trigger>
-              <NText
-                strong
-                type="primary"
-                style="cursor: help"
-              >
-                Microsoft 某某 Online (Natural)
-              </NText>
-            </template>
-            例如 Microsoft Xiaoxiao Online (Natural) - Chinese (Mainland)，各种营销号就用的这些配音
-          </NTooltip>
-          系列语音，效果<NText strong>好很多</NText>
-        </NAlert>
-
-        <NAlert
-          type="warning"
-          closable
-        >
-          <template #icon>
-            <NIcon :component="Info24Filled" />
-          </template>
-          <NText strong>重要：</NText> 当在后台运行时请关闭浏览器的页面休眠/内存节省功能
-          <NDivider vertical />
-          <NButton
-            tag="a"
-            type="info"
-            href="https://support.google.com/chrome/answer/12929150?hl=zh-Hans"
-            target="_blank"
-            text
-            size="small"
-          >
-            Chrome 设置
-          </NButton>
-          <NButton
-            tag="a"
-            type="info"
-            href="https://support.microsoft.com/zh-cn/topic/%E4%BA%86%E8%A7%A3-microsoft-edge-%E4%B8%AD%E7%9A%84%E6%80%A7%E8%83%BD%E5%8A%9F%E8%83%BD-7b36f363-2119-448a-8de6-375cfd88ab25"
-            target="_blank"
-            text
-            size="small"
-          >
-            Edge 设置
-          </NButton>
-        </NAlert>
-      </NSpace>
-
-      <!-- 主控制区域 -->
-      <NCard
-        :bordered="false"
-        style="margin-top: 16px"
-      >
-        <NSpace
-          vertical
-          :size="16"
-        >
-          <NSpace
-            align="center"
-            justify="space-between"
-            :wrap="false"
-          >
-            <NSpace align="center">
-              <NButton
-                :type="speechState.canSpeech ? 'error' : 'primary'"
-                size="large"
-                :loading="speechState.isApiAudioLoading"
-                data-umami-event="Use TTS"
-                :data-umami-event-uid="accountInfo?.id"
-                @click="speechState.canSpeech ? stopSpeech() : startSpeech()"
-              >
-                <template #icon>
-                  <NIcon :component="speechState.canSpeech ? MicOff24Filled : Mic24Filled" />
-                </template>
-                {{ speechState.canSpeech ? '停止监听' : '开始监听' }}
-              </NButton>
-
-              <NDivider vertical />
-
-              <NButton
-                :type="speechState.isSpeaking ? 'error' : 'default'"
-                :disabled="!speechState.isSpeaking"
-                @click="cancelSpeech"
-              >
-                <template #icon>
-                  <NIcon :component="Dismiss20Filled" />
-                </template>
-                取消当前
-              </NButton>
-
-              <NButton
-                type="warning"
-                secondary
-                :disabled="speakQueue.length === 0"
-                @click="clearQueue"
-              >
-                <template #icon>
-                  <NIcon :component="Dismiss20Filled" />
-                </template>
-                清空队列
-              </NButton>
-            </NSpace>
-
-            <NSpace align="center">
-              <NPopconfirm @positive-click="downloadConfig">
-                <template #trigger>
-                  <NButton
-                    type="primary"
-                    secondary
-                    size="small"
-                    :disabled="!accountInfo"
-                  >
-                    <template #icon>
-                      <NIcon :component="Settings20Filled" />
-                    </template>
-                    获取配置
-                  </NButton>
-                </template>
-                这将覆盖当前设置，确定？
-              </NPopconfirm>
-
-              <NButton
-                type="primary"
-                secondary
-                size="small"
-                :disabled="!accountInfo"
-                @click="uploadConfig"
-              >
-                <template #icon>
-                  <NIcon :component="CheckmarkCircle20Filled" />
-                </template>
-                保存配置
-              </NButton>
-            </NSpace>
-          </NSpace>
-
-          <!-- 音频输出设备选择 -->
-          <NDivider style="margin: 8px 0">
-            音频输出设置
-          </NDivider>
-          <NSpace
-            align="center"
-            :size="12"
-          >
-            <NIcon
-              :component="Speaker124Filled"
-              :size="20"
-            />
-            <NText>输出设备：</NText>
-            <NSelect
-              v-model:value="selectedDeviceId"
-              :options="deviceOptions"
-              :loading="isLoadingDevices"
-              style="min-width: 250px; flex: 1"
-              :disabled="availableDevices.length === 0"
-            />
-            <NButton
-              :loading="isLoadingDevices"
-              @click="loadAudioDevices"
-            >
-              刷新设备
-            </NButton>
-          </NSpace>
-          <NAlert
-            v-if="availableDevices.length === 0 && !isLoadingDevices"
-            type="warning"
-            :bordered="false"
-          >
-            <template #icon>
-              <NIcon :component="Info24Filled" />
-            </template>
-            未检测到音频输出设备或浏览器不支持设备选择功能
-          </NAlert>
-        </NSpace>
-      </NCard>
-
-      <!-- 状态统计区域 -->
-      <NCard
-        v-if="speechState.canSpeech"
-        title="实时状态"
-        :bordered="false"
-        style="margin-top: 16px"
-      >
-        <NGrid
-          :cols="4"
-          :x-gap="12"
-          :y-gap="12"
-          responsive="screen"
-        >
-          <NGi>
-            <NStatistic label="当前状态">
-              <template #prefix>
-                <NTooltip v-if="speechState.isApiAudioLoading">
-                  <template #trigger>
-                    <NSpin :size="20" />
-                  </template>
-                  加载中
-                </NTooltip>
-                <NIcon
-                  v-else
-                  :component="Mic24Filled"
-                  :color="speechState.isSpeaking ? '#18a058' : '#d0d0d0'"
-                  :size="20"
-                  :style="`animation: ${speechState.isSpeaking ? 'pulse 2s infinite' : 'none'}`"
-                />
-              </template>
-              <NText :type="speechState.isSpeaking ? 'success' : 'default'">
-                {{ speechState.isSpeaking ? '朗读中' : '待机' }}
-              </NText>
-            </NStatistic>
-            <NText
-              v-if="speechState.isSpeaking"
-              depth="3"
-              style="font-size: 12px; display: block; margin-top: 4px"
-            >
-              {{ speechState.speakingText }}
-            </NText>
-          </NGi>
-
-          <NGi>
-            <NStatistic
-              label="队列长度"
-              :value="queueStats.total"
-            >
-              <template #suffix>
-                <NText depth="3">
-                  条
-                </NText>
-              </template>
-            </NStatistic>
-          </NGi>
-
-          <NGi>
-            <NStatistic
-              label="已读取"
-              :value="readedDanmaku"
-            >
-              <template #suffix>
-                <NText depth="3">
-                  条
-                </NText>
-              </template>
-            </NStatistic>
-          </NGi>
-
-          <NGi>
-            <NStatistic label="队列分布">
-              <NSpace
-                :size="8"
-                style="margin-top: 4px"
-              >
-                <NTooltip v-if="queueStats.messages > 0">
-                  <template #trigger>
-                    <NTag
-                      :bordered="false"
-                      type="info"
-                      size="small"
-                    >
-                      弹幕 {{ queueStats.messages }}
-                    </NTag>
-                  </template>
-                  弹幕消息数量
-                </NTooltip>
-                <NTooltip v-if="queueStats.gifts > 0">
-                  <template #trigger>
-                    <NTag
-                      :bordered="false"
-                      type="success"
-                      size="small"
-                    >
-                      礼物 {{ queueStats.gifts }}
-                    </NTag>
-                  </template>
-                  礼物消息数量
-                </NTooltip>
-                <NTooltip v-if="queueStats.waiting > 0">
-                  <template #trigger>
-                    <NTag
-                      :bordered="false"
-                      type="warning"
-                      size="small"
-                      style="animation: pulse 2s infinite"
-                    >
-                      等待 {{ queueStats.waiting }}
-                    </NTag>
-                  </template>
-                  等待合并的礼物
-                </NTooltip>
-              </NSpace>
-            </NStatistic>
-          </NGi>
-        </NGrid>
-
-        <!-- 队列详情 -->
-        <NDivider style="margin: 16px 0" />
-        <NCollapse>
-          <NCollapseItem
-            title="队列详情"
-            name="queue"
-          >
-            <template #header-extra>
-              <NTag
-                :bordered="false"
-                size="small"
-              >
-                {{ speakQueue.length }} 项
-              </NTag>
-            </template>
-
-            <NEmpty
-              v-if="speakQueue.length === 0"
-              description="队列为空"
-              size="small"
-            />
-
-            <NScrollbar
-              v-else
-              style="max-height: 300px"
-            >
-              <NList
-                size="small"
-                bordered
-              >
-                <NListItem
-                  v-for="(item, index) in speakQueue"
-                  :key="`${item.data.time}-${index}`"
-                >
-                  <NSpace
-                    align="center"
-                    :size="8"
-                  >
-                    <NButton
-                      type="primary"
-                      size="tiny"
-                      circle
-                      @click="forceSpeak(item.data)"
-                    >
-                      <template #icon>
-                        <NIcon :component="Play20Filled" />
-                      </template>
-                    </NButton>
-
-                    <NButton
-                      type="error"
-                      size="tiny"
-                      circle
-                      @click="removeFromQueue(item)"
-                    >
-                      <template #icon>
-                        <NIcon :component="Dismiss20Filled" />
-                      </template>
-                    </NButton>
-
-                    <NTag
-                      v-if="item.data.type == EventDataTypes.Gift && item.combineCount"
-                      type="info"
-                      size="small"
-                      :bordered="false"
-                      style="animation: pulse 2s infinite"
-                    >
-                      连续赠送中
-                    </NTag>
-                    <NTag
-                      v-else-if="item.data.type == EventDataTypes.Gift && settings.combineGiftDelay"
-                      type="success"
-                      size="small"
-                      :bordered="false"
-                    >
-                      等待合并
-                    </NTag>
-
-                    <NTag
-                      :type="getEventTypeTag(item.data.type).type"
-                      size="small"
-                      :bordered="false"
-                    >
-                      {{ getEventTypeTag(item.data.type).text }}
-                    </NTag>
-
-                    <NText strong>
-                      {{ item.data.uname }}
-                    </NText>
-
-                    <NText depth="3">
-                      {{ speechService.getTextFromDanmaku(item.data) }}
-                    </NText>
-                  </NSpace>
-                </NListItem>
-              </NList>
-            </NScrollbar>
-          </NCollapseItem>
-        </NCollapse>
-      </NCard>
-
-      <!-- 语音设置区域 -->
-      <NCard
-        title="语音设置"
-        :bordered="false"
-        style="margin-top: 16px"
-      >
-        <NSpace
-          vertical
-          :size="16"
-        >
-          <NRadioGroup
-            v-model:value="settings.voiceType"
-            size="large"
-          >
-            <NRadioButton value="local">
-              <NSpace :size="4">
-                <span>本地语音</span>
-                <NTooltip>
-                  <template #trigger>
-                    <NIcon
-                      :component="Info24Filled"
-                      :size="16"
-                    />
-                  </template>
-                  使用浏览器内置的语音合成功能
-                </NTooltip>
-              </NSpace>
-            </NRadioButton>
-
-            <NRadioButton value="api">
-              <NSpace :size="4">
-                <span>API 语音</span>
-                <NTooltip>
-                  <template #trigger>
-                    <NIcon
-                      :component="Info24Filled"
-                      :size="16"
-                    />
-                  </template>
-                  自定义语音API，可以播放自己训练的模型或其他TTS
-                </NTooltip>
-              </NSpace>
-            </NRadioButton>
-          </NRadioGroup>
-
-          <Transition
-            name="fade"
-            mode="out-in"
-          >
-            <!-- 本地语音设置 -->
-            <NSpace
-              v-if="settings.voiceType === 'local'"
-              vertical
-              :size="16"
-            >
-              <div>
-                <NText strong>选择语音</NText>
-                <NSelect
-                  v-model:value="settings.speechInfo.voice"
-                  :options="voiceOptions"
-                  :fallback-option="() => ({
-                    label: settings.speechInfo.voice ? `已选择: ${settings.speechInfo.voice}` : '未选择, 将使用默认语音',
-                    value: settings.speechInfo.voice || '',
-                  })"
-                  style="margin-top: 8px"
-                  filterable
-                />
-              </div>
-
-              <div>
-                <NSpace
-                  justify="space-between"
-                  align="center"
-                >
-                  <NText>音量</NText>
-                  <NText depth="3">
-                    {{ (settings.speechInfo.volume * 100).toFixed(0) }}%
-                  </NText>
-                </NSpace>
-                <NSlider
-                  v-model:value="settings.speechInfo.volume"
-                  :min="0"
-                  :max="1"
-                  :step="0.01"
-                  style="margin-top: 8px"
-                />
-              </div>
-
-              <div>
-                <NSpace
-                  justify="space-between"
-                  align="center"
-                >
-                  <NText>音调</NText>
-                  <NText depth="3">
-                    {{ settings.speechInfo.pitch.toFixed(2) }}
-                  </NText>
-                </NSpace>
-                <NSlider
-                  v-model:value="settings.speechInfo.pitch"
-                  :min="0"
-                  :max="2"
-                  :step="0.01"
-                  style="margin-top: 8px"
-                />
-              </div>
-
-              <div>
-                <NSpace
-                  justify="space-between"
-                  align="center"
-                >
-                  <NText>语速</NText>
-                  <NText depth="3">
-                    {{ settings.speechInfo.rate.toFixed(2) }}
-                  </NText>
-                </NSpace>
-                <NSlider
-                  v-model:value="settings.speechInfo.rate"
-                  :min="0"
-                  :max="2"
-                  :step="0.01"
-                  style="margin-top: 8px"
-                />
-              </div>
-            </NSpace>
-
-            <!-- API 语音设置 -->
-            <NSpace
-              v-else
-              vertical
-              :size="16"
-            >
-              <NCollapse>
-                <NCollapseItem
-                  title="📖 使用说明"
-                  name="requirements"
-                >
-                  <NSpace
-                    vertical
-                    :size="8"
-                  >
-                    <NText>API 要求：</NText>
-                    <ul style="margin: 0; padding-left: 24px">
-                      <li>直接返回音频数据（wav, mp3, m4a 等）</li>
-                      <li>建议使用 HTTPS（HTTP 将通过 Cloudflare Workers 代理，会较慢）</li>
-                      <li>确保 API 可以被外部访问</li>
-                    </ul>
-                    <NDivider style="margin: 8px 0" />
-                    <NText>推荐项目（可本地部署）：</NText>
-                    <NButton
-                      text
-                      type="info"
-                      tag="a"
-                      href="https://github.com/fishaudio/Bert-VITS2"
-                      target="_blank"
-                    >
-                      Bert-VITS2
-                    </NButton>
-                  </NSpace>
-                </NCollapseItem>
-              </NCollapse>
-
-              <NAlert
-                v-if="isVtsuruVoiceAPI"
-                type="success"
-                closable
-              >
-                <template #icon>
-                  <NIcon :component="Info24Filled" />
-                </template>
-                你正在使用本站提供的测试 API (voice.vtsuru.live)，仅用于测试，不保证可用性
-              </NAlert>
-
-              <NAlert type="info">
-                地址中的
-                <NButton
-                  size="tiny"
-                  type="primary"
-                  text
-                  @click="copyToClipboard('{{text}}')"
-                  v-text="'{{ text }}'"
-                />
-                将被替换为要念的文本
-              </NAlert>
-
-              <div>
-                <NText strong>API 地址</NText>
-                <NInputGroup style="margin-top: 8px">
-                  <NSelect
-                    v-model:value="settings.voiceAPISchemeType"
-                    :options="[
-                      { label: 'https://', value: 'https' },
-                      { label: 'http://', value: 'http' },
-                    ]"
-                    style="width: 110px"
-                  />
-                  <NInput
-                    v-model:value="settings.voiceAPI"
-                    placeholder="例如: xxx.com/voice/bert-vits2?text={{text}}&id=0"
-                    :status="/^(?:https?:\/\/)/.test(settings.voiceAPI?.toLowerCase() ?? '') ? 'error' : undefined"
-                  />
-                  <NButton
-                    type="info"
-                    :loading="speechState.isApiAudioLoading"
-                    @click="testAPI"
-                  >
-                    测试
-                  </NButton>
-                </NInputGroup>
-              </div>
-
-              <NAlert
-                v-if="settings.voiceAPISchemeType === 'http'"
-                type="warning"
-              >
-                <template #icon>
-                  <NIcon :component="Info24Filled" />
-                </template>
-                <NSpace
-                  vertical
-                  :size="8"
-                >
-                  <NText>不使用 HTTPS 将通过 Cloudflare Workers 代理，速度会慢很多</NText>
-                  <NCheckbox v-model:checked="settings.useAPIDirectly">
-                    不使用代理（需要了解可能产生的影响）
-                  </NCheckbox>
-                </NSpace>
-              </NAlert>
-
-              <div>
-                <NSpace
-                  justify="space-between"
-                  align="center"
-                >
-                  <NText>音量</NText>
-                  <NText depth="3">
-                    {{ (settings.speechInfo.volume * 100).toFixed(0) }}%
-                  </NText>
-                </NSpace>
-                <NSlider
-                  v-model:value="settings.speechInfo.volume"
-                  :min="0"
-                  :max="1"
-                  :step="0.01"
-                  style="margin-top: 8px"
-                />
-              </div>
-
-              <!-- 隐藏的音频元素 -->
-              <audio
-                ref="apiAudio"
-                :src="speechState.apiAudioSrc"
-                :volume="settings.speechInfo.volume"
-                style="display: none"
-                @ended="cancelSpeech"
-                @canplay="speechState.isApiAudioLoading = false"
-                @error="onAPIError"
-              />
-            </NSpace>
-          </Transition>
-        </NSpace>
-      </NCard>
-
-      <!-- 模板设置区域 -->
-      <NCard
-        title="消息模板"
-        :bordered="false"
-        style="margin-top: 16px"
-      >
-        <NSpace
-          vertical
-          :size="16"
-        >
-          <NAlert
-            type="info"
-            :bordered="false"
-          >
-            <template #icon>
-              <NIcon :component="Info24Filled" />
-            </template>
-            <NText>支持的变量（点击复制）：</NText>
-            <NDivider style="margin: 8px 0" />
-            <NSpace :size="8">
-              <NButton
-                v-for="item in Object.values(templateConstants)"
-                :key="item.name"
-                size="tiny"
-                secondary
-                @click="copyToClipboard(item.words)"
-              >
-                {{ item.words }}
-                <NDivider vertical />
-                {{ item.name }}
-              </NButton>
-            </NSpace>
-          </NAlert>
-
-          <NText depth="3" style="font-size: 12px; margin-bottom: 8px;">
-            提示：模板留空则不播报对应类型的事件
-          </NText>
-
-          <div>
-            <NInputGroup>
-              <NInputGroupLabel style="min-width: 120px">
-                弹幕模板
-              </NInputGroupLabel>
-              <NInput
-                v-model:value="settings.danmakuTemplate"
-              />
-              <NButton
-                type="info"
-                :loading="speechState.isApiAudioLoading"
-                @click="test(EventDataTypes.Message)"
-              >
-                测试
-              </NButton>
-            </NInputGroup>
-          </div>
-
-          <div>
-            <NInputGroup>
-              <NInputGroupLabel style="min-width: 120px">
-                礼物模板
-              </NInputGroupLabel>
-              <NInput
-                v-model:value="settings.giftTemplate"
-              />
-              <NButton
-                type="info"
-                :loading="speechState.isApiAudioLoading"
-                @click="test(EventDataTypes.Gift)"
-              >
-                测试
-              </NButton>
-            </NInputGroup>
-          </div>
-
-          <div>
-            <NInputGroup>
-              <NInputGroupLabel style="min-width: 120px">
-                SC 模板
-              </NInputGroupLabel>
-              <NInput
-                v-model:value="settings.scTemplate"
-              />
-              <NButton
-                type="info"
-                :loading="speechState.isApiAudioLoading"
-                @click="test(EventDataTypes.SC)"
-              >
-                测试
-              </NButton>
-            </NInputGroup>
-          </div>
-
-          <div>
-            <NInputGroup>
-              <NInputGroupLabel style="min-width: 120px">
-                上舰模板
-              </NInputGroupLabel>
-              <NInput
-                v-model:value="settings.guardTemplate"
-              />
-              <NButton
-                type="info"
-                :loading="speechState.isApiAudioLoading"
-                @click="test(EventDataTypes.Guard)"
-              >
-                测试
-              </NButton>
-            </NInputGroup>
-          </div>
-
-          <div>
-            <NInputGroup>
-              <NInputGroupLabel style="min-width: 120px">
-                进入直播间模板
-              </NInputGroupLabel>
-              <NInput
-                v-model:value="settings.enterTemplate"
-              />
-              <NButton
-                type="info"
-                :loading="speechState.isApiAudioLoading"
-                @click="test(EventDataTypes.Enter)"
-              >
-                测试
-              </NButton>
-            </NInputGroup>
-          </div>
-        </NSpace>
-      </NCard>
-
-      <!-- 高级设置区域 -->
-      <NCard
-        title="高级设置"
-        :bordered="false"
-        style="margin-top: 16px"
-      >
-        <NSpace
-          vertical
-          :size="16"
-        >
-          <NSpace align="center">
-            <NCheckbox
-              :checked="settings.combineGiftDelay !== undefined"
-              @update:checked="(checked: boolean) => {
-                settings.combineGiftDelay = checked ? 2 : undefined
-              }"
-            >
-              <NSpace
-                :size="4"
-                align="center"
-              >
-                <span>礼物合并</span>
-                <NTooltip>
-                  <template #trigger>
-                    <NIcon
-                      :component="Info24Filled"
-                      :size="16"
-                    />
-                  </template>
-                  在指定时间内连续送相同礼物会等停止送礼物之后才会念。
-                  <br>
-                  这也会导致送的礼物会等待指定时间之后才会念，即使没有连续赠送。
-                </NTooltip>
-              </NSpace>
-            </NCheckbox>
-
-            <NInputGroup
-              v-if="settings.combineGiftDelay !== undefined"
-              style="width: 200px"
-            >
-              <NInputGroupLabel>延迟（秒）</NInputGroupLabel>
-              <NInputNumber
-                v-model:value="settings.combineGiftDelay"
-                :min="1"
-                :max="10"
-                @update:value="(value) => {
-                  if (!value || value <= 0) settings.combineGiftDelay = undefined
-                }"
-              />
-            </NInputGroup>
-          </NSpace>
-
-          <NCheckbox v-model:checked="settings.splitText">
-            <NSpace
-              :size="4"
-              align="center"
-            >
-              <span>启用句子拆分</span>
-              <NTooltip>
-                <template #trigger>
-                  <NIcon
-                    :component="Info24Filled"
-                    :size="16"
-                  />
-                </template>
-                仅 API 方式可用，为英文用户名用引号包裹起来，并将所有大写单词拆分成单个单词，以防止部分单词念不出来。
-                <br>
-                例：原文: Megghy 说: UPPERCASE单词
-                <br>
-                结果: 'Megghy' 说: U P P E R C A S E 单词
-              </NTooltip>
-            </NSpace>
-          </NCheckbox>
-        </NSpace>
-      </NCard>
-    </template>
-  </div>
-</template>
-
-<style scoped>
-.read-danmaku-container {
-  width: 100%;
-  padding: 16px;
-  background: var(--n-color);
-  border-radius: 8px;
-}
-
-@keyframes pulse {
-  0%, 100% {
-    opacity: 1;
-    transform: scale(1);
-  }
-  50% {
-    opacity: 0.7;
-    transform: scale(0.95);
-  }
-}
-
-.fade-enter-active,
-.fade-leave-active {
-  transition: opacity 0.3s ease, transform 0.3s ease;
-}
-
-.fade-enter-from {
-  opacity: 0;
-  transform: translateY(-10px);
-}
-
-.fade-leave-to {
-  opacity: 0;
-  transform: translateY(10px);
-}
-
-/* 响应式设计 */
-@media (max-width: 768px) {
-  .read-danmaku-container {
-    padding: 12px;
-  }
-}
-
-/* 暗色模式优化 */
-@media (prefers-color-scheme: dark) {
-  .read-danmaku-container {
-    background: var(--n-color);
-  }
-}
-</style>
+ <ReadDanmaku />
+</template>
\ No newline at end of file
diff --git a/src/components.d.ts b/src/components.d.ts
index 986dd56..923672d 100644
--- a/src/components.d.ts
+++ b/src/components.d.ts
@@ -18,13 +18,18 @@ declare module 'vue' {
     LabelItem: typeof import('./components/LabelItem.vue')['default']
     LiveInfoContainer: typeof import('./components/LiveInfoContainer.vue')['default']
     MonacoEditorComponent: typeof import('./components/MonacoEditorComponent.vue')['default']
-    NEllipsis: typeof import('naive-ui')['NEllipsis']
-    NEmpty: typeof import('naive-ui')['NEmpty']
+    NAvatar: typeof import('naive-ui')['NAvatar']
+    NButton: typeof import('naive-ui')['NButton']
+    NCard: typeof import('naive-ui')['NCard']
     NFlex: typeof import('naive-ui')['NFlex']
     NFormItemGi: typeof import('naive-ui')['NFormItemGi']
     NGridItem: typeof import('naive-ui')['NGridItem']
     NIcon: typeof import('naive-ui')['NIcon']
+    NImage: typeof import('naive-ui')['NImage']
+    NPopconfirm: typeof import('naive-ui')['NPopconfirm']
     NScrollbar: typeof import('naive-ui')['NScrollbar']
+    NSpace: typeof import('naive-ui')['NSpace']
+    NSwitch: typeof import('naive-ui')['NSwitch']
     NTag: typeof import('naive-ui')['NTag']
     NText: typeof import('naive-ui')['NText']
     PointGoodsItem: typeof import('./components/manage/PointGoodsItem.vue')['default']
diff --git a/src/data/constants.ts b/src/data/constants.ts
index 7df8ff0..48201ce 100644
--- a/src/data/constants.ts
+++ b/src/data/constants.ts
@@ -19,7 +19,7 @@ export const THINGS_URL = `${FILE_BASE_URL}/things/`
 export const apiFail = ref(false)
 
 export const BASE_URL
-  = process.env.NODE_ENV === 'development'
+  = import.meta.env.NODE_ENV === 'development'
     ? debugAPI
     : apiFail.value
       ? failoverAPI
@@ -27,7 +27,7 @@ export const BASE_URL
 export const BASE_API_URL = `${BASE_URL}api/`
 export const FETCH_API = 'https://fetch.vtsuru.live/'
 export const BASE_HUB_URL
-  = `${process.env.NODE_ENV === 'development'
+  = `${import.meta.env.NODE_ENV === 'development'
     ? debugAPI
     : apiFail.value
       ? failoverAPI
@@ -65,6 +65,7 @@ export const CHECKIN_API_URL = `${BASE_API_URL}checkin/`
 export const USER_CONFIG_API_URL = `${BASE_API_URL}user-config/`
 export const FILE_API_URL = `${BASE_API_URL}files/`
 export const VOTE_API_URL = `${BASE_API_URL}vote/`
+export const TTS_API_URL = `${BASE_API_URL}tts/`
 
 export interface TemplateMapType {
   [key: string]: {
diff --git a/src/store/useSpeechService.ts b/src/store/useSpeechService.ts
index a47b55b..3f5ad44 100644
--- a/src/store/useSpeechService.ts
+++ b/src/store/useSpeechService.ts
@@ -7,7 +7,7 @@ import { clearInterval, setInterval } from 'worker-timers'
 import type { EventModel } from '@/api/api-models'
 import { DownloadConfig, UploadConfig, useAccount } from '@/api/account'
 import { EventDataTypes } from '@/api/api-models'
-import { FETCH_API } from '@/data/constants'
+import { FETCH_API, TTS_API_URL } from '@/data/constants'
 
 export interface SpeechSettings {
   speechInfo: SpeechInfo
@@ -16,12 +16,14 @@ export interface SpeechSettings {
   guardTemplate: string
   giftTemplate: string
   enterTemplate: string
-  voiceType: 'local' | 'api'
+  voiceType: 'local' | 'api' | 'azure'
   voiceAPISchemeType: 'http' | 'https'
   voiceAPI: string
   splitText: boolean
   useAPIDirectly: boolean
   combineGiftDelay: number | undefined
+  azureVoice: string
+  azureLanguage: string
 }
 
 export interface SpeechInfo {
@@ -65,6 +67,8 @@ const DEFAULT_SETTINGS: SpeechSettings = {
   useAPIDirectly: false,
   splitText: false,
   combineGiftDelay: 2,
+  azureVoice: 'zh-CN-XiaoxiaoNeural',
+  azureLanguage: 'zh-CN',
 }
 
 export const templateConstants = {
@@ -134,6 +138,7 @@ function createSpeechService() {
 
   const apiAudio = ref<HTMLAudioElement>()
   let checkTimer: number | undefined
+  let loadingTimeoutTimer: number | undefined // 音频加载超时计时器
   let speechQueueTimer: number | undefined
 
   const speechSynthesisInfo = ref<{
@@ -204,6 +209,11 @@ function createSpeechService() {
       checkTimer = undefined
     }
 
+    if (loadingTimeoutTimer) {
+      clearInterval(loadingTimeoutTimer)
+      loadingTimeoutTimer = undefined
+    }
+
     cancelSpeech()
     giftCombineMap.clear()
     speakQueue.value = []
@@ -294,10 +304,7 @@ function createSpeechService() {
       text = text.replace(templateConstants.guard_num.regex, (data.num ?? 0).toString())
     }
 
-    text = fullWidthToHalfWidth(text)
-      .replace(/[^0-9a-z\u4E00-\u9FFF\u3400-\u4DBF\uF900-\uFAFF,.:'"\s]/gi, '')
-      .normalize('NFKC')
-
+    console.log(text)
     return text
   }
 
@@ -359,6 +366,13 @@ function createSpeechService() {
    * 构建API请求URL
    */
   function buildApiUrl(text: string): string | null {
+    // Azure TTS
+    if (settings.value.voiceType === 'azure') {
+      const apiUrl = `${TTS_API_URL}azure?text=${encodeURIComponent(text)}`
+      return apiUrl
+    }
+
+    // 自定义 API
     if (!settings.value.voiceAPI) {
       message.error('未设置语音API')
       return null
@@ -400,15 +414,47 @@ function createSpeechService() {
    * 使用API TTS朗读
    */
   function speakFromAPI(text: string) {
-    const url = buildApiUrl(text)
+    let url = buildApiUrl(text)
     if (!url) {
       cancelSpeech()
       return
     }
 
+    // 如果是 Azure TTS，添加额外参数
+    if (settings.value.voiceType === 'azure') {
+      const azureUrl = new URL(url)
+      azureUrl.searchParams.set('voice', settings.value.azureVoice)
+      azureUrl.searchParams.set('language', settings.value.azureLanguage)
+      azureUrl.searchParams.set('rate', settings.value.speechInfo.rate.toString())
+      azureUrl.searchParams.set('pitch', settings.value.speechInfo.pitch.toString())
+      azureUrl.searchParams.set('streaming', 'true')
+      url = azureUrl.toString()
+    }
+
     speechState.isSpeaking = true
     speechState.isApiAudioLoading = true
-    speechState.apiAudioSrc = url
+    
+    // 先清空 apiAudioSrc，确保 audio 元素能够正确重新加载
+    // 这样可以避免连续播放时 src 更新不触发加载的问题
+    speechState.apiAudioSrc = ''
+    
+    // 使用 nextTick 确保 DOM 更新后再设置新的 src
+    // 但由于这是在 store 中，我们使用 setTimeout 来模拟
+    setTimeout(() => {
+      speechState.apiAudioSrc = url
+    }, 0)
+
+    // 设置 10 秒加载超时
+    if (loadingTimeoutTimer) {
+      clearInterval(loadingTimeoutTimer)
+    }
+    loadingTimeoutTimer = setInterval(() => {
+      if (speechState.isApiAudioLoading) {
+        console.error('[TTS] 音频加载超时 (10秒)')
+        message.error('音频加载超时，请检查网络连接或API状态')
+        cancelSpeech()
+      }
+    }, 10000) // 10 秒超时
   }
 
   /**
@@ -470,7 +516,10 @@ function createSpeechService() {
       if (settings.value.voiceType == 'local') {
         speakDirect(text)
       } else {
-        text = settings.value.splitText ? insertSpaces(text) : text
+        // 只有自定义 API 且启用了 splitText 才进行文本拆分
+        if (settings.value.voiceType === 'api' && settings.value.splitText) {
+          text = insertSpaces(text)
+        }
         speakFromAPI(text)
       }
 
@@ -489,16 +538,34 @@ function createSpeechService() {
       checkTimer = undefined
     }
 
+    if (loadingTimeoutTimer) {
+      clearInterval(loadingTimeoutTimer)
+      loadingTimeoutTimer = undefined
+    }
+
     speechState.isApiAudioLoading = false
 
     if (apiAudio.value && !apiAudio.value.paused) {
       apiAudio.value.pause()
     }
 
+    // 清空音频源，确保下次播放时能正确加载新的音频
+    speechState.apiAudioSrc = ''
+
     EasySpeech.cancel()
     speechState.speakingText = ''
   }
 
+  /**
+   * 清除音频加载超时计时器
+   */
+  function clearLoadingTimeout() {
+    if (loadingTimeoutTimer) {
+      clearInterval(loadingTimeoutTimer)
+      loadingTimeoutTimer = undefined
+    }
+  }
+
   /**
    * 接收事件并添加到队列
    */
@@ -680,6 +747,7 @@ function createSpeechService() {
     startSpeech,
     stopSpeech,
     cancelSpeech,
+    clearLoadingTimeout,
     uploadConfig,
     downloadConfig,
     getTextFromDanmaku,
diff --git a/src/views/open_live/ReadDanmaku.vue b/src/views/open_live/ReadDanmaku.vue
index 54aa365..30c9aec 100644
--- a/src/views/open_live/ReadDanmaku.vue
+++ b/src/views/open_live/ReadDanmaku.vue
@@ -47,6 +47,7 @@ import { EventDataTypes } from '@/api/api-models'
 import { useDanmakuClient } from '@/store/useDanmakuClient'
 import { templateConstants, useSpeechService } from '@/store/useSpeechService'
 import { copyToClipboard } from '@/Utils'
+import { TTS_API_URL } from '@/data/constants';
 
 const props = defineProps<{
   roomInfo?: any
@@ -68,6 +69,10 @@ const {
   apiAudio,
 } = speechService
 
+// Azure 语音列表
+const azureVoices = ref<Array<{ label: string; value: string; locale: string }>>([])
+const azureVoicesLoading = ref(false)
+
 // 计算属性
 const isVtsuruVoiceAPI = computed(() => {
   return (
@@ -197,6 +202,61 @@ function testAPI() {
   }
 }
 
+/**
+ * 获取 Azure 语音列表
+ */
+async function fetchAzureVoices() {
+  if (azureVoices.value.length > 0) {
+    return
+  }
+
+  azureVoicesLoading.value = true
+  try {
+    const response = await fetch(`${TTS_API_URL}voices`)
+    if (!response.ok) {
+      throw new Error('获取语音列表失败')
+    }
+
+    const voices = await response.json()
+
+    azureVoices.value = voices
+      .filter((v: any) => {
+        const locale = v.Locale || v.locale || ''
+        return locale.startsWith('zh-') || locale.startsWith('ja-') || locale.startsWith('en-')
+      })
+      .map((v: any) => {
+        const shortName = v.ShortName || v.shortName || ''
+        const localeName = v.LocaleName || v.localeName || ''
+        const localName = v.LocalName || v.localName || v.DisplayName || v.displayName || ''
+        const gender = v.Gender || v.gender || ''
+        const isMultilingual = shortName.toLowerCase().includes('multilingual')
+
+        return {
+          label: `[${localeName}] ${localName} (${gender === 'Male' ? '男' : '女'})${isMultilingual ? ' 🌍' : ''}`,
+          value: shortName,
+          locale: v.Locale || v.locale || '',
+        }
+      })
+      .sort((a: any, b: any) => {
+        // 多语言模型优先
+        const aMulti = a.value.toLowerCase().includes('multilingual')
+        const bMulti = b.value.toLowerCase().includes('multilingual')
+        if (aMulti && !bMulti) return -1
+        if (!aMulti && bMulti) return 1
+
+        // 然后按语言排序：中文排前面，日文其次，英文最后
+        const aScore = a.locale.startsWith('zh-') ? 0 : a.locale.startsWith('ja-') ? 1 : 2
+        const bScore = b.locale.startsWith('zh-') ? 0 : b.locale.startsWith('ja-') ? 1 : 2
+        return aScore - bScore
+      })
+  } catch (error) {
+    console.error('[Azure TTS] 获取语音列表失败:', error)
+    message.error('获取 Azure 语音列表失败')
+  } finally {
+    azureVoicesLoading.value = false
+  }
+}
+
 function getEventTypeTag(type: EventDataTypes) {
   switch (type) {
     case EventDataTypes.Message:
@@ -220,6 +280,16 @@ function onAPIError(_e: Event) {
   cancelSpeech()
 }
 
+function onAudioCanPlay() {
+  speechState.isApiAudioLoading = false
+  speechService.clearLoadingTimeout()
+}
+
+function onAudioError(e: Event) {
+  speechService.clearLoadingTimeout()
+  onAPIError(e)
+}
+
 // 生命周期
 onMounted(async () => {
   await speechService.initialize()
@@ -229,6 +299,11 @@ onMounted(async () => {
   client.onEvent('guard', onGetEvent)
   client.onEvent('gift', onGetEvent)
   client.onEvent('enter', onGetEvent)
+
+  // 如果默认使用 Azure TTS，则预加载语音列表
+  if (settings.value.voiceType === 'azure') {
+    fetchAzureVoices()
+  }
 })
 
 onUnmounted(() => {
@@ -646,6 +721,21 @@ onUnmounted(() => {
               </NSpace>
             </NRadioButton>
 
+            <NRadioButton value="azure">
+              <NSpace :size="4">
+                <span>Azure TTS</span>
+                <NTooltip>
+                  <template #trigger>
+                    <NIcon
+                      :component="Info24Filled"
+                      :size="16"
+                    />
+                  </template>
+                  使用 Microsoft Azure 语音合成服务, 混合语言输出效果和音质好, 略有延迟
+                </NTooltip>
+              </NSpace>
+            </NRadioButton>
+
             <NRadioButton value="api">
               <NSpace :size="4">
                 <span>API 语音</span>
@@ -744,6 +834,127 @@ onUnmounted(() => {
               </div>
             </NSpace>
 
+            <!-- Azure TTS 设置 -->
+            <NSpace
+              v-else-if="settings.voiceType === 'azure'"
+              vertical
+              :size="16"
+            >
+              <NAlert
+                type="success"
+                :bordered="false"
+              >
+                <template #icon>
+                  <NIcon :component="Info24Filled" />
+                </template>
+                使用本站提供的 Microsoft Azure 语音合成服务，效果最好
+              </NAlert>
+
+              <div>
+                <NSpace justify="space-between" align="center">
+                  <NText strong>语音选择</NText>
+                  <NButton
+                    v-if="azureVoices.length === 0"
+                    text
+                    type="primary"
+                    size="small"
+                    :loading="azureVoicesLoading"
+                    @click="fetchAzureVoices"
+                  >
+                    加载语音列表
+                  </NButton>
+                  <NText v-else depth="3" style="font-size: 12px">
+                    共 {{ azureVoices.length }} 个语音
+                  </NText>
+                </NSpace>
+                <NSelect
+                  v-model:value="settings.azureVoice"
+                  :options="azureVoices.length > 0 ? azureVoices : [
+                    { label: '中文(普通话)女 - 晓晓', value: 'zh-CN-XiaoxiaoNeural' },
+                    { label: '中文(普通话)女 - 晓伊', value: 'zh-CN-XiaoyiNeural' },
+                    { label: '中文(普通话)女 - 晓梦', value: 'zh-CN-XiaomengNeural' },
+                    { label: '中文(普通话)女 - 晓莫', value: 'zh-CN-XiaomoNeural' },
+                    { label: '中文(普通话)女 - 晓秋', value: 'zh-CN-XiaoqiuNeural' },
+                    { label: '中文(普通话)女 - 晓双', value: 'zh-CN-XiaoshuangNeural' },
+                    { label: '中文(普通话)女 - 晓纯', value: 'zh-CN-XiaochenNeural' },
+                    { label: '中文(普通话)女 - 晓翔', value: 'zh-CN-XiaoxiangNeural' },
+                    { label: '中文(普通话)女 - 晓蕾', value: 'zh-CN-XiaorouNeural' },
+                    { label: '中文(普通话)女 - 晓瑶', value: 'zh-CN-XiaoyouNeural' },
+                    { label: '中文(普通话)男 - 云希', value: 'zh-CN-YunxiNeural' },
+                    { label: '中文(普通话)男 - 云扬', value: 'zh-CN-YunyangNeural' },
+                    { label: '中文(普通话)男 - 云健', value: 'zh-CN-YunjianNeural' },
+                    { label: '中文(普通话)儿童 - 晓晋', value: 'zh-CN-XiaozhenNeural' },
+                    { label: '中文(普通话)儿童 - 云夏', value: 'zh-CN-YunxiaNeural' },
+                  ]"
+                  :loading="azureVoicesLoading"
+                  :fallback-option="() => ({
+                    label: settings.azureVoice ? `已选择: ${settings.azureVoice}` : '未选择',
+                    value: settings.azureVoice || '',
+                  })"
+                  style="margin-top: 8px"
+                  filterable
+                  @focus="fetchAzureVoices"
+                />
+              </div>
+
+              <div>
+                <NSpace
+                  justify="space-between"
+                  align="center"
+                >
+                  <NText>音量</NText>
+                  <NText depth="3">
+                    {{ (settings.speechInfo.volume * 100).toFixed(0) }}%
+                  </NText>
+                </NSpace>
+                <NSlider
+                  v-model:value="settings.speechInfo.volume"
+                  :min="0"
+                  :max="1"
+                  :step="0.01"
+                  style="margin-top: 8px"
+                />
+              </div>
+
+              <div>
+                <NSpace
+                  justify="space-between"
+                  align="center"
+                >
+                  <NText>音调</NText>
+                  <NText depth="3">
+                    {{ settings.speechInfo.pitch.toFixed(2) }}
+                  </NText>
+                </NSpace>
+                <NSlider
+                  v-model:value="settings.speechInfo.pitch"
+                  :min="0.5"
+                  :max="2"
+                  :step="0.01"
+                  style="margin-top: 8px"
+                />
+              </div>
+
+              <div>
+                <NSpace
+                  justify="space-between"
+                  align="center"
+                >
+                  <NText>语速</NText>
+                  <NText depth="3">
+                    {{ settings.speechInfo.rate.toFixed(2) }}
+                  </NText>
+                </NSpace>
+                <NSlider
+                  v-model:value="settings.speechInfo.rate"
+                  :min="0.5"
+                  :max="2"
+                  :step="0.01"
+                  style="margin-top: 8px"
+                />
+              </div>
+            </NSpace>
+
             <!-- API 语音设置 -->
             <NSpace
               v-else
@@ -865,19 +1076,21 @@ onUnmounted(() => {
                   style="margin-top: 8px"
                 />
               </div>
-
-              <!-- 隐藏的音频元素 -->
-              <audio
-                ref="apiAudio"
-                :src="speechState.apiAudioSrc"
-                :volume="settings.speechInfo.volume"
-                style="display: none"
-                @ended="cancelSpeech"
-                @canplay="speechState.isApiAudioLoading = false"
-                @error="onAPIError"
-              />
             </NSpace>
           </Transition>
+
+          <!-- 隐藏的音频元素 - 用于 API 和 Azure TTS -->
+          <audio
+            v-if="settings.voiceType !== 'local'"
+            ref="apiAudio"
+            :src="speechState.apiAudioSrc"
+            :volume="settings.speechInfo.volume"
+            style="display: none"
+            autoplay
+            @ended="cancelSpeech"
+            @canplay="onAudioCanPlay"
+            @error="onAudioError"
+          />
         </NSpace>
       </NCard>
 
@@ -1063,7 +1276,10 @@ onUnmounted(() => {
             </NInputGroup>
           </NSpace>
 
-          <NCheckbox v-model:checked="settings.splitText">
+          <NCheckbox
+            v-if="settings.voiceType === 'api'"
+            v-model:checked="settings.splitText"
+          >
             <NSpace
               :size="4"
               align="center"