fix: 初步适配铃音语音

2025-12-16 13:27:08 +00:00 · 2023-11-04 11:49:36 +08:00 · 2023-11-04 11:49:36 +08:00 · 61d3b48781
commit 61d3b48781
parent 7cc22e487a
2 changed files with 22 additions and 16 deletions
--- a/utils/common.js
+++ b/utils/common.js
@ -847,14 +847,13 @@ export function getMaxModelTokens (model = 'gpt-3.5-turbo') {
 export function getUin (e) {
  if (e?.bot?.uin) return e.bot.uin
  if (Array.isArray(Bot.uin)) {
-    if (Config.trssBotUin && Bot.uin.indexOf(Config.trssBotUin) > -1) {return Config.trssBotUin}
-    else {
-        Bot.uin.forEach((u) => {
-          if (Bot[u].self_id) {
-            return Bot[u].self_id
-          }
-        })
-        return Bot.uin[Bot.uin.length - 1]
+    if (Config.trssBotUin && Bot.uin.indexOf(Config.trssBotUin) > -1) { return Config.trssBotUin } else {
+      Bot.uin.forEach((u) => {
+        if (Bot[u].self_id) {
+          return Bot[u].self_id
+        }
+      })
+      return Bot.uin[Bot.uin.length - 1]
    }
  } else return Bot.uin
 }
@ -871,6 +870,7 @@ export async function generateAudio (e, pendingText, speakingEmotion, emotionDeg
  if (!Config.ttsSpace && !Config.azureTTSKey && !Config.voicevoxSpace) return false
  let wav
  const speaker = getUserSpeaker(await getUserReplySetting(e))
+  let ignoreEncode = getUin(e) === 88888
  try {
    if (Config.ttsMode === 'vits-uma-genshin-honkai' && Config.ttsSpace) {
      if (Config.autoJapanese) {
@ -883,7 +883,7 @@ export async function generateAudio (e, pendingText, speakingEmotion, emotionDeg
      }
      wav = await generateVitsAudio(pendingText, speaker, '中日混合（中文用[ZH][ZH]包裹起来，日文用[JA][JA]包裹起来）')
    } else if (Config.ttsMode === 'azure' && Config.azureTTSKey) {
-      return await generateAzureAudio(pendingText, speaker, speakingEmotion, emotionDegree)
+      return await generateAzureAudio(pendingText, speaker, speakingEmotion, emotionDegree, ignoreEncode)
    } else if (Config.ttsMode === 'voicevox' && Config.voicevoxSpace) {
      pendingText = (await translate(pendingText, '日')).replace('\n', '')
      wav = await VoiceVoxTTS.generateAudio(pendingText, {
@ -897,7 +897,7 @@ export async function generateAudio (e, pendingText, speakingEmotion, emotionDeg
  let sendable
  try {
    try {
-      sendable = await uploadRecord(wav, Config.ttsMode)
+      sendable = await uploadRecord(wav, Config.ttsMode, ignoreEncode)
      if (!sendable) {
        // 如果合成失败，尝试使用ffmpeg合成
        sendable = segment.record(wav)
@ -927,9 +927,10 @@ export async function generateAudio (e, pendingText, speakingEmotion, emotionDeg
 * @param role - 发言人
 * @param speakingEmotion - 发言人情绪
 * @param emotionDegree - 发言人情绪强度
+ * @param ignoreEncode - 不在客户端处理编码
 * @returns {Promise<{file: string, type: string}|boolean>}
 */
-export async function generateAzureAudio (pendingText, role = '随机', speakingEmotion, emotionDegree = 1) {
+export async function generateAzureAudio (pendingText, role = '随机', speakingEmotion, emotionDegree = 1, ignoreEncode = false) {
  if (!Config.azureTTSKey) return false
  let speaker
  try {
@ -970,11 +971,13 @@ export async function generateAzureAudio (pendingText, role = '随机', speaking
      pendingText,
      emotionDegree
    })
+    let record = await AzureTTS.generateAudio(pendingText, {
+      speaker
+    }, await ssml)
    return await uploadRecord(
-      await AzureTTS.generateAudio(pendingText, {
-        speaker
-      }, await ssml)
-      , Config.ttsMode
+      record
+      , Config.ttsMode,
+      ignoreEncode
    )
  } catch (err) {
    logger.error(err)
--- a/utils/uploadRecord.js
+++ b/utils/uploadRecord.js
@ -39,7 +39,7 @@ if (module) {
 // import { pcm2slk } from 'node-silk'
 let errors = {}

-async function uploadRecord (recordUrl, ttsMode = 'vits-uma-genshin-honkai') {
+async function uploadRecord (recordUrl, ttsMode = 'vits-uma-genshin-honkai', ignoreEncode = false) {
  let recordType = 'url'
  let tmpFile = ''
  if (ttsMode === 'azure') {
@ -48,6 +48,9 @@ async function uploadRecord (recordUrl, ttsMode = 'vits-uma-genshin-honkai') {
    recordType = 'buffer'
    tmpFile = `data/chatgpt/tts/tmp/${crypto.randomUUID()}.wav`
  }
+  if (ignoreEncode) {
+    return segment.record(recordUrl)
+  }
  let result
  if (pcm2slk) {
    result = await getPttBuffer(recordUrl, Bot.config.ffmpeg_path)