为azure语音模式添加说话风格配置,支持vits语音模式中文回答转日语语音输出,添加翻译功能,支持指令切换语音模式,支持查看当前语音模式下的支持角色列表 (#404)

* feat: add support for ‘greeting’ and ‘global reply mode’ commands, improve variable naming and remove unnecessary backend output.

* feat: Add support for black and white lists, global reply mode and voice role settings, private chat switch, and active greeting configuration. Refactor some variable names and comment out redundant code for better readability and reduced backend output.

* feat: 为新功能完善了帮助面板

* docs: 完善了‘打招呼’的帮助说明

* Commit Type: feat, bugfix

Add functionality to view plugin command table, fix bug in blacklist/whitelist, and fix bug where chat mode can still be used in private messaging when disabled.

* Commit Type: feat, bugfix

Add functionality to view plugin command table, fix bug in blacklist/whitelist, and fix bug where chat mode can still be used in private messaging when disabled.

* refactor: Remove redundant log output.

* Refactor: optimize code logic

* Fix: 修复绘图指令表被抢指令的bug。

* Refactor:1. Add support for automatically translating replies to Japanese and generating voice messages in VITS voice mode (please monitor remaining quota after enabling). 2. Add translation function. 3. Add emotion configuration for Azure voice mode, allowing the robot to select appropriate emotional styles for replies.

* Refactor:Handle the issue of exceeding character setting limit caused by adding emotion configuration.

* Fix: fix bugs

* Refactor: Added error feedback to translation service

* Refactor: Added support for viewing the list of supported roles for each language mode, and fixed some bugs in the emotion switching feature of the auzre mode.

* Refactor: Optimized some command feedback and added owner restriction to chat record export function.

* Refactor: Optimized feedback when viewing role list to avoid excessive messages.

* Refactor: Optimized feedback when configuring multi-emotion mode.

* Feature: Added help instructions for translation feature.

* chore: Adjust help instructions for mood settings

* Fix: Fixed issue where only first line of multi-line replies were being read and Azure voice was pronouncing punctuation marks.

* Fix: Fixed bug where switching to Azure voice mode prompted for missing key and restricted ability to view voice role list to only when in voice mode.

---------

Co-authored-by: Sean <1519059137@qq.com>
Co-authored-by: ikechan8370 <geyinchibuaa@gmail.com>
This commit is contained in:
Sean Murphy 2023-05-04 22:55:49 +08:00 committed by GitHub
parent bb90c3c3e7
commit b687d45897
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23
13 changed files with 1165 additions and 75 deletions

141
utils/baiduTranslate.js Normal file
View file

@ -0,0 +1,141 @@
import md5 from 'md5-node'
import axios from 'axios'
// noinspection NonAsciiCharacters
export const transMap = { : 'zh', : 'jp', : 'wyw', : 'en', : 'ru', : 'kr' }
const errOr = {
52001: '请求超时,请重试。',
52002: '系统错误,请重试。',
52003: '未授权用户请检查appid是否正确或者服务是否开通。',
54000: '必填参数为空,请检查是否少传参数。',
54001: '签名错误,请检查您的签名生成方法。',
54003: '访问频率受限,请降低您的调用频率,或进行身份认证后切换为高级版/尊享版。',
54004: '账户余额不足,请前往管理控制台为账户充值。',
54005: '长query请求频繁请降低长query的发送频率3s后再试。',
58000: '客户端IP非法检查个人资料里填写的IP地址是否正确可前往开发者信息-基本信息修改。',
58001: '译文语言方向不支持,检查译文语言是否在语言列表里。',
58002: '服务当前已关闭,请前往管理控制台开启服务。',
90107: '认证未通过或未生效,请前往我的认证查看认证进度。'
}
function Translate (config) {
this.requestNumber = 0 // 请求次数
this.config = {
showProgress: 1, // 是否显示进度
requestNumber: 1, // 最大请求次数
agreement: 'http', // 协议
...config
}
this.baiduApi = `${this.config.agreement}://api.fanyi.baidu.com/api/trans/vip/translate`
// 拼接url
this.createUrl = (domain, form) => {
let result = domain + '?'
for (let key in form) {
result += `${key}=${form[key]}&`
}
return result.slice(0, result.length - 1)
}
this.translate = async (value, ...params) => {
let result = ''
let from = 'auto'
let to = 'en'
if (params.length === 1) {
to = transMap[params[0]] || to
} else if (params.length === 2) {
from = transMap[params[0]] || from
to = transMap[params[1]] || to
}
if (typeof value === 'string') {
const res = await this.requestApi(value, { from, to })
result = res[0].dst
}
if (Array.isArray(value) || Object.prototype.toString.call(value) === '[object Object]') {
result = await this._createObjValue(value, { from, to })
}
return result
}
this.requestApi = (value, params) => {
if (this.requestNumber >= this.config.requestNumber) {
return new Promise((resolve) => {
setTimeout(() => {
this.requestApi(value, params).then((res) => {
resolve(res)
})
}, 1000)
})
}
this.requestNumber++
const { appid, secret } = this.config
const q = value
const salt = Math.random()
const sign = md5(`${appid}${q}${salt}${secret}`)
const fromData = {
q: encodeURIComponent(q),
sign,
appid,
salt,
from: params.from || 'auto',
to: params.to || 'en'
}
const fanyiApi = this.createUrl(this.baiduApi, fromData)
return new Promise((resolve, reject) => {
axios
.get(fanyiApi)
.then(({ data: res }) => {
if (!res.error_code) {
const resList = res.trans_result
resolve(resList)
} else {
const errCode = res.error_code
if (errOr[errCode]) {
reject(new Error('翻译出错了~' + errOr[errCode]))
} else {
reject(new Error('翻译出错了~' + errCode))
}
}
})
.finally(() => {
setTimeout(() => {
this.requestNumber--
}, 1000)
})
})
}
// 递归翻译数组或对象
this._createObjValue = async (value, parames) => {
let index = 0
const obj = Array.isArray(value) ? [] : {}
const strDatas = Array.isArray(value) ? value : Object.values(value)
const reqData = strDatas
.filter((item) => typeof item === 'string') // 过滤字符串
.join('\n')
const res = reqData ? await this.requestApi(reqData, parames) : []
for (let key in value) {
if (typeof value[key] === 'string') {
obj[key] = res[index].dst
index++
}
if (
Array.isArray(value[key]) ||
Object.prototype.toString.call(value[key]) === '[object Object]'
) {
obj[key] = await this.translate(value[key], parames) // 递归翻译
}
}
return obj
}
return this.translate
}
export default Translate

View file

@ -111,8 +111,12 @@ const defaultConfig = {
azureTTSSpeaker: 'zh-CN-XiaochenNeural',
voicevoxSpace: '',
voicevoxTTSSpeaker: '护士机器子T',
baiduTranslateAppId: '',
baiduTranslateSecret: '',
azureTTSEmotion: false,
enhanceAzureTTSEmotion: false,
autoJapanese: false,
version: 'v2.5.8'
}
const _path = process.cwd()
let config = {}

View file

@ -1,50 +1,110 @@
import crypto from 'crypto'
import { mkdirs } from '../common.js'
import { getDefaultReplySetting, mkdirs } from '../common.js'
import { Config } from '../config.js'
let sdk
try {
sdk = (await import('microsoft-cognitiveservices-speech-sdk')).default
} catch (err) {
logger.warn('未安装microsoft-cognitiveservices-speech-sdk无法使用微软Azure语音源')
}
async function generateAudio (text, option = {}) {
async function generateAudio (text, option = {}, ssml = '') {
if (!sdk) {
throw new Error('未安装microsoft-cognitiveservices-speech-sdk无法使用微软Azure语音源')
}
let subscriptionKey = Config.azureTTSKey
let serviceRegion = Config.azureTTSRegion
let speechConfig = sdk.SpeechConfig.fromSubscription(subscriptionKey, serviceRegion)
const _path = process.cwd()
mkdirs(`${_path}/data/chatgpt/tts/azure`)
let filename = `${_path}/data/chatgpt/tts/azure/${crypto.randomUUID()}.wav`
let audioConfig = sdk.AudioConfig.fromAudioFileOutput(filename)
let speechConfig = sdk.SpeechConfig.fromSubscription(subscriptionKey, serviceRegion)
// speechConfig.speechSynthesisLanguage = option?.language || 'zh-CN'
logger.info('using speaker: ' + option?.speaker || 'zh-CN-YunyeNeural')
speechConfig.speechSynthesisVoiceName = option?.speaker || 'zh-CN-YunyeNeural'
let synthesizer = new sdk.SpeechSynthesizer(speechConfig, audioConfig)
let synthesizer
if (ssml) {
synthesizer = new sdk.SpeechSynthesizer(speechConfig, audioConfig)
await speakSsmlAsync(synthesizer, ssml)
} else {
speechConfig.speechSynthesisLanguage = option?.language || 'zh-CN'
logger.info('using speaker: ' + option?.speaker || 'zh-CN-YunyeNeural')
speechConfig.speechSynthesisVoiceName = option?.speaker || 'zh-CN-YunyeNeural'
synthesizer = new sdk.SpeechSynthesizer(speechConfig, audioConfig)
await speakTextAsync(synthesizer, text)
}
console.log('synthesis finished.')
synthesizer.close()
synthesizer = undefined
return filename
}
async function speakTextAsync (synthesizer, text) {
return new Promise((resolve, reject) => {
synthesizer.speakTextAsync(text, result => {
if (result.reason === sdk.ResultReason.SynthesizingAudioCompleted) {
console.log('synthesis finished.')
logger.info('speakTextAsync: true')
resolve()
} else {
console.error('Speech synthesis canceled, ' + result.errorDetails +
'\nDid you update the subscription info?')
reject(result.errorDetails)
}
synthesizer.close()
synthesizer = undefined
resolve(filename)
}, err => {
console.error('err - ' + err)
synthesizer.close()
synthesizer = undefined
reject(err)
})
})
}
const supportConfigurations = [
async function speakSsmlAsync (synthesizer, ssml) {
return new Promise((resolve, reject) => {
synthesizer.speakSsmlAsync(ssml, result => {
if (result.reason === sdk.ResultReason.SynthesizingAudioCompleted) {
logger.info('speakSsmlAsync: true')
resolve()
} else {
console.error('Speech synthesis canceled, ' + result.errorDetails +
'\nDid you update the subscription info?')
reject(result.errorDetails)
}
}, err => {
console.error('err - ' + err)
reject(err)
})
})
}
async function generateSsml (text, option = {}) {
const voiceName = option.speaker || 'zh-CN-YunyeNeural'
const expressAs = option.emotion ? `<mstts:express-as style="${option.emotion}" styledegree="${option.emotionDegree || 1}">` : ''
return `<speak version="1.0" xmlns="http://www.w3.org/2001/10/synthesis"
xmlns:mstts="https://www.w3.org/2001/mstts" xml:lang="zh-CN">
<voice name="${voiceName}">
${expressAs}${text}${expressAs ? '</mstts:express-as>' : ''}
</voice>
</speak>`
}
async function getEmotionPrompt (e) {
if (!Config.azureTTSEmotion) return ''
let userReplySetting = await redis.get(`CHATGPT:USER:${e.sender.user_id}`)
userReplySetting = !userReplySetting
? getDefaultReplySetting()
: JSON.parse(userReplySetting)
let emotionPrompt = ''
let ttsRoleAzure = userReplySetting.ttsRoleAzure
const configuration = Config.ttsMode === 'azure' ? supportConfigurations.find(config => config.code === ttsRoleAzure) : ''
if (configuration !== '' && configuration.emotion) {
// 0-1 感觉没啥区别说实话只有1和2听得出差别。。
emotionPrompt = `\n在回复的最开始使用[]在其中表示你这次回复的情绪风格和程度(1-2)最小单位0.1
\n例如['angry',2]表示你极度愤怒
\n这是情绪参考值禁止使用给出范围以外的词且单次回复只需要给出一个情绪表示
\n${JSON.stringify(configuration.emotion)}
\n另外不要在情绪[]前后使用回车换行如果你明白上面的设定请回复好的我明白了并在后续的对话中严格执行此设定`
// logger.warn('emotionPrompt:', `${JSON.stringify(configuration.emotion)}`)
} else {
return ''
}
return emotionPrompt
}
export const supportConfigurations = [
{
code: 'zh-CN-liaoning-XiaobeiNeural',
name: '晓北',
@ -78,35 +138,86 @@ const supportConfigurations = [
name: '晓晓',
language: 'zh-CN',
languageDetail: '中文(普通话,简体)',
gender: '女'
gender: '女',
emotion: {
affectionate: '温暖、亲切的语气',
angry: '生气和厌恶的语气',
assistant: '数字助理用的是热情而轻松的语气',
calm: '沉着冷静的态度说话。语气、音调和韵律统一',
chat: '表达轻松随意的语气',
cheerful: '表达积极愉快的语气',
customerservice: '以友好热情的语气为客户提供支持',
disgruntled: '轻蔑、抱怨的语气,表现不悦和蔑视',
excited: '乐观、充满希望的语气,发生了美好的事情',
fearful: '恐惧、紧张的语气,说话人处于紧张和不安的状态',
friendly: '愉快、怡人、温暖、真诚、关切的语气',
gentle: '温和、礼貌、愉快的语气,音调和音量较低',
lyrical: '以优美又带感伤的方式表达情感',
newscast: '以正式专业的语气叙述新闻',
'poetry-reading': '读诗时带情感和节奏的语气',
sad: '表达悲伤语气',
serious: '严肃、命令的语气'
}
},
{
code: 'zh-CN-YunxiNeural',
name: '云希',
language: 'zh-CN',
languageDetail: '中文(普通话,简体)',
gender: '男'
languageDetail: '中文 (普通话,简体)',
gender: '男',
emotion: {
angry: '表达生气和愤怒的语气',
assistant: '数字助理使用热情而轻松的语气',
chat: '表达轻松随意的语气',
cheerful: '表达积极愉快的语气',
depressed: '表达沮丧、消沉的语气',
disgruntled: '表达不满、不悦的语气',
embarrassed: '表达尴尬、难为情的语气',
fearful: '表达害怕、恐惧的语气',
'narration-relaxed': '以轻松、自然的语气叙述',
newscast: '用于新闻播报,表现出庄重、严谨的语气',
sad: '表达悲伤、失落的语气',
serious: '表现出认真、严肃的语气'
}
},
{
code: 'zh-CN-YunyangNeural',
name: '云扬',
language: 'zh-CN',
languageDetail: '中文(普通话,简体)',
gender: '男'
languageDetail: '中文 (普通话,简体)',
gender: '男',
emotion: {
customerservice: '以亲切友好的语气为客户提供支持',
'narration-professional': '以专业、稳重的语气讲述',
'newscast-casual': '以轻松自然的语气播报新闻'
}
},
{
code: 'zh-CN-YunyeNeural',
name: '云野',
language: 'zh-CN',
languageDetail: '中文(普通话,简体)',
gender: '男'
gender: '男',
emotion: {
angry: '表达愤怒和不满的语气',
calm: '以冷静的态度说话,不带过多情绪',
cheerful: '表达快乐和积极的语气',
disgruntled: '表达不满和不满足的语气',
embarrassed: '表达不自在或难堪的语气',
fearful: '表达害怕和不安的语气',
sad: '表达悲伤和失落的语气',
serious: '以认真和严肃的态度说话'
}
},
{
code: 'zh-CN-XiaoshuangNeural',
name: '晓双',
language: 'zh-CN',
languageDetail: '中文(普通话,简体)',
gender: '女'
gender: '女',
emotion: {
chat: '表达轻松随意的语气'
}
},
{
code: 'zh-CN-XiaoyouNeural',
@ -141,56 +252,126 @@ const supportConfigurations = [
name: '晓墨',
language: 'zh-CN',
languageDetail: '中文(普通话,简体)',
gender: '女'
gender: '女',
emotion: {
affectionate: '温暖、亲切的语气',
angry: '生气和厌恶的语气',
calm: '沉着冷静的态度说话。语气、音调和韵律统一',
cheerful: '表达积极愉快的语气',
depressed: '调低音调和音量来表达忧郁、沮丧的语气',
disgruntled: '轻蔑、抱怨的语气,表现不悦和蔑视',
embarrassed: '在说话者感到不舒适时表达不确定、犹豫的语气',
envious: '当你渴望别人拥有的东西时,表达一种钦佩的语气',
fearful: '恐惧、紧张的语气,说话人处于紧张和不安的状态',
gentle: '温和、礼貌、愉快的语气,音调和音量较低',
sad: '表达悲伤语气',
serious: '严肃、命令的语气'
}
},
{
code: 'zh-CN-XiaoxuanNeural',
name: '晓萱',
language: 'zh-CN',
languageDetail: '中文(普通话,简体)',
gender: '女'
gender: '女',
emotion: {
angry: '生气和厌恶的语气',
calm: '沉着冷静的态度说话。语气、音调和韵律统一',
cheerful: '表达积极愉快的语气',
depressed: '调低音调和音量来表达忧郁、沮丧的语气',
disgruntled: '轻蔑、抱怨的语气,表现不悦和蔑视',
fearful: '恐惧、紧张的语气,说话人处于紧张和不安的状态',
gentle: '温和、礼貌、愉快的语气,音调和音量较低',
serious: '严肃、命令的语气'
}
},
{
code: 'zh-CN-XiaohanNeural',
name: '晓涵',
language: 'zh-CN',
languageDetail: '中文(普通话,简体)',
gender: '女'
gender: '女',
emotion: {
affectionate: '温暖、亲切的语气',
angry: '生气和厌恶的语气',
calm: '沉着冷静的态度说话。语气、音调和韵律统一',
cheerful: '表达积极愉快的语气',
disgruntled: '轻蔑、抱怨的语气,表现不悦和蔑视',
embarrassed: '在说话者感到不舒适时表达不确定、犹豫的语气',
fearful: '恐惧、紧张的语气,说话人处于紧张和不安的状态',
gentle: '温和、礼貌、愉快的语气,音调和音量较低',
sad: '表达悲伤语气',
serious: '严肃、命令的语气'
}
},
{
code: 'zh-CN-XiaoruiNeural',
name: '晓睿',
language: 'zh-CN',
languageDetail: '中文(普通话,简体)',
gender: '女'
gender: '女',
emotion: {
angry: '生气和厌恶的语气',
calm: '沉着冷静的态度说话。语气、音调和韵律统一',
fearful: '恐惧、紧张的语气,说话人处于紧张和不安的状态',
sad: '表达悲伤语气'
}
},
{
code: 'zh-CN-XiaomengNeural',
name: '晓梦',
language: 'zh-CN',
languageDetail: '中文(普通话,简体)',
gender: '女'
gender: '女',
emotion: {
chat: '表达轻松随意的语气'
}
},
{
code: 'zh-CN-XiaoyiNeural',
name: '晓伊',
language: 'zh-CN',
languageDetail: '中文(普通话,简体)',
gender: '女'
gender: '女',
emotion: {
angry: '生气和厌恶的语气',
affectionate: '温暖、亲切的语气',
cheerful: '表达积极愉快的语气',
gentle: '温和、礼貌、愉快的语气,音调和音量较低',
sad: '表达悲伤语气',
serious: '严肃、命令的语气'
}
},
{
code: 'zh-CN-XiaozhenNeural',
name: '晓甄',
language: 'zh-CN',
languageDetail: '中文(普通话,简体)',
gender: '女'
gender: '女',
emotion: {
angry: '生气和厌恶的语气',
cheerful: '表达积极愉快的语气',
disgruntled: '轻蔑、抱怨的语气,表现不悦和蔑视',
fearful: '恐惧、紧张的语气,说话人处于紧张和不安的状态',
sad: '表达悲伤语气',
serious: '严肃、命令的语气'
}
},
{
code: 'zh-CN-YunfengNeural',
name: '云枫',
language: 'zh-CN',
languageDetail: '中文(普通话,简体)',
gender: '男'
gender: '男',
emotion: {
angry: '生气和厌恶的语气',
cheerful: '表达积极愉快的语气',
depressed: '调低音调和音量来表达忧郁、沮丧的语气',
disgruntled: '轻蔑、抱怨的语气,表现不悦和蔑视',
fearful: '恐惧、紧张的语气,说话人处于紧张和不安的状态',
sad: '表达悲伤语气',
serious: '严肃、命令的语气'
}
},
{
code: 'zh-CN-YunhaoNeural',
@ -204,21 +385,44 @@ const supportConfigurations = [
name: '云健',
language: 'zh-CN',
languageDetail: '中文(普通话,简体)',
gender: '男'
gender: '男',
emotion: {
'narration-relaxed': '以轻松、自然的语气进行叙述',
'sports-commentary': '在解说体育比赛时,使用专业而自信的语气',
'sports-commentary-excited': '在解说激动人心的体育比赛时,使用兴奋和激动的语气'
}
},
{
code: 'zh-CN-YunxiaNeural',
name: '云夏',
language: 'zh-CN',
languageDetail: '中文(普通话,简体)',
gender: '男'
languageDetail: '中文 (普通话,简体)',
gender: '男',
emotion: {
angry: '生气和厌恶的语气',
calm: '沉着冷静的态度说话。语气、音调和韵律统一',
cheerful: '表达积极愉快的语气',
fearful: '表达害怕、紧张的语气',
sad: '表达悲伤和失落的语气'
}
},
{
code: 'zh-CN-YunzeNeural',
name: '云泽',
language: 'zh-CN',
languageDetail: '中文(普通话,简体)',
gender: '男'
languageDetail: '中文 (普通话,简体)',
gender: '男',
emotion: {
angry: '用愤怒的语气表达强烈的不满和愤怒',
calm: '以冷静、沉着的语气说话,表现出稳重、深思熟虑的态度',
cheerful: '表达愉快和轻松的情绪',
depressed: '用沉闷、低落的语气表达消极、悲伤的情绪',
disgruntled: '表达不满和不高兴的情绪',
'documentary-narration': '用一种客观、中立的语气讲述事实和事件',
fearful: '表达害怕、不安的情绪',
sad: '用悲伤的语气表达悲伤和失落',
serious: '以严肃的语气和态度表现出对事情的重视和认真对待'
}
},
{
code: 'zh-HK-HiuGaaiNeural',
@ -240,7 +444,480 @@ const supportConfigurations = [
language: 'zh-CN',
languageDetail: '中文(粤语,繁体)',
gender: '男'
},
{
code: 'en-GB-AbbiNeural',
name: 'Abbi',
language: 'en-GB',
languageDetail: '英语(英国)',
gender: 'female'
},
{
code: 'en-GB-AlfieNeural',
name: 'Alfie',
language: 'en-GB',
languageDetail: '英语(英国)',
gender: 'male'
},
{
code: 'en-GB-BellaNeural',
name: 'Bella',
language: 'en-GB',
languageDetail: '英语(英国)',
gender: 'female'
},
{
code: 'en-GB-ElliotNeural',
name: 'Elliot',
language: 'en-GB',
languageDetail: '英语(英国)',
gender: 'male'
},
{
code: 'en-GB-EthanNeural',
name: 'Ethan',
language: 'en-GB',
languageDetail: '英语(英国)',
gender: 'male'
},
{
code: 'en-GB-HollieNeural',
name: 'Hollie',
language: 'en-GB',
languageDetail: '英语(英国)',
gender: 'female'
},
{
code: 'en-GB-LibbyNeural',
name: 'Libby',
language: 'en-GB',
languageDetail: '英语(英国)',
gender: 'female'
},
{
code: 'en-GB-MaisieNeural',
name: 'Maisie',
language: 'en-GB',
languageDetail: '英语(英国)',
gender: 'female'
},
{
code: 'en-GB-NoahNeural',
name: 'Noah',
language: 'en-GB',
languageDetail: '英语(英国)',
gender: 'male'
},
{
code: 'en-GB-OliverNeural',
name: 'Oliver',
language: 'en-GB',
languageDetail: '英语(英国)',
gender: 'male'
},
{
code: 'en-GB-OliviaNeural',
name: 'Olivia',
language: 'en-GB',
languageDetail: '英语(英国)',
gender: 'female'
},
{
code: 'en-GB-RyanNeural',
name: 'Ryan',
language: 'en-GB',
languageDetail: '英语(英国)',
gender: 'male',
emotion: {
chat: '表达轻松随意的语气',
cheerful: '表达积极愉快的语气'
}
},
{
code: 'en-GB-SoniaNeural',
name: 'Sonia',
language: 'en-GB',
languageDetail: '英语(英国)',
gender: 'female',
emotion: {
cheerful: '表达积极愉快的语气',
sad: '表达悲伤语气'
}
},
{
code: 'en-GB-ThomasNeural',
name: 'Thomas',
language: 'en-GB',
languageDetail: '英语(英国)',
gender: 'male'
},
{
code: 'ja-JP-AoiNeural',
name: '葵',
language: 'ja-JP',
languageDetail: '日语(日本)',
gender: '女'
},
{
code: 'ja-JP-DaichiNeural',
name: '大地',
language: 'ja-JP',
languageDetail: '日语(日本)',
gender: '男'
},
{
code: 'ja-JP-KeitaNeural',
name: '慶太',
language: 'ja-JP',
languageDetail: '日语(日本)',
gender: '男'
},
{
code: 'ja-JP-MayuNeural',
name: '真由',
language: 'ja-JP',
languageDetail: '日语(日本)',
gender: '女'
},
{
code: 'ja-JP-NanamiNeural',
name: '七海',
language: 'ja-JP',
languageDetail: '日语(日本)',
gender: '女',
emotion: {
chat: '表达轻松随意的语气',
cheerful: '表达积极愉快的语气',
customerservice: '以友好热情的语气为客户提供支持'
}
},
{
code: 'ja-JP-NaokiNeural',
name: '直樹',
language: 'ja-JP',
languageDetail: '日语(日本)',
gender: '男'
},
{
code: 'ja-JP-ShioriNeural',
name: '栞',
language: 'ja-JP',
languageDetail: '日语(日本)',
gender: '女'
},
{
code: 'en-US-AIGenerate1Neural1',
name: 'AI Generate 1',
language: 'en-US',
languageDetail: 'English (United States)',
gender: '男'
},
{
code: 'en-US-AIGenerate2Neural1',
name: 'AI Generate 2',
language: 'en-US',
languageDetail: 'English (United States)',
gender: '女'
},
{
code: 'en-US-AmberNeural',
name: 'Amber',
language: 'en-US',
languageDetail: 'English (United States)',
gender: '女'
},
{
code: 'en-US-AnaNeural',
name: 'Ana',
language: 'en-US',
languageDetail: 'English (United States)',
gender: '女性、儿童'
},
{
code: 'en-US-AriaNeural',
name: 'Aria',
language: 'en-US',
languageDetail: 'English (United States)',
gender: '女',
emotion: {
angry: '生气和厌恶的语气',
cheerful: '表达积极愉快的语气',
excited: '乐观、充满希望的语气,发生了美好的事情',
friendly: '愉快、怡人、温暖、真诚、关切的语气',
hopeful: '温暖且渴望的语气。像是会有好事发生',
sad: '表达悲伤语气',
shouting: '就像从遥远的地方说话或在外面说话',
terrified: '非常害怕的语气,语速快且声音颤抖。不稳定的疯狂状态',
unfriendly: '表达一种冷淡无情的语气',
whispering: '说话非常柔和,发出的声音小且温柔',
chat: '表达轻松随意的语气',
customerservice: '以友好热情的语气为客户提供支持',
empathetic: '表达关心和理解',
'narration-professional': '以专业、客观的语气朗读内容',
'newscast-casual': '以通用、随意的语气发布一般新闻',
'newscast-formal': '以正式、自信和权威的语气发布新闻'
}
},
{
code: 'en-US-AshleyNeural',
name: 'Ashley',
language: 'en-US',
languageDetail: 'English (United States)',
gender: '女'
},
{
code: 'en-US-BrandonNeural',
name: 'Brandon',
language: 'en-US',
languageDetail: 'English (United States)',
gender: '男'
},
{
code: 'en-US-ChristopherNeural',
name: 'Christopher',
language: 'en-US',
languageDetail: 'English (United States)',
gender: '男'
},
{
code: 'en-US-CoraNeural',
name: 'Cora',
language: 'en-US',
languageDetail: 'English (United States)',
gender: '女'
},
{
code: 'en-US-DavisNeural',
name: 'Davis',
language: 'en-US',
languageDetail: 'English (United States)',
gender: '男',
emotion: {
angry: '生气和厌恶的语气',
cheerful: '表达积极愉快的语气',
excited: '乐观、充满希望的语气,发生了美好的事情',
friendly: '愉快、怡人、温暖、真诚、关切的语气',
hopeful: '温暖且渴望的语气。像是会有好事发生',
sad: '表达悲伤语气',
shouting: '就像从遥远的地方说话或在外面说话',
terrified: '非常害怕的语气,语速快且声音颤抖。不稳定的疯狂状态',
unfriendly: '表达一种冷淡无情的语气',
whispering: '说话非常柔和,发出的声音小且温柔'
}
},
{
code: 'en-US-ElizabethNeural',
name: 'Elizabeth',
language: 'en-US',
languageDetail: 'English (United States)',
gender: '女'
},
{
code: 'en-US-EricNeural',
name: 'Eric',
language: 'en-US',
languageDetail: 'English (United States)',
gender: '男'
},
{
code: 'en-US-GuyNeural',
name: 'Guy',
language: 'en-US',
languageDetail: 'English (United States)',
gender: '男',
emotion: {
angry: '生气和厌恶的语气',
cheerful: '表达积极愉快的语气',
excited: '乐观、充满希望的语气,发生了美好的事情',
friendly: '愉快、怡人、温暖、真诚、关切的语气',
hopeful: '温暖且渴望的语气。像是会有好事发生',
sad: '表达悲伤语气',
shouting: '就像从遥远的地方说话或在外面说话',
terrified: '非常害怕的语气,语速快且声音颤抖。不稳定的疯狂状态',
unfriendly: '表达一种冷淡无情的语气',
whispering: '说话非常柔和,发出的声音小且温柔',
newscast: '以正式专业的语气叙述新闻'
}
},
{
code: 'en-US-JacobNeural',
name: 'Jacob',
language: 'en-US',
languageDetail: 'English (United States)',
gender: '男'
},
{
code: 'en-US-JaneNeural',
name: 'Jane',
language: 'en-US',
languageDetail: 'English (United States)',
gender: '女',
emotion: {
angry: '生气和厌恶的语气',
cheerful: '表达积极愉快的语气',
excited: '乐观、充满希望的语气,发生了美好的事情',
friendly: '愉快、怡人、温暖、真诚、关切的语气',
hopeful: '温暖且渴望的语气。像是会有好事发生',
sad: '表达悲伤语气',
shouting: '就像从遥远的地方说话或在外面说话',
terrified: '非常害怕的语气,语速快且声音颤抖。不稳定的疯狂状态',
unfriendly: '表达一种冷淡无情的语气',
whispering: '说话非常柔和,发出的声音小且温柔'
}
},
{
code: 'en-US-JasonNeural',
name: 'Jason',
language: 'en-US',
languageDetail: '英语(美国)',
gender: 'male',
emotion: {
angry: '生气和厌恶的语气',
cheerful: '表达积极愉快的语气',
excited: '乐观、充满希望的语气,发生了美好的事情',
friendly: '愉快、怡人、温暖、真诚、关切的语气',
hopeful: '温暖且渴望的语气。像是会有好事发生',
sad: '表达悲伤语气',
shouting: '就像从遥远的地方说话或在外面说话',
terrified: '非常害怕的语气,语速快且声音颤抖。不稳定的疯狂状态',
unfriendly: '表达一种冷淡无情的语气',
whispering: '说话非常柔和,发出的声音小且温柔'
}
},
{
code: 'en-US-JennyMultilingualNeural3',
name: 'Jenny',
language: 'en-US',
languageDetail: '英语(美国)',
gender: 'female'
},
{
code: 'en-US-JennyNeural',
name: 'Jenny',
language: 'en-US',
languageDetail: '英语(美国)',
gender: 'female',
emotion: {
angry: '生气和厌恶的语气',
cheerful: '表达积极愉快的语气',
excited: '乐观、充满希望的语气,发生了美好的事情',
friendly: '愉快、怡人、温暖、真诚、关切的语气',
hopeful: '温暖且渴望的语气。像是会有好事发生',
sad: '表达悲伤语气',
shouting: '就像从遥远的地方说话或在外面说话',
terrified: '非常害怕的语气,语速快且声音颤抖。不稳定的疯狂状态',
unfriendly: '表达一种冷淡无情的语气',
whispering: '说话非常柔和,发出的声音小且温柔',
assistant: '数字助理用的是热情而轻松的语气',
chat: '表达轻松随意的语气',
customerservice: '以友好热情的语气为客户提供支持',
newscast: '以正式专业的语气叙述新闻'
}
},
{
code: 'en-US-MichelleNeural',
name: 'Michelle',
language: 'en-US',
languageDetail: '英语(美国)',
gender: 'female'
},
{
code: 'en-US-MonicaNeural',
name: 'Monica',
language: 'en-US',
languageDetail: '英语(美国)',
gender: 'female'
},
{
code: 'en-US-NancyNeural',
name: 'Nancy',
language: 'en-US',
languageDetail: '英语(美国)',
gender: 'female',
emotion: {
angry: '生气和厌恶的语气',
cheerful: '表达积极愉快的语气',
excited: '乐观、充满希望的语气,发生了美好的事情',
friendly: '愉快、怡人、温暖、真诚、关切的语气',
hopeful: '温暖且渴望的语气。像是会有好事发生',
sad: '表达悲伤语气',
shouting: '就像从遥远的地方说话或在外面说话',
terrified: '非常害怕的语气,语速快且声音颤抖。不稳定的疯狂状态',
unfriendly: '表达一种冷淡无情的语气',
whispering: '说话非常柔和,发出的声音小且温柔'
}
},
{
code: 'en-US-RogerNeural',
name: 'Roger',
language: 'en-US',
languageDetail: '英语(美国)',
gender: 'male'
},
{
code: 'en-US-SaraNeural',
name: 'Sara',
language: 'en-US',
languageDetail: '英语(美国)',
gender: 'female',
emotion: {
angry: '生气和厌恶的语气',
cheerful: '表达积极愉快的语气',
excited: '乐观、充满希望的语气,发生了美好的事情',
friendly: '愉快、怡人、温暖、真诚、关切的语气',
hopeful: '温暖且渴望的语气。像是会有好事发生',
sad: '表达悲伤语气',
shouting: '就像从遥远的地方说话或在外面说话',
terrified: '非常害怕的语气,语速快且声音颤抖。不稳定的疯狂状态',
unfriendly: '表达一种冷淡无情的语气',
whispering: '说话非常柔和,发出的声音小且温柔'
}
},
{
code: 'en-US-SteffanNeural',
name: 'Steffan',
language: 'en-US',
languageDetail: '英语(美国)',
gender: 'male'
},
{
code: 'en-US-TonyNeural',
name: 'Tony',
language: 'en-US',
languageDetail: '英语(美国)',
gender: 'male',
emotion: {
angry: '生气和厌恶的语气',
cheerful: '表达积极愉快的语气',
excited: '乐观、充满希望的语气,发生了美好的事情',
friendly: '愉快、怡人、温暖、真诚、关切的语气',
hopeful: '温暖且渴望的语气。像是会有好事发生',
sad: '表达悲伤语气',
shouting: '就像从遥远的地方说话或在外面说话',
terrified: '非常害怕的语气,语速快且声音颤抖。不稳定的疯狂状态',
unfriendly: '表达一种冷淡无情的语气',
whispering: '说话非常柔和,发出的声音小且温柔'
}
},
{
code: 'en-IN-NeerjaNeural',
name: 'Neerja',
language: 'en',
languageDetail: '英语(印度)',
gender: 'female'
},
{
code: 'en-IN-PrabhatNeural',
name: 'Prabhat',
language: 'en',
languageDetail: '英语(印度)',
gender: 'male'
}
]
export default { generateAudio, supportConfigurations }
export default { generateAudio, generateSsml, getEmotionPrompt, supportConfigurations }

View file

@ -73,7 +73,7 @@ async function generateAudio (text, options = {}) {
return Buffer.from(synthesisResponseData)
}
const supportConfigurations = [
export const supportConfigurations = [
{
supported_features: { permitted_synthesis_morphing: 'SELF_ONLY' },
name: '四国めたん',

View file

@ -8,7 +8,8 @@ import stream from 'stream'
import crypto from 'crypto'
import child_process from 'child_process'
import { Config } from './config.js'
import {mkdirs} from "./common.js";
import path from 'path'
import { mkdirs } from './common.js'
let module
try {
module = await import('oicq')
@ -248,9 +249,14 @@ async function getPttBuffer (file, ffmpeg = 'ffmpeg') {
}
async function audioTrans (file, ffmpeg = 'ffmpeg') {
const tmpfile = path.join(TMP_DIR, uuid())
const cmd = IS_WIN
? `${ffmpeg} -i "${file}" -f s16le -ac 1 -ar 24000 "${tmpfile}"`
: `exec ${ffmpeg} -i "${file}" -f s16le -ac 1 -ar 24000 "${tmpfile}"`
return new Promise((resolve, reject) => {
const tmpfile = TMP_DIR + '/' + (0, uuid)();
(0, child_process.exec)(`${ffmpeg} -i "${file}" -f s16le -ac 1 -ar 24000 "${tmpfile}"`, async (error, stdout, stderr) => {
// 隐藏windows下调用ffmpeg的cmd弹窗
const options = IS_WIN ? { windowsHide: true, stdio: 'ignore' } : {}
child_process.exec(cmd, options, async (error, stdout, stderr) => {
try {
resolve(pcm2slk(fs.readFileSync(tmpfile)))
} catch {