57 lines
1.4 KiB
YAML
57 lines
1.4 KiB
YAML
server:
|
|
port: 8080
|
|
read_timeout: 60
|
|
write_timeout: 60
|
|
base_path: ""
|
|
|
|
tts:
|
|
region: "eastasia"
|
|
default_voice: "zh-CN-XiaoxiaoNeural"
|
|
default_rate: "0"
|
|
default_pitch: "0"
|
|
default_format: "audio-24khz-48kbitrate-mono-mp3"
|
|
max_text_length: 65535
|
|
request_timeout: 30
|
|
max_concurrent: 20
|
|
segment_threshold: 300
|
|
min_sentence_length: 200
|
|
max_sentence_length: 300
|
|
api_key: ''
|
|
|
|
# OpenAI 到微软 TTS 中文语音的映射
|
|
voice_mapping:
|
|
alloy: "zh-CN-XiaoyiNeural" # 中性女声
|
|
echo: "zh-CN-YunxiNeural" # 年轻男声
|
|
fable: "zh-CN-XiaochenNeural" # 儿童声
|
|
onyx: "zh-CN-YunjianNeural" # 成熟男声
|
|
nova: "zh-CN-XiaohanNeural" # 活力女声
|
|
shimmer: "zh-CN-XiaomoNeural" # 温柔女声
|
|
openai:
|
|
api_key: ''
|
|
|
|
ssml:
|
|
preserve_tags:
|
|
- name: break
|
|
pattern: <break\s+[^>]*/>
|
|
- name: speak
|
|
pattern: <speak>|</speak>
|
|
- name: prosody
|
|
pattern: <prosody\s+[^>]*>|</prosody>
|
|
- name: emphasis
|
|
pattern: <emphasis\s+[^>]*>|</emphasis>
|
|
- name: voice
|
|
pattern: <voice\s+[^>]*>|</voice>
|
|
- name: say-as
|
|
pattern: <say-as\s+[^>]*>|</say-as>
|
|
- name: phoneme
|
|
pattern: <phoneme\s+[^>]*>|</phoneme>
|
|
- name: audio
|
|
pattern: <audio\s+[^>]*>|</audio>
|
|
- name: p
|
|
pattern: <p>|</p>
|
|
- name: s
|
|
pattern: <s>|</s>
|
|
- name: sub
|
|
pattern: <sub\s+[^>]*>|</sub>
|
|
- name: mstts
|
|
pattern: <mstts:[^>]*>|</mstts:[^>]*> |