liumaolin
commited on
Commit
·
b5b48f0
1
Parent(s):
8228973
Add new voice model "Ellen" to MoYoYo configuration
Browse files- Include model details, inference parameters, and related files.
- Add reference audio and pretrained weights for TTS.
assets/models/tts/moyoyo/GPT_weights/ellen_best_gpt.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2de5d2cf0b2b888ee47978f3b2811e4678ca90cd08fd9e491768fd22d772e787
|
| 3 |
+
size 155312957
|
assets/models/tts/moyoyo/SoVITS_weights/ellen_best_sovits.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0a5ceab180bb7f663ee9bfdb892323c8194a3dc01c02bd6742ffafb2f8279f01
|
| 3 |
+
size 85007202
|
assets/models/tts/moyoyo/ref_audios/ellen_ref.wav
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:692552ea483214b0b08e66f6ff684696ecd9fc96da40ee6925415359bdff83d0
|
| 3 |
+
size 599084
|
src/voice_dialogue/services/audio/generators/configs/moyoyo.py
CHANGED
|
@@ -276,6 +276,35 @@ MOYOYO_TTS_CONFIGS = [
|
|
| 276 |
'seed': 233333,
|
| 277 |
},
|
| 278 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 279 |
]
|
| 280 |
|
| 281 |
|
|
|
|
| 276 |
'seed': 233333,
|
| 277 |
},
|
| 278 |
},
|
| 279 |
+
{
|
| 280 |
+
'repository': 'MoYoYoTech/tone-models',
|
| 281 |
+
'character_name': 'Ellen',
|
| 282 |
+
'cover_image': '',
|
| 283 |
+
'description': '美国脱口秀主持人Ellen DeGeneres的AI语音模型,具有其标志性的幽默风格和独特的表达方式,适合制作娱乐和创意内容。',
|
| 284 |
+
'file_size': '241M',
|
| 285 |
+
'is_chinese_voice': False,
|
| 286 |
+
'model_files': {
|
| 287 |
+
**BASE_PRETRAINED_FILES,
|
| 288 |
+
'gpt-weights': 'GPT_weights/ellen_best_gpt.ckpt',
|
| 289 |
+
'sovits-weights': 'SoVITS_weights/ellen_best_sovits.pth',
|
| 290 |
+
'reference_audio': 'ref_audios/ellen_ref.wav',
|
| 291 |
+
},
|
| 292 |
+
'inference_parameters': {
|
| 293 |
+
'text_lang': "en",
|
| 294 |
+
'prompt_text': "It might serve you better to be a little less comfortable. But wherever you're listening to this book, please remember to turn off your cell phone and that the taking of flash photographs is strictly forbidden.",
|
| 295 |
+
'prompt_lang': "en",
|
| 296 |
+
'top_k': 5,
|
| 297 |
+
'top_p': 1,
|
| 298 |
+
'temperature': 1,
|
| 299 |
+
'text_split_method': "cut4",
|
| 300 |
+
'batch_size': 100,
|
| 301 |
+
'speed_factor': 1.0,
|
| 302 |
+
'split_bucket': True,
|
| 303 |
+
'return_fragment': False,
|
| 304 |
+
'fragment_interval': 0.07,
|
| 305 |
+
'seed': 233333,
|
| 306 |
+
},
|
| 307 |
+
},
|
| 308 |
]
|
| 309 |
|
| 310 |
|