liumaolin commited on
Commit
b5b48f0
·
1 Parent(s): 8228973

Add new voice model "Ellen" to MoYoYo configuration

Browse files

- Include model details, inference parameters, and related files.
- Add reference audio and pretrained weights for TTS.

assets/models/tts/moyoyo/GPT_weights/ellen_best_gpt.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2de5d2cf0b2b888ee47978f3b2811e4678ca90cd08fd9e491768fd22d772e787
3
+ size 155312957
assets/models/tts/moyoyo/SoVITS_weights/ellen_best_sovits.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a5ceab180bb7f663ee9bfdb892323c8194a3dc01c02bd6742ffafb2f8279f01
3
+ size 85007202
assets/models/tts/moyoyo/ref_audios/ellen_ref.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:692552ea483214b0b08e66f6ff684696ecd9fc96da40ee6925415359bdff83d0
3
+ size 599084
src/voice_dialogue/services/audio/generators/configs/moyoyo.py CHANGED
@@ -276,6 +276,35 @@ MOYOYO_TTS_CONFIGS = [
276
  'seed': 233333,
277
  },
278
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
279
  ]
280
 
281
 
 
276
  'seed': 233333,
277
  },
278
  },
279
+ {
280
+ 'repository': 'MoYoYoTech/tone-models',
281
+ 'character_name': 'Ellen',
282
+ 'cover_image': '',
283
+ 'description': '美国脱口秀主持人Ellen DeGeneres的AI语音模型,具有其标志性的幽默风格和独特的表达方式,适合制作娱乐和创意内容。',
284
+ 'file_size': '241M',
285
+ 'is_chinese_voice': False,
286
+ 'model_files': {
287
+ **BASE_PRETRAINED_FILES,
288
+ 'gpt-weights': 'GPT_weights/ellen_best_gpt.ckpt',
289
+ 'sovits-weights': 'SoVITS_weights/ellen_best_sovits.pth',
290
+ 'reference_audio': 'ref_audios/ellen_ref.wav',
291
+ },
292
+ 'inference_parameters': {
293
+ 'text_lang': "en",
294
+ 'prompt_text': "It might serve you better to be a little less comfortable. But wherever you're listening to this book, please remember to turn off your cell phone and that the taking of flash photographs is strictly forbidden.",
295
+ 'prompt_lang': "en",
296
+ 'top_k': 5,
297
+ 'top_p': 1,
298
+ 'temperature': 1,
299
+ 'text_split_method': "cut4",
300
+ 'batch_size': 100,
301
+ 'speed_factor': 1.0,
302
+ 'split_bucket': True,
303
+ 'return_fragment': False,
304
+ 'fragment_interval': 0.07,
305
+ 'seed': 233333,
306
+ },
307
+ },
308
  ]
309
 
310