liumaolin commited on
Commit
7b003c4
·
1 Parent(s): d0c1c61

Add new voice model "Doubao" to MoYoYo configuration

Browse files

- Include model details, inference parameters, and related files.
- Add reference audio and pretrained weights for TTS.

assets/models/tts/moyoyo/GPT_weights/doubao_best_gpt.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2514e7b3e1eca3ad58ed18291f5b1d95c18d086320e23baead7a6ea4f6862fb
3
+ size 155312658
assets/models/tts/moyoyo/SoVITS_weights/doubao_best_sovits.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6206099d9d30e32065903775916dedaab89213e210930440288722259915b929
3
+ size 85007879
assets/models/tts/moyoyo/ref_audios/doubao_ref.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5c8581b8b7a857f5ecbdce36a558b12f7eefc36dbbc96e7cf7a99615627f6e6
3
+ size 844878
src/voice_dialogue/services/audio/generators/configs/moyoyo.py CHANGED
@@ -12,6 +12,35 @@ BASE_PRETRAINED_FILES = {
12
 
13
  # MoYoYo TTS配置列表
14
  MOYOYO_TTS_CONFIGS = [
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
15
  {
16
  'repository': 'MoYoYoTech/tone-models',
17
  'character_name': 'Luo Xiang',
 
12
 
13
  # MoYoYo TTS配置列表
14
  MOYOYO_TTS_CONFIGS = [
15
+ {
16
+ 'repository': 'MoYoYoTech/tone-models',
17
+ 'character_name': 'Doubao',
18
+ 'cover_image': 'https://huggingface.co/MoYoYoTech/tone-models/resolve/main/cover/doubao.png',
19
+ 'description': '豆包是MoYoYo的虚拟助手,能陪你聊天解闷,不管是聊生活趣事,知识科普还是帮你出主意,我都在行哦。',
20
+ 'file_size': '240M',
21
+ 'is_chinese_voice': True,
22
+ 'model_files': {
23
+ **BASE_PRETRAINED_FILES,
24
+ 'gpt-weights': 'GPT_weights/doubao_best_gpt.ckpt',
25
+ 'sovits-weights': 'SoVITS_weights/doubao_best_sovits.pth',
26
+ 'reference_audio': 'ref_audios/doubao_ref.wav',
27
+ },
28
+ 'inference_parameters': {
29
+ 'text_lang': "zh",
30
+ 'prompt_text': "我叫豆包呀,能陪你聊天解闷,不管是聊生活趣事,知识科普还是帮你出主意,我都在行哦。",
31
+ 'prompt_lang': "zh",
32
+ 'top_k': 5,
33
+ 'top_p': 1,
34
+ 'temperature': 1,
35
+ 'text_split_method': "cut3",
36
+ 'batch_size': 100,
37
+ 'speed_factor': 1.1,
38
+ 'split_bucket': True,
39
+ 'return_fragment': False,
40
+ 'fragment_interval': 0.07,
41
+ 'seed': 233333,
42
+ },
43
+ },
44
  {
45
  'repository': 'MoYoYoTech/tone-models',
46
  'character_name': 'Luo Xiang',