primepake commited on
Commit
035ed05
·
1 Parent(s): 4a1f5f8

update structure

Browse files
Files changed (2) hide show
  1. README.md +4 -9
  2. speech/config.yaml +1 -1
README.md CHANGED
@@ -135,16 +135,11 @@ pip install -r requirements.txt
135
  ```
136
  minimax-speech/
137
  ├── assets/
138
- │ └── image.png
139
- ├── configs/
140
- │ └── dac_vae.yaml
141
- ├── models/
142
- │ ├── fsq/
143
- │ └── dac_vae/
144
- ├── cosyvoice/ # Components from CosyVoice2
145
  │ ├── flow/
146
- │ ├── transformer/
147
- │ └── utils/
148
  └── README.md
149
  ```
150
 
 
135
  ```
136
  minimax-speech/
137
  ├── assets/
138
+ ├── dac-vae/
139
+ ├── flowae/
140
+ ├── speech/
141
+ ├── llm/
 
 
 
142
  │ ├── flow/
 
 
143
  └── README.md
144
  ```
145
 
speech/config.yaml CHANGED
@@ -198,7 +198,7 @@ sort: !name:cosyvoice.dataset.processor.sort
198
  sort_size: 500 # sort_size should be less than shuffle_size
199
  batch: !name:cosyvoice.dataset.processor.batch
200
  batch_type: 'dynamic'
201
- max_frames_in_batch: 50000
202
  padding: !name:cosyvoice.dataset.processor.padding
203
  use_spk_embedding: False # change to True during sft
204
  use_speaker_encoder: !ref <use_speaker_encoder>
 
198
  sort_size: 500 # sort_size should be less than shuffle_size
199
  batch: !name:cosyvoice.dataset.processor.batch
200
  batch_type: 'dynamic'
201
+ max_frames_in_batch: 40000
202
  padding: !name:cosyvoice.dataset.processor.padding
203
  use_spk_embedding: False # change to True during sft
204
  use_speaker_encoder: !ref <use_speaker_encoder>