Update README.md
Browse files
README.md
CHANGED
|
@@ -67,7 +67,7 @@ pip install git+https://github.com/huggingface/parler-tts.git
|
|
| 67 |
## Utilisation
|
| 68 |
## Exemple de base
|
| 69 |
|
| 70 |
-
|
| 71 |
import torch
|
| 72 |
from parler_tts import ParlerTTSForConditionalGeneration
|
| 73 |
from transformers import AutoTokenizer
|
|
@@ -96,7 +96,7 @@ audio = model.generate(
|
|
| 96 |
|
| 97 |
# Sauvegarde
|
| 98 |
sf.write("output.wav", audio.cpu().numpy().squeeze(), model.config.sampling_rate)
|
| 99 |
-
|
| 100 |
<audio controls>
|
| 101 |
<source src="https://huggingface.co/spaces/CONCREE/Adia_TTS/resolve/main/snt.wav" type="audio/wav">
|
| 102 |
</audio>
|
|
@@ -104,7 +104,7 @@ sf.write("output.wav", audio.cpu().numpy().squeeze(), model.config.sampling_rate
|
|
| 104 |
## Configuration avancée
|
| 105 |
## Paramètres de génération
|
| 106 |
|
| 107 |
-
|
| 108 |
generation_config = {
|
| 109 |
"temperature": 0.8, # Contrôle la variabilité de la sortie
|
| 110 |
"max_new_tokens": 1000, # Longueur maximale de la séquence générée
|
|
@@ -118,7 +118,7 @@ audio = model.generate(
|
|
| 118 |
prompt_input_ids=prompt_ids,
|
| 119 |
**generation_config
|
| 120 |
)
|
| 121 |
-
|
| 122 |
|
| 123 |
<audio controls>
|
| 124 |
<source src="https://huggingface.co/spaces/CONCREE/Adia_TTS/resolve/main/avct.wav" type="audio/wav">
|
|
@@ -138,17 +138,17 @@ description = "A warm and natural voice, with a conversational flow"
|
|
| 138 |
|
| 139 |
2. ### Voix professionnelle
|
| 140 |
|
| 141 |
-
|
| 142 |
description = "A professional, clear and composed voice, perfect for formal presentations"
|
| 143 |
-
|
| 144 |
<audio controls>
|
| 145 |
<source src="https://huggingface.co/spaces/CONCREE/Adia_TTS/resolve/main/styl2.wav" type="audio/wav">
|
| 146 |
</audio>
|
| 147 |
|
| 148 |
3. ### Voix pour l'éducation
|
| 149 |
-
|
| 150 |
description = "A clear and educational voice, with a flow adapted to learning"
|
| 151 |
-
|
| 152 |
<audio controls>
|
| 153 |
<source src="https://huggingface.co/spaces/CONCREE/Adia_TTS/resolve/main/styl3.wav" type="audio/wav">
|
| 154 |
</audio>
|
|
@@ -161,7 +161,7 @@ description = "A clear and educational voice, with a flow adapted to learning"
|
|
| 161 |
* Temps de chargement initial du modèle relativement long
|
| 162 |
## Références
|
| 163 |
|
| 164 |
-
|
| 165 |
@misc{CONCREE-2024-Adia_TTS,
|
| 166 |
author = {CONCREE},
|
| 167 |
title = {Adia_TTS},
|
|
@@ -170,9 +170,9 @@ description = "A clear and educational voice, with a flow adapted to learning"
|
|
| 170 |
journal = {Hugging Face repository},
|
| 171 |
howpublished = {\url{https://huggingface.co/CONCREE/Adia_TTS}}
|
| 172 |
}
|
| 173 |
-
|
| 174 |
|
| 175 |
-
|
| 176 |
@misc{lyth2024natural,
|
| 177 |
title={Natural language guidance of high-fidelity text-to-speech with synthetic annotations},
|
| 178 |
author={Dan Lyth and Simon King},
|
|
|
|
| 67 |
## Utilisation
|
| 68 |
## Exemple de base
|
| 69 |
|
| 70 |
+
```py
|
| 71 |
import torch
|
| 72 |
from parler_tts import ParlerTTSForConditionalGeneration
|
| 73 |
from transformers import AutoTokenizer
|
|
|
|
| 96 |
|
| 97 |
# Sauvegarde
|
| 98 |
sf.write("output.wav", audio.cpu().numpy().squeeze(), model.config.sampling_rate)
|
| 99 |
+
```
|
| 100 |
<audio controls>
|
| 101 |
<source src="https://huggingface.co/spaces/CONCREE/Adia_TTS/resolve/main/snt.wav" type="audio/wav">
|
| 102 |
</audio>
|
|
|
|
| 104 |
## Configuration avancée
|
| 105 |
## Paramètres de génération
|
| 106 |
|
| 107 |
+
```py
|
| 108 |
generation_config = {
|
| 109 |
"temperature": 0.8, # Contrôle la variabilité de la sortie
|
| 110 |
"max_new_tokens": 1000, # Longueur maximale de la séquence générée
|
|
|
|
| 118 |
prompt_input_ids=prompt_ids,
|
| 119 |
**generation_config
|
| 120 |
)
|
| 121 |
+
```
|
| 122 |
|
| 123 |
<audio controls>
|
| 124 |
<source src="https://huggingface.co/spaces/CONCREE/Adia_TTS/resolve/main/avct.wav" type="audio/wav">
|
|
|
|
| 138 |
|
| 139 |
2. ### Voix professionnelle
|
| 140 |
|
| 141 |
+
```py
|
| 142 |
description = "A professional, clear and composed voice, perfect for formal presentations"
|
| 143 |
+
```
|
| 144 |
<audio controls>
|
| 145 |
<source src="https://huggingface.co/spaces/CONCREE/Adia_TTS/resolve/main/styl2.wav" type="audio/wav">
|
| 146 |
</audio>
|
| 147 |
|
| 148 |
3. ### Voix pour l'éducation
|
| 149 |
+
```py
|
| 150 |
description = "A clear and educational voice, with a flow adapted to learning"
|
| 151 |
+
```
|
| 152 |
<audio controls>
|
| 153 |
<source src="https://huggingface.co/spaces/CONCREE/Adia_TTS/resolve/main/styl3.wav" type="audio/wav">
|
| 154 |
</audio>
|
|
|
|
| 161 |
* Temps de chargement initial du modèle relativement long
|
| 162 |
## Références
|
| 163 |
|
| 164 |
+
```
|
| 165 |
@misc{CONCREE-2024-Adia_TTS,
|
| 166 |
author = {CONCREE},
|
| 167 |
title = {Adia_TTS},
|
|
|
|
| 170 |
journal = {Hugging Face repository},
|
| 171 |
howpublished = {\url{https://huggingface.co/CONCREE/Adia_TTS}}
|
| 172 |
}
|
| 173 |
+
```
|
| 174 |
|
| 175 |
+
```
|
| 176 |
@misc{lyth2024natural,
|
| 177 |
title={Natural language guidance of high-fidelity text-to-speech with synthetic annotations},
|
| 178 |
author={Dan Lyth and Simon King},
|