Update README.md
Browse files
README.md
CHANGED
|
@@ -79,18 +79,24 @@ installs
|
|
| 79 |
|
| 80 |
inference
|
| 81 |
```python
|
| 82 |
-
|
| 83 |
from transformers import pipeline
|
| 84 |
from datasets import load_dataset
|
| 85 |
import soundfile as sf
|
|
|
|
|
|
|
| 86 |
|
| 87 |
synthesiser = pipeline("text-to-speech", "umarigan/speecht5_tts_tr_v1.0")
|
| 88 |
|
| 89 |
-
embeddings_dataset = load_dataset("umarigan/turkish_voice_dataset_embedded", split="train
|
| 90 |
speaker_embedding = torch.tensor(embeddings_dataset[736]["speaker_embeddings"]).unsqueeze(0)
|
| 91 |
-
|
|
|
|
| 92 |
speech = synthesiser("Bir berber bir berbere gel beraber bir berber kuralım demiş", forward_params={"speaker_embeddings": speaker_embedding})
|
| 93 |
|
|
|
|
| 94 |
sf.write("speech.wav", speech["audio"], samplerate=speech["sampling_rate"])
|
| 95 |
|
|
|
|
|
|
|
|
|
|
| 96 |
```
|
|
|
|
| 79 |
|
| 80 |
inference
|
| 81 |
```python
|
|
|
|
| 82 |
from transformers import pipeline
|
| 83 |
from datasets import load_dataset
|
| 84 |
import soundfile as sf
|
| 85 |
+
import torch
|
| 86 |
+
from IPython.display import Audio
|
| 87 |
|
| 88 |
synthesiser = pipeline("text-to-speech", "umarigan/speecht5_tts_tr_v1.0")
|
| 89 |
|
| 90 |
+
embeddings_dataset = load_dataset("umarigan/turkish_voice_dataset_embedded", split="train")
|
| 91 |
speaker_embedding = torch.tensor(embeddings_dataset[736]["speaker_embeddings"]).unsqueeze(0)
|
| 92 |
+
|
| 93 |
+
# Synthesize speech using the embedding
|
| 94 |
speech = synthesiser("Bir berber bir berbere gel beraber bir berber kuralım demiş", forward_params={"speaker_embeddings": speaker_embedding})
|
| 95 |
|
| 96 |
+
# Save the generated audio to a file
|
| 97 |
sf.write("speech.wav", speech["audio"], samplerate=speech["sampling_rate"])
|
| 98 |
|
| 99 |
+
# Play the audio in the notebook
|
| 100 |
+
Audio("speech.wav")
|
| 101 |
+
|
| 102 |
```
|