datasetsANDmodels commited on
Commit
2f9d6f5
·
verified ·
1 Parent(s): 4633c83

Upload usage.py

Browse files
Files changed (1) hide show
  1. usage.py +21 -0
usage.py ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from transformers import VitsModel, AutoTokenizer
2
+ import torch
3
+ import scipy
4
+ import numpy as np
5
+
6
+ model = VitsModel.from_pretrained("indonesian-tts")
7
+ tokenizer = AutoTokenizer.from_pretrained("indonesian-tts")
8
+ text ="Saya menelepon dari kantor pajak."
9
+ inputs = tokenizer(text, return_tensors="pt")
10
+
11
+ with torch.no_grad():
12
+ output = model(**inputs).waveform
13
+ output_np = output.squeeze().numpy() # Remove extra dimensions
14
+ output_np = output_np / np.max(np.abs(output_np)) # Normalize to prevent clipping
15
+
16
+ scipy.io.wavfile.write(
17
+ "indonesian.wav", # Better file naming with padding
18
+ rate=model.config.sampling_rate,
19
+ data=output_np
20
+ )
21
+