Spaces:
Build error
Build error
Commit
·
ebe9cbe
1
Parent(s):
7d0bff2
Add some more sample voice
Browse files- .vscode/settings.json +3 -0
- app.py +17 -7
- input/sample/Dwayne-Johnson-sample.wav +3 -0
- input/sample/Elon-Sample.wav +3 -0
- input/sample/Obama-sample.wav +3 -0
- output/output.wav +2 -2
.vscode/settings.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"cSpell.words": ["Elon"]
|
| 3 |
+
}
|
app.py
CHANGED
|
@@ -9,7 +9,7 @@ all_models = TTS.list_models()
|
|
| 9 |
# print(model)
|
| 10 |
|
| 11 |
# print("Using model: ", all_models[0])
|
| 12 |
-
|
| 13 |
# Init TTS
|
| 14 |
|
| 15 |
|
|
@@ -17,6 +17,8 @@ print("Downloading model...", '')
|
|
| 17 |
|
| 18 |
voiceCloneModel = TTS('tts_models/multilingual/multi-dataset/your_tts')
|
| 19 |
|
|
|
|
|
|
|
| 20 |
|
| 21 |
def run_cmd(command):
|
| 22 |
try:
|
|
@@ -36,27 +38,35 @@ def inference(text, speaker):
|
|
| 36 |
speaker = 'input/obama.mp3'
|
| 37 |
elif (speaker == 'Speaker-4'):
|
| 38 |
speaker = 'input/trump.wav'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 39 |
else:
|
| 40 |
speaker = 'input/z-default.wav'
|
| 41 |
# print("speaker: ", speaker)
|
| 42 |
# cmd = ['tts', '--text', text, '--out_path', 'output/tts_output.wav']
|
| 43 |
# run_cmd(cmd)
|
| 44 |
# Text to speech to a file
|
| 45 |
-
# tts = TTS(
|
| 46 |
# progress_bar=False, gpu=True)
|
| 47 |
voiceCloneModel.tts_to_file(text, speaker_wav=speaker,
|
| 48 |
language="en", file_path="output/output.wav")
|
| 49 |
|
| 50 |
-
# for i in range(len(
|
| 51 |
-
#
|
| 52 |
-
#
|
| 53 |
|
| 54 |
return 'output/output.wav'
|
| 55 |
|
| 56 |
|
|
|
|
|
|
|
| 57 |
inputs = [gr.inputs.Textbox(lines=5, label="Input Text"),
|
| 58 |
-
gr.inputs.Dropdown(
|
| 59 |
-
|
| 60 |
]
|
| 61 |
outputs = gr.outputs.Audio(type="filepath", label="Output Audio")
|
| 62 |
title = "Text To Speech"
|
|
|
|
| 9 |
# print(model)
|
| 10 |
|
| 11 |
# print("Using model: ", all_models[0])
|
| 12 |
+
model = all_models[0]
|
| 13 |
# Init TTS
|
| 14 |
|
| 15 |
|
|
|
|
| 17 |
|
| 18 |
voiceCloneModel = TTS('tts_models/multilingual/multi-dataset/your_tts')
|
| 19 |
|
| 20 |
+
# tts = TTS("tts_models/de/thorsten/tacotron2-DDC")
|
| 21 |
+
|
| 22 |
|
| 23 |
def run_cmd(command):
|
| 24 |
try:
|
|
|
|
| 38 |
speaker = 'input/obama.mp3'
|
| 39 |
elif (speaker == 'Speaker-4'):
|
| 40 |
speaker = 'input/trump.wav'
|
| 41 |
+
elif (speaker == 'Rock'):
|
| 42 |
+
speaker = 'input/sample/Dwayne-Johnson-sample.wav'
|
| 43 |
+
elif (speaker == 'Elon'):
|
| 44 |
+
speaker = 'input/sample/Elon-Sample.wav'
|
| 45 |
+
elif (speaker == 'Obama'):
|
| 46 |
+
speaker = 'input/sample/Obama-sample.wav'
|
| 47 |
else:
|
| 48 |
speaker = 'input/z-default.wav'
|
| 49 |
# print("speaker: ", speaker)
|
| 50 |
# cmd = ['tts', '--text', text, '--out_path', 'output/tts_output.wav']
|
| 51 |
# run_cmd(cmd)
|
| 52 |
# Text to speech to a file
|
| 53 |
+
# tts = TTS(model="tts_models/multilingual/multi-dataset/your_tts",
|
| 54 |
# progress_bar=False, gpu=True)
|
| 55 |
voiceCloneModel.tts_to_file(text, speaker_wav=speaker,
|
| 56 |
language="en", file_path="output/output.wav")
|
| 57 |
|
| 58 |
+
# for i in range(len(model.languages)):
|
| 59 |
+
# model.tts_to_file(text=text,
|
| 60 |
+
# speaker=model.speakers[i], language=model.languages[0], file_path='output/output-'+str(i)+'.wav')
|
| 61 |
|
| 62 |
return 'output/output.wav'
|
| 63 |
|
| 64 |
|
| 65 |
+
sampleInput = ['Speaker-1', 'Speaker-2', 'Speaker-3',
|
| 66 |
+
'Speaker-4', 'Rock', 'Elon', 'Obama']
|
| 67 |
inputs = [gr.inputs.Textbox(lines=5, label="Input Text"),
|
| 68 |
+
gr.inputs.Dropdown(
|
| 69 |
+
sampleInput, label="Sample Input", default="Speaker-1",)
|
| 70 |
]
|
| 71 |
outputs = gr.outputs.Audio(type="filepath", label="Output Audio")
|
| 72 |
title = "Text To Speech"
|
input/sample/Dwayne-Johnson-sample.wav
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f3c3d9d61a817cc459f890867c584a0496245c81b747205b48c18b49b6723d8b
|
| 3 |
+
size 1578042
|
input/sample/Elon-Sample.wav
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a6609e4b4c5a8ce77eff174fd2eca989ded8a28fd2ca5b1866035fd54247649b
|
| 3 |
+
size 1233978
|
input/sample/Obama-sample.wav
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6dec4bb97019439e01a8909d68f5704e0e2c6de12c57865f3d4a01132519c045
|
| 3 |
+
size 930874
|
output/output.wav
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:07abadaef514caf57a002e76da940e5900a6851ccba39076c3e7eb4359fdf82d
|
| 3 |
+
size 1364620
|