Voice-Cloning

Configuration error

App Files Files Community

peteralexandercharles commited on Jan 9, 2023

Commit

4236718

1 Parent(s): c3d118a

Update app.py

Browse files

Files changed (1) hide show

app.py +6 -6

app.py CHANGED Viewed

@@ -116,15 +116,15 @@ def greet(Text,Voicetoclone,VoiceMicrophone):
       print(VoiceMicrophone)
       sample= str(VoiceMicrophone)
     size= len(reference_files)*sys.getsizeof(reference_files)
-    size2= size / 1000000
-    if (size2 > 0.012) or len(text)>2000:
-      message="File is greater than 30mb or Text inserted is longer than 2000 characters. Please re-try with smaller sizes."
       print(message)
       raise SystemExit("File is greater than 30mb. Please re-try or Text inserted is longer than 2000 characters. Please re-try with smaller sizes.")
     else:
-      os.system('ffmpeg-normalize $sample -nt rms -t=-27 -o $sample -ar 16000 -f')
       reference_emb = SE_speaker_manager.compute_d_vector_from_clip(reference_files)
-      model.length_scale = 1  # scaler for the duration predictor. The larger it is, the slower the speech.
       model.inference_noise_scale = 0.3 # defines the noise variance applied to the random z vector at inference.
       model.inference_noise_scale_dp = 0.3 # defines the noise variance applied to the duration predictor z vector at inference.
       text = text
@@ -158,7 +158,7 @@ def greet(Text,Voicetoclone,VoiceMicrophone):
 demo = gr.Interface(
     fn=greet,
-    inputs=[gr.inputs.Textbox(label='What would you like the voice to say? (max. 2000 characters per request)'),gr.Audio(type="filepath",         source="upload",label='Please upload a voice to clone (max. 30mb)'),gr.Audio(source="microphone", type="filepath", streaming=True)],
     outputs="audio",
     title="Bilal's Voice Cloning Tool"
     )

       print(VoiceMicrophone)
       sample= str(VoiceMicrophone)
     size= len(reference_files)*sys.getsizeof(reference_files)
+    size2= size / 10000000
+    if (size2 > 0.012) or len(text)>20000:
+      message="File is greater than 300mb or Text inserted is longer than 20000 characters. Please re-try with smaller sizes."
       print(message)
       raise SystemExit("File is greater than 30mb. Please re-try or Text inserted is longer than 2000 characters. Please re-try with smaller sizes.")
     else:
+      os.system('ffmpeg-normalize $sample -nt rms -t=-270 -o $sample -ar 160000 -f')
       reference_emb = SE_speaker_manager.compute_d_vector_from_clip(reference_files)
+      model.length_scale = 2  # scaler for the duration predictor. The larger it is, the slower the speech.
       model.inference_noise_scale = 0.3 # defines the noise variance applied to the random z vector at inference.
       model.inference_noise_scale_dp = 0.3 # defines the noise variance applied to the duration predictor z vector at inference.
       text = text
 demo = gr.Interface(
     fn=greet,
+    inputs=[gr.inputs.Textbox(label='What would you like the voice to say? (max. 20000 characters per request)'),gr.Audio(type="filepath",         source="upload",label='Please upload a voice to clone (max. 30mb)'),gr.Audio(source="microphone", type="filepath", streaming=True)],
     outputs="audio",
     title="Bilal's Voice Cloning Tool"
     )