Spaces:

E-motionAssistant
/

Space2

Sleeping

App Files Files Community

amasha03 commited on 24 days ago

Commit

0861d22

verified ·

1 Parent(s): 8636826

Update app.py

Browse files

Files changed (1) hide show

app.py +23 -48

app.py CHANGED Viewed

@@ -12,80 +12,55 @@ def load_eng_model():
     model_path = hf_hub_download(repo_id=repo_id, filename="best_model.pth")
     config_path = hf_hub_download(repo_id=repo_id, filename="config.json")
-    # --- THE FIX: MANUALLY OVERWRITE THE FILE ON DISK ---
     with open(config_path, 'r') as f:
-        config_data = json.load(f)
-    # Force the character count in the dictionary
-    print("Modifying config file on disk to 137 characters...")
-    config_data["model_args"]["num_chars"] = 137
-    # Save it back to the same file
-    with open(config_path, 'w') as f:
-        json.dump(config_data, f)
-    # ---------------------------------------------------
-    # Now load using the paths normally. Since the file is
-    # changed on disk, the model will read 137 correctly.
-    tts = TTS(model_path=model_path, config_path=config_path, gpu=False)
     gc.collect()
     return tts
 # --- Global Initialization ---
-print("Starting English TTS...")
 try:
     eng_tts = load_eng_model()
-    print("--- ENGLISH MODEL LOADED SUCCESSFULLY ---")
 except Exception as e:
     print(f"CRITICAL ERROR: {e}")
     eng_tts = None
 def generate_voice(text):
-    print(f"\n>>> SYNTHESIS START: '{text}'")
     if eng_tts is None:
-        print(">>> ERROR: eng_tts is None. Model did not load!")
         return None
     try:
-        # Use an absolute path to ensure Gradio finds it
         output_path = os.path.join(os.getcwd(), "en_output.wav")
-        # Clean up old file if it exists
-        if os.path.exists(output_path):
-            os.remove(output_path)
-            print(">>> Cleaned old audio file.")
-        # Synthesis
-        print(">>> Running tts_to_file...")
         eng_tts.tts_to_file(text=str(text), file_path=output_path)
-        # Check if the file actually exists and has data
-        if os.path.exists(output_path):
-            size = os.path.getsize(output_path)
-            if size > 1000: # Files smaller than 1KB are usually silent/empty
-                print(f">>> SUCCESS: Audio generated ({size} bytes)")
-                return output_path
-            else:
-                print(f">>> ERROR: File created but it is TOO SMALL ({size} bytes).")
-        else:
-            print(">>> ERROR: tts_to_file finished but NO FILE was found on disk.")
     except Exception as e:
-        print(f">>> GENERATION CRASHED: {e}")
-        # If espeak is missing, the error will appear here!
-    return None
-# Gradio Interface - Added interactive features to help debugging
 demo = gr.Interface(
     fn=generate_voice,
-    inputs=gr.Textbox(label="Input English Text", value="Hello, the system is now testing audio output."),
-    outputs=gr.Audio(label="Synthesized Speech", type="filepath", autoplay=True),
-    title="English VITS TTS",
-    allow_flagging="never"
 )
 if __name__ == "__main__":
     demo.launch()

     model_path = hf_hub_download(repo_id=repo_id, filename="best_model.pth")
     config_path = hf_hub_download(repo_id=repo_id, filename="config.json")
+    # 1. Read the config file
     with open(config_path, 'r') as f:
+        config_dict = json.load(f)
+    # 2. Force the character count to 137 in the dictionary
+    print("Forcing 137 characters in config...")
+    config_dict["model_args"]["num_chars"] = 137
+    # 3. Save it back to a NEW local file to ensure it's fresh
+    local_config_path = os.path.join(os.getcwd(), "fixed_config.json")
+    with open(local_config_path, 'w') as f:
+        json.dump(config_dict, f)
+    # 4. Initialize TTS and load model
+    # Use the local_config_path we just created
+    print("Initializing TTS engine with fixed config...")
+    tts = TTS(model_path=model_path, config_path=local_config_path, gpu=False)
     gc.collect()
     return tts
 # --- Global Initialization ---
+print("Starting English TTS Startup...")
 try:
     eng_tts = load_eng_model()
+    print("--- SUCCESS: ENGLISH MODEL LOADED ---")
 except Exception as e:
     print(f"CRITICAL ERROR: {e}")
     eng_tts = None
 def generate_voice(text):
     if eng_tts is None:
         return None
     try:
         output_path = os.path.join(os.getcwd(), "en_output.wav")
+        # Synthesize
         eng_tts.tts_to_file(text=str(text), file_path=output_path)
+        return output_path
     except Exception as e:
+        print(f"Generation Error: {e}")
+        return None
+# Gradio Interface (Fixed: removed 'allow_flagging' which caused the crash)
 demo = gr.Interface(
     fn=generate_voice,
+    inputs=gr.Textbox(label="Input English Text"),
+    outputs=gr.Audio(label="Synthesized Speech", type="filepath"),
+    title="English VITS TTS"
 )
 if __name__ == "__main__":
     demo.launch()