Spaces:

Rajhuggingface4253
/

neu

Paused

App Files Files Community

Rajhuggingface4253 commited on Oct 16

Commit

26c5cf5

verified ·

1 Parent(s): 97f4e01

Update app.py

Browse files

Files changed (1) hide show

app.py +47 -55

app.py CHANGED Viewed

@@ -3,45 +3,39 @@ import sys
 import uuid
 import logging
 from typing import Optional
-import numpy as np
-from fastapi import FastAPI, HTTPException, UploadFile, File, Form
-from fastapi.responses import FileResponse, JSONResponse
-from fastapi.middleware.cors import CORSMiddleware
-import soundfile as sf
-import io
 # Set up logging
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger("neutts-api")
-# Add neutts-air to Python path BEFORE any imports
 neutts_path = os.path.join(os.getcwd(), "neutts-air")
 sys.path.insert(0, neutts_path)
 logger.info(f"Current directory: {os.getcwd()}")
-logger.info(f"Python path: {sys.path}")
-# Check if neutts-air exists and what's in it
-if os.path.exists(neutts_path):
-    logger.info("neutts-air directory exists")
-    logger.info(f"Contents: {os.listdir(neutts_path)}")
-    # Check for the specific module structure
-    neuttsair_path = os.path.join(neutts_path, "neuttsair")
-    if os.path.exists(neuttsair_path):
-        logger.info(f"neuttsair subdirectory exists: {os.listdir(neuttsair_path)}")
-    else:
-        logger.error("neuttsair subdirectory not found!")
-else:
-    logger.error("neutts-air directory not found!")
 try:
-    # Now import - this should work with the path added
     from neuttsair.neutts import NeuTTSAir
-    logger.info("✅ Successfully imported NeuTTSAir")
 except ImportError as e:
     logger.error(f"❌ Import failed: {e}")
-    # Try to provide more detailed debug info
     import traceback
     traceback.print_exc()
     raise
@@ -79,6 +73,8 @@ def initialize_model():
             logger.info("✅ NeuTTS Air model initialized successfully")
         except Exception as e:
             logger.error(f"❌ Model initialization failed: {e}")
             raise
     return tts
@@ -87,8 +83,9 @@ async def startup_event():
     """Initialize model on startup"""
     try:
         initialize_model()
     except Exception as e:
-        logger.error(f"Startup initialization failed: {e}")
 @app.get("/")
 async def root():
@@ -101,14 +98,25 @@ async def root():
 @app.get("/health")
 async def health_check():
     return {
-        "status": "healthy",
         "model_loaded": tts is not None,
         "endpoints": {
             "synthesize": "/api/v1/synthesize",
-            "synthesize_b64": "/api/v1/synthesize/b64"
         }
     }
 @app.post("/api/v1/synthesize")
 async def synthesize_speech(
     ref_text: str = Form(..., description="Reference audio transcript"),
@@ -119,8 +127,8 @@ async def synthesize_speech(
     Synthesize speech using voice cloning - returns WAV file
     """
     try:
-        if tts is None:
-            initialize_model()
         # Validate input
         if not ref_text.strip() or not gen_text.strip():
@@ -143,10 +151,10 @@ async def synthesize_speech(
         # Perform inference
         logger.info("Encoding reference audio...")
-        ref_codes = tts.encode_reference(upload_path)
         logger.info("Generating speech...")
-        wav = tts.infer(gen_text, ref_codes, ref_text)
         # Save output
         os.makedirs("outputs", exist_ok=True)
@@ -169,6 +177,8 @@ async def synthesize_speech(
     except Exception as e:
         logger.error(f"Synthesis error: {str(e)}")
         raise HTTPException(500, f"Synthesis failed: {str(e)}")
 @app.post("/api/v1/synthesize/b64")
@@ -181,8 +191,7 @@ async def synthesize_speech_base64(
     Synthesize speech and return as base64 encoded audio
     """
     try:
-        if tts is None:
-            initialize_model()
         # Save uploaded file
         os.makedirs("uploads", exist_ok=True)
@@ -192,8 +201,8 @@ async def synthesize_speech_base64(
             f.write(content)
         # Perform inference
-        ref_codes = tts.encode_reference(upload_path)
-        wav = tts.infer(gen_text, ref_codes, ref_text)
         # Convert to base64
         buffer = io.BytesIO()
@@ -218,27 +227,10 @@ async def synthesize_speech_base64(
     except Exception as e:
         logger.error(f"Base64 synthesis error: {str(e)}")
         raise HTTPException(500, f"Synthesis failed: {str(e)}")
-# Simple test endpoint
-@app.get("/api/v1/test")
-async def test_endpoint():
-    """Test endpoint to verify basic functionality"""
-    try:
-        if tts is None:
-            initialize_model()
-        return {
-            "status": "success",
-            "message": "API is working",
-            "model_loaded": tts is not None
-        }
-    except Exception as e:
-        return {
-            "status": "error",
-            "message": str(e)
-        }
 if __name__ == "__main__":
     import uvicorn
     uvicorn.run(app, host="0.0.0.0", port=7860)

 import uuid
 import logging
 from typing import Optional
+# CRITICAL: Set numba environment variables BEFORE any imports
+os.environ['NUMBA_CACHE_DIR'] = '/tmp/numba_cache'
+os.environ['NUMBA_DISABLE_JIT'] = '0'  # Keep JIT enabled but control cache
+# Create cache directory
+os.makedirs('/tmp/numba_cache', exist_ok=True)
 # Set up logging
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger("neutts-api")
+# Add neutts-air to Python path
 neutts_path = os.path.join(os.getcwd(), "neutts-air")
 sys.path.insert(0, neutts_path)
 logger.info(f"Current directory: {os.getcwd()}")
 try:
+    # Import after environment setup
+    import numpy as np
+    from fastapi import FastAPI, HTTPException, UploadFile, File, Form
+    from fastapi.responses import FileResponse, JSONResponse
+    from fastapi.middleware.cors import CORSMiddleware
+    import soundfile as sf
+    import io
+    # Now import NeuTTS - this should work with the numba cache fix
     from neuttsair.neutts import NeuTTSAir
+    logger.info("✅ All imports successful")
 except ImportError as e:
     logger.error(f"❌ Import failed: {e}")
     import traceback
     traceback.print_exc()
     raise
             logger.info("✅ NeuTTS Air model initialized successfully")
         except Exception as e:
             logger.error(f"❌ Model initialization failed: {e}")
+            import traceback
+            traceback.print_exc()
             raise
     return tts
     """Initialize model on startup"""
     try:
         initialize_model()
+        logger.info("✅ Startup initialization successful")
     except Exception as e:
+        logger.warning(f"⚠️ Startup initialization failed: {e}")
 @app.get("/")
 async def root():
 @app.get("/health")
 async def health_check():
     return {
+        "status": "healthy" if tts is not None else "degraded",
         "model_loaded": tts is not None,
         "endpoints": {
             "synthesize": "/api/v1/synthesize",
+            "synthesize_b64": "/api/v1/synthesize/b64",
+            "test": "/api/v1/test"
         }
     }
+@app.get("/api/v1/test")
+async def test_endpoint():
+    """Test endpoint that doesn't require model initialization"""
+    return {
+        "status": "success",
+        "message": "API is working",
+        "model_loaded": tts is not None,
+        "numba_cache": os.environ.get('NUMBA_CACHE_DIR', 'not set')
+    }
 @app.post("/api/v1/synthesize")
 async def synthesize_speech(
     ref_text: str = Form(..., description="Reference audio transcript"),
     Synthesize speech using voice cloning - returns WAV file
     """
     try:
+        # Initialize model if needed
+        tts_model = initialize_model()
         # Validate input
         if not ref_text.strip() or not gen_text.strip():
         # Perform inference
         logger.info("Encoding reference audio...")
+        ref_codes = tts_model.encode_reference(upload_path)
         logger.info("Generating speech...")
+        wav = tts_model.infer(gen_text, ref_codes, ref_text)
         # Save output
         os.makedirs("outputs", exist_ok=True)
     except Exception as e:
         logger.error(f"Synthesis error: {str(e)}")
+        import traceback
+        traceback.print_exc()
         raise HTTPException(500, f"Synthesis failed: {str(e)}")
 @app.post("/api/v1/synthesize/b64")
     Synthesize speech and return as base64 encoded audio
     """
     try:
+        tts_model = initialize_model()
         # Save uploaded file
         os.makedirs("uploads", exist_ok=True)
             f.write(content)
         # Perform inference
+        ref_codes = tts_model.encode_reference(upload_path)
+        wav = tts_model.infer(gen_text, ref_codes, ref_text)
         # Convert to base64
         buffer = io.BytesIO()
     except Exception as e:
         logger.error(f"Base64 synthesis error: {str(e)}")
+        import traceback
+        traceback.print_exc()
         raise HTTPException(500, f"Synthesis failed: {str(e)}")
 if __name__ == "__main__":
     import uvicorn
     uvicorn.run(app, host="0.0.0.0", port=7860)