Spaces:
Sleeping
Sleeping
Peter Michael Gits Claude commited on
Commit Β·
489f3e7
1
Parent(s): f3f17e8
CRITICAL FIX: Return single value from gradio_transcribe_memory endpoint
Browse files- Fixed gradio_transcribe_memory to return only transcription text instead of 3-tuple
- This resolves JSON parsing errors in voiceCal-ai client
- voiceCal-ai expects single string but was receiving (transcription, timing, status)
- All error cases now also return single values
- Should resolve "Starting..." UI issue in voiceCal-ai
π€ Generated with [Claude Code](https://claude.ai/code)
Co-Authored-By: Claude <noreply@anthropic.com>
app.py
CHANGED
|
@@ -223,7 +223,7 @@ def gradio_transcribe_memory(audio_base64: str, language: str = "en", model_size
|
|
| 223 |
|
| 224 |
if not audio_base64 or audio_base64 == "":
|
| 225 |
logger.warning("π MEMORY: No audio data provided")
|
| 226 |
-
return "β No audio data provided"
|
| 227 |
|
| 228 |
# Decode base64 to binary audio data
|
| 229 |
try:
|
|
@@ -231,7 +231,7 @@ def gradio_transcribe_memory(audio_base64: str, language: str = "en", model_size
|
|
| 231 |
logger.info(f"π MEMORY: Decoded audio size: {len(audio_binary)} bytes")
|
| 232 |
except Exception as decode_error:
|
| 233 |
logger.error(f"π MEMORY: Base64 decode error: {decode_error}")
|
| 234 |
-
return f"β Invalid base64 audio data: {decode_error}"
|
| 235 |
|
| 236 |
# Save to temporary file for Whisper processing (still needed for torchaudio.load)
|
| 237 |
with tempfile.NamedTemporaryFile(suffix='.webm', delete=False) as tmp_file:
|
|
@@ -249,9 +249,9 @@ def gradio_transcribe_memory(audio_base64: str, language: str = "en", model_size
|
|
| 249 |
logger.info(f"π MEMORY: Status: {status}")
|
| 250 |
|
| 251 |
if status == "success":
|
| 252 |
-
return
|
| 253 |
else:
|
| 254 |
-
return
|
| 255 |
|
| 256 |
finally:
|
| 257 |
# Clean up temp file
|
|
@@ -262,7 +262,7 @@ def gradio_transcribe_memory(audio_base64: str, language: str = "en", model_size
|
|
| 262 |
except Exception as e:
|
| 263 |
error_msg = f"Error in gradio_transcribe_memory: {str(e)}"
|
| 264 |
logger.error(f"π MEMORY: {error_msg}")
|
| 265 |
-
return f"β Error: {str(e)}"
|
| 266 |
|
| 267 |
# Create Gradio interface with transcription functionality
|
| 268 |
with gr.Blocks(title="π€ STT WebSocket Service v1.0.0") as demo:
|
|
|
|
| 223 |
|
| 224 |
if not audio_base64 or audio_base64 == "":
|
| 225 |
logger.warning("π MEMORY: No audio data provided")
|
| 226 |
+
return "β No audio data provided"
|
| 227 |
|
| 228 |
# Decode base64 to binary audio data
|
| 229 |
try:
|
|
|
|
| 231 |
logger.info(f"π MEMORY: Decoded audio size: {len(audio_binary)} bytes")
|
| 232 |
except Exception as decode_error:
|
| 233 |
logger.error(f"π MEMORY: Base64 decode error: {decode_error}")
|
| 234 |
+
return f"β Invalid base64 audio data: {decode_error}"
|
| 235 |
|
| 236 |
# Save to temporary file for Whisper processing (still needed for torchaudio.load)
|
| 237 |
with tempfile.NamedTemporaryFile(suffix='.webm', delete=False) as tmp_file:
|
|
|
|
| 249 |
logger.info(f"π MEMORY: Status: {status}")
|
| 250 |
|
| 251 |
if status == "success":
|
| 252 |
+
return transcription # Return only transcription for voiceCal-ai compatibility
|
| 253 |
else:
|
| 254 |
+
return "β Transcription failed"
|
| 255 |
|
| 256 |
finally:
|
| 257 |
# Clean up temp file
|
|
|
|
| 262 |
except Exception as e:
|
| 263 |
error_msg = f"Error in gradio_transcribe_memory: {str(e)}"
|
| 264 |
logger.error(f"π MEMORY: {error_msg}")
|
| 265 |
+
return f"β Error: {str(e)}"
|
| 266 |
|
| 267 |
# Create Gradio interface with transcription functionality
|
| 268 |
with gr.Blocks(title="π€ STT WebSocket Service v1.0.0") as demo:
|