Spaces:

AutoArk-AI
/

GPA_DEMO

Running on L4

wanglamao commited on 1 day ago

Commit

71d4610

1 Parent(s): f1fdc79

add trim logic

Files changed (1) hide show

app.py CHANGED Viewed

@@ -53,12 +53,16 @@ def preprocess_audio(audio_path):
         # Validate audio duration
         is_valid, duration = validate_audio_duration(audio_path)
         if not is_valid:
-            logger.error(f"Audio duration {duration:.2f}s exceeds max limit {MAX_AUDIO_DURATION}s")
-            raise ValueError(f"Audio duration cannot exceed {MAX_AUDIO_DURATION}s, current is {duration:.2f}s")
         # Load audio with librosa: automatically resamples to sr=16000 and converts to mono
         y, _ = librosa.load(audio_path, sr=16000, mono=True)
         # Save processed audio to a new file to avoid conflicts
         dir_name = os.path.dirname(audio_path)
         base_name = os.path.basename(audio_path)
@@ -110,8 +114,8 @@ def process_tts_a(text, ref_audio):
         # Validate text length
         is_valid, text_len = validate_text_length(text)
         if not is_valid:
-            logger.error(f"Text length {text_len} exceeds max limit {MAX_TEXT_LENGTH}")
-            raise ValueError(f"Text length cannot exceed {MAX_TEXT_LENGTH} chars, current is {text_len} chars")
         # Preprocess audio
         ref_audio = preprocess_audio(ref_audio)

         # Validate audio duration
         is_valid, duration = validate_audio_duration(audio_path)
         if not is_valid:
+            logger.warning(f"Audio duration {duration:.2f}s exceeds max limit {MAX_AUDIO_DURATION}s. Truncating.")
         # Load audio with librosa: automatically resamples to sr=16000 and converts to mono
         y, _ = librosa.load(audio_path, sr=16000, mono=True)
+        # Truncate if exceeds max duration
+        max_samples = int(MAX_AUDIO_DURATION * 16000)
+        if len(y) > max_samples:
+            y = y[:max_samples]
         # Save processed audio to a new file to avoid conflicts
         dir_name = os.path.dirname(audio_path)
         base_name = os.path.basename(audio_path)
         # Validate text length
         is_valid, text_len = validate_text_length(text)
         if not is_valid:
+            logger.warning(f"Text length {text_len} exceeds max limit {MAX_TEXT_LENGTH}. Truncating.")
+            text = text[:MAX_TEXT_LENGTH]
         # Preprocess audio
         ref_audio = preprocess_audio(ref_audio)