Spaces:

ArtSpace
/

TransCree

Sleeping

App Files Files Community

ArtSpace commited on Jan 19

Commit

49e6533

verified ·

1 Parent(s): 1a1c969

Update app.py

Browse files

Files changed (1) hide show

app.py +18 -9

app.py CHANGED Viewed

@@ -79,6 +79,7 @@ class MediaDownloader:
             if progress_callback:
                 progress_callback(0.1, "Starting download...")
             output_template = str(self.output_dir / "%(title)s.%(ext)s")
             cmd = [
                 "yt-dlp",
@@ -94,13 +95,14 @@ class MediaDownloader:
             if result.returncode != 0:
                 return DownloadResult(success=False, error=result.stderr)
-            # Find downloaded file
             files = list(self.output_dir.glob("*"))
             media_files = [f for f in files if f.suffix.lower() in SUPPORTED_MEDIA]
             if not media_files:
                 return DownloadResult(success=False, error="No media file found after download")
             downloaded_file = max(media_files, key=lambda x: x.stat().st_mtime)
             if progress_callback:
@@ -177,7 +179,7 @@ class SpeechTranscriber:
             if progress_callback:
                 progress_callback(0.1, "Transcribing...")
-            # Convert language code (ar-EG → ar)
             lang_code = language.split('-')[0] if '-' in language else language
             if hasattr(self, 'use_openai'):
@@ -210,13 +212,17 @@ def generate_srt(segments, output_path: Path):
     """Generate SRT subtitle file"""
     with open(output_path, 'w', encoding='utf-8') as f:
         for i, seg in enumerate(segments, 1):
-            start = format_timestamp(seg.start if hasattr(seg, 'start') else seg['start'])
-            end = format_timestamp(seg.end if hasattr(seg, 'end') else seg['end'])
-            text = seg.text if hasattr(seg, 'text') else seg['text']
             f.write(f"{i}\n")
             f.write(f"{start} --> {end}\n")
-            f.write(f"{text.strip()}\n\n")
 def format_timestamp(seconds: float) -> str:
     """Format seconds to SRT timestamp"""
@@ -255,7 +261,7 @@ class TranscriptionPipeline:
                 progress(0.1, desc="Downloading...")
                 download_result = self.downloader.download_url(
                     source_url.strip(),
-                    lambda p, msg: progress(p * 0.3, desc=msg)
                 )
                 if not download_result.success:
                     return f"❌ Download failed: {download_result.error}", None, None, None
@@ -267,18 +273,21 @@ class TranscriptionPipeline:
             progress(0.4, desc="Converting to WAV...")
             conversion_result = self.converter.convert(
                 source_path,
-                lambda p, msg: progress(0.4 + p * 0.2, desc=msg)
             )
             if not conversion_result.success:
                 return f"❌ Conversion failed: {conversion_result.error}", None, None, None
             # Step 3: Transcribe
             progress(0.6, desc="Transcribing audio...")
             transcription_result = self.transcriber.transcribe(
                 conversion_result.wav_path,
                 language=language,
-                lambda p, msg: progress(0.6 + p * 0.4, desc=msg)
             )
             if not transcription_result.success:
                 return f"❌ Transcription failed: {transcription_result.error}", None, None, None

             if progress_callback:
                 progress_callback(0.1, "Starting download...")
+            # Using %(title)s.%(ext)s template
             output_template = str(self.output_dir / "%(title)s.%(ext)s")
             cmd = [
                 "yt-dlp",
             if result.returncode != 0:
                 return DownloadResult(success=False, error=result.stderr)
+            # Find downloaded file (most recently modified in the dir)
             files = list(self.output_dir.glob("*"))
             media_files = [f for f in files if f.suffix.lower() in SUPPORTED_MEDIA]
             if not media_files:
                 return DownloadResult(success=False, error="No media file found after download")
+            # Get the newest file
             downloaded_file = max(media_files, key=lambda x: x.stat().st_mtime)
             if progress_callback:
             if progress_callback:
                 progress_callback(0.1, "Transcribing...")
+            # Convert language code (ar-EG -> ar)
             lang_code = language.split('-')[0] if '-' in language else language
             if hasattr(self, 'use_openai'):
     """Generate SRT subtitle file"""
     with open(output_path, 'w', encoding='utf-8') as f:
         for i, seg in enumerate(segments, 1):
+            # Handle differences between whisper lib versions
+            start_time = seg.start if hasattr(seg, 'start') else seg.get('start', 0)
+            end_time = seg.end if hasattr(seg, 'end') else seg.get('end', 0)
+            text_content = seg.text if hasattr(seg, 'text') else seg.get('text', "")
+            start = format_timestamp(start_time)
+            end = format_timestamp(end_time)
             f.write(f"{i}\n")
             f.write(f"{start} --> {end}\n")
+            f.write(f"{text_content.strip()}\n\n")
 def format_timestamp(seconds: float) -> str:
     """Format seconds to SRT timestamp"""
                 progress(0.1, desc="Downloading...")
                 download_result = self.downloader.download_url(
                     source_url.strip(),
+                    progress_callback=lambda p, msg: progress(p * 0.3, desc=msg)
                 )
                 if not download_result.success:
                     return f"❌ Download failed: {download_result.error}", None, None, None
             progress(0.4, desc="Converting to WAV...")
             conversion_result = self.converter.convert(
                 source_path,
+                progress_callback=lambda p, msg: progress(0.4 + p * 0.2, desc=msg)
             )
             if not conversion_result.success:
                 return f"❌ Conversion failed: {conversion_result.error}", None, None, None
             # Step 3: Transcribe
             progress(0.6, desc="Transcribing audio...")
+            # ===== FIXED CALL HERE =====
             transcription_result = self.transcriber.transcribe(
                 conversion_result.wav_path,
                 language=language,
+                progress_callback=lambda p, msg: progress(0.6 + p * 0.4, desc=msg)
             )
             if not transcription_result.success:
                 return f"❌ Transcription failed: {transcription_result.error}", None, None, None