Video-stitch

Sleeping

App Files Files Community

Nav3005 commited on Feb 19

Commit

23b54a0

verified ·

1 Parent(s): 3a97dde

Upload 3 files

Browse files

Files changed (3) hide show

Dockerfile +28 -0
app.py +873 -0
requirements.txt +8 -0

Dockerfile ADDED Viewed

	@@ -0,0 +1,28 @@

+FROM python:3.11-slim
+# Install system dependencies needed for Pillow, fontconfig, and ffmpeg
+RUN apt-get update && apt-get install -y \
+    libgl1-mesa-glx \
+    libglib2.0-0 \
+    libgomp1 \
+    fontconfig \
+    && rm -rf /var/lib/apt/lists/*
+WORKDIR /app
+# Install Python dependencies first (layer caching)
+COPY requirements.txt .
+RUN pip install --no-cache-dir -r requirements.txt
+# Copy application files
+COPY app.py .
+COPY reddit_template.png . 2>/dev/null || true
+# Copy fonts if they exist
+COPY fonts/ ./fonts/ 2>/dev/null || true
+# Hugging Face Spaces requires port 7860
+EXPOSE 7860
+# Run with uvicorn on the required HF port
+CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860", "--workers", "1"]

app.py ADDED Viewed

	@@ -0,0 +1,873 @@

+import subprocess
+import static_ffmpeg
+import os
+import tempfile
+import requests
+import re
+import textwrap
+import shutil
+import time
+import uuid
+import asyncio
+from datetime import datetime
+from PIL import Image, ImageDraw, ImageFont
+from functools import lru_cache
+from typing import Optional
+from concurrent.futures import ThreadPoolExecutor
+from fastapi import FastAPI, UploadFile, File, Form, HTTPException, BackgroundTasks, Request
+from fastapi.responses import FileResponse, JSONResponse
+from fastapi.middleware.cors import CORSMiddleware
+from pydantic import BaseModel, Field
+import aiofiles
+# ========================================
+# CONFIGURATION SECTION - CUSTOMIZE HERE
+# ========================================
+# Reddit Template Text Settings
+REDDIT_CONFIG = {
+  'template_file': 'reddit_template.png',  # Template filename in script directory
+  'font_file': 'RFDewi-Bold.ttf',          # Font file for Reddit text
+  'font_size_max': 180,                     # Maximum font size to try
+  'font_size_min': 16,                      # Minimum font size (if text too long)
+  'text_wrap_width': 35,                    # Characters per line for wrapping
+  'text_color': 'black',                    # Text color
+  'line_spacing': 10,                       # Spacing between lines
+  'text_box_width_percent': 0.85,            # 80% of template width
+  'text_box_height_percent': 0.65,           # 50% of template height
+  'y_offset': 20,                           # Vertical offset from center
+}
+# Word-by-Word Subtitle Settings
+SUBTITLE_CONFIG = {
+  'font_file': 'TitanOne-Regular.ttf', # Font file for subtitles (TTF or OTF)
+  'font_name': 'Titan One',               # Font name as it appears in system
+  'font_size_default': 12,                  # Default subtitle font size
+  'position_alignment': 5,                  # 5 = center (1-9 numpad layout)
+  'margin_left': 50,
+  'margin_right': 70,
+  'margin_vertical': 0,
+}
+# Video Processing Settings
+VIDEO_CONFIG = {
+  'reddit_scale_percent': 0.75,             # Reddit template size (0.75 = 75% of video width)
+  'fade_start_percent': 0.70,                # When fade to color starts (60%)
+  'fade_end_percent': 0.83,                 # When fully faded to color (75%)
+  'promo_percent': 0.1,                     # Last 10% for book cover
+  'fade_color_rgb': (218, 207, 195),        # Fade color RGB
+  'book_fade_in_duration': 2,               # Book cover fade-in duration (seconds)
+}
+# ========================================
+# END CONFIGURATION SECTION
+# ========================================
+# Add static ffmpeg to PATH
+static_ffmpeg.add_paths()
+# Thread pool for background jobs (max 2 concurrent encoding jobs)
+executor = ThreadPoolExecutor(max_workers=2)
+def setup_custom_fonts_hf(temp_dir):
+  """
+  Setup custom fonts for FFmpeg/libass - Hugging Face Spaces compatible.
+  """
+  try:
+      fonts_dir = os.path.join(temp_dir, 'fonts')
+      os.makedirs(fonts_dir, exist_ok=True)
+      script_dir = os.path.dirname(os.path.abspath(__file__))
+      repo_fonts_dir = os.path.join(script_dir, 'fonts')
+      fonts_to_copy = []
+      if os.path.exists(repo_fonts_dir):
+          for font_file in os.listdir(repo_fonts_dir):
+              if font_file.endswith(('.ttf', '.otf', '.TTF', '.OTF')):
+                  fonts_to_copy.append(os.path.join(repo_fonts_dir, font_file))
+      for item in [REDDIT_CONFIG['font_file'], SUBTITLE_CONFIG['font_file']]:
+          font_path = os.path.join(script_dir, item)
+          if os.path.exists(font_path) and font_path not in fonts_to_copy:
+              fonts_to_copy.append(font_path)
+      for src in fonts_to_copy:
+          dst = os.path.join(fonts_dir, os.path.basename(src))
+          shutil.copy(src, dst)
+      if fonts_to_copy:
+          fonts_conf = f"""<?xml version="1.0"?>
+<fontconfig>
+<dir>{fonts_dir}</dir>
+<cachedir>{temp_dir}/cache</cachedir>
+</fontconfig>
+"""
+          conf_path = os.path.join(temp_dir, 'fonts.conf')
+          with open(conf_path, 'w') as f:
+              f.write(fonts_conf)
+          env = os.environ.copy()
+          env['FONTCONFIG_FILE'] = conf_path
+          env['FONTCONFIG_PATH'] = temp_dir
+          return env
+      return os.environ.copy()
+  except Exception as e:
+      return os.environ.copy()
+def download_file_from_url(url, output_dir, filename):
+  """Download a file from URL and save it to output directory."""
+  try:
+      response = requests.get(url, stream=True, timeout=30)
+      response.raise_for_status()
+      file_path = os.path.join(output_dir, filename)
+      with open(file_path, 'wb') as f:
+          for chunk in response.iter_content(chunk_size=8192):
+              f.write(chunk)
+      return file_path
+  except Exception as e:
+      raise Exception(f"Failed to download file from URL: {str(e)}")
+def download_book_cover(book_id, output_dir):
+  """Download book cover from Google Books API using Book ID."""
+  try:
+      image_url = f"https://books.google.com/books/publisher/content/images/frontcover/{book_id}"
+      response = requests.get(image_url, timeout=30)
+      response.raise_for_status()
+      image_path = os.path.join(output_dir, 'book_cover.png')
+      with open(image_path, 'wb') as f:
+          f.write(response.content)
+      img = Image.open(image_path)
+      img.verify()
+      return image_path
+  except Exception as e:
+      raise Exception(f"Failed to download book cover: {str(e)}")
+def get_video_info(video_path):
+  """Get video resolution and frame rate using ffprobe."""
+  try:
+      cmd_res = [
+          "ffprobe", "-v", "error", "-select_streams", "v:0",
+          "-show_entries", "stream=width,height", "-of", "csv=s=x:p=0", video_path
+      ]
+      result = subprocess.run(cmd_res, capture_output=True, text=True, check=True)
+      width, height = result.stdout.strip().split('x')
+      cmd_fps = [
+          "ffprobe", "-v", "error", "-select_streams", "v:0",
+          "-show_entries", "stream=r_frame_rate", "-of", "default=noprint_wrappers=1:nokey=1", video_path
+      ]
+      result = subprocess.run(cmd_fps, capture_output=True, text=True, check=True)
+      fps_str = result.stdout.strip()
+      if '/' in fps_str:
+          num, den = fps_str.split('/')
+          fps = float(num) / float(den)
+      else:
+          fps = float(fps_str)
+      return int(width), int(height), fps
+  except Exception as e:
+      raise Exception(f"Failed to get video info: {str(e)}")
+def get_audio_duration(audio_path):
+  """Get audio duration in seconds using ffprobe."""
+  try:
+      cmd = [
+          "ffprobe", "-v", "error", "-show_entries", "format=duration",
+          "-of", "default=noprint_wrappers=1:nokey=1", audio_path
+      ]
+      result = subprocess.run(cmd, capture_output=True, text=True, check=True)
+      return float(result.stdout.strip())
+  except Exception as e:
+      raise Exception(f"Failed to get audio duration: {str(e)}")
+def extract_first_subtitle(srt_path):
+  """Extract first subtitle entry. Returns: (text, start_sec, end_sec)"""
+  try:
+      with open(srt_path, 'r', encoding='utf-8') as f:
+          content = f.read()
+      blocks = re.split(r'\n\s*\n', content.strip())
+      if not blocks:
+          return "No subtitle found", 0.0, 3.0
+      first_block = blocks[0].strip().split('\n')
+      if len(first_block) >= 3:
+          times = first_block[1].split(' --> ')
+          def time_to_sec(t):
+              h, m, s = t.split(':')
+              s, ms = s.split(',')
+              return int(h) * 3600 + int(m) * 60 + int(s) + int(ms) / 1000.0
+          start_sec = time_to_sec(times[0].strip())
+          end_sec = time_to_sec(times[1].strip())
+          text = ' '.join(first_block[2:]).strip()
+          return text, start_sec, end_sec
+      return "No subtitle found", 0.0, 3.0
+  except Exception as e:
+      raise Exception(f"Failed to extract first subtitle: {str(e)}")
+def create_reddit_card_with_text(template_path, hook_text, output_dir, config=REDDIT_CONFIG):
+  """Create Reddit card with text using PIL."""
+  try:
+      template = Image.open(template_path).convert('RGBA')
+      template_width, template_height = template.size
+      text_box_width = int(template_width * config['text_box_width_percent'])
+      text_box_height = int(template_height * config['text_box_height_percent'])
+      best_font_size = config['font_size_max']
+      best_wrapped_text = hook_text
+      script_dir = os.path.dirname(os.path.abspath(__file__))
+      font_paths = [
+          os.path.join(script_dir, 'fonts', config['font_file']),
+          os.path.join(script_dir, config['font_file'])
+      ]
+      for font_size in range(config['font_size_max'], config['font_size_min'] - 1, -2):
+          font = None
+          for font_path in font_paths:
+              if os.path.exists(font_path):
+                  try:
+                      font = ImageFont.truetype(font_path, font_size)
+                      break
+                  except:
+                      pass
+          if font is None:
+              try:
+                  font = ImageFont.truetype('Verdana', font_size)
+              except:
+                  font = ImageFont.load_default()
+          wrapped = textwrap.fill(hook_text, width=config['text_wrap_width'])
+          draw = ImageDraw.Draw(template)
+          bbox = draw.multiline_textbbox((0, 0), wrapped, font=font, spacing=config['line_spacing'])
+          text_width = bbox[2] - bbox[0]
+          text_height = bbox[3] - bbox[1]
+          if text_width <= text_box_width and text_height <= text_box_height:
+              best_font_size = font_size
+              best_wrapped_text = wrapped
+              break
+      font = None
+      for font_path in font_paths:
+          if os.path.exists(font_path):
+              try:
+                  font = ImageFont.truetype(font_path, best_font_size)
+                  break
+              except:
+                  pass
+      if font is None:
+          try:
+              font = ImageFont.truetype('Verdana', best_font_size)
+          except:
+              font = ImageFont.load_default()
+      draw = ImageDraw.Draw(template)
+      bbox = draw.multiline_textbbox((0, 0), best_wrapped_text, font=font, spacing=config['line_spacing'])
+      text_width = bbox[2] - bbox[0]
+      text_height = bbox[3] - bbox[1]
+      x = (template_width - text_width) / 2
+      y = (template_height - text_height) / 2 + config['y_offset']
+      draw.multiline_text(
+          (x, y),
+          best_wrapped_text,
+          fill=config['text_color'],
+          font=font,
+          spacing=config['line_spacing'],
+          align='left'
+      )
+      output_path = os.path.join(output_dir, 'reddit_card_composite.png')
+      template.save(output_path, 'PNG')
+      return output_path
+  except Exception as e:
+      raise Exception(f"Failed to create Reddit card: {str(e)}")
+def validate_and_get_file(uploaded_file, url_string, file_type, temp_dir):
+  """Validate that only one input method is used and return the file path."""
+  has_upload = uploaded_file is not None
+  has_url = url_string and url_string.strip()
+  if not has_upload and not has_url:
+      return None, f"❌ Please provide {file_type} either by upload or URL"
+  if has_upload and has_url:
+      return None, f"❌ Please use only ONE method for {file_type}: either upload OR URL (not both)"
+  if has_upload:
+      file_path = uploaded_file.name if hasattr(uploaded_file, 'name') else uploaded_file
+      return file_path, None
+  if has_url:
+      try:
+          url_parts = url_string.strip().split('/')
+          original_filename = url_parts[-1] if url_parts else f"{file_type}_file"
+          if '.' not in original_filename:
+              ext_map = {'video': '.mp4', 'audio': '.wav', 'subtitle': '.srt'}
+              original_filename += ext_map.get(file_type, '.tmp')
+          timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
+          filename = f"{file_type}_{timestamp}_{original_filename}"
+          file_path = download_file_from_url(url_string.strip(), temp_dir, filename)
+          return file_path, None
+      except Exception as e:
+          return None, f"❌ Error downloading {file_type} from URL: {str(e)}"
+  return None, f"❌ Unknown error processing {file_type}"
+def srt_time_to_ms(time_str):
+  """Convert SRT timestamp to milliseconds."""
+  time_str = time_str.strip()
+  hours, minutes, seconds = time_str.split(':')
+  seconds, milliseconds = seconds.split(',')
+  return (int(hours) * 3600000 + int(minutes) * 60000 +
+          int(seconds) * 1000 + int(milliseconds))
+def ms_to_ass_time(ms):
+  """Convert milliseconds to ASS timestamp format."""
+  hours = ms // 3600000
+  ms %= 3600000
+  minutes = ms // 60000
+  ms %= 60000
+  seconds = ms // 1000
+  centiseconds = (ms % 1000) // 10
+  return f"{hours}:{minutes:02d}:{seconds:02d}.{centiseconds:02d}"
+def create_word_by_word_highlight_ass(srt_path, output_dir, highlight_color='yellow',
+                                     font_size=None, skip_first=False, config=SUBTITLE_CONFIG):
+  """Convert SRT to ASS with word-by-word highlighting."""
+  if font_size is None:
+      font_size = config['font_size_default']
+  color_map = {
+      'yellow': ('&H00000000', '&H0000FFFF'),
+      'orange': ('&H0000A5FF', '&H00000000'),
+      'green': ('&H0000FF00', '&H00000000'),
+      'cyan': ('&H00FFFF00', '&H00000000'),
+      'pink': ('&H00FF69B4', '&H00000000'),
+      'red': ('&H000000FF', '&H00FFFFFF'),
+      'blue': ('&H00FF0000', '&H00FFFFFF'),
+  }
+  highlight_bg, highlight_text = color_map.get(highlight_color.lower(), ('&H00000000', '&H0000FFFF'))
+  with open(srt_path, 'r', encoding='utf-8') as f:
+      srt_content = f.read()
+  ass_path = os.path.join(output_dir, 'word_highlight_subtitles.ass')
+  ass_header = f"""[Script Info]
+Title: Word-by-Word Highlight Subtitles
+ScriptType: v4.00+
+Collisions: Normal
+PlayDepth: 0
+[V4+ Styles]
+Format: Name, Fontname, Fontsize, PrimaryColour, SecondaryColour, OutlineColour, BackColour, Bold, Italic, Underline, StrikeOut, ScaleX, ScaleY, Spacing, Angle, BorderStyle, Outline, Shadow, Alignment, MarginL, MarginR, MarginV, Encoding
+Style: Default,{config['font_name']},{font_size},&H00FFFFFF,&H00FFFFFF,&H00000000,&H80000000,0,0,0,0,100,100,0,0,1,3,1,{config['position_alignment']},{config['margin_left']},{config['margin_right']},{config['margin_vertical']},1
+[Events]
+Format: Layer, Start, End, Style, Name, MarginL, MarginR, MarginV, Effect, Text
+"""
+  srt_blocks = re.split(r'\n\s*\n', srt_content.strip())
+  ass_events = []
+  start_index = 1 if skip_first else 0
+  for block in srt_blocks[start_index:]:
+      lines = block.strip().split('\n')
+      if len(lines) >= 3:
+          timestamp_line = lines[1]
+          times = timestamp_line.split(' --> ')
+          if len(times) == 2:
+              start_ms = srt_time_to_ms(times[0])
+              end_ms = srt_time_to_ms(times[1])
+              text = ' '.join(lines[2:])
+              words = text.split()
+              if not words:
+                  continue
+              total_duration = end_ms - start_ms
+              time_per_word = total_duration / len(words)
+              for i, word in enumerate(words):
+                  word_start_ms = start_ms + int(i * time_per_word)
+                  word_end_ms = start_ms + int((i + 1) * time_per_word)
+                  if i == len(words) - 1:
+                      word_end_ms = end_ms
+                  text_parts = []
+                  for j, w in enumerate(words):
+                      if j == i:
+                          text_parts.append(f"{{\\c{highlight_text}\\3c{highlight_bg}\\bord5}}{w}{{\\r}}")
+                      else:
+                          text_parts.append(w)
+                  styled_text = ' '.join(text_parts)
+                  start_time = ms_to_ass_time(word_start_ms)
+                  end_time = ms_to_ass_time(word_end_ms)
+                  ass_line = f"Dialogue: 0,{start_time},{end_time},Default,,0,0,0,,{styled_text}"
+                  ass_events.append(ass_line)
+  with open(ass_path, 'w', encoding='utf-8') as f:
+      f.write(ass_header)
+      f.write('\n'.join(ass_events))
+  return ass_path
+def stitch_media(
+  video_file, video_url,
+  audio_file, audio_url,
+  subtitle_file, subtitle_url,
+  book_id,
+  enable_highlight,
+  highlight_color,
+  font_size,
+  crf_quality=23
+):
+  """Main video stitching function with Reddit overlay and book cover."""
+  temp_dir = tempfile.mkdtemp()
+  try:
+      ffmpeg_env = setup_custom_fonts_hf(temp_dir)
+      video_path, video_error = validate_and_get_file(video_file, video_url, 'video', temp_dir)
+      if video_error: return None, video_error
+      audio_path, audio_error = validate_and_get_file(audio_file, audio_url, 'audio', temp_dir)
+      if audio_error: return None, audio_error
+      subtitle_path, subtitle_error = validate_and_get_file(subtitle_file, subtitle_url, 'subtitle', temp_dir)
+      if subtitle_error: return None, subtitle_error
+      video_width, video_height, video_fps = get_video_info(video_path)
+      audio_duration = get_audio_duration(audio_path)
+      status_msg = "📥 Processing files:\n"
+      status_msg += f"  • Video: {'URL' if video_url else 'Upload'} ({video_width}x{video_height} @ {video_fps:.2f}fps)\n"
+      status_msg += f"  • Audio: {'URL' if audio_url else 'Upload'} ({audio_duration:.2f}s)\n"
+      status_msg += f"  • Subtitle: {'URL' if subtitle_url else 'Upload'}\n"
+      script_dir = os.path.dirname(os.path.abspath(__file__))
+      reddit_template_path = os.path.join(script_dir, REDDIT_CONFIG['template_file'])
+      has_reddit_template = os.path.exists(reddit_template_path)
+      if has_reddit_template:
+          status_msg += "  • Reddit template: ✅ Found\n"
+          try:
+              first_sub_text, first_sub_start, first_sub_end = extract_first_subtitle(subtitle_path)
+              status_msg += f"\n📱 Reddit Overlay:\n"
+              status_msg += f"  • Text: '{first_sub_text[:40]}...'\n"
+              status_msg += f"  • Timing: {first_sub_start:.1f}s - {first_sub_end:.1f}s\n"
+              reddit_card_path = create_reddit_card_with_text(
+                  reddit_template_path, first_sub_text, temp_dir, REDDIT_CONFIG
+              )
+              status_msg += "  • ✅ Reddit card ready\n"
+          except Exception as e:
+              status_msg += f"  • ⚠️ Reddit card failed: {str(e)}\n"
+              has_reddit_template = False
+      else:
+          status_msg += "  • Reddit template: ⚠️ Not found (skipping)\n"
+      if enable_highlight:
+          status_msg += f"\n✨ Word highlighting: {highlight_color} ({font_size}px)\n"
+          subtitle_to_use = create_word_by_word_highlight_ass(
+              subtitle_path, temp_dir, highlight_color, font_size,
+              skip_first=has_reddit_template, config=SUBTITLE_CONFIG
+          )
+      else:
+          subtitle_to_use = subtitle_path
+      subtitle_escaped = subtitle_to_use.replace('\\', '/').replace(':', '\\:')
+      has_book_cover = book_id and book_id.strip()
+      timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
+      output_path = os.path.join(temp_dir, f"final_{timestamp}.mp4")
+      r, g, b = VIDEO_CONFIG['fade_color_rgb']
+      fade_color_hex = f"#dacfc3"
+      if has_book_cover:
+          status_msg += f"\n📚 Downloading book cover (ID: {book_id})...\n"
+          try:
+              book_cover_path = download_book_cover(book_id.strip(), temp_dir)
+              status_msg += "✅ Book cover downloaded\n"
+              fade_starts_at = audio_duration * VIDEO_CONFIG['fade_start_percent']
+              fade_ends_at = audio_duration * VIDEO_CONFIG['fade_end_percent']
+              fade_out_duration = fade_ends_at - fade_starts_at
+              promo_duration = audio_duration * VIDEO_CONFIG['promo_percent']
+              book_appears_at = audio_duration - promo_duration
+              solid_color_duration = book_appears_at - fade_ends_at
+              main_video_duration = fade_ends_at
+              cover_segment_duration = promo_duration
+              status_msg += f"\n⏱️ Timing: Fade {fade_starts_at:.1f}→{fade_ends_at:.1f}s, Hold {solid_color_duration:.1f}s\n"
+              status_msg += "🎬 Step 1/4: Main video with fade-out...\n"
+              main_segment_path = os.path.join(temp_dir, f"main_{timestamp}.mp4")
+              cmd_main = [
+                  "ffmpeg", "-stream_loop", "-1", "-i", video_path, "-t", str(main_video_duration),
+                  "-vf", f"fps={video_fps},scale={video_width}:{video_height},fade=t=out:st={fade_starts_at}:d={fade_out_duration}:c={fade_color_hex}",
+                  "-c:v", "libx264", "-crf", str(crf_quality), "-pix_fmt", "yuv420p", "-an", "-y", main_segment_path
+              ]
+              subprocess.run(cmd_main, check=True, capture_output=True, text=True, env=ffmpeg_env)
+              status_msg += "✅ Step 1 done\n🎬 Step 2/4: Solid color...\n"
+              solid_color_path = os.path.join(temp_dir, f"solid_{timestamp}.mp4")
+              cmd_solid = [
+                  "ffmpeg", "-f", "lavfi",
+                  "-i", f"color=c={fade_color_hex}:s={video_width}x{video_height}:d={solid_color_duration}:r={video_fps}",
+                  "-c:v", "libx264", "-crf", str(crf_quality), "-pix_fmt", "yuv420p", "-y", solid_color_path
+              ]
+              subprocess.run(cmd_solid, check=True, capture_output=True, text=True, env=ffmpeg_env)
+              status_msg += "✅ Step 2 done\n🎬 Step 3/4: Cover with fade-in...\n"
+              cover_segment_path = os.path.join(temp_dir, f"cover_{timestamp}.mp4")
+              cmd_cover = [
+                  "ffmpeg", "-loop", "1", "-i", book_cover_path, "-t", str(cover_segment_duration),
+                  "-vf", f"scale={video_width}:{video_height},setsar=1,fps={video_fps},fade=t=in:st=0:d={VIDEO_CONFIG['book_fade_in_duration']}:c={fade_color_hex}",
+                  "-c:v", "libx264", "-crf", str(crf_quality), "-pix_fmt", "yuv420p", "-an", "-y", cover_segment_path
+              ]
+              subprocess.run(cmd_cover, check=True, capture_output=True, text=True, env=ffmpeg_env)
+              status_msg += "✅ Step 3 done\n🎬 Step 4/4: Final assembly...\n"
+              concat_list_path = os.path.join(temp_dir, f"concat_{timestamp}.txt")
+              with open(concat_list_path, 'w') as f:
+                  f.write(f"file '{main_segment_path}'\n")
+                  f.write(f"file '{solid_color_path}'\n")
+                  f.write(f"file '{cover_segment_path}'\n")
+              if has_reddit_template:
+                  filter_complex = (
+                      f"[0:v]ass={subtitle_escaped}[bg];"
+                      f"[1:v]scale={video_width}*{VIDEO_CONFIG['reddit_scale_percent']}:-1[reddit];"
+                      f"[bg][reddit]overlay=(W-w)/2:(H-h)/2:enable='between(t,{first_sub_start},{first_sub_end})'[v]"
+                  )
+                  cmd_final = [
+                      "ffmpeg", "-f", "concat", "-safe", "0", "-i", concat_list_path,
+                      "-loop", "1", "-i", reddit_card_path, "-i", audio_path,
+                      "-filter_complex", filter_complex, "-map", "[v]", "-map", "2:a",
+                      "-c:v", "libx264", "-crf", str(crf_quality), "-c:a", "aac",
+                      "-pix_fmt", "yuv420p", "-shortest", "-y", output_path
+                  ]
+              else:
+                  cmd_final = [
+                      "ffmpeg", "-f", "concat", "-safe", "0", "-i", concat_list_path, "-i", audio_path,
+                      "-vf", f"ass={subtitle_escaped}", "-map", "0:v", "-map", "1:a",
+                      "-c:v", "libx264", "-crf", str(crf_quality), "-c:a", "aac",
+                      "-pix_fmt", "yuv420p", "-shortest", "-y", output_path
+                  ]
+              subprocess.run(cmd_final, check=True, capture_output=True, text=True, env=ffmpeg_env)
+          except subprocess.CalledProcessError as e:
+              return None, f"❌ FFmpeg error:\n{e.stderr[-1000:] if e.stderr else str(e)}"
+          except Exception as e:
+              return None, f"❌ Error: {str(e)}"
+      else:
+          status_msg += "\n🎬 Creating video...\n"
+          if has_reddit_template:
+              filter_complex = (
+                  f"[0:v]ass={subtitle_escaped}[bg];"
+                  f"[1:v]scale={video_width}*{VIDEO_CONFIG['reddit_scale_percent']}:-1[reddit];"
+                  f"[bg][reddit]overlay=(W-w)/2:(H-h)/2:enable='between(t,{first_sub_start},{first_sub_end})'[v]"
+              )
+              cmd = [
+                  "ffmpeg", "-stream_loop", "-1", "-i", video_path,
+                  "-loop", "1", "-i", reddit_card_path, "-i", audio_path,
+                  "-filter_complex", filter_complex, "-map", "[v]", "-map", "2:a",
+                  "-c:v", "libx264", "-crf", str(crf_quality), "-c:a", "aac",
+                  "-shortest", "-y", output_path
+              ]
+          else:
+              cmd = [
+                  "ffmpeg", "-stream_loop", "-1", "-i", video_path, "-i", audio_path,
+                  "-vf", f"ass={subtitle_escaped}", "-map", "0:v", "-map", "1:a",
+                  "-c:v", "libx264", "-crf", str(crf_quality), "-c:a", "aac",
+                  "-shortest", "-y", output_path
+              ]
+          try:
+              subprocess.run(cmd, check=True, capture_output=True, text=True, env=ffmpeg_env)
+          except subprocess.CalledProcessError as e:
+              return None, f"❌ FFmpeg error:\n{e.stderr[-1000:] if e.stderr else str(e)}"
+      if os.path.exists(output_path):
+          file_size = os.path.getsize(output_path) / (1024 * 1024)
+          success_msg = f"✅ Video created successfully!\n\n"
+          success_msg += f"📊 Size: {file_size:.2f} MB | Duration: {audio_duration:.2f}s\n"
+          success_msg += f"🎨 Quality: CRF {crf_quality} | FPS: {video_fps:.2f}\n"
+          if has_reddit_template:
+              success_msg += f"📱 Reddit: ✅ ({first_sub_start:.1f}-{first_sub_end:.1f}s)\n"
+          if has_book_cover:
+              success_msg += f"📚 Book: ✅ (Fade: 60→75%, Hold: 75→90%, Book: 90→100%)\n"
+          success_msg += "\n" + status_msg
+          return output_path, success_msg
+      else:
+          return None, "❌ Output file was not created"
+  except Exception as e:
+      return None, f"❌ Error: {str(e)}"
+# ========================================
+# FastAPI app
+# ========================================
+app = FastAPI(title="Video Stitcher API")
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+# ========================================
+# RESPONSE MODELS
+# ========================================
+class StitchQueuedResponse(BaseModel):
+    job_id: str = Field(..., example="3cecd6e6-6920-474c-b924-aa9f174c0bd0")
+    status: str = Field(..., example="queued")
+    message: str = Field(..., example="Job queued. Poll /status/{job_id} for updates.")
+    status_endpoint: str = Field(..., example="http://0.0.0.0:7860/status/3cecd6e6-6920-474c-b924-aa9f174c0bd0")
+    result_endpoint: str = Field(..., example="http://0.0.0.0:7860/result/3cecd6e6-6920-474c-b924-aa9f174c0bd0")
+class StitchErrorResponse(BaseModel):
+    job_id: str = Field(..., example="3cecd6e6-6920-474c-b924-aa9f174c0bd0")
+    status: str = Field(..., example="failed")
+    message: str = Field(..., example="❌ Error downloading video from URL: Connection timeout")
+    run_time: str = Field(..., example="2m 15s")
+class StatusResponse(BaseModel):
+    job_id: str = Field(..., example="3cecd6e6-6920-474c-b924-aa9f174c0bd0")
+    status: str = Field(..., example="processing")
+    message: str = Field(..., example="Processing files...")
+class ResultCompletedResponse(BaseModel):
+    job_id: str = Field(..., example="3cecd6e6-6920-474c-b924-aa9f174c0bd0")
+    status: str = Field(..., example="completed")
+    message: str = Field(..., example="✅ Video created successfully!")
+    download_endpoint: str = Field(..., example="http://0.0.0.0:7860/download/3cecd6e6-6920-474c-b924-aa9f174c0bd0")
+    result_file: str = Field(..., example="final_20260219_210606.mp4")
+    file_ready: bool = Field(..., example=True)
+    run_time: str = Field(..., example="5m 42s")
+# In-memory job store
+JOBS: dict = {}
+def _save_upload_to_temp(upload_file: UploadFile, temp_dir: str) -> str:
+    filename = os.path.basename(upload_file.filename)
+    dest_path = os.path.join(temp_dir, filename)
+    with open(dest_path, 'wb') as f:
+        f.write(upload_file.file.read())
+    return dest_path
+def _run_stitch_job(job_id: str, payload: dict):
+    """Background worker — runs in a thread pool, not the async event loop."""
+    try:
+        start_time = time.time()
+        JOBS[job_id]['status'] = 'processing'
+        JOBS[job_id]['start_time'] = start_time
+        result_path, message = stitch_media(
+            payload.get('video_file'), payload.get('video_url'),
+            payload.get('audio_file'), payload.get('audio_url'),
+            payload.get('subtitle_file'), payload.get('subtitle_url'),
+            payload.get('book_id'), payload.get('enable_highlight', True),
+            payload.get('highlight_color', 'yellow'), payload.get('font_size', 18),
+            payload.get('crf_quality', 23)
+        )
+        end_time = time.time()
+        runtime_seconds = int(end_time - start_time)
+        runtime_formatted = f"{runtime_seconds // 60}m {runtime_seconds % 60}s"
+        if result_path:
+            JOBS[job_id].update({
+                'status': 'completed',
+                'result': result_path,
+                'message': message,
+                'end_time': end_time,
+                'run_time': runtime_formatted,
+            })
+        else:
+            JOBS[job_id].update({
+                'status': 'failed',
+                'message': message,
+                'end_time': end_time,
+                'run_time': runtime_formatted,
+            })
+    except Exception as e:
+        end_time = time.time()
+        runtime_seconds = int(end_time - JOBS[job_id].get('start_time', end_time))
+        JOBS[job_id].update({
+            'status': 'failed',
+            'message': str(e),
+            'end_time': end_time,
+            'run_time': f"{runtime_seconds // 60}m {runtime_seconds % 60}s",
+        })
+@app.post(
+    '/video_stitch',
+    response_model=StitchQueuedResponse,
+    responses={500: {"model": StitchErrorResponse}},
+    summary="Submit a video stitching job",
+    description=(
+        "Accepts video, audio, and subtitle inputs (as file uploads or URLs). "
+        "Returns a job_id immediately. Poll `/status/{job_id}` to track progress, "
+        "then use `/result/{job_id}` or `/download/{job_id}` when complete."
+    ),
+)
+async def stitch_upload(
+    request: Request,
+    video_file: Optional[UploadFile] = File(None),
+    audio_file: Optional[UploadFile] = File(None),
+    subtitle_file: Optional[UploadFile] = File(None),
+    video_url: Optional[str] = Form(None),
+    audio_url: Optional[str] = Form(None),
+    subtitle_url: Optional[str] = Form(None),
+    book_id: Optional[str] = Form(None),
+    enable_highlight: bool = Form(True),
+    highlight_color: str = Form('yellow'),
+    font_size: int = Form(12),
+    crf_quality: int = Form(23),
+):
+    temp_dir = tempfile.mkdtemp()
+    payload = {
+        'video_file': None,
+        'audio_file': None,
+        'subtitle_file': None,
+        'video_url': video_url,
+        'audio_url': audio_url,
+        'subtitle_url': subtitle_url,
+        'book_id': book_id,
+        'enable_highlight': enable_highlight,
+        'highlight_color': highlight_color,
+        'font_size': font_size,
+        'crf_quality': crf_quality,
+    }
+    try:
+        if video_file is not None:
+            payload['video_file'] = _save_upload_to_temp(video_file, temp_dir)
+        if audio_file is not None:
+            payload['audio_file'] = _save_upload_to_temp(audio_file, temp_dir)
+        if subtitle_file is not None:
+            payload['subtitle_file'] = _save_upload_to_temp(subtitle_file, temp_dir)
+        job_id = str(uuid.uuid4())
+        JOBS[job_id] = {'status': 'queued', 'message': 'Job queued, waiting to start.', 'result': None}
+        # ✅ FIX: Submit to background thread — returns immediately, no proxy timeout
+        executor.submit(_run_stitch_job, job_id, payload)
+        base_url = str(request.base_url).rstrip('/')
+        return JSONResponse({
+            'job_id': job_id,
+            'status': 'queued',
+            'message': 'Job queued. Poll /status/{job_id} for updates.',
+            'status_endpoint': f"{base_url}/status/{job_id}",
+            'result_endpoint': f"{base_url}/result/{job_id}",
+        })
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
+@app.get('/status/{job_id}', response_model=StatusResponse, summary="Check job status")
+async def job_status(job_id: str):
+    job = JOBS.get(job_id)
+    if not job:
+        raise HTTPException(status_code=404, detail='Job not found')
+    return {'job_id': job_id, 'status': job['status'], 'message': job.get('message', '')}
+@app.get(
+    '/result/{job_id}',
+    responses={
+        200: {"model": ResultCompletedResponse, "description": "Job completed — includes download link"},
+        202: {"description": "Job still processing"},
+        404: {"description": "Job not found"},
+    },
+    summary="Get job result (includes download link when complete)",
+)
+async def job_result(job_id: str, request: Request):
+    job = JOBS.get(job_id)
+    if not job:
+        raise HTTPException(status_code=404, detail='Job not found')
+    base_url = str(request.base_url).rstrip('/')
+    response: dict = {
+        'job_id': job_id,
+        'status': job['status'],
+        'message': job.get('message', ''),
+    }
+    if job['status'] == 'completed' and job.get('result'):
+        response['download_endpoint'] = f"{base_url}/download/{job_id}"
+        response['result_file'] = os.path.basename(job['result'])
+        response['file_ready'] = True
+        response['run_time'] = job.get('run_time', 'N/A')
+        return JSONResponse(response, status_code=200)
+    if job['status'] in ('queued', 'processing'):
+        return JSONResponse(response, status_code=202)
+    # failed
+    return JSONResponse(response, status_code=200)
+@app.get('/download/{job_id}', summary="Download the completed video")
+async def download_result(job_id: str):
+    job = JOBS.get(job_id)
+    if not job:
+        raise HTTPException(status_code=404, detail='Job not found')
+    if job['status'] != 'completed' or not job.get('result'):
+        raise HTTPException(status_code=400, detail='Result not yet available')
+    return FileResponse(
+        job['result'],
+        media_type='video/mp4',
+        filename=os.path.basename(job['result']),
+    )
+@app.get('/health', summary="Health check")
+async def health():
+    return {"status": "ok", "jobs_in_memory": len(JOBS)}

requirements.txt ADDED Viewed

	@@ -0,0 +1,8 @@

+fastapi==0.115.0
+uvicorn[standard]==0.30.6
+static-ffmpeg==2.5
+Pillow==10.4.0
+requests==2.32.3
+aiofiles==23.2.1
+python-multipart==0.0.9
+pydantic==2.8.2