Spaces:

suprimedev
/

hfvd

Sleeping

App Files Files Community

suprimedev commited on Nov 5, 2025

Commit

39512db

verified ·

1 Parent(s): 901e3e9

Update app.py

Browse files

Files changed (1) hide show

app.py +77 -80

app.py CHANGED Viewed

@@ -7,23 +7,17 @@ import speech_recognition as sr
 from pydub import AudioSegment
 import time
 import warnings
-import json
 from datetime import datetime, timedelta
 import threading
 import hashlib
-from fastapi import FastAPI
-from fastapi.responses import JSONResponse
 warnings.filterwarnings("ignore")
-# ذخیره‌سازی نتایج (متن همیشه ذخیره می‌شود)
 results_cache = {}
 cache_lock = threading.Lock()
-# FastAPI instance برای API endpoints
-app = FastAPI()
-# تابع برای پاکسازی cache قدیمی (بهبود: فقط event_idهای کامل‌شده و قدیمی را پاک کن)
 def cleanup_old_cache():
     while True:
         time.sleep(3600)  # هر ساعت
@@ -40,7 +34,8 @@ def cleanup_old_cache():
                         except:
                             pass
             for event_id in keys_to_remove:
-                del results_cache[event_id]
             if keys_to_remove:
                 print(f"[CACHE] {len(keys_to_remove)} event_id قدیمی پاک شد.")
@@ -48,12 +43,12 @@ cleanup_thread = threading.Thread(target=cleanup_old_cache, daemon=True)
 cleanup_thread.start()
 def get_event_id(video_url, language):
-    """ایجاد event_id یکتا (قبلاً cache_key)"""
     return hashlib.md5(f"{video_url}_{language}".encode()).hexdigest()
 def save_result_to_cache(event_id, video_url, language, mp3_path, text, status_msg, processing=False):
     """ذخیره نتیجه در cache (متن همیشه ذخیره می‌شود)"""
-    # کپی فایل MP3 به مکان دائمی اگر موجود باشد
     cache_mp3_path = None
     if mp3_path and os.path.exists(mp3_path):
         cache_mp3_path = f"cache_{event_id}.mp3"
@@ -63,7 +58,7 @@ def save_result_to_cache(event_id, video_url, language, mp3_path, text, status_m
         results_cache[event_id] = {
             'timestamp': datetime.now(),
             'mp3_path': cache_mp3_path,
-            'text': text,  # متن همیشه ذخیره می‌شود (حتی اگر None باشد)
             'status_msg': status_msg,
             'video_url': video_url,
             'language': language,
@@ -82,8 +77,30 @@ def get_result_from_cache(event_id):
             return result
     return None
 def convert_to_mp3_and_transcribe_wrapper(video_url, language):
-    """Wrapper function که event_id را در ابتدا برمی‌گرداند"""
     if not video_url:
         return None, None, "لینک ویدیو را وارد کنید.", None
@@ -105,7 +122,7 @@ def convert_to_mp3_and_transcribe_wrapper(video_url, language):
     # ثبت شروع پردازش
     save_result_to_cache(event_id, video_url, language, None, None, "در حال پردازش...", processing=True)
-    # پردازش در background (برای سادگی، همینجا انجام می‌دهیم - در production async کنید)
     mp3_path, text, status_msg = convert_to_mp3_and_transcribe(video_url, language)
     save_result_to_cache(event_id, video_url, language, mp3_path, text, status_msg, processing=False)
@@ -120,7 +137,7 @@ def convert_to_mp3_and_transcribe(video_url, language):
         progress(0, desc="شروع دانلود...")
-        # دانلود و تبدیل به MP3
         ydl_opts = {
             'format': 'bestaudio[ext=m4a]/bestaudio/best',
             'postprocessors': [{
@@ -149,7 +166,7 @@ def convert_to_mp3_and_transcribe(video_url, language):
         progress(0.3, desc="دانلود کامل. کپی MP3...")
-        # کپی به موقت
         temp_mp3 = tempfile.NamedTemporaryFile(suffix='.mp3', delete=False)
         temp_mp3.close()
         shutil.copy2(mp3_file, temp_mp3.name)
@@ -177,7 +194,7 @@ def language_display(lang_code):
     return "پارسی" if lang_code == 'fa-IR' else "انگلیسی" if lang_code == 'en-US' else lang_code
 def transcribe_audio(mp3_path, progress, language, chunk_length_ms=60000, overlap_ms=5000):
-    """استخراج متن - کد قبلی شما"""
     recognizer = sr.Recognizer()
     recognizer.energy_threshold = 300
     recognizer.dynamic_energy_threshold = True
@@ -274,74 +291,54 @@ def transcribe_audio(mp3_path, progress, language, chunk_length_ms=60000, overla
     return final_text, ""
-# API endpoints (بهبود: event_id به جای cache_key، و endpoint جدید برای لیست)
-@app.get("/api/check_result/{event_id}")
-async def check_result_api(event_id: str):
-    """API endpoint برای بررسی وضعیت نتیجه با event_id (متن اگر کامل شده برگردانده می‌شود)"""
-    result = get_result_from_cache(event_id)
-    if not result:
-        return JSONResponse({"status": 0, "message": "Event ID not found"})
-    if result['processing']:
-        return JSONResponse({"status": 0, "message": "Processing..."})
-    if result['completed']:
-        return JSONResponse({
-            "status": 1,
-            "event_id": event_id,
-            "text": result['text'],  # متن استخراج‌شده همیشه برگردانده می‌شود
-            "mp3_available": result['mp3_path'] is not None and os.path.exists(result['mp3_path']),
-            "status_message": result['status_msg'],
-            "timestamp": result['timestamp'].isoformat()
-        })
-    return JSONResponse({"status": 0, "message": "Unknown status"})
-@app.get("/api/list_events")
-async def list_events_api(limit: int = 10):
-    """API endpoint جدید: لیست event_idهای اخیر (برای مدیریت)"""
-    with cache_lock:
-        recent_events = sorted(
-            [(eid, data['timestamp']) for eid, data in results_cache.items() if data['completed']],
-            key=lambda x: x[1],
-            reverse=True
-        )[:limit]
-        return JSONResponse({
-            "events": [{"event_id": eid, "timestamp": ts.isoformat()} for eid, ts in recent_events]
-        })
-# رابط Gradio (بهبود: event_id برجسته‌تر)
-iface = gr.Interface(
-    fn=convert_to_mp3_and_transcribe_wrapper,
-    inputs=[
-        gr.Textbox(
-            label="لینک ویدیو",
-            placeholder="https://www.youtube.com/watch?v=..."
-        ),
-        gr.Dropdown(
-            choices=[("پارسی", "fa-IR"), ("انگلیسی", "en-US")],
-            value="fa-IR",
-            label="زبان"
         )
-    ],
-    outputs=[
-        gr.File(label="دانلود MP3"),
-        gr.Textbox(label="متن استخراج‌شده", lines=10),
-        gr.Textbox(label="وضعیت"),
-        gr.Textbox(label="Event ID (برای استعلام API)", visible=True, info="این ID را برای چک کردن نتیجه از API استفاده کنید: /api/check_result/{event_id}")
-    ],
-    title="تبدیل ویدیو به MP3 و متن (با ذخیره event_id)",
     examples=[
         ["https://www.youtube.com/watch?v=5qap5aO4i9A", "fa-IR"],
         ["https://www.youtube.com/watch?v=dQw4w9WgXcQ", "en-US"]
-    ]
 )
-# Mount FastAPI to Gradio
-from gradio import mount_gradio_app
-mount_gradio_app(app, iface, path="/")
-if __name__ == "__main__":
-    import uvicorn
-    uvicorn.run(app, host="0.0.0.0", port=7860)

 from pydub import AudioSegment
 import time
 import warnings
 from datetime import datetime, timedelta
 import threading
 import hashlib
 warnings.filterwarnings("ignore")
+# ذخیره‌سازی نتایج (متن همیشه ذخیره می‌شود - در حافظه Spaces موقت)
 results_cache = {}
 cache_lock = threading.Lock()
+# تابع برای پاکسازی cache قدیمی (هر ساعت، فقط event_idهای کامل‌شده قدیمی رو پاک کن)
 def cleanup_old_cache():
     while True:
         time.sleep(3600)  # هر ساعت
                         except:
                             pass
             for event_id in keys_to_remove:
+                if event_id in results_cache:
+                    del results_cache[event_id]
             if keys_to_remove:
                 print(f"[CACHE] {len(keys_to_remove)} event_id قدیمی پاک شد.")
 cleanup_thread.start()
 def get_event_id(video_url, language):
+    """ایجاد event_id یکتا"""
     return hashlib.md5(f"{video_url}_{language}".encode()).hexdigest()
 def save_result_to_cache(event_id, video_url, language, mp3_path, text, status_msg, processing=False):
     """ذخیره نتیجه در cache (متن همیشه ذخیره می‌شود)"""
+    # کپی فایل MP3 به مکان دائمی اگر موجود باشد (در Spaces، فایل‌ها موقت هستن)
     cache_mp3_path = None
     if mp3_path and os.path.exists(mp3_path):
         cache_mp3_path = f"cache_{event_id}.mp3"
         results_cache[event_id] = {
             'timestamp': datetime.now(),
             'mp3_path': cache_mp3_path,
+            'text': text,  # متن استخراج‌شده همیشه ذخیره می‌شه (حتی None)
             'status_msg': status_msg,
             'video_url': video_url,
             'language': language,
             return result
     return None
+def check_event_id(event_id):
+    """تابع جدید: استعلام event_id و برگرداندن متن/وضعیت (برای Gradio و API)"""
+    if not event_id:
+        return "Event ID را وارد کنید.", None, "نامشخص"
+    cached_result = get_result_from_cache(event_id)
+    if not cached_result:
+        return "Event ID یافت نشد.", None, "Not found"
+    if cached_result['processing']:
+        return "در حال پردازش... (صبر کنید)", None, "Processing"
+    if cached_result['completed']:
+        text = cached_result['text']
+        status = cached_result['status_msg']
+        mp3_path = cached_result['mp3_path'] if cached_result['mp3_path'] and os.path.exists(cached_result['mp3_path']) else None
+        return (text if text else "متن استخراج نشد.",
+                mp3_path,
+                f"کامل: {status} (زمان: {cached_result['timestamp'].strftime('%Y-%m-%d %H:%M')})")
+    return "وضعیت نامشخص.", None, "Unknown"
 def convert_to_mp3_and_transcribe_wrapper(video_url, language):
+    """Wrapper اصلی: پردازش ویدیو و برگرداندن event_id"""
     if not video_url:
         return None, None, "لینک ویدیو را وارد کنید.", None
     # ثبت شروع پردازش
     save_result_to_cache(event_id, video_url, language, None, None, "در حال پردازش...", processing=True)
+    # پردازش (در Spaces، sync باشه چون async سخت‌تره)
     mp3_path, text, status_msg = convert_to_mp3_and_transcribe(video_url, language)
     save_result_to_cache(event_id, video_url, language, mp3_path, text, status_msg, processing=False)
         progress(0, desc="شروع دانلود...")
+        # دانلود و تبدیل به MP3 (در Spaces، yt_dlp کار می‌کنه اما محدودیت حجم داره)
         ydl_opts = {
             'format': 'bestaudio[ext=m4a]/bestaudio/best',
             'postprocessors': [{
         progress(0.3, desc="دانلود کامل. کپی MP3...")
+        # کپی به موقت (در Spaces، tempfile خوبه)
         temp_mp3 = tempfile.NamedTemporaryFile(suffix='.mp3', delete=False)
         temp_mp3.close()
         shutil.copy2(mp3_file, temp_mp3.name)
     return "پارسی" if lang_code == 'fa-IR' else "انگلیسی" if lang_code == 'en-US' else lang_code
 def transcribe_audio(mp3_path, progress, language, chunk_length_ms=60000, overlap_ms=5000):
+    """استخراج متن - بدون تغییر"""
     recognizer = sr.Recognizer()
     recognizer.energy_threshold = 300
     recognizer.dynamic_energy_threshold = True
     return final_text, ""
+# رابط Gradio با دو تب (برای Spaces بهینه)
+with gr.Blocks(title="تبدیل ویدیو به MP3 و متن (Hugging Face Spaces)") as demo:
+    gr.Markdown("# تبدیل ویدیو یوتیوب به MP3 و متن استخراج‌شده\n\n- **تب 1**: پردازش ویدیو جدید (event_id تولید می‌شه).\n- **تب 2**: استعلام event_id برای گرفتن متن ذخیره‌شده.")
+    with gr.Tab("پردازش ویدیو"):
+        with gr.Row():
+            video_input = gr.Textbox(label="لینک ویدیو", placeholder="https://www.youtube.com/watch?v=...")
+            lang_input = gr.Dropdown(choices=[("پارسی", "fa-IR"), ("انگلیسی", "en-US")], value="fa-IR", label="زبان")
+        process_btn = gr.Button("پردازش")
+        with gr.Row():
+            mp3_output = gr.File(label="دانلود MP3")
+            text_output = gr.Textbox(label="متن استخراج‌شده", lines=10)
+        status_output = gr.Textbox(label="وضعیت")
+        event_id_output = gr.Textbox(label="Event ID (کپی کنید برای استعلام)", info="این ID رو در تب دوم وارد کنید یا از API استفاده کنید.")
+        process_btn.click(
+            fn=convert_to_mp3_and_transcribe_wrapper,
+            inputs=[video_input, lang_input],
+            outputs=[mp3_output, text_output, status_output, event_id_output]
+        )
+    with gr.Tab("استعلام Event ID"):
+        event_id_input = gr.Textbox(label="Event ID را وارد کنید", placeholder="مثال: a1b2c3d4e5f6...")
+        check_btn = gr.Button("چک کن")
+        check_text = gr.Textbox(label="متن استخراج‌شده", lines=10)
+        check_mp3 = gr.File(label="دانلود MP3 (اگر موجود)")
+        check_status = gr.Textbox(label="وضعیت")
+        check_btn.click(
+            fn=check_event_id,
+            inputs=[event_id_input],
+            outputs=[check_text, check_mp3, check_status]
         )
+        gr.Markdown("### API Usage (از خارج Spaces):\n- **پردازش ویدیو**: `POST /api/predict` با payload: `{'data': ['https://youtube.com/...', 'fa-IR']}` → خروجی شامل event_id.\n- **چک event_id**: `POST /api/predict` با payload: `{'fn_index': 1, 'data': ['event_id_here']}` → خروجی متن/وضعیت.\nمثال با curl: `curl -X POST https://your-space.hf.space/api/predict -H 'Content-Type: application/json' -d '{"data": ["url", "lang"]}'`")
+# Examples برای تب اول
+examples = gr.Examples(
     examples=[
         ["https://www.youtube.com/watch?v=5qap5aO4i9A", "fa-IR"],
         ["https://www.youtube.com/watch?v=dQw4w9WgXcQ", "en-US"]
+    ],
+    inputs=[video_input, lang_input],
+    outputs=[mp3_output, text_output, status_output, event_id_output],
+    fn=convert_to_mp3_and_transcribe_wrapper
 )
+# در Spaces، demo رو launch نکن؛ Spaces خودش handle می‌کنه
+# demo.launch(share=True)  # فقط برای local، در Spaces کامنت کن