Spaces:

Opera8
/

Sadarubikabot

Paused

App Files Files Community

Opera8 commited on 12 days ago

Commit

d4fef3d

verified ·

1 Parent(s): 2e46f6e

Update main.py

Browse files

Files changed (1) hide show

main.py +84 -77

main.py CHANGED Viewed

@@ -2274,7 +2274,6 @@ def local_merge_videos(base_video_bytes, new_clip_bytes):
 async def helper_generate_image_for_video(prompt, action_name, width, height):
     headers = {"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64)"}
-    # تلاش برای ساخت تصویر تا ۳ بار در صورت برخورد با محدودیت
     for attempt in range(3):
         try:
             payload = {"prompt": prompt, "width": width, "height": height, "action_name": action_name}
@@ -2285,7 +2284,7 @@ async def helper_generate_image_for_video(prompt, action_name, width, height):
                         run_id = data.get("run_id")
                         if run_id:
                             waited = 0
-                            while waited < 100: # انتظار حداکثر ۱۰۰ ثانیه برای تصویر
                                 await asyncio.sleep(5)
                                 waited += 5
                                 try:
@@ -2301,58 +2300,6 @@ async def helper_generate_image_for_video(prompt, action_name, width, height):
         await asyncio.sleep(5)
     return None
-async def helper_optimize_video_prompt(image_bytes, user_prompt):
-    if not GEMINI_KEYS:
-        return None
-    master_prompt = """You are an expert AI Animation Planner. Your absolute highest priority is to faithfully and creatively execute the user's specific request based on the provided image.
-    1. If the user prompt is empty or generic (like "animate this"), add subtle, high-quality, believable cinematic motion (e.g., slow zoom, water flowing, wind in hair).
-    2. If the user gives specific directions, focus ENTIRELY on executing that command perfectly. If the action is not visible in-frame, use cinematic camera movements to reveal it.
-    3. You must output ONLY a highly detailed, descriptive animation prompt in ENGLISH. Do not translate literally; ENHANCE the prompt for a text-to-video AI model.
-    4. MUST Include keywords at the end: cinematic, photorealistic, high detail, smooth motion, 8k.
-    CRITICAL RULE: DO NOT say "Here is the prompt" or give any conversational explanations. DO NOT output JSON. Output ONLY the raw English animation prompt text and NOTHING ELSE."""
-    prompt_for_ai = user_prompt if user_prompt else "لطفاً این تصویر را به یک ویدیوی سینمایی بسیار جذاب و واقع‌گرایانه متحرک کن."
-    combined_prompt = f"{master_prompt}\n\nUser request: {prompt_for_ai}"
-    base64_data = base64.b64encode(image_bytes).decode('utf-8')
-    mime_type = "image/jpeg"
-    for attempt in range(2):
-        keys_to_try = get_next_gemini_keys(50)
-        async with aiohttp.ClientSession() as session:
-            for key in keys_to_try:
-                url = f"https://generativelanguage.googleapis.com/v1beta/models/gemini-2.5-flash:generateContent?key={key}"
-                payload = {
-                    "contents": [{
-                        "parts": [
-                            {"text": combined_prompt},
-                            {"inlineData": {"mimeType": mime_type, "data": base64_data}}
-                        ]
-                    }],
-                    "generationConfig": {"temperature": 0.7, "maxOutputTokens": 1024}
-                }
-                try:
-                    async with session.post(url, json=payload, timeout=20) as response:
-                        if response.status == 200:
-                            data = await response.json()
-                            try:
-                                enhanced_prompt = data["candidates"][0]["content"]["parts"][0]["text"]
-                                enhanced_prompt = enhanced_prompt.replace("```text", "").replace("```", "").replace("```json", "").strip()
-                                if "پردازش متوقف شد" in enhanced_prompt or "سهمیه سرور موقتاً پر شده" in enhanced_prompt:
-                                    continue
-                                return enhanced_prompt
-                            except (KeyError, IndexError):
-                                continue
-                except Exception:
-                    continue
-        await asyncio.sleep(2)
-    return None
 async def process_video_generation(client, chat_id, video_type, prompt, duration_int, image_bytes, txt_model_action=None, width=1024, height=1024):
     str_chat_id = str(chat_id).replace("`", "").replace("'", "").replace('"', "").strip()
     creds = get_user_credits(str_chat_id)
@@ -2374,12 +2321,63 @@ async def process_video_generation(client, chat_id, video_type, prompt, duration
     current_image_bytes = await asyncio.to_thread(force_jpeg, current_image_bytes)
-    # پرامپت هوشمند
-    proc_msg = await update_status_msg(client, chat_id, proc_msg, "🧠 در حال درک تصویر و بهینه‌سازی دستور (پرامپت) شما توسط هوش مصنوعی...")
-    eng_prompt = await helper_optimize_video_prompt(current_image_bytes, prompt)
     if eng_prompt:
-        proc_msg = await update_status_msg(client, chat_id, proc_msg, f"✅ دستور شما بهینه شد:\n\n`{eng_prompt}`\n\n🎬 در حال ارسال برای ساخت ویدیو نهایی...")
         await asyncio.sleep(3)
     else:
         try:
@@ -2388,18 +2386,27 @@ async def process_video_generation(client, chat_id, video_type, prompt, duration
         except:
             eng_prompt = "cinematic motion, photorealistic, high detail, smooth animation, 8k"
-    op_name = "متحرک‌سازی تصاویر" if video_type == "animate" else "ساخت ویدیو"
-    proc_msg = await update_status_msg(client, chat_id, proc_msg, f"🎬 عملیات {op_name} آغاز شد.\n⏱ زمان نهایی: {duration_int} ثانیه")
     for loop_idx in range(loops_needed):
         new_clip_bytes = None
-        step_text_base = f"🎬 بخش {loop_idx + 1} از {loops_needed}"
-        # تلاش مجدد تا ۳ بار برای هر رندر ۵ ثانیه‌ای
         for attempt in range(3):
             run_id = str(uuid.uuid4())
-            step_text = f"{step_text_base} (تلاش {attempt + 1}/3):\n"
-            proc_msg = await update_status_msg(client, chat_id, proc_msg, step_text + "۱. 📤 ارسال دستور مستقیم به اکشن‌های پردازشی...")
             input_filename = f"{run_id}_input.jpg"
             with open(f"static/images/{input_filename}", "wb") as f:
@@ -2407,8 +2414,6 @@ async def process_video_generation(client, chat_id, video_type, prompt, duration
             image_public_url = f"{RUBIKA_SPACE_URL}/static/images/{input_filename}"
-            dispatch_url = f"https://api.github.com/repos/{GITHUB_USER}/{GITHUB_REPO}/dispatches"
-            dispatch_headers = {"Accept": "application/vnd.github.v3+json", "Authorization": f"token {GITHUB_TOKEN}"}
             dispatch_payload = {
                 "event_type": "generate-video",
                 "client_payload": {
@@ -2423,15 +2428,18 @@ async def process_video_generation(client, chat_id, video_type, prompt, duration
             try:
                 resp = await asyncio.to_thread(requests.post, dispatch_url, headers=dispatch_headers, json=dispatch_payload, timeout=20)
                 if resp.status_code != 204:
-                    proc_msg = await update_status_msg(client, chat_id, proc_msg, f"❌ خطای گیت‌هاب در پذیرش دستور: {resp.text}")
                     await asyncio.sleep(4)
                     continue
-            except Exception as e:
-                proc_msg = await update_status_msg(client, chat_id, proc_msg, f"❌ خطای اتصال به اکشن: {str(e)[:50]}")
                 await asyncio.sleep(4)
                 continue
-            proc_msg = await update_status_msg(client, chat_id, proc_msg, step_text + "۲. ⏳ سرور در حال رندر می‌باشد.\n(در صورت شلوغی سرور و خطای سهمیه، ربات تا ۳ بار اکشن جدید ایجاد می‌کند. منتظر دریافت فایل...)")
             waited = 0
             while waited < 180: # انتظار تا 180 ثانیه (3 دقیقه)
@@ -2455,33 +2463,32 @@ async def process_video_generation(client, chat_id, video_type, prompt, duration
             if new_clip_bytes:
                 break
             else:
-                proc_msg = await update_status_msg(client, chat_id, proc_msg, step_text + "⚠️ محدودیت زمانی در رندر یا خطای ترافیک. ایجاد درخواست و اکشن جدید...")
                 await asyncio.sleep(5)
         if not new_clip_bytes:
-            return await update_status_msg(client, chat_id, proc_msg, "❌ پس از ۳ بار تلاش، زمان رندر بیش از حد مجاز طول کشید یا درخواست محدود شد. عملیات متوقف شد.")
         if base_video_bytes is not None:
-            proc_msg = await update_status_msg(client, chat_id, proc_msg, step_text_base + "\n۳. 🔄 در حال متصل کردن بخش جدید به ویدیوهای قبلی (میکس لوکال)...")
             base_video_bytes = await asyncio.to_thread(local_merge_videos, base_video_bytes, new_clip_bytes)
         else:
             base_video_bytes = new_clip_bytes
         if loop_idx < loops_needed - 1:
             current_secs = (loop_idx + 1) * 5
-            proc_msg = await update_status_msg(client, chat_id, proc_msg, step_text_base + f"\n۴. 📸 فعلاً {current_secs} ثانیه ساخته شد. در حال استخراج فریم آخر جهت ساخت ادامه...")
             current_image_bytes = await asyncio.to_thread(helper_extract_last_frame, base_video_bytes)
             if not current_image_bytes:
                 await update_status_msg(client, chat_id, proc_msg, "⚠️ استخراج فریم با مشکل مواجه شد. عملیات در همین نقطه پایان یافت.")
                 break
-    proc_msg = await update_status_msg(client, chat_id, proc_msg, "🚀 ویدیو کاملاً آماده شد! در حال آپلود سریع...")
     try:
         file_name = f"video_{uuid.uuid4().hex}.mp4"
         await asyncio.to_thread(sync_write_file, file_name, base_video_bytes)
-        caption_text = f"🎞 ویدیو شما با موفقیت آماده شد!\n⏱ زمان: {duration_int} ثانیه\n✨ پرامپت: {prompt}"
         upload_result = False
         for up_att in range(3):

 async def helper_generate_image_for_video(prompt, action_name, width, height):
     headers = {"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64)"}
     for attempt in range(3):
         try:
             payload = {"prompt": prompt, "width": width, "height": height, "action_name": action_name}
                         run_id = data.get("run_id")
                         if run_id:
                             waited = 0
+                            while waited < 100:
                                 await asyncio.sleep(5)
                                 waited += 5
                                 try:
         await asyncio.sleep(5)
     return None
 async def process_video_generation(client, chat_id, video_type, prompt, duration_int, image_bytes, txt_model_action=None, width=1024, height=1024):
     str_chat_id = str(chat_id).replace("`", "").replace("'", "").replace('"', "").strip()
     creds = get_user_credits(str_chat_id)
     current_image_bytes = await asyncio.to_thread(force_jpeg, current_image_bytes)
+    # 🧠 استفاده از Gemma 4 از طریق گیت‌هاب برای بهینه‌سازی پرامپت
+    proc_msg = await update_status_msg(client, chat_id, proc_msg, "🧠 در حال درک تصویر و نگارش بهترین سناریو برای ویدیو توسط هوش مصنوعی...")
+    master_prompt = """You are an expert AI Animation Planner. Your absolute highest priority is to faithfully and creatively execute the user's specific request based on the provided image.
+    1. If the user prompt is empty or generic (like "animate this"), add subtle, high-quality, believable cinematic motion (e.g., slow zoom, water flowing, wind in hair).
+    2. If the user gives specific directions, focus ENTIRELY on executing that command perfectly. If the action is not visible in-frame, use cinematic camera movements to reveal it.
+    3. You must output ONLY a highly detailed, descriptive animation prompt in ENGLISH. Do not translate literally; ENHANCE the prompt for a text-to-video AI model.
+    4. MUST Include keywords at the end: cinematic, photorealistic, high detail, smooth motion, 8k.
+    CRITICAL RULE: DO NOT say "Here is the prompt" or give any conversational explanations. DO NOT output JSON. Output ONLY the raw English animation prompt text and NOTHING ELSE."""
+    prompt_for_ai = prompt if prompt else "لطفاً این تصویر را به یک ویدیوی سینمایی بسیار جذاب و واقع‌گرایانه متحرک کن."
+    combined_prompt = f"{master_prompt}\n\nUser request: {prompt_for_ai}"
+    gemma_run_id = f"gemma_{uuid.uuid4().hex[:8]}"
+    gemma_filename = f"{gemma_run_id}.jpg"
+    with open(f"static/images/{gemma_filename}", "wb") as f:
+        f.write(current_image_bytes)
+    gemma_image_url = f"{RUBIKA_SPACE_URL}/static/images/{gemma_filename}"
+    dispatch_url = f"https://api.github.com/repos/{GITHUB_USER}/{GITHUB_REPO}/dispatches"
+    dispatch_headers = {"Accept": "application/vnd.github.v3+json", "Authorization": f"token {GITHUB_TOKEN}"}
+    gemma_payload = {
+        "event_type": "chat-gemma",
+        "client_payload": {
+            "prompt": combined_prompt,
+            "file_url": gemma_image_url,
+            "file_mime": "image/jpeg",
+            "run_id": gemma_run_id,
+            "space_url": RUBIKA_SPACE_URL
+        }
+    }
+    eng_prompt = None
+    try:
+        resp = await asyncio.to_thread(requests.post, dispatch_url, headers=dispatch_headers, json=gemma_payload, timeout=20)
+        if resp.status_code == 204:
+            waited = 0
+            while waited < 90:
+                txt_path = f"static/images/{gemma_run_id}.txt"
+                if os.path.exists(txt_path):
+                    with open(txt_path, "r", encoding="utf-8") as f:
+                        eng_prompt = f.read().strip()
+                    os.remove(txt_path)
+                    break
+                await asyncio.sleep(3)
+                waited += 3
+    except Exception as e:
+        print("Gemma action error:", e)
+    try: os.remove(f"static/images/{gemma_filename}")
+    except: pass
     if eng_prompt:
+        eng_prompt = eng_prompt.replace("```text", "").replace("```", "").replace("```json", "").strip()
+        proc_msg = await update_status_msg(client, chat_id, proc_msg, f"✅ سناریوی ویدیوی شما بهینه‌سازی شد:\n\n`{eng_prompt}`")
         await asyncio.sleep(3)
     else:
         try:
         except:
             eng_prompt = "cinematic motion, photorealistic, high detail, smooth animation, 8k"
     for loop_idx in range(loops_needed):
         new_clip_bytes = None
         for attempt in range(3):
             run_id = str(uuid.uuid4())
+            # مدیریت هوشمند پیام‌های نمایشی بدون اصطلاحات فنی
+            if loops_needed == 1:
+                if attempt == 0:
+                    msg_txt = "🎬 در حال ارسال درخواست به سرورهای قدرتمند رندر ویدیو..."
+                else:
+                    msg_txt = "⚠️ به دلیل شلوغی سرور، در حال تلاش مجدد با یک مسیر آزادتر..."
+            else:
+                start_sec = loop_idx * 5
+                end_sec = (loop_idx + 1) * 5
+                if attempt == 0:
+                    msg_txt = f"🎬 در حال رندر ثانیه‌های {start_sec} تا {end_sec} از ویدیو..."
+                else:
+                    msg_txt = f"⚠️ تلاش مجدد برای رندر ثانیه‌های {start_sec} تا {end_sec}..."
+            proc_msg = await update_status_msg(client, chat_id, proc_msg, msg_txt)
             input_filename = f"{run_id}_input.jpg"
             with open(f"static/images/{input_filename}", "wb") as f:
             image_public_url = f"{RUBIKA_SPACE_URL}/static/images/{input_filename}"
             dispatch_payload = {
                 "event_type": "generate-video",
                 "client_payload": {
             try:
                 resp = await asyncio.to_thread(requests.post, dispatch_url, headers=dispatch_headers, json=dispatch_payload, timeout=20)
                 if resp.status_code != 204:
                     await asyncio.sleep(4)
                     continue
+            except Exception:
                 await asyncio.sleep(4)
                 continue
+            if loops_needed == 1:
+                wait_msg = "⏳ هوش مصنوعی در حال ساخت ویدیوی شماست.\n(این فرآیند معمولاً بین ۲ تا ۴ دقیقه زمان می‌برد. لطفاً صبور باشید...)"
+            else:
+                wait_msg = "⏳ هوش مصنوعی در حال پردازش و رندر این بخش می‌باشد...\n(ممکن است چند دقیقه زمان ببرد)"
+            proc_msg = await update_status_msg(client, chat_id, proc_msg, wait_msg)
             waited = 0
             while waited < 180: # انتظار تا 180 ثانیه (3 دقیقه)
             if new_clip_bytes:
                 break
             else:
                 await asyncio.sleep(5)
         if not new_clip_bytes:
+            return await update_status_msg(client, chat_id, proc_msg, "❌ متاسفانه به دلیل ترافیک سنگین سرورهای رندر، عملیات متوقف شد. لطفاً کمی بعد مجدداً تلاش کنید.")
         if base_video_bytes is not None:
+            proc_msg = await update_status_msg(client, chat_id, proc_msg, "🔄 در حال متصل کردن ویدیوهای ساخته شده به یکدیگر...")
             base_video_bytes = await asyncio.to_thread(local_merge_videos, base_video_bytes, new_clip_bytes)
         else:
             base_video_bytes = new_clip_bytes
         if loop_idx < loops_needed - 1:
             current_secs = (loop_idx + 1) * 5
+            proc_msg = await update_status_msg(client, chat_id, proc_msg, f"✅ {current_secs} ثانیه از ویدیو ساخته شد!\n📸 در حال آماده‌سازی برای ساخت ثانیه‌های بعدی...")
             current_image_bytes = await asyncio.to_thread(helper_extract_last_frame, base_video_bytes)
             if not current_image_bytes:
                 await update_status_msg(client, chat_id, proc_msg, "⚠️ استخراج فریم با مشکل مواجه شد. عملیات در همین نقطه پایان یافت.")
                 break
+    proc_msg = await update_status_msg(client, chat_id, proc_msg, "🚀 ویدیو کاملاً آماده شد! در حال آپلود سریع در سرور روبیکا...")
     try:
         file_name = f"video_{uuid.uuid4().hex}.mp4"
         await asyncio.to_thread(sync_write_file, file_name, base_video_bytes)
+        caption_text = f"🎞 ویدیو شما با موفقیت آماده شد!\n⏱ زمان: {duration_int} ثانیه\n✨ پرامپت بهینه شده:\n{eng_prompt}"
         upload_result = False
         for up_att in range(3):