Mix

Running

App Files Files Community

Mmyyyzsj commited on Mar 9

Commit

a6852ca

verified ·

1 Parent(s): 2695ae9

Create app.py

Browse files

Files changed (1) hide show

app.py +132 -0

app.py ADDED Viewed

	@@ -0,0 +1,132 @@

+import os
+import cv2
+import torch
+import gradio as gr
+import numpy as np
+from PIL import Image
+from insightface.app import FaceAnalysis
+from insightface.model_zoo import get_model
+from transformers import AutoModelForCausalLM, AutoTokenizer, AutoConfig
+import tempfile
+# 1. إعداد نماذج الرؤية (Moondream2) - النسخة المستقرة
+print("--- جاري تحميل نموذج الرؤية (Moondream2) ---")
+model_id = "vikhyatk/moondream2"
+revision = "2024-05-20"
+device = "cpu"
+try:
+    # --- الجزء الجديد لحل مشكلة AttributeError و pad_token_id ---
+    config = AutoConfig.from_pretrained(model_id, trust_remote_code=True)
+    if not hasattr(config, 'pad_token_id'):
+        # تعيين pad_token_id ليكون نفس قيمة eos_token_id لمنع خطأ PhiConfig
+        config.pad_token_id = config.eos_token_id
+    tokenizer = AutoTokenizer.from_pretrained(
+        model_id,
+        trust_remote_code=True
+    )
+    vision_model = AutoModelForCausalLM.from_pretrained(
+        model_id,
+        config=config,
+        revision=revision,
+        trust_remote_code=True
+    ).to(device)
+    vision_model.eval()
+    # -------------------------------------------------------
+except Exception as e:
+    print(f"⚠️ خطأ أثناء تحميل موديل الرؤية: {e}")
+# 2. إعداد محرك الـ Mix (Face Swap)
+print("--- جاري تحميل محرك تبديل الوجوه ---")
+face_app = FaceAnalysis(name='bufflere', providers=['CPUExecutionProvider'])
+face_app.prepare(ctx_id=0, det_size=(640, 640))
+# تحميل موديل التبديل (inswapper_128)
+swapper = get_model("inswapper_128.onnx", download=True, download_zip=True)
+def process_video(source_img, target_video, progress=gr.Progress()):
+    if source_img is None or target_video is None:
+        return None, "⚠️ من فضلك ارفع صورة الوجه وفيديو المشهد أولاً."
+    progress(0, desc="🔍 جاري تحليل ملامح الوجه...")
+    # تحويل الصورة لنمط OpenCV
+    face_img = cv2.cvtColor(np.array(source_img), cv2.COLOR_RGB2BGR)
+    source_faces = face_app.get(face_img)
+    if not source_faces:
+        return None, "❌ لم نجد وجهاً واضحاً في الصورة المرفوعة!"
+    source_face = source_faces[0]
+    # قراءة الفيديو المصدر
+    cap = cv2.VideoCapture(target_video)
+    fps = cap.get(cv2.CAP_PROP_FPS)
+    total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
+    width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+    height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+    # إنشاء ملف مؤقت للنتيجة
+    output_fd, output_path = tempfile.mkstemp(suffix='.mp4')
+    os.close(output_fd)
+    fourcc = cv2.VideoWriter_fourcc(*'mp4v')
+    out = cv2.VideoWriter(output_path, fourcc, fps, (width, height))
+    frame_count = 0
+    try:
+        while cap.isOpened():
+            ret, frame = cap.read()
+            if not ret:
+                break
+            # البحث عن الوجوه في كل فريم لتبديلها
+            target_faces = face_app.get(frame)
+            if target_faces:
+                for target_face in target_faces:
+                    # عملية التبديل السينمائي
+                    frame = swapper.get(frame, target_face, source_face, paste_back=True)
+            out.write(frame)
+            frame_count += 1
+            if frame_count % 5 == 0:
+                progress(frame_count / total_frames, desc=f"🎬 جاري المعالجة: {int((frame_count/total_frames)*100)}%")
+    except Exception as e:
+        return None, f"🔥 حدث خطأ فني: {str(e)}"
+    finally:
+        cap.release()
+        out.release()
+    return output_path, "✅ تم الخلط بنجاح! شاهد النتيجة الآن."
+# 3. واجهة المستخدم (Gradio UI)
+with gr.Blocks(theme=gr.themes.Soft(primary_hue="indigo")) as demo:
+    gr.HTML("""
+        <div style="text-align: center; padding: 20px;">
+            <h1 style="font-size: 2.5rem; font-weight: 900;">🎭 AI Face Mix Pro</h1>
+            <p style="font-size: 1.1rem; opacity: 0.8;">اجمع بين صورتك وأي مشهد فيديو باحترافية</p>
+        </div>
+    """)
+    with gr.Row():
+        with gr.Column():
+            source_image = gr.Image(label="📸 صورتك الشخصية", type="pil")
+            target_video = gr.Video(label="🎬 فيديو المشهد")
+            mix_btn = gr.Button("🚀 ابدأ الخلط السحري", variant="primary")
+        with gr.Column():
+            output_video = gr.Video(label="✨ النتيجة النهائية")
+            status_text = gr.Textbox(label="📡 حالة المعالجة", interactive=False)
+    mix_btn.click(
+        fn=process_video,
+        inputs=[source_image, target_video],
+        outputs=[output_video, status_text]
+    )
+if __name__ == "__main__":
+    demo.launch(server_name="0.0.0.0", server_port=7860)