Spaces:

thomson99
/

blenderbot

Runtime error

App Files Files Community

thomson99 commited on Jan 19, 2025

Commit

a7061b5

verified ·

1 Parent(s): ed8662b

Upload app.py

Browse files

Files changed (1) hide show

app.py +62 -66

app.py CHANGED Viewed

@@ -1,6 +1,6 @@
 import gradio as gr
 import torch
-from diffusers import StableDiffusionPipeline, EulerAncestralDiscreteScheduler
 from PIL import Image
 import numpy as np
 from moviepy.editor import ImageSequenceClip
@@ -11,91 +11,87 @@ from tqdm import tqdm
 def create_video_from_text(text_prompt, duration=10, fps=30, resolution="480p", motion_scale=30):
     try:
         # تهيئة نموذج Stable Diffusion
-        model_id = "runwayml/stable-diffusion-v1-5"
-        device = "cpu"  # استخدام CPU
         pipe = StableDiffusionPipeline.from_pretrained(
             model_id,
-            torch_dtype=torch.float32,  # استخدام float32 للـ CPU
         )
-        pipe.scheduler = EulerAncestralDiscreteScheduler.from_config(pipe.scheduler.config)
-        pipe.enable_attention_slicing()
         pipe = pipe.to(device)
-        # إنشاء مجلد مؤقت لحفظ الصور
         temp_dir = tempfile.mkdtemp()
         frames = []
-        # تحديد حجم الصورة حسب الدقة المطلوبة
         if resolution == "480p":
-            size = (854, 480)
         elif resolution == "720p":
             size = (1280, 720)
-        else:  # 1080p
             size = (1920, 1080)
-        # تقليل عدد الإطارات للأداء على CPU
-        fps_reduced = 15  # تقليل معدل الإطارات
-        num_frames = int(duration * fps_reduced / 2)  # تقليل عدد الإطارات
-        print(f"جاري توليد {num_frames} إطار...")
-        # توليد الإطار الأول
-        generator = torch.Generator(device=device).manual_seed(42)
-        latents = torch.randn(
-            (1, pipe.unet.config.in_channels, 64, 64),
-            generator=generator,
-            device=device,
-            dtype=torch.float32
-        )
-        # توليد الصورة الأولى
-        image = pipe(
-            prompt=text_prompt,
-            latents=latents,
-            num_inference_steps=20,  # تقليل خطوات الاستدلال
-            guidance_scale=7.5,
-            generator=generator
-        ).images[0]
-        frames.append(np.array(image.resize(size)))
-        # توليد الإطارات المتتالية مع حركة تدريجية
-        for i in tqdm(range(1, num_frames)):
-            # إضافة اضطراب تدريجي للكمون
-            time_embed = torch.tensor([i / num_frames], device=device, dtype=torch.float32)
-            noise = torch.randn_like(latents) * (motion_scale / 100)
-            current_latents = latents + noise * time_embed.view(-1, 1, 1, 1)
-            # توليد الإطار الجديد
             image = pipe(
-                prompt=text_prompt,
-                latents=current_latents,
-                num_inference_steps=20,
-                guidance_scale=7.5,
-                generator=generator
             ).images[0]
-            frames.append(np.array(image.resize(size)))
         if not frames:
-            raise ValueError("فشل في توليد الإطارات")
         print("جاري إنشاء الفيديو...")
-        # تكرار الإطارات للوصول إلى FPS المطلوب
-        frames_extended = []
-        for frame in frames:
-            repeat_times = int(fps / fps_reduced)
-            frames_extended.extend([frame] * repeat_times)
-        # إنشاء الفيديو من الإطارات
-        clip = ImageSequenceClip(frames_extended, fps=fps)
-        # حفظ الفيديو في ملف مؤقت
         output_path = os.path.join(temp_dir, "output.mp4")
         clip.write_videofile(output_path, codec='libx264', fps=fps)
-        # تحرير الذاكرة
         pipe = None
         torch.cuda.empty_cache()
@@ -114,7 +110,6 @@ def video_generator(text_prompt, duration=10, resolution="480p", motion_scale=30
     print(f"بدء توليد فيديو متحرك بناءً على الوصف: {text_prompt}")
     print(f"المدة: {duration} ثواني")
     print(f"الدقة: {resolution}")
-    print(f"مقياس الحركة: {motion_scale}")
     try:
         result = create_video_from_text(
@@ -129,25 +124,26 @@ def video_generator(text_prompt, duration=10, resolution="480p", motion_scale=30
         print(f"حدث خطأ في المولد: {error_msg}")
         return f"حدث خطأ: {error_msg}"
-# إنشاء واجهة المستخدم باستخدام Gradio
 iface = gr.Interface(
     fn=video_generator,
     inputs=[
         gr.Textbox(label="وصف المشهد", placeholder="اكتب وصفاً للمشهد المتحرك الذي تريد إنشاءه..."),
-        gr.Slider(minimum=5, maximum=30, value=10, step=5, label="مدة الفيديو (بالثواني)"),
         gr.Radio(["480p", "720p", "1080p"], label="دقة الفيديو", value="480p"),
         gr.Slider(minimum=10, maximum=100, value=30, step=5, label="مقياس الحركة (%)")
     ],
     outputs=gr.Video(label="الفيديو المتحرك المُنشأ"),
-    title="مولد الفيديو المتحرك بالذكاء الاصطناعي",
     description="""
     قم بإدخال وصف للمشهد وسيقوم النظام بإنشاء فيديو متحرك باستخدام الذكاء الاصطناعي.
-    - استخدم مقياس الحركة للتحكم في مقدار الحركة في الفيديو (10% لحركة بسيطة، 100% لحركة كبيرة)
-    - اختر الدقة المناسبة (480p للسرعة، 1080p للجودة العالية)
-    - اكتب وصفاً تفصيلياً للمشهد للحصول على أفضل النتائج
-    ملاحظة: يتم تشغيل النموذج على CPU مما قد يؤدي إلى بطء في الأداء. للحصول على أداء أفضل، يُنصح باستخدام GPU.
     """,
     theme="huggingface",
     cache_examples=False

 import gradio as gr
 import torch
+from diffusers import StableDiffusionPipeline
 from PIL import Image
 import numpy as np
 from moviepy.editor import ImageSequenceClip
 def create_video_from_text(text_prompt, duration=10, fps=30, resolution="480p", motion_scale=30):
     try:
         # تهيئة نموذج Stable Diffusion
+        model_id = "CompVis/stable-diffusion-v1-4"  # نموذج أخف
+        device = "cpu"
         pipe = StableDiffusionPipeline.from_pretrained(
             model_id,
+            torch_dtype=torch.float32
         )
         pipe = pipe.to(device)
+        # تحسين الأداء
+        pipe.enable_attention_slicing()
+        pipe.enable_model_cpu_offload()
+        # إنشاء مجلد مؤقت
         temp_dir = tempfile.mkdtemp()
         frames = []
+        # تحديد الحجم
         if resolution == "480p":
+            size = (640, 480)  # حجم أصغر للأداء
         elif resolution == "720p":
             size = (1280, 720)
+        else:
             size = (1920, 1080)
+        # توليد 3 صور فقط
+        num_images = 3
+        print(f"جاري توليد {num_images} صور...")
+        for i in tqdm(range(num_images)):
+            # تعديل البرومبت لكل صورة
+            current_prompt = text_prompt
+            if i == 1:
+                current_prompt += " , slight movement"
+            elif i == 2:
+                current_prompt += " , more movement"
+            # توليد الصورة
             image = pipe(
+                prompt=current_prompt,
+                num_inference_steps=20,  # تقليل خطوات الاستدلال
+                guidance_scale=7.0
             ).images[0]
+            # تغيير الحجم
+            image = image.resize(size, Image.LANCZOS)
+            frames.append(np.array(image))
         if not frames:
+            raise ValueError("فشل في توليد الصور")
         print("جاري إنشاء الفيديو...")
+        # إنشاء الإطارات الوسيطة
+        final_frames = []
+        for i in range(len(frames)-1):
+            # إضافة الإطار الحالي
+            final_frames.append(frames[i])
+            # إنشاء إطارات وسيطة
+            num_transitions = 10  # عدد الإطارات الوسيطة
+            for t in range(num_transitions):
+                alpha = t / num_transitions
+                transition_frame = (1 - alpha) * frames[i] + alpha * frames[i+1]
+                final_frames.append(transition_frame.astype(np.uint8))
+        # إضافة الإطار الأخير
+        final_frames.append(frames[-1])
+        # تكرار الإطارات للوصول للمدة المطلوبة
+        target_frames = int(duration * fps)
+        if len(final_frames) < target_frames:
+            final_frames = final_frames * (target_frames // len(final_frames) + 1)
+        final_frames = final_frames[:target_frames]
+        # إنشاء الفيديو
+        clip = ImageSequenceClip(final_frames, fps=fps)
         output_path = os.path.join(temp_dir, "output.mp4")
         clip.write_videofile(output_path, codec='libx264', fps=fps)
+        # تنظيف الذاكرة
         pipe = None
         torch.cuda.empty_cache()
     print(f"بدء توليد فيديو متحرك بناءً على الوصف: {text_prompt}")
     print(f"المدة: {duration} ثواني")
     print(f"الدقة: {resolution}")
     try:
         result = create_video_from_text(
         print(f"حدث خطأ في المولد: {error_msg}")
         return f"حدث خطأ: {error_msg}"
+# إنشاء واجهة المستخدم
 iface = gr.Interface(
     fn=video_generator,
     inputs=[
         gr.Textbox(label="وصف المشهد", placeholder="اكتب وصفاً للمشهد المتحرك الذي تريد إنشاءه..."),
+        gr.Slider(minimum=3, maximum=15, value=5, step=1, label="مدة الفيديو (بالثواني)"),
         gr.Radio(["480p", "720p", "1080p"], label="دقة الفيديو", value="480p"),
         gr.Slider(minimum=10, maximum=100, value=30, step=5, label="مقياس الحركة (%)")
     ],
     outputs=gr.Video(label="الفيديو المتحرك المُنشأ"),
+    title="مولد الفيديو المتحرك بالذكاء الاصطناعي (نسخة سريعة)",
     description="""
     قم بإدخال وصف للمشهد وسيقوم النظام بإنشاء فيديو متحرك باستخدام الذكاء الاصطناعي.
+    نصائح للأداء الأفضل:
+    - استخدم دقة 480p للحصول على أسرع أداء
+    - اختر مدة قصيرة (3-5 ثواني) للتجربة الأولى
+    - اكتب وصفاً واضحاً وبسيطاً
+    ملاحظة: هذه نسخة مُحسنة للأداء على CPU. تم تبسيط عملية توليد الفيديو للحصول على نتائج أسرع.
     """,
     theme="huggingface",
     cache_examples=False