Spaces:

thomson99
/

blenderbot

Runtime error

App Files Files Community

thomson99 commited on Jan 19, 2025

Commit

ed8662b

verified ·

1 Parent(s): 513387b

Upload app.py

Browse files

Files changed (1) hide show

app.py +44 -38

app.py CHANGED Viewed

@@ -1,6 +1,5 @@
 import gradio as gr
 import torch
-from torch import autocast
 from diffusers import StableDiffusionPipeline, EulerAncestralDiscreteScheduler
 from PIL import Image
 import numpy as np
@@ -13,14 +12,15 @@ def create_video_from_text(text_prompt, duration=10, fps=30, resolution="480p",
     try:
         # تهيئة نموذج Stable Diffusion
         model_id = "runwayml/stable-diffusion-v1-5"
         pipe = StableDiffusionPipeline.from_pretrained(
             model_id,
-            torch_dtype=torch.float16,
-            safety_checker=None
         )
         pipe.scheduler = EulerAncestralDiscreteScheduler.from_config(pipe.scheduler.config)
         pipe.enable_attention_slicing()
-        pipe = pipe.to("cuda")
         # إنشاء مجلد مؤقت لحفظ الصور
         temp_dir = tempfile.mkdtemp()
@@ -34,58 +34,62 @@ def create_video_from_text(text_prompt, duration=10, fps=30, resolution="480p",
         else:  # 1080p
             size = (1920, 1080)
-        # عدد الإطارات المطلوبة
-        num_frames = int(duration * fps)
         print(f"جاري توليد {num_frames} إطار...")
         # توليد الإطار الأول
-        with autocast("cuda"):
-            # إنشاء الكمون الأولي
-            generator = torch.Generator(device="cuda").manual_seed(42)
-            latents = torch.randn(
-                (1, pipe.unet.config.in_channels, 64, 64),
-                generator=generator,
-                device="cuda",
-                dtype=torch.float16
-            )
-            # توليد الصورة الأولى
             image = pipe(
                 prompt=text_prompt,
-                latents=latents,
-                num_inference_steps=30,
                 guidance_scale=7.5,
                 generator=generator
             ).images[0]
             frames.append(np.array(image.resize(size)))
-        # توليد الإطارات المتتالية مع حركة تدريجية
-        for i in tqdm(range(1, num_frames)):
-            with autocast("cuda"):
-                # إضافة اضطراب تدريجي للكمون
-                time_embed = torch.tensor([i / num_frames]).to("cuda", dtype=torch.float16)
-                noise = torch.randn_like(latents) * (motion_scale / 100)
-                current_latents = latents + noise * time_embed.view(-1, 1, 1, 1)
-                # توليد الإطار الجديد
-                image = pipe(
-                    prompt=text_prompt,
-                    latents=current_latents,
-                    num_inference_steps=30,
-                    guidance_scale=7.5,
-                    generator=generator
-                ).images[0]
-                frames.append(np.array(image.resize(size)))
         if not frames:
             raise ValueError("فشل في توليد الإطارات")
         print("جاري إنشاء الفيديو...")
         # إنشاء الفيديو من الإطارات
-        clip = ImageSequenceClip(frames, fps=fps)
         # حفظ الفيديو في ملف مؤقت
         output_path = os.path.join(temp_dir, "output.mp4")
@@ -142,6 +146,8 @@ iface = gr.Interface(
     - استخدم مقياس الحركة للتحكم في مقدار الحركة في الفيديو (10% لحركة بسيطة، 100% لحركة كبيرة)
     - اختر الدقة المناسبة (480p للسرعة، 1080p للجودة العالية)
     - اكتب وصفاً تفصيلياً للمشهد للحصول على أفضل النتائج
     """,
     theme="huggingface",
     cache_examples=False

 import gradio as gr
 import torch
 from diffusers import StableDiffusionPipeline, EulerAncestralDiscreteScheduler
 from PIL import Image
 import numpy as np
     try:
         # تهيئة نموذج Stable Diffusion
         model_id = "runwayml/stable-diffusion-v1-5"
+        device = "cpu"  # استخدام CPU
         pipe = StableDiffusionPipeline.from_pretrained(
             model_id,
+            torch_dtype=torch.float32,  # استخدام float32 للـ CPU
         )
         pipe.scheduler = EulerAncestralDiscreteScheduler.from_config(pipe.scheduler.config)
         pipe.enable_attention_slicing()
+        pipe = pipe.to(device)
         # إنشاء مجلد مؤقت لحفظ الصور
         temp_dir = tempfile.mkdtemp()
         else:  # 1080p
             size = (1920, 1080)
+        # تقليل عدد الإطارات للأداء على CPU
+        fps_reduced = 15  # تقليل معدل الإطارات
+        num_frames = int(duration * fps_reduced / 2)  # تقليل عدد الإطارات
         print(f"جاري توليد {num_frames} إطار...")
         # توليد الإطار الأول
+        generator = torch.Generator(device=device).manual_seed(42)
+        latents = torch.randn(
+            (1, pipe.unet.config.in_channels, 64, 64),
+            generator=generator,
+            device=device,
+            dtype=torch.float32
+        )
+        # توليد الصورة الأولى
+        image = pipe(
+            prompt=text_prompt,
+            latents=latents,
+            num_inference_steps=20,  # تقليل خطوات الاستدلال
+            guidance_scale=7.5,
+            generator=generator
+        ).images[0]
+        frames.append(np.array(image.resize(size)))
+        # توليد الإطارات المتتالية مع حركة تدريجية
+        for i in tqdm(range(1, num_frames)):
+            # إضافة اضطراب تدريجي للكمون
+            time_embed = torch.tensor([i / num_frames], device=device, dtype=torch.float32)
+            noise = torch.randn_like(latents) * (motion_scale / 100)
+            current_latents = latents + noise * time_embed.view(-1, 1, 1, 1)
+            # توليد الإطار الجديد
             image = pipe(
                 prompt=text_prompt,
+                latents=current_latents,
+                num_inference_steps=20,
                 guidance_scale=7.5,
                 generator=generator
             ).images[0]
             frames.append(np.array(image.resize(size)))
         if not frames:
             raise ValueError("فشل في توليد الإطارات")
         print("جاري إنشاء الفيديو...")
+        # تكرار الإطارات للوصول إلى FPS المطلوب
+        frames_extended = []
+        for frame in frames:
+            repeat_times = int(fps / fps_reduced)
+            frames_extended.extend([frame] * repeat_times)
         # إنشاء الفيديو من الإطارات
+        clip = ImageSequenceClip(frames_extended, fps=fps)
         # حفظ الفيديو في ملف مؤقت
         output_path = os.path.join(temp_dir, "output.mp4")
     - استخدم مقياس الحركة للتحكم في مقدار الحركة في الفيديو (10% لحركة بسيطة، 100% لحركة كبيرة)
     - اختر الدقة المناسبة (480p للسرعة، 1080p للجودة العالية)
     - اكتب وصفاً تفصيلياً للمشهد للحصول على أفضل النتائج
+    ملاحظة: يتم تشغيل النموذج على CPU مما قد يؤدي إلى بطء في الأداء. للحصول على أداء أفضل، يُنصح باستخدام GPU.
     """,
     theme="huggingface",
     cache_examples=False