Spaces:

thomson99
/

blenderbot

Runtime error

App Files Files Community

thomson99 commited on Jan 19, 2025

Commit

513387b

verified ·

1 Parent(s): d94e7cf

Upload 2 files

Browse files

Files changed (2) hide show

app.py +28 -17
requirements.txt +4 -3

app.py CHANGED Viewed

@@ -1,25 +1,25 @@
 import gradio as gr
 import torch
 from torch import autocast
-from diffusers import StableDiffusionPipeline, DPMSolverMultistepScheduler
 from PIL import Image
 import numpy as np
 from moviepy.editor import ImageSequenceClip
 import os
 import tempfile
-import random
 from tqdm import tqdm
 def create_video_from_text(text_prompt, duration=10, fps=30, resolution="480p", motion_scale=30):
     try:
-        # تهيئة نموذج Stable Diffusion مع جدولة DPM-Solver
         model_id = "runwayml/stable-diffusion-v1-5"
         pipe = StableDiffusionPipeline.from_pretrained(
             model_id,
             torch_dtype=torch.float16,
             safety_checker=None
         )
-        pipe.scheduler = DPMSolverMultistepScheduler.from_config(pipe.scheduler.config)
         pipe = pipe.to("cuda")
         # إنشاء مجلد مؤقت لحفظ الصور
@@ -40,8 +40,11 @@ def create_video_from_text(text_prompt, duration=10, fps=30, resolution="480p",
         # توليد الإطار الأول
         with autocast("cuda"):
-            initial_latents = torch.randn(
-                (1, pipe.unet.in_channels, 64, 64),
                 device="cuda",
                 dtype=torch.float16
             )
@@ -49,9 +52,10 @@ def create_video_from_text(text_prompt, duration=10, fps=30, resolution="480p",
             # توليد الصورة الأولى
             image = pipe(
                 prompt=text_prompt,
-                latents=initial_latents,
-                num_inference_steps=50,
-                guidance_scale=7.5
             ).images[0]
             frames.append(np.array(image.resize(size)))
@@ -59,17 +63,18 @@ def create_video_from_text(text_prompt, duration=10, fps=30, resolution="480p",
         # توليد الإطارات المتتالية مع حركة تدريجية
         for i in tqdm(range(1, num_frames)):
             with autocast("cuda"):
-                # إضافة اضطراب صغير للكمون لإنشاء حركة سلسة
-                noise_scale = (i / num_frames) * motion_scale
-                noise = torch.randn_like(initial_latents) * 0.1 * noise_scale
-                current_latents = initial_latents + noise
                 # توليد الإطار الجديد
                 image = pipe(
                     prompt=text_prompt,
                     latents=current_latents,
-                    num_inference_steps=50,
-                    guidance_scale=7.5
                 ).images[0]
                 frames.append(np.array(image.resize(size)))
@@ -127,11 +132,17 @@ iface = gr.Interface(
         gr.Textbox(label="وصف المشهد", placeholder="اكتب وصفاً للمشهد المتحرك الذي تريد إنشاءه..."),
         gr.Slider(minimum=5, maximum=30, value=10, step=5, label="مدة الفيديو (بالثواني)"),
         gr.Radio(["480p", "720p", "1080p"], label="دقة الفيديو", value="480p"),
-        gr.Slider(minimum=10, maximum=50, value=30, step=5, label="مقياس الحركة")
     ],
     outputs=gr.Video(label="الفيديو المتحرك المُنشأ"),
     title="مولد الفيديو المتحرك بالذكاء الاصطناعي",
-    description="قم بإدخال وصف للمشهد وسيقوم النظام بإنشاء فيديو متحرك باستخدام الذكاء الاصطناعي. يمكنك التحكم في مقدار الحركة باستخدام شريط التمرير.",
     theme="huggingface",
     cache_examples=False
 )

 import gradio as gr
 import torch
 from torch import autocast
+from diffusers import StableDiffusionPipeline, EulerAncestralDiscreteScheduler
 from PIL import Image
 import numpy as np
 from moviepy.editor import ImageSequenceClip
 import os
 import tempfile
 from tqdm import tqdm
 def create_video_from_text(text_prompt, duration=10, fps=30, resolution="480p", motion_scale=30):
     try:
+        # تهيئة نموذج Stable Diffusion
         model_id = "runwayml/stable-diffusion-v1-5"
         pipe = StableDiffusionPipeline.from_pretrained(
             model_id,
             torch_dtype=torch.float16,
             safety_checker=None
         )
+        pipe.scheduler = EulerAncestralDiscreteScheduler.from_config(pipe.scheduler.config)
+        pipe.enable_attention_slicing()
         pipe = pipe.to("cuda")
         # إنشاء مجلد مؤقت لحفظ الصور
         # توليد الإطار الأول
         with autocast("cuda"):
+            # إنشاء الكمون الأولي
+            generator = torch.Generator(device="cuda").manual_seed(42)
+            latents = torch.randn(
+                (1, pipe.unet.config.in_channels, 64, 64),
+                generator=generator,
                 device="cuda",
                 dtype=torch.float16
             )
             # توليد الصورة الأولى
             image = pipe(
                 prompt=text_prompt,
+                latents=latents,
+                num_inference_steps=30,
+                guidance_scale=7.5,
+                generator=generator
             ).images[0]
             frames.append(np.array(image.resize(size)))
         # توليد الإطارات المتتالية مع حركة تدريجية
         for i in tqdm(range(1, num_frames)):
             with autocast("cuda"):
+                # إضافة اضطراب تدريجي للكمون
+                time_embed = torch.tensor([i / num_frames]).to("cuda", dtype=torch.float16)
+                noise = torch.randn_like(latents) * (motion_scale / 100)
+                current_latents = latents + noise * time_embed.view(-1, 1, 1, 1)
                 # توليد الإطار الجديد
                 image = pipe(
                     prompt=text_prompt,
                     latents=current_latents,
+                    num_inference_steps=30,
+                    guidance_scale=7.5,
+                    generator=generator
                 ).images[0]
                 frames.append(np.array(image.resize(size)))
         gr.Textbox(label="وصف المشهد", placeholder="اكتب وصفاً للمشهد المتحرك الذي تريد إنشاءه..."),
         gr.Slider(minimum=5, maximum=30, value=10, step=5, label="مدة الفيديو (بالثواني)"),
         gr.Radio(["480p", "720p", "1080p"], label="دقة الفيديو", value="480p"),
+        gr.Slider(minimum=10, maximum=100, value=30, step=5, label="مقياس الحركة (%)")
     ],
     outputs=gr.Video(label="الفيديو المتحرك المُنشأ"),
     title="مولد الفيديو المتحرك بالذكاء الاصطناعي",
+    description="""
+    قم بإدخال وصف للمشهد وسيقوم النظام بإنشاء فيديو متحرك باستخدام الذكاء الاصطناعي.
+    - استخدم مقياس الحركة للتحكم في مقدار الحركة في الفيديو (10% لحركة بسيطة، 100% لحركة كبيرة)
+    - اختر الدقة المناسبة (480p للسرعة، 1080p للجودة العالية)
+    - اكتب وصفاً تفصيلياً للمشهد للحصول على أفضل النتائج
+    """,
     theme="huggingface",
     cache_examples=False
 )

requirements.txt CHANGED Viewed

@@ -1,8 +1,9 @@
 gradio==3.50.2
 torch==2.0.1
-diffusers==0.19.3
-transformers==4.30.2
-accelerate==0.21.0
 pillow==9.5.0
 moviepy==1.0.3
 numpy==1.24.3

 gradio==3.50.2
 torch==2.0.1
+diffusers==0.24.0
+transformers==4.35.2
+accelerate==0.25.0
+huggingface-hub==0.19.4
 pillow==9.5.0
 moviepy==1.0.3
 numpy==1.24.3