Spaces:
Configuration error
Configuration error
Update app.py
Browse files
app.py
CHANGED
|
@@ -26,8 +26,9 @@ import torchvision
|
|
| 26 |
from PIL import Image
|
| 27 |
from transformers import CLIPVisionModelWithProjection, CLIPImageProcessor
|
| 28 |
from transformers.image_transforms import convert_to_rgb
|
|
|
|
| 29 |
|
| 30 |
-
|
| 31 |
def auto_inpainting(video_input, masked_video, mask, prompt, image, vae, text_encoder, image_encoder, diffusion, model, device, cfg_scale, img_cfg_scale, negative_prompt=""):
|
| 32 |
global use_fp16
|
| 33 |
image_prompt_embeds = None
|
|
@@ -82,7 +83,7 @@ def auto_inpainting(video_input, masked_video, mask, prompt, image, vae, text_en
|
|
| 82 |
video_clip = vae.decode(video_clip / 0.18215).sample # [16, 3, 256, 256]
|
| 83 |
return video_clip
|
| 84 |
|
| 85 |
-
|
| 86 |
def auto_inpainting_temp_split(video_input, masked_video, mask, prompt, image, vae, text_encoder, image_encoder, diffusion, model, device, scfg_scale, tcfg_scale, img_cfg_scale, negative_prompt=""):
|
| 87 |
global use_fp16
|
| 88 |
image_prompt_embeds = None
|
|
@@ -153,7 +154,7 @@ vae = None
|
|
| 153 |
text_encoder = None
|
| 154 |
image_encoder = None
|
| 155 |
clip_image_processor = None
|
| 156 |
-
|
| 157 |
def init_model():
|
| 158 |
global device
|
| 159 |
global output_path
|
|
@@ -212,7 +213,7 @@ init_model()
|
|
| 212 |
# ========================================
|
| 213 |
# Video Generation
|
| 214 |
# ========================================
|
| 215 |
-
|
| 216 |
def video_generation(text, image, scfg_scale, tcfg_scale, img_cfg_scale, diffusion):
|
| 217 |
with torch.no_grad():
|
| 218 |
print("begin generation", flush=True)
|
|
@@ -242,6 +243,7 @@ def video_generation(text, image, scfg_scale, tcfg_scale, img_cfg_scale, diffusi
|
|
| 242 |
# ========================================
|
| 243 |
# Video Prediction
|
| 244 |
# ========================================
|
|
|
|
| 245 |
def video_prediction(text, image, scfg_scale, tcfg_scale, img_cfg_scale, preframe, diffusion):
|
| 246 |
with torch.no_grad():
|
| 247 |
print("begin generation", flush=True)
|
|
@@ -278,7 +280,7 @@ def video_prediction(text, image, scfg_scale, tcfg_scale, img_cfg_scale, prefram
|
|
| 278 |
# ========================================
|
| 279 |
# Judge Generation or Prediction
|
| 280 |
# ========================================
|
| 281 |
-
|
| 282 |
def gen_or_pre(text_input, image_input, scfg_scale, tcfg_scale, img_cfg_scale, preframe_input, diffusion_step):
|
| 283 |
default_step = [25, 40, 50, 100, 125, 200, 250]
|
| 284 |
difference = [abs(item - diffusion_step) for item in default_step]
|
|
|
|
| 26 |
from PIL import Image
|
| 27 |
from transformers import CLIPVisionModelWithProjection, CLIPImageProcessor
|
| 28 |
from transformers.image_transforms import convert_to_rgb
|
| 29 |
+
import spaces
|
| 30 |
|
| 31 |
+
@spaces.GPU
|
| 32 |
def auto_inpainting(video_input, masked_video, mask, prompt, image, vae, text_encoder, image_encoder, diffusion, model, device, cfg_scale, img_cfg_scale, negative_prompt=""):
|
| 33 |
global use_fp16
|
| 34 |
image_prompt_embeds = None
|
|
|
|
| 83 |
video_clip = vae.decode(video_clip / 0.18215).sample # [16, 3, 256, 256]
|
| 84 |
return video_clip
|
| 85 |
|
| 86 |
+
@spaces.GPU
|
| 87 |
def auto_inpainting_temp_split(video_input, masked_video, mask, prompt, image, vae, text_encoder, image_encoder, diffusion, model, device, scfg_scale, tcfg_scale, img_cfg_scale, negative_prompt=""):
|
| 88 |
global use_fp16
|
| 89 |
image_prompt_embeds = None
|
|
|
|
| 154 |
text_encoder = None
|
| 155 |
image_encoder = None
|
| 156 |
clip_image_processor = None
|
| 157 |
+
@spaces.GPU
|
| 158 |
def init_model():
|
| 159 |
global device
|
| 160 |
global output_path
|
|
|
|
| 213 |
# ========================================
|
| 214 |
# Video Generation
|
| 215 |
# ========================================
|
| 216 |
+
@spaces.GPU
|
| 217 |
def video_generation(text, image, scfg_scale, tcfg_scale, img_cfg_scale, diffusion):
|
| 218 |
with torch.no_grad():
|
| 219 |
print("begin generation", flush=True)
|
|
|
|
| 243 |
# ========================================
|
| 244 |
# Video Prediction
|
| 245 |
# ========================================
|
| 246 |
+
@spaces.GPU
|
| 247 |
def video_prediction(text, image, scfg_scale, tcfg_scale, img_cfg_scale, preframe, diffusion):
|
| 248 |
with torch.no_grad():
|
| 249 |
print("begin generation", flush=True)
|
|
|
|
| 280 |
# ========================================
|
| 281 |
# Judge Generation or Prediction
|
| 282 |
# ========================================
|
| 283 |
+
@spaces.GPU
|
| 284 |
def gen_or_pre(text_input, image_input, scfg_scale, tcfg_scale, img_cfg_scale, preframe_input, diffusion_step):
|
| 285 |
default_step = [25, 40, 50, 100, 125, 200, 250]
|
| 286 |
difference = [abs(item - diffusion_step) for item in default_step]
|