r3gm commited on
Commit
107040a
·
verified ·
1 Parent(s): ac9412c

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +12 -2
app.py CHANGED
@@ -10,6 +10,8 @@ from PIL import Image
10
  import random
11
  import gc
12
  import copy
 
 
13
 
14
  from torchao.quantization import quantize_
15
  from torchao.quantization import Float8DynamicActivationFloat8WeightConfig
@@ -44,6 +46,8 @@ MAX_FRAMES_MODEL = 160
44
  MIN_DURATION = round(MIN_FRAMES_MODEL / FIXED_FPS, 1)
45
  MAX_DURATION = round(MAX_FRAMES_MODEL / FIXED_FPS, 1)
46
 
 
 
47
  SCHEDULER_MAP = {
48
  "FlowMatchEulerDiscrete": FlowMatchEulerDiscreteScheduler,
49
  "SASolver": SASolverScheduler,
@@ -61,6 +65,12 @@ pipe = WanImageToVideoPipeline.from_pretrained(
61
  original_scheduler = copy.deepcopy(pipe.scheduler)
62
  print(original_scheduler)
63
 
 
 
 
 
 
 
64
  quantize_(pipe.text_encoder, Int8WeightOnlyConfig())
65
  quantize_(pipe.transformer, Float8DynamicActivationFloat8WeightConfig())
66
  quantize_(pipe.transformer_2, Float8DynamicActivationFloat8WeightConfig())
@@ -299,11 +309,11 @@ def generate_video(
299
  return video_path, video_path, current_seed
300
 
301
 
302
- with gr.Blocks(theme=gr.themes.Soft(), delete_cache=(12800, 12800)) as demo:
303
  gr.Markdown("# WAMU V2 - Wan 2.2 I2V (14B) 🐢")
304
  gr.Markdown("## ℹ️ **A Note on Performance:** This version prioritizes a straightforward setup over maximum speed, so performance may vary.")
305
  gr.Markdown('Try the previous version: [WAMU v1](https://huggingface.co/spaces/r3gm/wan2-2-fp8da-aoti-preview2)')
306
- gr.Markdown("run Wan 2.2 in just 4-8 steps, fp8 quantization & AoT compilation - compatible with 🧨 diffusers and ZeroGPU")
307
  with gr.Row():
308
  with gr.Column():
309
  input_image_component = gr.Image(type="pil", label="Input Image")
 
10
  import random
11
  import gc
12
  import copy
13
+ import os
14
+ import shutil
15
 
16
  from torchao.quantization import quantize_
17
  from torchao.quantization import Float8DynamicActivationFloat8WeightConfig
 
46
  MIN_DURATION = round(MIN_FRAMES_MODEL / FIXED_FPS, 1)
47
  MAX_DURATION = round(MAX_FRAMES_MODEL / FIXED_FPS, 1)
48
 
49
+ CACHE_DIR = os.path.expanduser("~/.cache/huggingface/")
50
+
51
  SCHEDULER_MAP = {
52
  "FlowMatchEulerDiscrete": FlowMatchEulerDiscreteScheduler,
53
  "SASolver": SASolverScheduler,
 
65
  original_scheduler = copy.deepcopy(pipe.scheduler)
66
  print(original_scheduler)
67
 
68
+ if os.path.exists(CACHE_DIR):
69
+ shutil.rmtree(CACHE_DIR)
70
+ print("Deleted Hugging Face cache.")
71
+ else:
72
+ print("No hub cache found.")
73
+
74
  quantize_(pipe.text_encoder, Int8WeightOnlyConfig())
75
  quantize_(pipe.transformer, Float8DynamicActivationFloat8WeightConfig())
76
  quantize_(pipe.transformer_2, Float8DynamicActivationFloat8WeightConfig())
 
309
  return video_path, video_path, current_seed
310
 
311
 
312
+ with gr.Blocks(theme=gr.themes.Soft(), delete_cache=(3600, 10800)) as demo:
313
  gr.Markdown("# WAMU V2 - Wan 2.2 I2V (14B) 🐢")
314
  gr.Markdown("## ℹ️ **A Note on Performance:** This version prioritizes a straightforward setup over maximum speed, so performance may vary.")
315
  gr.Markdown('Try the previous version: [WAMU v1](https://huggingface.co/spaces/r3gm/wan2-2-fp8da-aoti-preview2)')
316
+ gr.Markdown("Run Wan 2.2 in just 4-8 steps, fp8 quantization & AoT compilation - compatible with 🧨 diffusers and ZeroGPU")
317
  with gr.Row():
318
  with gr.Column():
319
  input_image_component = gr.Image(type="pil", label="Input Image")