Spaces:

allenai
/

RefDecoder

Configuration error

App Files Files Community

xiangfan00 commited on 3 days ago

Commit

307d7cf

1 Parent(s): efdefa8

Try increasing GPU duration

Browse files

Files changed (1) hide show

app.py +14 -15

app.py CHANGED Viewed

@@ -11,14 +11,17 @@ import gradio as gr
 import imageio
 import numpy as np
 import ftfy
 try:
     import spaces
 except ImportError:
     class _SpacesShim:
         @staticmethod
         def GPU(*args, **kwargs):
             def decorator(fn):
                 return fn
             return decorator
     spaces = _SpacesShim()
@@ -31,7 +34,6 @@ from transformers import CLIPVisionModel
 from src.models.Wan.autoencoder_wanT import AutoencoderKLWan
 from src.models.Wan.transformer_wan import WanDecoderTransformer
 ROOT = Path(__file__).resolve().parent
 if str(ROOT) not in sys.path:
     sys.path.insert(0, str(ROOT))
@@ -559,7 +561,7 @@ def decode_with_refdecoder(latents, reference_frame, vae, transformer):
     return video
-@spaces.GPU(duration=95)
 def generate_latents_on_gpu(image, prompt, seed):
     log_cuda_mem("start generate_latents_on_gpu")
     GENERATION_PIPE.to(DEVICE)
@@ -607,7 +609,10 @@ def decode_refdecoder_on_gpu(latents, reference_frame):
     REFDECODER_TRANSFORMER.to(DEVICE)
     try:
         video = decode_with_refdecoder(
-            latents, reference_frame, REFDECODER_VAE, REFDECODER_TRANSFORMER,
         )
         video = video.detach().cpu()
     finally:
@@ -991,8 +996,7 @@ button.download-ref:disabled {
 with gr.Blocks(title="RefDecoder I2V Demo", theme=gr.themes.Soft(), css=CUSTOM_CSS) as demo:
     with gr.Column(elem_classes="app-shell"):
-        gr.HTML(
-            """
             <script>
             (() => {
                 if (window.__refdecoderResizeBound) return;
@@ -1049,18 +1053,15 @@ with gr.Blocks(title="RefDecoder I2V Demo", theme=gr.themes.Soft(), css=CUSTOM_C
                     The app generates latents once, then renders them with Wan's original VAE and with RefDecoder.
                 </p>
             </div>
-            """
-        )
         with gr.Column(elem_classes=["panel-card", "compare-panel"]):
-            gr.HTML(
-                """
                 <div class="section-title">Inputs</div>
                 <div class="section-copy">
                     Upload a reference image, optionally add a prompt, and compare the decoders below.
                 </div>
-                """
-            )
             with gr.Row(equal_height=True):
                 with gr.Column(scale=3):
                     image_input = gr.Image(
@@ -1091,14 +1092,12 @@ with gr.Blocks(title="RefDecoder I2V Demo", theme=gr.themes.Soft(), css=CUSTOM_C
                     status_md = gr.Markdown(value="", elem_classes="run-status")
         with gr.Column(elem_classes="panel-card"):
-            gr.HTML(
-                """
                 <div class="section-title">Decoder Comparison</div>
                 <div class="section-copy">
                     Left side shows Wan Baseline. Right side shows RefDecoder. Drag the divider across the frame to compare them.
                 </div>
-                """
-            )
             compare_output = gr.HTML(value=build_compare_html(None, None))
             with gr.Row(elem_classes="download-row"):

 import imageio
 import numpy as np
 import ftfy
 try:
     import spaces
 except ImportError:
     class _SpacesShim:
         @staticmethod
         def GPU(*args, **kwargs):
             def decorator(fn):
                 return fn
             return decorator
     spaces = _SpacesShim()
 from src.models.Wan.autoencoder_wanT import AutoencoderKLWan
 from src.models.Wan.transformer_wan import WanDecoderTransformer
 ROOT = Path(__file__).resolve().parent
 if str(ROOT) not in sys.path:
     sys.path.insert(0, str(ROOT))
     return video
+@spaces.GPU(duration=150)
 def generate_latents_on_gpu(image, prompt, seed):
     log_cuda_mem("start generate_latents_on_gpu")
     GENERATION_PIPE.to(DEVICE)
     REFDECODER_TRANSFORMER.to(DEVICE)
     try:
         video = decode_with_refdecoder(
+            latents,
+            reference_frame,
+            REFDECODER_VAE,
+            REFDECODER_TRANSFORMER,
         )
         video = video.detach().cpu()
     finally:
 with gr.Blocks(title="RefDecoder I2V Demo", theme=gr.themes.Soft(), css=CUSTOM_CSS) as demo:
     with gr.Column(elem_classes="app-shell"):
+        gr.HTML("""
             <script>
             (() => {
                 if (window.__refdecoderResizeBound) return;
                     The app generates latents once, then renders them with Wan's original VAE and with RefDecoder.
                 </p>
             </div>
+            """)
         with gr.Column(elem_classes=["panel-card", "compare-panel"]):
+            gr.HTML("""
                 <div class="section-title">Inputs</div>
                 <div class="section-copy">
                     Upload a reference image, optionally add a prompt, and compare the decoders below.
                 </div>
+                """)
             with gr.Row(equal_height=True):
                 with gr.Column(scale=3):
                     image_input = gr.Image(
                     status_md = gr.Markdown(value="", elem_classes="run-status")
         with gr.Column(elem_classes="panel-card"):
+            gr.HTML("""
                 <div class="section-title">Decoder Comparison</div>
                 <div class="section-copy">
                     Left side shows Wan Baseline. Right side shows RefDecoder. Drag the divider across the frame to compare them.
                 </div>
+                """)
             compare_output = gr.HTML(value=build_compare_html(None, None))
             with gr.Row(elem_classes="download-row"):