SUPIR

Running on Zero

App Files Files Community

Fabrice-TIERCELIN commited on 23 days ago

Commit

835c77e

verified ·

1 Parent(s): 829ee9e

Total second length

Browse files

Files changed (1) hide show

app.py +34 -9

app.py CHANGED Viewed

@@ -1100,18 +1100,19 @@ class CameraDropdown(gr.HTML):
 def generate_video_example_debug(input_image, prompt, camera_lora, resolution, radioanimated_mode, input_video, input_audio, progress=gr.Progress(track_tqdm=True)):
     allocation_time = None
     if input_image_debug_value[0] is not None or input_audio_debug_value[0] is not None or input_video_debug_value[0] is not None or prompt_debug_value[0] is not None or total_second_length_debug_value[0] is not None or allocation_time_debug_value[0] is not None or resolution_debug_value[0] is not None or factor_debug_value[0] is not None:
         input_image = input_image_debug_value[0]
         input_audio = input_audio_debug_value[0]
         input_video = input_video_debug_value[0]
         prompt = prompt_debug_value[0]
-        duration = total_second_length_debug_value[0]
         resolution = resolution_debug_value[0]
         allocation_time = allocation_time_debug_value[0]
-    return generate_video_example(input_image, prompt, camera_lora, resolution, radioanimated_mode, input_video, input_audio, allocation_time)
-def generate_video_example(input_image, prompt, camera_lora, resolution, radioanimated_mode, input_video, input_audio, allocation_time=None, progress=gr.Progress(track_tqdm=True)):
     w, h = apply_resolution(resolution)
@@ -1129,6 +1130,7 @@ def generate_video_example(input_image, prompt, camera_lora, resolution, radioan
             w,
             camera_lora,
             input_audio,
             allocation_time,
             progress
         )
@@ -1147,8 +1149,9 @@ def get_duration(
     width,
     camera_lora,
     audio_path,
-    allocation_time,
-    progress
 ):
     if allocation_time is not None:
         allocation_time
@@ -1185,6 +1188,7 @@ def generate_video(
     width: int = DEFAULT_1_STAGE_WIDTH,
     camera_lora: str = "No LoRA",
     audio_path = None,
     allocation_time = None,
     progress=gr.Progress(track_tqdm=True),
 ):
@@ -1219,6 +1223,9 @@ def generate_video(
         gr.Info("15s not avaiable when a LoRA or lipsync is activated, reducing to 10s for this generation")
         duration = 10
     if audio_path is None:
         print(f'generating with duration:{duration} and LoRA:{camera_lora} in {width}x{height}')
     else:
@@ -2283,18 +2290,36 @@ with gr.Blocks(title="LTX-2 Video Distilled 🎥🔈") as demo:
         examples=[
             [
                 "supergirl-2.png",
-                "A fuzzy puppet superhero character resembling a female puppet with blonde hair and a blue superhero suit sleeping in bed and just waking up, she gradually gets up, rubbing her eyes and looking at her dog that just popped on the bed. the scene feels chaotic, comedic, and emotional with expressive puppet reactions, cinematic lighting, smooth camera motion, shallow depth of field, and high-quality puppet-style animation",
                 "Static",
                 "16:9",
                 "Image-to-Video",
                 None,
                 "supergirl.m4a"
             ],
             [
                 "supergirl.png",
-                "A fuzzy puppet superhero character resembling a female puppet with blonde hair and a blue superhero suit stands inside an icy cave made of frozen walls and icicles, she looks panicked and frantic, rapidly turning her head left and right and scanning the cave while waving her arms and shouting angrily and desperately, mouthing the words “where the hell is my dog,” her movements exaggerated and puppet-like with high energy and urgency, suddenly a second puppet dog bursts into frame from the side, jumping up excitedly and tackling her affectionately while licking her face repeatedly, she freezes in surprise and then breaks into relief and laughter as the dog continues licking her, the scene feels chaotic, comedic, and emotional with expressive puppet reactions, cinematic lighting, smooth camera motion, shallow depth of field, and high-quality puppet-style animation",
                 "No LoRA",
-                "16:9",
                 "Image-to-Video",
                 None,
                 None,
@@ -2354,7 +2379,7 @@ with gr.Blocks(title="LTX-2 Video Distilled 🎥🔈") as demo:
         input_image_debug=gr.Image(type="filepath", label="Image Debug")
         input_audio_debug = gr.Audio(label="Audio Debug", type="filepath")
         input_video_debug=gr.Video(label="Video Debug")
-        total_second_length_debug=gr.Slider(label="Duration Debug", minimum=1, maximum=120, value=7, step=0.1)
         resolution_debug = gr.Dropdown(
                             choices=[
                                 ["16:9", "16:9"],

 def generate_video_example_debug(input_image, prompt, camera_lora, resolution, radioanimated_mode, input_video, input_audio, progress=gr.Progress(track_tqdm=True)):
     allocation_time = None
+    total_second_length = None
     if input_image_debug_value[0] is not None or input_audio_debug_value[0] is not None or input_video_debug_value[0] is not None or prompt_debug_value[0] is not None or total_second_length_debug_value[0] is not None or allocation_time_debug_value[0] is not None or resolution_debug_value[0] is not None or factor_debug_value[0] is not None:
         input_image = input_image_debug_value[0]
         input_audio = input_audio_debug_value[0]
         input_video = input_video_debug_value[0]
         prompt = prompt_debug_value[0]
+        total_second_length = total_second_length_debug_value[0]
         resolution = resolution_debug_value[0]
         allocation_time = allocation_time_debug_value[0]
+    return generate_video_example(input_image, prompt, camera_lora, resolution, radioanimated_mode, input_video, input_audio, total_second_length, allocation_time)
+def generate_video_example(input_image, prompt, camera_lora, resolution, radioanimated_mode, input_video, input_audio, total_second_length=5, allocation_time=None, progress=gr.Progress(track_tqdm=True)):
     w, h = apply_resolution(resolution)
             w,
             camera_lora,
             input_audio,
+            total_second_length,
             allocation_time,
             progress
         )
     width,
     camera_lora,
     audio_path,
+    total_second_length = None,
+    allocation_time = None,
+    progress = None
 ):
     if allocation_time is not None:
         allocation_time
     width: int = DEFAULT_1_STAGE_WIDTH,
     camera_lora: str = "No LoRA",
     audio_path = None,
+    total_second_length = None,
     allocation_time = None,
     progress=gr.Progress(track_tqdm=True),
 ):
         gr.Info("15s not avaiable when a LoRA or lipsync is activated, reducing to 10s for this generation")
         duration = 10
+    if total_second_length is not None:
+        duration = total_second_length
     if audio_path is None:
         print(f'generating with duration:{duration} and LoRA:{camera_lora} in {width}x{height}')
     else:
         examples=[
             [
                 "supergirl-2.png",
+                "A woman wakes up.",
                 "Static",
                 "16:9",
                 "Image-to-Video",
                 None,
                 "supergirl.m4a"
             ],
+            [
+                "supergirl-2.png",
+                "A woman speaks.",
+                "Static",
+                "16:9",
+                "Image-to-Video",
+                None,
+                None
+            ],
+            [
+                "supergirl-2.png",
+                "A woman speaks.",
+                "Static",
+                "16:9",
+                "Image-to-Video",
+                None,
+                None
+            ],
             [
                 "supergirl.png",
+                "A woman is stuck.",
                 "No LoRA",
+                "9:16",
                 "Image-to-Video",
                 None,
                 None,
         input_image_debug=gr.Image(type="filepath", label="Image Debug")
         input_audio_debug = gr.Audio(label="Audio Debug", type="filepath")
         input_video_debug=gr.Video(label="Video Debug")
+        total_second_length_debug=gr.Slider(label="Duration Debug", minimum=1, maximum=120, value=15, step=0.1)
         resolution_debug = gr.Dropdown(
                             choices=[
                                 ["16:9", "16:9"],