Spaces:

QHL067
/

CrossFlow

Paused

App Files Files Community

QHL067 commited on Mar 14, 2025

Commit

9666147

1 Parent(s): 9b01db5

addition

Browse files

Files changed (1) hide show

app.py +79 -3

app.py CHANGED Viewed

@@ -282,9 +282,9 @@ with gr.Blocks(css=css) as demo:
     with gr.Column(elem_id="col-container"):
         gr.Markdown("# CrossFlow")
         gr.Markdown("[CrossFlow](https://cross-flow.github.io/) directly transforms text representations into images for text-to-image generation, without the need for both the noise distribution and conditioning mechanism.")
         with gr.Tabs():
-            with gr.Tab("Linear interpolation"):
-                gr.Markdown("This allows interpolation in the input text latent space, as demonstrated here.")
                 gr.Markdown("This demo uses 256px images, 25 sampling steps (instead of 50), and 10 interpolations (instead of 50) to conserve GPU memory. For better results, see the original [code](https://github.com/qihao067/CrossFlow). (You may adjust them in Advanced Settings, but doing so may trigger OOM errors.)")
                 # gr.Markdown("CrossFlow directly transforms text representations into images for text-to-image generation, enabling interpolation in the input text latent space.")
@@ -354,7 +354,83 @@ with gr.Blocks(css=css) as demo:
             with gr.Tab("Arithmetic Operations"):
                 # The second tab is currently empty. You can add more components later.
-                gr.Markdown("This tab is intentionally left empty.")
     gr.on(
         triggers=[run_button.click, prompt1.submit, prompt2.submit],

     with gr.Column(elem_id="col-container"):
         gr.Markdown("# CrossFlow")
         gr.Markdown("[CrossFlow](https://cross-flow.github.io/) directly transforms text representations into images for text-to-image generation, without the need for both the noise distribution and conditioning mechanism.")
+        gr.Markdown("This direct mapping enables meaningful 'Linear Interpolation' and 'Arithmetic Operations' in the text latent space, as demonstrated here.")
         with gr.Tabs():
+            with gr.Tab("Linear Interpolation"):
                 gr.Markdown("This demo uses 256px images, 25 sampling steps (instead of 50), and 10 interpolations (instead of 50) to conserve GPU memory. For better results, see the original [code](https://github.com/qihao067/CrossFlow). (You may adjust them in Advanced Settings, but doing so may trigger OOM errors.)")
                 # gr.Markdown("CrossFlow directly transforms text representations into images for text-to-image generation, enabling interpolation in the input text latent space.")
             with gr.Tab("Arithmetic Operations"):
                 # The second tab is currently empty. You can add more components later.
+                gr.Markdown("This demo only supports addition or subtraction between two text latents ('Prompt_1 + Prompt_2' or 'Prompt_1 - Prompt_2'). For the other arithmetic operations, see the original [code](https://github.com/qihao067/CrossFlow).")
+                with gr.Row():
+                    prompt1 = gr.Text(
+                        label="Prompt_1",
+                        show_label=False,
+                        max_lines=1,
+                        placeholder="Enter your prompt for the first image",
+                        container=False,
+                    )
+                with gr.Row():
+                    prompt2 = gr.Text(
+                        label="Prompt_2",
+                        show_label=False,
+                        max_lines=1,
+                        placeholder="Enter your prompt for the second image",
+                        container=False,
+                    )
+                with gr.Row():
+                    operation_mode = gr.Radio(
+                        choices=["Addition", "Subtraction"],
+                        label="Operation Mode",
+                        value="Addition",
+                    )
+                with gr.Row():
+                    run_button = gr.Button("Run", scale=0, variant="primary")
+                # Create separate outputs for the first image, last image, and the animated GIF
+                first_image_output = gr.Image(label="Image of the first prompt", show_label=True)
+                last_image_output = gr.Image(label="Image of the second prompt", show_label=True)
+                gif_output = gr.Image(label="Linear interpolation", show_label=True)
+                with gr.Accordion("Advanced Settings", open=False):
+                    seed = gr.Slider(
+                        label="Seed",
+                        minimum=0,
+                        maximum=MAX_SEED,
+                        step=1,
+                        value=0,
+                    )
+                    randomize_seed = gr.Checkbox(label="Randomize seed", value=True)
+                    with gr.Row():
+                        guidance_scale = gr.Slider(
+                            label="Guidance scale",
+                            minimum=0.0,
+                            maximum=10.0,
+                            step=0.1,
+                            value=7.0,  # Replace with defaults that work for your model
+                        )
+                    # with gr.Row():
+                    #     num_inference_steps = gr.Slider(
+                    #         label="Number of inference steps - 50 inference steps are recommended; but you can reduce to 20 if the demo fails.",
+                    #         minimum=1,
+                    #         maximum=50,
+                    #         step=1,
+                    #         value=55,  # Replace with defaults that work for your model
+                    #     )
+                    if operation_mode == "Addition":
+                        num_inference_steps = -1
+                    elif operation_mode == "Subtraction":
+                        num_inference_steps = -2
+                    else:
+                        num_inference_steps = 0
+                    with gr.Row():
+                        num_of_interpolation = gr.Slider(
+                            label="Number of images for interpolation - More images yield smoother transitions but require more resources and may fail.",
+                            minimum=5,
+                            maximum=50,
+                            step=1,
+                            value=50,  # Replace with defaults that work for your model
+                        )
+                gr.Examples(examples=examples, inputs=[prompt1, prompt2])
     gr.on(
         triggers=[run_button.click, prompt1.submit, prompt2.submit],