addition
Browse files
app.py
CHANGED
|
@@ -282,9 +282,9 @@ with gr.Blocks(css=css) as demo:
|
|
| 282 |
with gr.Column(elem_id="col-container"):
|
| 283 |
gr.Markdown("# CrossFlow")
|
| 284 |
gr.Markdown("[CrossFlow](https://cross-flow.github.io/) directly transforms text representations into images for text-to-image generation, without the need for both the noise distribution and conditioning mechanism.")
|
|
|
|
| 285 |
with gr.Tabs():
|
| 286 |
-
with gr.Tab("Linear
|
| 287 |
-
gr.Markdown("This allows interpolation in the input text latent space, as demonstrated here.")
|
| 288 |
gr.Markdown("This demo uses 256px images, 25 sampling steps (instead of 50), and 10 interpolations (instead of 50) to conserve GPU memory. For better results, see the original [code](https://github.com/qihao067/CrossFlow). (You may adjust them in Advanced Settings, but doing so may trigger OOM errors.)")
|
| 289 |
# gr.Markdown("CrossFlow directly transforms text representations into images for text-to-image generation, enabling interpolation in the input text latent space.")
|
| 290 |
|
|
@@ -354,7 +354,83 @@ with gr.Blocks(css=css) as demo:
|
|
| 354 |
|
| 355 |
with gr.Tab("Arithmetic Operations"):
|
| 356 |
# The second tab is currently empty. You can add more components later.
|
| 357 |
-
gr.Markdown("This
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 358 |
|
| 359 |
gr.on(
|
| 360 |
triggers=[run_button.click, prompt1.submit, prompt2.submit],
|
|
|
|
| 282 |
with gr.Column(elem_id="col-container"):
|
| 283 |
gr.Markdown("# CrossFlow")
|
| 284 |
gr.Markdown("[CrossFlow](https://cross-flow.github.io/) directly transforms text representations into images for text-to-image generation, without the need for both the noise distribution and conditioning mechanism.")
|
| 285 |
+
gr.Markdown("This direct mapping enables meaningful 'Linear Interpolation' and 'Arithmetic Operations' in the text latent space, as demonstrated here.")
|
| 286 |
with gr.Tabs():
|
| 287 |
+
with gr.Tab("Linear Interpolation"):
|
|
|
|
| 288 |
gr.Markdown("This demo uses 256px images, 25 sampling steps (instead of 50), and 10 interpolations (instead of 50) to conserve GPU memory. For better results, see the original [code](https://github.com/qihao067/CrossFlow). (You may adjust them in Advanced Settings, but doing so may trigger OOM errors.)")
|
| 289 |
# gr.Markdown("CrossFlow directly transforms text representations into images for text-to-image generation, enabling interpolation in the input text latent space.")
|
| 290 |
|
|
|
|
| 354 |
|
| 355 |
with gr.Tab("Arithmetic Operations"):
|
| 356 |
# The second tab is currently empty. You can add more components later.
|
| 357 |
+
gr.Markdown("This demo only supports addition or subtraction between two text latents ('Prompt_1 + Prompt_2' or 'Prompt_1 - Prompt_2'). For the other arithmetic operations, see the original [code](https://github.com/qihao067/CrossFlow).")
|
| 358 |
+
with gr.Row():
|
| 359 |
+
prompt1 = gr.Text(
|
| 360 |
+
label="Prompt_1",
|
| 361 |
+
show_label=False,
|
| 362 |
+
max_lines=1,
|
| 363 |
+
placeholder="Enter your prompt for the first image",
|
| 364 |
+
container=False,
|
| 365 |
+
)
|
| 366 |
+
|
| 367 |
+
with gr.Row():
|
| 368 |
+
prompt2 = gr.Text(
|
| 369 |
+
label="Prompt_2",
|
| 370 |
+
show_label=False,
|
| 371 |
+
max_lines=1,
|
| 372 |
+
placeholder="Enter your prompt for the second image",
|
| 373 |
+
container=False,
|
| 374 |
+
)
|
| 375 |
+
|
| 376 |
+
with gr.Row():
|
| 377 |
+
operation_mode = gr.Radio(
|
| 378 |
+
choices=["Addition", "Subtraction"],
|
| 379 |
+
label="Operation Mode",
|
| 380 |
+
value="Addition",
|
| 381 |
+
)
|
| 382 |
+
with gr.Row():
|
| 383 |
+
run_button = gr.Button("Run", scale=0, variant="primary")
|
| 384 |
+
|
| 385 |
+
# Create separate outputs for the first image, last image, and the animated GIF
|
| 386 |
+
first_image_output = gr.Image(label="Image of the first prompt", show_label=True)
|
| 387 |
+
last_image_output = gr.Image(label="Image of the second prompt", show_label=True)
|
| 388 |
+
gif_output = gr.Image(label="Linear interpolation", show_label=True)
|
| 389 |
+
|
| 390 |
+
with gr.Accordion("Advanced Settings", open=False):
|
| 391 |
+
seed = gr.Slider(
|
| 392 |
+
label="Seed",
|
| 393 |
+
minimum=0,
|
| 394 |
+
maximum=MAX_SEED,
|
| 395 |
+
step=1,
|
| 396 |
+
value=0,
|
| 397 |
+
)
|
| 398 |
+
|
| 399 |
+
randomize_seed = gr.Checkbox(label="Randomize seed", value=True)
|
| 400 |
+
|
| 401 |
+
with gr.Row():
|
| 402 |
+
guidance_scale = gr.Slider(
|
| 403 |
+
label="Guidance scale",
|
| 404 |
+
minimum=0.0,
|
| 405 |
+
maximum=10.0,
|
| 406 |
+
step=0.1,
|
| 407 |
+
value=7.0, # Replace with defaults that work for your model
|
| 408 |
+
)
|
| 409 |
+
# with gr.Row():
|
| 410 |
+
# num_inference_steps = gr.Slider(
|
| 411 |
+
# label="Number of inference steps - 50 inference steps are recommended; but you can reduce to 20 if the demo fails.",
|
| 412 |
+
# minimum=1,
|
| 413 |
+
# maximum=50,
|
| 414 |
+
# step=1,
|
| 415 |
+
# value=55, # Replace with defaults that work for your model
|
| 416 |
+
# )
|
| 417 |
+
if operation_mode == "Addition":
|
| 418 |
+
num_inference_steps = -1
|
| 419 |
+
elif operation_mode == "Subtraction":
|
| 420 |
+
num_inference_steps = -2
|
| 421 |
+
else:
|
| 422 |
+
num_inference_steps = 0
|
| 423 |
+
|
| 424 |
+
with gr.Row():
|
| 425 |
+
num_of_interpolation = gr.Slider(
|
| 426 |
+
label="Number of images for interpolation - More images yield smoother transitions but require more resources and may fail.",
|
| 427 |
+
minimum=5,
|
| 428 |
+
maximum=50,
|
| 429 |
+
step=1,
|
| 430 |
+
value=50, # Replace with defaults that work for your model
|
| 431 |
+
)
|
| 432 |
+
|
| 433 |
+
gr.Examples(examples=examples, inputs=[prompt1, prompt2])
|
| 434 |
|
| 435 |
gr.on(
|
| 436 |
triggers=[run_button.click, prompt1.submit, prompt2.submit],
|