TaliDror commited on
Commit ·
8c65b86
1
Parent(s): 28e4085
improved UI
Browse files
app.py
CHANGED
|
@@ -514,9 +514,11 @@ def load_models():
|
|
| 514 |
def build_demo():
|
| 515 |
with gr.Blocks(title="AAS2F: Ambiguity-Aware Speech-to-Face Synthesis with Speaker-Conditioned Diffusion Models") as demo:
|
| 516 |
gr.Markdown("# AAS2F: Ambiguity-Aware Speech-to-Face Synthesis with Speaker-Conditioned Diffusion Models")
|
| 517 |
-
gr.Markdown(
|
| 518 |
-
|
| 519 |
-
|
|
|
|
|
|
|
| 520 |
|
| 521 |
with gr.Row():
|
| 522 |
with gr.Column():
|
|
|
|
| 514 |
def build_demo():
|
| 515 |
with gr.Blocks(title="AAS2F: Ambiguity-Aware Speech-to-Face Synthesis with Speaker-Conditioned Diffusion Models") as demo:
|
| 516 |
gr.Markdown("# AAS2F: Ambiguity-Aware Speech-to-Face Synthesis with Speaker-Conditioned Diffusion Models")
|
| 517 |
+
gr.Markdown(
|
| 518 |
+
"**Steps to use the demo:**\n\n"
|
| 519 |
+
"1. Upload or record a speech audio clip and generate face images conditioned on the speaker's voice. **Please provide at least 5 seconds of speech.** Note that it works best with **English** as the model is trained on English speech, but should work with other languages as well.\n"
|
| 520 |
+
"2. Click the 'Generate' button to start the generation process."
|
| 521 |
+
)
|
| 522 |
|
| 523 |
with gr.Row():
|
| 524 |
with gr.Column():
|