Spaces:
Paused
Paused
Update app.py
Browse files
app.py
CHANGED
|
@@ -216,33 +216,8 @@ controller = FoleyController()
|
|
| 216 |
device = "cuda" if torch.cuda.is_available() else "cpu"
|
| 217 |
|
| 218 |
with gr.Blocks(css=css) as demo:
|
| 219 |
-
|
| 220 |
-
'<h1 style="height: 136px; display: flex; align-items: center; justify-content: space-around;"><span style="height: 100%; width:136px;"><img src="file/foleycrafter.png" alt="logo" style="height: 100%; width:auto; object-fit: contain; margin: 0px 0px; padding: 0px 0px;"></span><strong style="font-size: 36px;">FoleyCrafter: Bring Silent Videos to Life with Lifelike and Synchronized Sounds</strong></h1>'
|
| 221 |
-
)
|
| 222 |
-
gr.HTML(
|
| 223 |
-
'<p id="authors" style="text-align:center; font-size:24px;"> \
|
| 224 |
-
<a href="https://github.com/ymzhang0319">Yiming Zhang</a><sup>1</sup>,  \
|
| 225 |
-
<a href="https://github.com/VocodexElysium">Yicheng Gu</a><sup>2</sup>,  \
|
| 226 |
-
<a href="https://zengyh1900.github.io/">Yanhong Zeng</a><sup>1 †</sup>,  \
|
| 227 |
-
<a href="https://github.com/LeoXing1996/">Zhening Xing</a><sup>1</sup>,  \
|
| 228 |
-
<a href="https://github.com/HeCheng0625">Yuancheng Wang</a><sup>2</sup>,  \
|
| 229 |
-
<a href="https://drwuz.com/">Zhizheng Wu</a><sup>2</sup>,  \
|
| 230 |
-
<a href="https://chenkai.site/">Kai Chen</a><sup>1 †</sup>\
|
| 231 |
-
<br>\
|
| 232 |
-
<span>\
|
| 233 |
-
<sup>1</sup>Shanghai AI Laboratory \
|
| 234 |
-
<sup>2</sup>Chinese University of Hong Kong, Shenzhen \
|
| 235 |
-
†Corresponding author\
|
| 236 |
-
</span>\
|
| 237 |
-
</p>'
|
| 238 |
-
)
|
| 239 |
with gr.Row():
|
| 240 |
-
gr.Markdown(
|
| 241 |
-
"<div align='center'><font size='5'><a href='https://foleycrafter.github.io/'>Project Page</a>  " # noqa
|
| 242 |
-
"<a href='https://arxiv.org/abs/2407.01494/'>Paper</a>  "
|
| 243 |
-
"<a href='https://github.com/open-mmlab/foleycrafter'>Code</a>  "
|
| 244 |
-
"<a href='https://huggingface.co/spaces/ymzhang319/FoleyCrafter'>Demo</a> </font></div>"
|
| 245 |
-
)
|
| 246 |
|
| 247 |
with gr.Column(variant="panel"):
|
| 248 |
with gr.Row(equal_height=False):
|
|
@@ -280,16 +255,6 @@ with gr.Blocks(css=css) as demo:
|
|
| 280 |
with gr.Column():
|
| 281 |
result_video = gr.Video(label="Generated Audio", interactive=False)
|
| 282 |
with gr.Row():
|
| 283 |
-
gr.Markdown(
|
| 284 |
-
"<div style='word-spacing: 6px;'><font size='5'><b>Tips</b>: <br> \
|
| 285 |
-
1. With strong temporal visual cues in input video, you can scale up the <b>Temporal Align Scale</b>. <br>\
|
| 286 |
-
2. <b>Visual content scale</b> is the level of semantic alignment with visual content.</font></div> \
|
| 287 |
-
")
|
| 288 |
-
# gr.HTML(
|
| 289 |
-
# '<p style="font-size: 16px;">**Tips**: <br> \
|
| 290 |
-
# 1. With strong temporal visual cues in input video, you can scale up the **Temporal Align Scale**. <br>\
|
| 291 |
-
# 2. **Visual content scale** is the level of semantic alignment with visual content.</p> \
|
| 292 |
-
# ')
|
| 293 |
|
| 294 |
generate_button.click(
|
| 295 |
fn=controller.foley,
|
|
|
|
| 216 |
device = "cuda" if torch.cuda.is_available() else "cpu"
|
| 217 |
|
| 218 |
with gr.Blocks(css=css) as demo:
|
| 219 |
+
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 220 |
with gr.Row():
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 221 |
|
| 222 |
with gr.Column(variant="panel"):
|
| 223 |
with gr.Row(equal_height=False):
|
|
|
|
| 255 |
with gr.Column():
|
| 256 |
result_video = gr.Video(label="Generated Audio", interactive=False)
|
| 257 |
with gr.Row():
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 258 |
|
| 259 |
generate_button.click(
|
| 260 |
fn=controller.foley,
|