Helios-14B-RealTime

Runtime error

BestWishYsh commited on Mar 6

Commit

c02899d

verified ·

1 Parent(s): 3621eec

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -34,20 +34,20 @@ pipe.to("cuda")
 # pipe.transformer.set_attention_backend("flash_hub")
 pipe.transformer.set_attention_backend("_flash_3_hub")
-@spaces.GPU(duration=1500)
-def compile_transformer():
-    with spaces.aoti_capture(pipe.transformer) as call:
-        pipe("arbitrary example prompt")
-    exported = torch.export.export(
-        pipe.transformer,
-        args=call.args,
-        kwargs=call.kwargs,
-    )
-    return spaces.aoti_compile(exported)
-compiled_transformer = compile_transformer()
-spaces.aoti_apply(compiled_transformer, pipe.transformer)
 # ---------------------------------------------------------------------------
 # Generation

 # pipe.transformer.set_attention_backend("flash_hub")
 pipe.transformer.set_attention_backend("_flash_3_hub")
+# @spaces.GPU(duration=1500)
+# def compile_transformer():
+#     with spaces.aoti_capture(pipe.transformer) as call:
+#         pipe("arbitrary example prompt")
+#     exported = torch.export.export(
+#         pipe.transformer,
+#         args=call.args,
+#         kwargs=call.kwargs,
+#     )
+#     return spaces.aoti_compile(exported)
+# compiled_transformer = compile_transformer()
+# spaces.aoti_apply(compiled_transformer, pipe.transformer)
 # ---------------------------------------------------------------------------
 # Generation