ACE-Step-1.5

Running on Zero

ChuxiJ commited on Feb 20

Commit

6813c41

1 Parent(s): b7a9cc9

fix: move @spaces.GPU decorators to local wrappers to fix ZeroGPU pickling error

On ZeroGPU, Gradio serializes (pickles) event handler functions to send
them to GPU worker processes. When fn= was a lambda capturing dit_handler,
Python tried to pickle the entire handler including AceStepDiTModel which
contains unpicklable local objects in __init__, causing:
'Can't pickle local object AceStepDiTModel.__init__'

Fix: Remove @_get_spaces_gpu_decorator from module-level functions and
instead apply it to local wrapper functions defined inside
setup_event_handlers(), passed directly as fn= (same pattern as the
working generation_wrapper).

Affected handlers:
- process_source_audio (Analyze button)
- handle_create_sample (Create Sample button)
- handle_format_sample (Format button)
- calculate_score_handler_with_selection (Score buttons)
- generate_lrc_handler (LRC buttons)

Files changed (3) hide show

acestep/gradio_ui/events/__init__.py +37 -13
acestep/gradio_ui/events/generation_handlers.py +0 -3
acestep/gradio_ui/events/results_handlers.py +0 -2

acestep/gradio_ui/events/__init__.py CHANGED Viewed

@@ -263,10 +263,14 @@ def setup_event_handlers(demo, dit_handler, llm_handler, dataset_handler, datase
     # ========== Format Button ==========
     # Note: cfg_scale and negative_prompt are not supported in format mode
-    generation_section["format_btn"].click(
-        fn=lambda caption, lyrics, bpm, duration, key_scale, time_sig, temp, top_k, top_p, debug: gen_h.handle_format_sample(
             llm_handler, caption, lyrics, bpm, duration, key_scale, time_sig, temp, top_k, top_p, debug
-        ),
         inputs=[
             generation_section["captions"],
             generation_section["lyrics"],
@@ -312,8 +316,16 @@ def setup_event_handlers(demo, dit_handler, llm_handler, dataset_handler, datase
     # ========== Process Source Audio Button ==========
     # Combines Convert to Codes + Transcribe in one step
     generation_section["process_src_btn"].click(
-        fn=lambda src, debug: gen_h.process_source_audio(dit_handler, llm_handler, src, debug),
         inputs=[
             generation_section["src_audio"],
             generation_section["constrained_decoding_debug"]
@@ -353,10 +365,14 @@ def setup_event_handlers(demo, dit_handler, llm_handler, dataset_handler, datase
     # ========== Create Sample Button (Simple Mode) ==========
     # Note: cfg_scale and negative_prompt are not supported in create_sample mode
-    generation_section["create_sample_btn"].click(
-        fn=lambda query, instrumental, vocal_lang, temp, top_k, top_p, debug: gen_h.handle_create_sample(
             llm_handler, query, instrumental, vocal_lang, temp, top_k, top_p, debug
-        ),
         inputs=[
             generation_section["simple_query_input"],
             generation_section["simple_instrumental_checkbox"],
@@ -593,10 +609,15 @@ def setup_event_handlers(demo, dit_handler, llm_handler, dataset_handler, datase
     # ========== Score Calculation Handlers ==========
     # Use default argument to capture btn_idx value at definition time (Python closure fix)
     def make_score_handler(idx):
-        return lambda scale, batch_idx, queue: res_h.calculate_score_handler_with_selection(
-            dit_handler, llm_handler, idx, scale, batch_idx, queue
-        )
     for btn_idx in range(1, 9):
         results_section[f"score_btn_{btn_idx}"].click(
@@ -616,9 +637,12 @@ def setup_event_handlers(demo, dit_handler, llm_handler, dataset_handler, datase
     # ========== LRC Timestamp Handlers ==========
     # Use default argument to capture btn_idx value at definition time (Python closure fix)
     def make_lrc_handler(idx):
-        return lambda batch_idx, queue, vocal_lang, infer_steps: res_h.generate_lrc_handler(
-            dit_handler, idx, batch_idx, queue, vocal_lang, infer_steps
-        )
     for btn_idx in range(1, 9):
         results_section[f"lrc_btn_{btn_idx}"].click(

     # ========== Format Button ==========
     # Note: cfg_scale and negative_prompt are not supported in format mode
+    @_get_spaces_gpu_decorator(duration=180)
+    def handle_format_sample_wrapper(caption, lyrics, bpm, duration, key_scale, time_sig, temp, top_k, top_p, debug):
+        return gen_h.handle_format_sample(
             llm_handler, caption, lyrics, bpm, duration, key_scale, time_sig, temp, top_k, top_p, debug
+        )
+    generation_section["format_btn"].click(
+        fn=handle_format_sample_wrapper,
         inputs=[
             generation_section["captions"],
             generation_section["lyrics"],
     # ========== Process Source Audio Button ==========
     # Combines Convert to Codes + Transcribe in one step
+    # Note: @spaces.GPU decorator must be on the function passed directly to fn=,
+    # not on a module-level function wrapped in a lambda. Lambdas capturing handler
+    # objects cause pickling errors on ZeroGPU because the model contains unpicklable
+    # local objects (e.g. AceStepDiTModel.__init__ lambdas).
+    @_get_spaces_gpu_decorator(duration=180)
+    def process_source_audio_wrapper(src, debug):
+        return gen_h.process_source_audio(dit_handler, llm_handler, src, debug)
     generation_section["process_src_btn"].click(
+        fn=process_source_audio_wrapper,
         inputs=[
             generation_section["src_audio"],
             generation_section["constrained_decoding_debug"]
     # ========== Create Sample Button (Simple Mode) ==========
     # Note: cfg_scale and negative_prompt are not supported in create_sample mode
+    @_get_spaces_gpu_decorator(duration=180)
+    def handle_create_sample_wrapper(query, instrumental, vocal_lang, temp, top_k, top_p, debug):
+        return gen_h.handle_create_sample(
             llm_handler, query, instrumental, vocal_lang, temp, top_k, top_p, debug
+        )
+    generation_section["create_sample_btn"].click(
+        fn=handle_create_sample_wrapper,
         inputs=[
             generation_section["simple_query_input"],
             generation_section["simple_instrumental_checkbox"],
     # ========== Score Calculation Handlers ==========
     # Use default argument to capture btn_idx value at definition time (Python closure fix)
+    # Note: @spaces.GPU decorator applied here (not on module-level function) to avoid
+    # pickling issues on ZeroGPU when handler objects are captured in closures.
     def make_score_handler(idx):
+        @_get_spaces_gpu_decorator(duration=240)
+        def score_handler(scale, batch_idx, queue):
+            return res_h.calculate_score_handler_with_selection(
+                dit_handler, llm_handler, idx, scale, batch_idx, queue
+            )
+        return score_handler
     for btn_idx in range(1, 9):
         results_section[f"score_btn_{btn_idx}"].click(
     # ========== LRC Timestamp Handlers ==========
     # Use default argument to capture btn_idx value at definition time (Python closure fix)
     def make_lrc_handler(idx):
+        @_get_spaces_gpu_decorator(duration=240)
+        def lrc_handler(batch_idx, queue, vocal_lang, infer_steps):
+            return res_h.generate_lrc_handler(
+                dit_handler, idx, batch_idx, queue, vocal_lang, infer_steps
+            )
+        return lrc_handler
     for btn_idx in range(1, 9):
         results_section[f"lrc_btn_{btn_idx}"].click(

acestep/gradio_ui/events/generation_handlers.py CHANGED Viewed

@@ -766,7 +766,6 @@ def handle_generation_mode_change(mode: str):
         think_checkbox_update,  # think_checkbox - disabled for cover/repaint modes
     )
-@_get_spaces_gpu_decorator(duration=180)
 def process_source_audio(dit_handler, llm_handler, src_audio, constrained_decoding_debug):
     """
     Process source audio: convert to codes and then transcribe.
@@ -819,7 +818,6 @@ def process_source_audio(dit_handler, llm_handler, src_audio, constrained_decodi
         True  # Set is_format_caption to True
     )
-@_get_spaces_gpu_decorator(duration=180)
 def handle_create_sample(
     llm_handler,
     query: str,
@@ -949,7 +947,6 @@ def handle_create_sample(
         result.status_message,  # status_output
     )
-@_get_spaces_gpu_decorator(duration=180)
 def handle_format_sample(
     llm_handler,
     caption: str,

         think_checkbox_update,  # think_checkbox - disabled for cover/repaint modes
     )
 def process_source_audio(dit_handler, llm_handler, src_audio, constrained_decoding_debug):
     """
     Process source audio: convert to codes and then transcribe.
         True  # Set is_format_caption to True
     )
 def handle_create_sample(
     llm_handler,
     query: str,
         result.status_message,  # status_output
     )
 def handle_format_sample(
     llm_handler,
     caption: str,

acestep/gradio_ui/events/results_handlers.py CHANGED Viewed

@@ -1058,7 +1058,6 @@ def calculate_score_handler(
         error_msg = t("messages.score_error", error=str(e)) + f"\n{traceback.format_exc()}"
         return error_msg
-@_get_spaces_gpu_decorator(duration=240)
 def calculate_score_handler_with_selection(
         dit_handler,
         llm_handler,
@@ -1172,7 +1171,6 @@ def calculate_score_handler_with_selection(
         batch_queue
     )
-@_get_spaces_gpu_decorator(duration=240)
 def generate_lrc_handler(dit_handler, sample_idx, current_batch_index, batch_queue, vocal_language, inference_steps):
     """
     Generate LRC timestamps for a specific audio sample.

         error_msg = t("messages.score_error", error=str(e)) + f"\n{traceback.format_exc()}"
         return error_msg
 def calculate_score_handler_with_selection(
         dit_handler,
         llm_handler,
         batch_queue
     )
 def generate_lrc_handler(dit_handler, sample_idx, current_batch_index, batch_queue, vocal_language, inference_steps):
     """
     Generate LRC timestamps for a specific audio sample.