Sayoyo commited on
Commit
750d963
·
2 Parent(s): 1fb8172e012a1d

erge branch 'fix/cot_caption'

Browse files
Files changed (1) hide show
  1. acestep/api_server.py +14 -6
acestep/api_server.py CHANGED
@@ -640,10 +640,21 @@ def create_app() -> FastAPI:
640
  # Determine if LLM is needed
641
  thinking = bool(req.thinking)
642
  sample_mode = bool(req.sample_mode)
643
- need_llm = thinking or sample_mode
 
 
 
 
 
 
 
 
 
 
 
644
 
645
- print(f"[api_server] Request params: req.thinking={req.thinking}, req.sample_mode={req.sample_mode}")
646
- print(f"[api_server] Determined: thinking={thinking}, sample_mode={sample_mode}, need_llm={need_llm}")
647
 
648
  # Ensure LLM is ready if needed
649
  if need_llm:
@@ -659,9 +670,6 @@ def create_app() -> FastAPI:
659
  time_signature = req.time_signature
660
  audio_duration = req.audio_duration
661
 
662
- # Check if sample_query (description) is provided for create_sample
663
- has_sample_query = bool(req.sample_query and req.sample_query.strip())
664
-
665
  if sample_mode or has_sample_query:
666
  if has_sample_query:
667
  # Use create_sample() with description query
 
640
  # Determine if LLM is needed
641
  thinking = bool(req.thinking)
642
  sample_mode = bool(req.sample_mode)
643
+ has_sample_query = bool(req.sample_query and req.sample_query.strip())
644
+ use_format = bool(req.use_format)
645
+ use_cot_caption = bool(req.use_cot_caption)
646
+ use_cot_language = bool(req.use_cot_language)
647
+
648
+ # LLM is needed for:
649
+ # - thinking mode (LM generates audio codes)
650
+ # - sample_mode (LM generates random caption/lyrics/metas)
651
+ # - sample_query/description (LM generates from description)
652
+ # - use_format (LM enhances caption/lyrics)
653
+ # - use_cot_caption or use_cot_language (LM enhances metadata)
654
+ need_llm = thinking or sample_mode or has_sample_query or use_format or use_cot_caption or use_cot_language
655
 
656
+ print(f"[api_server] Request params: req.thinking={req.thinking}, req.sample_mode={req.sample_mode}, req.use_cot_caption={req.use_cot_caption}, req.use_cot_language={req.use_cot_language}, req.use_format={req.use_format}")
657
+ print(f"[api_server] Determined: thinking={thinking}, sample_mode={sample_mode}, use_cot_caption={use_cot_caption}, use_cot_language={use_cot_language}, use_format={use_format}, need_llm={need_llm}")
658
 
659
  # Ensure LLM is ready if needed
660
  if need_llm:
 
670
  time_signature = req.time_signature
671
  audio_duration = req.audio_duration
672
 
 
 
 
673
  if sample_mode or has_sample_query:
674
  if has_sample_query:
675
  # Use create_sample() with description query