victor HF Staff commited on
Commit
749bf48
·
1 Parent(s): 8ee99c8

Fix: set attn_implementation=sdpa (flash_attn not installed)

Browse files
Files changed (1) hide show
  1. app.py +1 -0
app.py CHANGED
@@ -40,6 +40,7 @@ tts_model = AutoModelForCausalLM.from_pretrained(
40
  low_cpu_mem_usage=True,
41
  )
42
  tts_model.eval()
 
43
 
44
  logger.info("Loading audio tokenizer: %s", AUDIO_TOKENIZER_ID)
45
  audio_tokenizer = AutoModel.from_pretrained(
 
40
  low_cpu_mem_usage=True,
41
  )
42
  tts_model.eval()
43
+ tts_model._set_attention_implementation("sdpa") # flash_attn not installed; sdpa is always available
44
 
45
  logger.info("Loading audio tokenizer: %s", AUDIO_TOKENIZER_ID)
46
  audio_tokenizer = AutoModel.from_pretrained(