Spaces:
Running on Zero
Running on Zero
Fix: set attn_implementation=sdpa (flash_attn not installed)
Browse files
app.py
CHANGED
|
@@ -40,6 +40,7 @@ tts_model = AutoModelForCausalLM.from_pretrained(
|
|
| 40 |
low_cpu_mem_usage=True,
|
| 41 |
)
|
| 42 |
tts_model.eval()
|
|
|
|
| 43 |
|
| 44 |
logger.info("Loading audio tokenizer: %s", AUDIO_TOKENIZER_ID)
|
| 45 |
audio_tokenizer = AutoModel.from_pretrained(
|
|
|
|
| 40 |
low_cpu_mem_usage=True,
|
| 41 |
)
|
| 42 |
tts_model.eval()
|
| 43 |
+
tts_model._set_attention_implementation("sdpa") # flash_attn not installed; sdpa is always available
|
| 44 |
|
| 45 |
logger.info("Loading audio tokenizer: %s", AUDIO_TOKENIZER_ID)
|
| 46 |
audio_tokenizer = AutoModel.from_pretrained(
|