Spaces:

gijs
/

phi4_mm

Runtime error

Gijs Wijngaard commited on Aug 26

Commit

dc6e6db

1 Parent(s): eaf61fe

init

Files changed (1) hide show

app.py CHANGED Viewed

@@ -17,10 +17,12 @@ model = AutoModelForCausalLM.from_pretrained(
     MODEL_ID,
     device_map="cuda" if torch.cuda.is_available() else "cpu",
     torch_dtype="auto",
-    trust_remote_code=True,
     _attn_implementation="flash_attention_2",
 )
 generation_config = GenerationConfig.from_pretrained(MODEL_ID)
 @spaces.GPU

     MODEL_ID,
     device_map="cuda" if torch.cuda.is_available() else "cpu",
     torch_dtype="auto",
     _attn_implementation="flash_attention_2",
 )
+model.load_adapter(MODEL_ID, adapter_name="speech", device_map="cuda" if torch.cuda.is_available() else "cpu", adapter_kwargs={"subfolder": 'speech-lora'})
+model.set_adapter("speech")
 generation_config = GenerationConfig.from_pretrained(MODEL_ID)
 @spaces.GPU