Spaces:

Ibou17
/

AgentScan_AI

Running

Ibou17 commited on Apr 9

Commit

fed2739

1 Parent(s): e4d7f15

Force TinyLlama for CPU deployment

Files changed (1) hide show

app.py CHANGED Viewed

@@ -71,7 +71,7 @@ def generate_text(model, tokenizer, prompt, max_new_tokens=150, temperature=0.1)
 # Chargement au démarrage (utilise TinyLlama si pas de GPU pour éviter OOM)
 print("Chargement du modèle...")
 try:
-    if torch.cuda.is_available():
         model, tokenizer = load_model("biomistral", quantize=True)
         print(f"✅ BioMistral-7B chargé — GPU: {torch.cuda.get_device_name(0)}")
     else:
@@ -376,7 +376,7 @@ def run_pipeline(text, synth_lang="fr", agents_enabled=None):
     }
     gc.collect()
-    if torch.cuda.is_available():
         torch.cuda.empty_cache()
     return R

 # Chargement au démarrage (utilise TinyLlama si pas de GPU pour éviter OOM)
 print("Chargement du modèle...")
 try:
+    if False:  # Force TinyLlama on CPU
         model, tokenizer = load_model("biomistral", quantize=True)
         print(f"✅ BioMistral-7B chargé — GPU: {torch.cuda.get_device_name(0)}")
     else:
     }
     gc.collect()
+    if False:  # Force TinyLlama on CPU
         torch.cuda.empty_cache()
     return R