Spaces:

Ronaldodev
/

MobiLLM

Runtime error

Ronaldodev commited on Oct 28, 2025

Commit

dcdbd59

verified ·

1 Parent(s): 5e6267d

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -5,11 +5,20 @@ from fastapi import FastAPI
 from pydantic import BaseModel
 import uvicorn
 import threading
 # --- 1. Charger le modèle ---
-model_name_or_path = "facebook/MobileLLM-Pro"  # ou ton chemin local si téléchargé
-tokenizer = AutoTokenizer.from_pretrained(model_name_or_path)
-model = AutoModelForCausalLM.from_pretrained(model_name_or_path, torch_dtype=torch.float16, device_map="auto")
 model.eval()
 # --- 2. Fonction de prédiction ---
@@ -28,7 +37,7 @@ def launch_gradio():
         title="MobileLLM-Pro Chat",
         description="Interface Gradio pour MobileLLM-Pro"
     )
-    iface.launch(server_name="0.0.0.0", server_port=7860)
 # --- 4. API FastAPI ---
 app = FastAPI()

 from pydantic import BaseModel
 import uvicorn
 import threading
+from huggingface_hub import notebook_login
+# --- 0. Authentification Hugging Face dans le Space ---
+notebook_login()  # ouvre une fenêtre pour te connecter si nécessaire
 # --- 1. Charger le modèle ---
+model_name_or_path = "facebook/MobileLLM-Pro"  # modèle gated
+tokenizer = AutoTokenizer.from_pretrained(model_name_or_path, use_auth_token=True)
+model = AutoModelForCausalLM.from_pretrained(
+    model_name_or_path,
+    use_auth_token=True,
+    torch_dtype=torch.float16,
+    device_map="auto"
+)
 model.eval()
 # --- 2. Fonction de prédiction ---
         title="MobileLLM-Pro Chat",
         description="Interface Gradio pour MobileLLM-Pro"
     )
+    iface.launch(server_name="0.0.0.0", server_port=7860, share=True)  # share=True pour accéder depuis le web
 # --- 4. API FastAPI ---
 app = FastAPI()