Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
|
@@ -44,11 +44,13 @@ class LLMManager:
|
|
| 44 |
actual_gb = actual_size / (1024*1024*1024)
|
| 45 |
logging.info(f"📊 Tamaño descargado para {model_name}: {actual_gb:.2f} GB")
|
| 46 |
|
|
|
|
|
|
|
| 47 |
logging.info(f"🔄 Cargando {model_name} en RAM…")
|
| 48 |
llm_instance = Llama(
|
| 49 |
model_path=temp_path,
|
| 50 |
n_ctx=MAX_CONTEXT_TOKENS,
|
| 51 |
-
n_batch=
|
| 52 |
n_threads=2,
|
| 53 |
n_threads_batch=2,
|
| 54 |
use_mlock=True,
|
|
|
|
| 44 |
actual_gb = actual_size / (1024*1024*1024)
|
| 45 |
logging.info(f"📊 Tamaño descargado para {model_name}: {actual_gb:.2f} GB")
|
| 46 |
|
| 47 |
+
n_batch = model_config.get("n_batch", 96)
|
| 48 |
+
|
| 49 |
logging.info(f"🔄 Cargando {model_name} en RAM…")
|
| 50 |
llm_instance = Llama(
|
| 51 |
model_path=temp_path,
|
| 52 |
n_ctx=MAX_CONTEXT_TOKENS,
|
| 53 |
+
n_batch=n_batch,
|
| 54 |
n_threads=2,
|
| 55 |
n_threads_batch=2,
|
| 56 |
use_mlock=True,
|