Spaces:

kenlkehl
/

mm-ai-demo

Sleeping

kenlkehl commited on Nov 3

Commit

d9d81e4

verified ·

1 Parent(s): c4d8a31

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -276,7 +276,7 @@ def load_tagger_model(model_path: str) -> Tuple[str, str]:
             device=0 if state.device == "cuda" else -1,
             truncation=True,
             padding="max_length",
-            max_length=512
         )
         return f"✓ Tagger model loaded from {model_path}", ""
     except Exception as e:
@@ -336,8 +336,8 @@ def load_llm_model(model_path: str) -> Tuple[str, str]:
             state.llm_model = LLM(
                 model=model_path,
                 tensor_parallel_size=tp_size,
-                gpu_memory_utilization=0.40,
-                max_model_len=5000
             )
             state.llm_tokenizer = state.llm_model.get_tokenizer()
             return f"✓ LLM loaded from {model_path} (vLLM, tp={tp_size})", ""

             device=0 if state.device == "cuda" else -1,
             truncation=True,
             padding="max_length",
+            max_length=128
         )
         return f"✓ Tagger model loaded from {model_path}", ""
     except Exception as e:
             state.llm_model = LLM(
                 model=model_path,
                 tensor_parallel_size=tp_size,
+                gpu_memory_utilization=0.50,
+                max_model_len=15000
             )
             state.llm_tokenizer = state.llm_model.get_tokenizer()
             return f"✓ LLM loaded from {model_path} (vLLM, tp={tp_size})", ""