Spaces:
Paused
Paused
encryptd commited on
Commit ·
a619f72
1
Parent(s): 9530a76
prog update
Browse files
app.py
CHANGED
|
@@ -40,7 +40,11 @@ def start_vllm():
|
|
| 40 |
"--gpu-memory-utilization", str(GPU_UTILIZATION),
|
| 41 |
"--max-model-len", str(MAX_MODEL_LEN),
|
| 42 |
"--dtype", "bfloat16",
|
| 43 |
-
"--limit-mm-per-prompt", '{"image": 1}'
|
|
|
|
|
|
|
|
|
|
|
|
|
| 44 |
]
|
| 45 |
# Connect vLLM logs to the HF console logs
|
| 46 |
subprocess.Popen(command, stdout=sys.stdout, stderr=sys.stderr)
|
|
|
|
| 40 |
"--gpu-memory-utilization", str(GPU_UTILIZATION),
|
| 41 |
"--max-model-len", str(MAX_MODEL_LEN),
|
| 42 |
"--dtype", "bfloat16",
|
| 43 |
+
"--limit-mm-per-prompt", '{"image": 1}',
|
| 44 |
+
# === Fix for Qwen2-VL Image Processor Warning ===
|
| 45 |
+
"--mm-processor-kwargs", '{"use_fast": true}',
|
| 46 |
+
# Optional but helpful
|
| 47 |
+
"--enforce-eager"
|
| 48 |
]
|
| 49 |
# Connect vLLM logs to the HF console logs
|
| 50 |
subprocess.Popen(command, stdout=sys.stdout, stderr=sys.stderr)
|