Spaces:
Running
Running
File size: 322 Bytes
a9d4375 | 1 2 3 4 5 6 7 8 9 10 11 12 | """Shared constants for Modal deployments."""
MODEL_NAME = "mistralai/Mistral-7B-Instruct-v0.3"
GPU_TYPE = "a10g"
VLLM_MAX_MODEL_LEN = 8192
VLLM_DTYPE = "half"
VLLM_GPU_MEMORY_UTILIZATION = 0.85
# Cost tracking (for provider comparison report)
# Modal A10G: ~$0.000361/sec (~$1.30/hr)
MODAL_A10G_COST_PER_SEC = 0.000361
|