DoloresAI-Merged / endpoint.json
busybisi's picture
Upload endpoint.json with huggingface_hub
fbbbc9e verified
{
"compute": {
"accelerator": "gpu",
"instanceSize": "medium",
"instanceType": "nvidia-a10g",
"scaling": {
"minReplica": 0,
"maxReplica": 1
}
},
"model": {
"framework": "pytorch",
"task": "text-generation",
"image": {
"huggingface": {}
}
},
"env": {
"PYTORCH_CUDA_ALLOC_CONF": "expandable_segments:True",
"CUDA_LAUNCH_BLOCKING": "1",
"TORCH_USE_CUDA_DSA": "1",
"TRANSFORMERS_OFFLINE": "0",
"HF_HUB_ENABLE_HF_TRANSFER": "1",
"MODEL_LOAD_TIMEOUT": "600"
}
}