Add config
Browse files- config.json +3 -18
config.json
CHANGED
|
@@ -12,37 +12,22 @@
|
|
| 12 |
},
|
| 13 |
"pipeline_tag": "text-classification",
|
| 14 |
"version": "1.0.0",
|
| 15 |
-
"last_updated": "2025-03-13
|
| 16 |
"last_updated_by": "latishab",
|
| 17 |
"formats_available": [
|
| 18 |
"pytorch",
|
| 19 |
"onnx",
|
| 20 |
-
"onnx_quantized"
|
| 21 |
-
"gguf"
|
| 22 |
],
|
| 23 |
"inference_config": {
|
| 24 |
"task_type": "text-classification",
|
| 25 |
"runtime": "2.1",
|
| 26 |
"framework": "pytorch",
|
| 27 |
"memory": "auto",
|
| 28 |
-
"conversion_config": {
|
| 29 |
-
"quantization": "int8",
|
| 30 |
-
"optimize_memory": true,
|
| 31 |
-
"optimize_inference": true
|
| 32 |
-
},
|
| 33 |
"deployment": {
|
| 34 |
"instance_type": "cpu-basic",
|
| 35 |
"min_replicas": 1,
|
| 36 |
-
"max_replicas": 3
|
| 37 |
-
"scaling_config": {
|
| 38 |
-
"cpu_utilization": 80,
|
| 39 |
-
"max_concurrent_requests": 100
|
| 40 |
-
}
|
| 41 |
-
},
|
| 42 |
-
"api_config": {
|
| 43 |
-
"timeout": 30,
|
| 44 |
-
"max_tokens": 256,
|
| 45 |
-
"max_batch_size": 32
|
| 46 |
}
|
| 47 |
}
|
| 48 |
}
|
|
|
|
| 12 |
},
|
| 13 |
"pipeline_tag": "text-classification",
|
| 14 |
"version": "1.0.0",
|
| 15 |
+
"last_updated": "2025-03-13 04:24:17",
|
| 16 |
"last_updated_by": "latishab",
|
| 17 |
"formats_available": [
|
| 18 |
"pytorch",
|
| 19 |
"onnx",
|
| 20 |
+
"onnx_quantized"
|
|
|
|
| 21 |
],
|
| 22 |
"inference_config": {
|
| 23 |
"task_type": "text-classification",
|
| 24 |
"runtime": "2.1",
|
| 25 |
"framework": "pytorch",
|
| 26 |
"memory": "auto",
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 27 |
"deployment": {
|
| 28 |
"instance_type": "cpu-basic",
|
| 29 |
"min_replicas": 1,
|
| 30 |
+
"max_replicas": 3
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 31 |
}
|
| 32 |
}
|
| 33 |
}
|