| { | |
| "inference": { | |
| "gpt2": { | |
| "instanceType": "ml.g4dn.xlarge", | |
| "numShard": 1 | |
| }, | |
| "google/flan-t5-xxl": { | |
| "instanceType": "ml.g5.12xlarge", | |
| "numShard": 4 | |
| }, | |
| "bigscience/bloom-7b1": { | |
| "instanceType": "ml.g5.12xlarge", | |
| "numShard": 4 | |
| }, | |
| "EleutherAI/gpt-neo-2.7B": { | |
| "instanceType": "ml.g5.xlarge", | |
| "numShard": 1 | |
| }, | |
| "tiiuae/falcon-40b-instruct": { | |
| "instanceType": "ml.g5.12xlarge", | |
| "numShard": 4 | |
| }, | |
| "EleutherAI/gpt-neox-20b": { | |
| "instanceType": "ml.g5.12xlarge", | |
| "numShard": 4 | |
| }, | |
| "bigcode/starcoder": { | |
| "instanceType": "ml.g5.12xlarge", | |
| "numShard": 4 | |
| }, | |
| "openlm-research/open_llama_13b": { | |
| "instanceType": "ml.g5.12xlarge", | |
| "numShard": 4 | |
| }, | |
| "amazon/FalconLite": { | |
| "instanceType": "ml.g5.12xlarge", | |
| "numShard": 4 | |
| } | |
| }, | |
| "training":{} | |
| } |