philschmid
/

sagemaker-models

Update model.json with amazon/FalconLite instance recommendation

by jinyolim - opened Aug 2, 2023

←

Files changed (1) hide show

model.json CHANGED Viewed

@@ -1,37 +1,41 @@
 {
-	"inference":{
-		"gpt2":{
-			"instanceType":"ml.g4dn.xlarge",
-			"numShard": 1
-		 },
-	   "google/flan-t5-xxl":{
-		  "instanceType":"ml.g5.12xlarge",
-		  "numShard": 4
-	   },
-	   "bigscience/bloom-7b1":{
-		"instanceType":"ml.g5.12xlarge",
-		"numShard": 4
-	 },
-	 "EleutherAI/gpt-neo-2.7B":{
-		"instanceType":"ml.g5.xlarge",
-		"numShard": 1
-	 },
-	 "tiiuae/falcon-40b-instruct":{
-		"instanceType":"ml.g5.12xlarge",
-		"numShard": 4
-	 },
-	 "EleutherAI/gpt-neox-20b":{
-		"instanceType":"ml.g5.12xlarge",
-		"numShard": 4
-	 },
-	 "bigcode/starcoder":{
-		"instanceType":"ml.g5.12xlarge",
-		"numShard": 4
-	 },
-	 "openlm-research/open_llama_13b":{
-		"instanceType":"ml.g5.12xlarge",
-		"numShard": 4
-	 }
-	},
-	"training":{}
- }

 {
+	"inference": {
+    "gpt2": {
+      "instanceType": "ml.g4dn.xlarge",
+      "numShard": 1
+    },
+    "google/flan-t5-xxl": {
+    "instanceType": "ml.g5.12xlarge",
+    "numShard": 4
+    },
+    "bigscience/bloom-7b1": {
+      "instanceType": "ml.g5.12xlarge",
+      "numShard": 4
+    },
+    "EleutherAI/gpt-neo-2.7B": {
+      "instanceType": "ml.g5.xlarge",
+      "numShard": 1
+    },
+    "tiiuae/falcon-40b-instruct": {
+      "instanceType": "ml.g5.12xlarge",
+      "numShard": 4
+    },
+    "EleutherAI/gpt-neox-20b": {
+      "instanceType": "ml.g5.12xlarge",
+      "numShard": 4
+    },
+    "bigcode/starcoder": {
+      "instanceType": "ml.g5.12xlarge",
+      "numShard": 4
+    },
+    "openlm-research/open_llama_13b": {
+      "instanceType": "ml.g5.12xlarge",
+      "numShard": 4
+    },
+    "amazon/FalconLite": {
+      "instanceType": "ml.g5.12xlarge",
+      "numShard": 4
+    }
+  },
+  "training":{}
+}