Upload folder using huggingface_hub

Browse files

Files changed (3) hide show

added_tokens.json +40 -0
generation_config.json +6 -4
quantize_config.json +103 -0

added_tokens.json ADDED Viewed

	@@ -0,0 +1,40 @@

+{
+  "\t\t": 50294,
+  "\t\t\t": 50293,
+  "\t\t\t\t": 50292,
+  "\t\t\t\t\t": 50291,
+  "\t\t\t\t\t\t": 50290,
+  "\t\t\t\t\t\t\t": 50289,
+  "\t\t\t\t\t\t\t\t": 50288,
+  "\t\t\t\t\t\t\t\t\t": 50287,
+  "  ": 50286,
+  "   ": 50285,
+  "    ": 50284,
+  "     ": 50283,
+  "      ": 50282,
+  "       ": 50281,
+  "        ": 50280,
+  "         ": 50279,
+  "          ": 50278,
+  "           ": 50277,
+  "            ": 50276,
+  "             ": 50275,
+  "              ": 50274,
+  "               ": 50273,
+  "                ": 50272,
+  "                 ": 50271,
+  "                  ": 50270,
+  "                   ": 50269,
+  "                    ": 50268,
+  "                     ": 50267,
+  "                      ": 50266,
+  "                       ": 50265,
+  "                        ": 50264,
+  "                         ": 50263,
+  "                          ": 50262,
+  "                           ": 50261,
+  "                            ": 50260,
+  "                             ": 50259,
+  "                              ": 50258,
+  "                               ": 50257
+}

generation_config.json CHANGED Viewed

@@ -1,6 +1,8 @@
 {
-  "_from_model_config": true,
-  "bos_token_id": 1,
-  "eos_token_id": 50256,
-  "transformers_version": "4.33.0.dev0"
 }

 {
+  "max_new_tokens": 150,
+  "temperature": 0.9,
+  "top_p": 0.9,
+  "do_sample": true,
+  "num_beams": 1,
+  "early_stopping": true
 }

quantize_config.json ADDED Viewed

	@@ -0,0 +1,103 @@

+{
+    "per_channel": false,
+    "reduce_range": false,
+    "per_model_config": {
+        "decoder_model": {
+            "op_types": [
+                "Cast",
+                "Equal",
+                "Sqrt",
+                "Softmax",
+                "Neg",
+                "Reshape",
+                "ReduceMean",
+                "Where",
+                "MatMul",
+                "Slice",
+                "Shape",
+                "Unsqueeze",
+                "Gather",
+                "Sub",
+                "Squeeze",
+                "Mul",
+                "Split",
+                "Expand",
+                "ConstantOfShape",
+                "Concat",
+                "Constant",
+                "Transpose",
+                "Range",
+                "Pow",
+                "Tanh",
+                "Add",
+                "Div"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_model_merged": {
+            "op_types": [
+                "Cast",
+                "Equal",
+                "Sqrt",
+                "Softmax",
+                "Neg",
+                "Reshape",
+                "ReduceMean",
+                "Where",
+                "MatMul",
+                "Slice",
+                "Shape",
+                "Gather",
+                "Unsqueeze",
+                "Sub",
+                "Squeeze",
+                "Mul",
+                "Split",
+                "Expand",
+                "ConstantOfShape",
+                "Concat",
+                "Constant",
+                "Transpose",
+                "Range",
+                "Pow",
+                "Tanh",
+                "Add",
+                "If",
+                "Div"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_with_past_model": {
+            "op_types": [
+                "Cast",
+                "Equal",
+                "Sqrt",
+                "Softmax",
+                "Neg",
+                "Reshape",
+                "ReduceMean",
+                "Where",
+                "MatMul",
+                "Slice",
+                "Shape",
+                "Unsqueeze",
+                "Gather",
+                "Sub",
+                "Squeeze",
+                "Mul",
+                "Split",
+                "Expand",
+                "ConstantOfShape",
+                "Concat",
+                "Constant",
+                "Transpose",
+                "Range",
+                "Pow",
+                "Tanh",
+                "Add",
+                "Div"
+            ],
+            "weight_type": "QInt8"
+        }
+    }
+}