onnx-community/InternLM2-ONNX · InternLM2 - 1.8B, 7B AWQ-int4 ONNX export

Files changed (18) hide show

{internlm2-1.8b-cpu-int4 → internlm2-1.8b-cpu-int4-awq}/genai_config.json RENAMED Viewed

@@ -27,7 +27,7 @@
         },
         "eos_token_id": 2,
         "pad_token_id": 2,
-        "type": "internlm2",
         "vocab_size": 92544
     },
     "search": {

         },
         "eos_token_id": 2,
         "pad_token_id": 2,
+        "type": "llama",
         "vocab_size": 92544
     },
     "search": {

{internlm2-7b-cpu-int4 → internlm2-1.8b-cpu-int4-awq}/model.onnx RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f7c952a2498956d1b1580f0687ffc8d56ea103ef3e11b13dcecb53632c7652de
-size 240378

 version https://git-lfs.github.com/spec/v1
+oid sha256:90f55a90d9e73491e9aa0dbb88098a20b8def5f9c6c129f9b2effb42f9f0fac0
+size 179593

{internlm2-1.8b-cpu-int4 → internlm2-1.8b-cpu-int4-awq}/model.onnx.data RENAMED Viewed

File without changes

{internlm2-1.8b-cpu-int4 → internlm2-1.8b-cpu-int4-awq}/special_tokens_map.json RENAMED Viewed

File without changes

{internlm2-1.8b-cpu-int4 → internlm2-1.8b-cpu-int4-awq}/tokenization_internlm2.py RENAMED Viewed

File without changes

{internlm2-1.8b-cpu-int4 → internlm2-1.8b-cpu-int4-awq}/tokenization_internlm2_fast.py RENAMED Viewed

File without changes

{internlm2-1.8b-cpu-int4 → internlm2-1.8b-cpu-int4-awq}/tokenizer.json RENAMED Viewed

File without changes

{internlm2-1.8b-cpu-int4 → internlm2-1.8b-cpu-int4-awq}/tokenizer.model RENAMED Viewed

File without changes

{internlm2-7b-cpu-int4 → internlm2-1.8b-cpu-int4-awq}/tokenizer_config.json RENAMED Viewed

@@ -38,9 +38,9 @@
   "decode_with_prefix_space": false,
   "eos_token": "</s>",
   "extra_special_tokens": {},
-  "model_max_length": 32768,
   "pad_token": "</s>",
   "sp_model_kwargs": null,
   "tokenizer_class": "InternLM2Tokenizer",
   "unk_token": "<unk>"
-}

   "decode_with_prefix_space": false,
   "eos_token": "</s>",
   "extra_special_tokens": {},
+  "model_max_length": 1000000000000000019884624838656,
   "pad_token": "</s>",
   "sp_model_kwargs": null,
   "tokenizer_class": "InternLM2Tokenizer",
   "unk_token": "<unk>"
+}

{internlm2-7b-cpu-int4 → internlm2-7b-cpu-int4-awq}/genai_config.json RENAMED Viewed

@@ -27,7 +27,7 @@
         },
         "eos_token_id": 2,
         "pad_token_id": 2,
-        "type": "internlm2",
         "vocab_size": 92544
     },
     "search": {

         },
         "eos_token_id": 2,
         "pad_token_id": 2,
+        "type": "llama",
         "vocab_size": 92544
     },
     "search": {

{internlm2-1.8b-cpu-int4 → internlm2-7b-cpu-int4-awq}/model.onnx RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2659c5468b3da32b1cd56910e1b3fca6ba2de0a04229fc3efd531a32d3abaea3
-size 180164

 version https://git-lfs.github.com/spec/v1
+oid sha256:862b2f22bc845237107303a06832042c9d4641fab30a740b7ef6dfed99b146c8
+size 239348

{internlm2-7b-cpu-int4 → internlm2-7b-cpu-int4-awq}/model.onnx.data RENAMED Viewed

File without changes

{internlm2-7b-cpu-int4 → internlm2-7b-cpu-int4-awq}/special_tokens_map.json RENAMED Viewed

File without changes

{internlm2-7b-cpu-int4 → internlm2-7b-cpu-int4-awq}/tokenization_internlm2.py RENAMED Viewed

File without changes

{internlm2-7b-cpu-int4 → internlm2-7b-cpu-int4-awq}/tokenization_internlm2_fast.py RENAMED Viewed

File without changes

{internlm2-7b-cpu-int4 → internlm2-7b-cpu-int4-awq}/tokenizer.json RENAMED Viewed

File without changes

{internlm2-7b-cpu-int4 → internlm2-7b-cpu-int4-awq}/tokenizer.model RENAMED Viewed

File without changes

{internlm2-1.8b-cpu-int4 → internlm2-7b-cpu-int4-awq}/tokenizer_config.json RENAMED Viewed

@@ -27,20 +27,14 @@
       "special": true
     }
   },
-  "auto_map": {
-    "AutoTokenizer": [
-      "tokenization_internlm2.InternLM2Tokenizer",
-      "tokenization_internlm2_fast.InternLM2TokenizerFast"
-    ]
-  },
   "bos_token": "<s>",
   "clean_up_tokenization_spaces": false,
   "decode_with_prefix_space": false,
   "eos_token": "</s>",
   "extra_special_tokens": {},
-  "model_max_length": 32768,
   "pad_token": "</s>",
   "sp_model_kwargs": null,
-  "tokenizer_class": "InternLM2Tokenizer",
   "unk_token": "<unk>"
-}

       "special": true
     }
   },
   "bos_token": "<s>",
   "clean_up_tokenization_spaces": false,
   "decode_with_prefix_space": false,
   "eos_token": "</s>",
   "extra_special_tokens": {},
+  "model_max_length": 1000000000000000019884624838656,
   "pad_token": "</s>",
   "sp_model_kwargs": null,
+  "tokenizer_class": "LlamaTokenizer",
   "unk_token": "<unk>"
+}