TinyPixel commited on Sep 26, 2023

Commit

2511eb9

1 Parent(s): a3a34fe

Upload LlamaForCausalLM

Files changed (17) hide show

config.json CHANGED Viewed

@@ -1,32 +1,27 @@
 {
-  "_name_or_path": "TinyPixel/CodeLlama-7B-bf16-sharded",
   "architectures": [
     "LlamaForCausalLM"
   ],
-  "auto_map": {
-    "AutoConfig": "TheBloke/CodeLlama-7B-fp16--configuration_llama.LlamaConfig",
-    "AutoModel": "TheBloke/CodeLlama-7B-fp16--modeling_llama.LlamaModel",
-    "AutoModelForCausalLM": "TheBloke/CodeLlama-7B-fp16--modeling_llama.LlamaForCausalLM",
-    "AutoModelForSequenceClassification": "TheBloke/CodeLlama-7B-fp16--modeling_llama.LlamaForSequenceClassification"
-  },
   "bos_token_id": 1,
   "eos_token_id": 2,
   "hidden_act": "silu",
   "hidden_size": 4096,
   "initializer_range": 0.02,
   "intermediate_size": 11008,
-  "max_position_embeddings": 16384,
   "model_type": "llama",
   "num_attention_heads": 32,
   "num_hidden_layers": 32,
   "num_key_value_heads": 32,
   "pretraining_tp": 1,
   "rms_norm_eps": 1e-05,
   "rope_scaling": null,
-  "rope_theta": 1000000,
   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
   "transformers_version": "4.34.0.dev0",
   "use_cache": true,
-  "vocab_size": 32016
 }

 {
+  "_name_or_path": "TinyPixel/Llama-2-7B-bf16-sharded",
   "architectures": [
     "LlamaForCausalLM"
   ],
   "bos_token_id": 1,
   "eos_token_id": 2,
   "hidden_act": "silu",
   "hidden_size": 4096,
   "initializer_range": 0.02,
   "intermediate_size": 11008,
+  "max_position_embeddings": 2048,
   "model_type": "llama",
   "num_attention_heads": 32,
   "num_hidden_layers": 32,
   "num_key_value_heads": 32,
+  "pad_token_id": 0,
   "pretraining_tp": 1,
   "rms_norm_eps": 1e-05,
   "rope_scaling": null,
+  "rope_theta": 10000.0,
   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
   "transformers_version": "4.34.0.dev0",
   "use_cache": true,
+  "vocab_size": 32000
 }

generation_config.json CHANGED Viewed

@@ -2,5 +2,6 @@
   "_from_model_config": true,
   "bos_token_id": 1,
   "eos_token_id": 2,
   "transformers_version": "4.34.0.dev0"
 }

   "_from_model_config": true,
   "bos_token_id": 1,
   "eos_token_id": 2,
+  "pad_token_id": 0,
   "transformers_version": "4.34.0.dev0"
 }

pytorch_model-00001-of-00014.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:042783ee2c07e45120eedb42f96be030d1cd084835dd968de441b9b2c87cbbbf
-size 981620399

 version https://git-lfs.github.com/spec/v1
+oid sha256:13dca03043e2204329753053c8d85e9bc232d340c4a80566a76b193ca260e846
+size 981489327

pytorch_model-00002-of-00014.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dd05dd202623c79d171398d0fccb78bb0d70ae926c1183e805d8549ab0421654
 size 966844269

 version https://git-lfs.github.com/spec/v1
+oid sha256:26e4072c445f0d7bcdb66eeae88ae74e8550a18c7f040873781e27a288bd4d0e
 size 966844269

pytorch_model-00003-of-00014.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b22be5dff46a9e9afca04efbabef54d92268fbca1eb6fee95ebfe3fde6cc0994
 size 966827273

 version https://git-lfs.github.com/spec/v1
+oid sha256:ebc453a7bde53abb560d627117f11e3bd933acd79f9bd87986e3c53285ae136f
 size 966827273

pytorch_model-00004-of-00014.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8fbfd0a91ff7b6ab3ac6fcbd6bb8c1a53e69c9a1762f20b8d8c0be92bcab0e9a
 size 989912603

 version https://git-lfs.github.com/spec/v1
+oid sha256:65a78480f23fbacf5607dbf303ed3c52af899a0d4d47f12e1dc362e7bed35036
 size 989912603

pytorch_model-00005-of-00014.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e48675ec64c70e7fadb2304e1688baa0730e9eba45cde080ef0cc6bb0ca6c5cf
 size 943758939

 version https://git-lfs.github.com/spec/v1
+oid sha256:d485f1350eb0b87b5aff649625d095d7e9e8bc584f851eb7889ecf1f9bfd8ac4
 size 943758939

pytorch_model-00006-of-00014.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a12f2215484496ce13aa5daeb7b43c8215be61230cf4e40b03301f475b0aa819
 size 989895607

 version https://git-lfs.github.com/spec/v1
+oid sha256:ee0078a1b12120eb0c95c44792dfbbbbab333bcc78b2de0382ce9488b49e1aee
 size 989895607

pytorch_model-00007-of-00014.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dddb6e1f0fcb6c73f4c3a4afe6d7d4e6873b9bf8adb1ca0b8c2fbe6fc1418dea
 size 966844269

 version https://git-lfs.github.com/spec/v1
+oid sha256:ec72061d9c7a3a9063e45bbe6115841f1fa596638443d7e6edab9a6d82019fcf
 size 966844269

pytorch_model-00008-of-00014.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0fff0cf9a21f088a6a4b91f2252c8b5a9ae0192f5a43bc52f2c16a8eb58614d0
 size 966827273

 version https://git-lfs.github.com/spec/v1
+oid sha256:0f8a31054f3a98f36bae88dcc15b8b65ec95987e9a5da6d98d8dc2497d61a945
 size 966827273

pytorch_model-00009-of-00014.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:952992a568c53e9312fcfc269d1402e7a5858c96ed4c2d109ae5906d2fc1b631
 size 989912667

 version https://git-lfs.github.com/spec/v1
+oid sha256:93e5a0f05b1797b76d61edc3ad7b133603b56a2be647b2267cafbfde69e8022c
 size 989912667

pytorch_model-00010-of-00014.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7f208e8b750cc66b20f9bf2c2f254c192d1e114673fdb256a56b31afbc3bc6a7
 size 943758939

 version https://git-lfs.github.com/spec/v1
+oid sha256:c74df24f96e90ee7faa3783bba447c98cc8a2a3b1ff5289b94879274e4e17c1b
 size 943758939

pytorch_model-00011-of-00014.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b8ed814aaa3d212c2455da73827edf6c8862caa2cf8a388abbdd2a79220232be
 size 989895607

 version https://git-lfs.github.com/spec/v1
+oid sha256:baa7bb3d343c41be9f630e936b1da919c77681251bd2ec44f25febe8fad333d5
 size 989895607

pytorch_model-00012-of-00014.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:859a16927e9b301f6635f948e723d1f4df0733b6859d9b92e52aa90e77fc96d8
 size 966844269

 version https://git-lfs.github.com/spec/v1
+oid sha256:bb3f88238a2405549949fc58f5bffc9f9af524d8dcf7d848b459769384b0a8dd
 size 966844269

pytorch_model-00013-of-00014.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:11a04c052f1cca3dcbd3aec93646a6b43b8335d59ca08ca5280fa223335d572b
 size 966827273

 version https://git-lfs.github.com/spec/v1
+oid sha256:beed225f18d508e6807fffe35dca5bc85fab88fdb18ec094040b0ed6b73125a3
 size 966827273

pytorch_model-00014-of-00014.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b22baafa8b6507ee3ee359229362ab44bbf59d22b182eebc098561b016fb7f3b
-size 847426845

 version https://git-lfs.github.com/spec/v1
+oid sha256:b7fccbb47e99f74efbc81bcde41ae8d8442066bb6416278bce9dcd22a2854549
+size 847295773

pytorch_model.bin.index.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "metadata": {
-    "total_size": 13477093376
   },
   "weight_map": {
     "lm_head.weight": "pytorch_model-00014-of-00014.bin",

 {
   "metadata": {
+    "total_size": 13476831232
   },
   "weight_map": {
     "lm_head.weight": "pytorch_model-00014-of-00014.bin",