Upload LlamaForCausalLM

Files changed (4) hide show

config.json CHANGED Viewed

@@ -22,5 +22,5 @@
   "torch_dtype": "float16",
   "transformers_version": "4.34.0.dev0",
   "use_cache": true,
-  "vocab_size": 32016
 }

   "torch_dtype": "float16",
   "transformers_version": "4.34.0.dev0",
   "use_cache": true,
+  "vocab_size": 42414
 }

pytorch_model-00001-of-00002.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d0f36d62f1ba2fa5891ec8801c97e94d39ecfa4a0264a3e7c7b246426c0d18fd
-size 9976754202

 version https://git-lfs.github.com/spec/v1
+oid sha256:a206bc33ad9407f02e9819a4ecc2f6cb2f5d597317e96f31352ffdfb5f638933
+size 9971739657

pytorch_model-00002-of-00002.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:31563012efe341673ff59ad934c7cfac37d98760b511e13be704afc855eb7172
-size 3500442883

 version https://git-lfs.github.com/spec/v1
+oid sha256:8922244af2d785fea6c862d5364b863bb5939907bd106e5284b0042cb7bc09b0
+size 3675818233

pytorch_model.bin.index.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "metadata": {
-    "total_size": 13477093376
   },
   "weight_map": {
     "lm_head.weight": "pytorch_model-00002-of-00002.bin",
@@ -149,11 +149,11 @@
     "model.layers.22.self_attn.o_proj.weight": "pytorch_model-00001-of-00002.bin",
     "model.layers.22.self_attn.q_proj.weight": "pytorch_model-00001-of-00002.bin",
     "model.layers.22.self_attn.v_proj.weight": "pytorch_model-00001-of-00002.bin",
-    "model.layers.23.input_layernorm.weight": "pytorch_model-00001-of-00002.bin",
-    "model.layers.23.mlp.down_proj.weight": "pytorch_model-00001-of-00002.bin",
     "model.layers.23.mlp.gate_proj.weight": "pytorch_model-00001-of-00002.bin",
     "model.layers.23.mlp.up_proj.weight": "pytorch_model-00001-of-00002.bin",
-    "model.layers.23.post_attention_layernorm.weight": "pytorch_model-00001-of-00002.bin",
     "model.layers.23.self_attn.k_proj.weight": "pytorch_model-00001-of-00002.bin",
     "model.layers.23.self_attn.o_proj.weight": "pytorch_model-00001-of-00002.bin",
     "model.layers.23.self_attn.q_proj.weight": "pytorch_model-00001-of-00002.bin",

 {
   "metadata": {
+    "total_size": 13647454208
   },
   "weight_map": {
     "lm_head.weight": "pytorch_model-00002-of-00002.bin",
     "model.layers.22.self_attn.o_proj.weight": "pytorch_model-00001-of-00002.bin",
     "model.layers.22.self_attn.q_proj.weight": "pytorch_model-00001-of-00002.bin",
     "model.layers.22.self_attn.v_proj.weight": "pytorch_model-00001-of-00002.bin",
+    "model.layers.23.input_layernorm.weight": "pytorch_model-00002-of-00002.bin",
+    "model.layers.23.mlp.down_proj.weight": "pytorch_model-00002-of-00002.bin",
     "model.layers.23.mlp.gate_proj.weight": "pytorch_model-00001-of-00002.bin",
     "model.layers.23.mlp.up_proj.weight": "pytorch_model-00001-of-00002.bin",
+    "model.layers.23.post_attention_layernorm.weight": "pytorch_model-00002-of-00002.bin",
     "model.layers.23.self_attn.k_proj.weight": "pytorch_model-00001-of-00002.bin",
     "model.layers.23.self_attn.o_proj.weight": "pytorch_model-00001-of-00002.bin",
     "model.layers.23.self_attn.q_proj.weight": "pytorch_model-00001-of-00002.bin",