Upload LlamaForCausalLM

Files changed (10) hide show

config.json CHANGED Viewed

@@ -1,12 +1,16 @@
 {
-  "_name_or_path": "unsloth/Meta-Llama-3.1-8B-bnb-4bit",
   "architectures": [
     "LlamaForCausalLM"
   ],
   "attention_bias": false,
   "attention_dropout": 0.0,
   "bos_token_id": 128000,
-  "eos_token_id": 128001,
   "hidden_act": "silu",
   "hidden_size": 4096,
   "initializer_range": 0.02,
@@ -17,23 +21,7 @@
   "num_attention_heads": 32,
   "num_hidden_layers": 32,
   "num_key_value_heads": 8,
-  "pad_token_id": 128004,
   "pretraining_tp": 1,
-  "quantization_config": {
-    "_load_in_4bit": true,
-    "_load_in_8bit": false,
-    "bnb_4bit_compute_dtype": "bfloat16",
-    "bnb_4bit_quant_storage": "uint8",
-    "bnb_4bit_quant_type": "nf4",
-    "bnb_4bit_use_double_quant": true,
-    "llm_int8_enable_fp32_cpu_offload": false,
-    "llm_int8_has_fp16_weight": false,
-    "llm_int8_skip_modules": null,
-    "llm_int8_threshold": 6.0,
-    "load_in_4bit": true,
-    "load_in_8bit": false,
-    "quant_method": "bitsandbytes"
-  },
   "rms_norm_eps": 1e-05,
   "rope_scaling": {
     "factor": 8.0,
@@ -44,9 +32,8 @@
   },
   "rope_theta": 500000.0,
   "tie_word_embeddings": false,
-  "torch_dtype": "float16",
   "transformers_version": "4.44.0",
-  "unsloth_version": "2024.8",
   "use_cache": true,
   "vocab_size": 128256
 }

 {
+  "_name_or_path": "meta-llama/Meta-Llama-3.1-8B-Instruct",
   "architectures": [
     "LlamaForCausalLM"
   ],
   "attention_bias": false,
   "attention_dropout": 0.0,
   "bos_token_id": 128000,
+  "eos_token_id": [
+    128001,
+    128008,
+    128009
+  ],
   "hidden_act": "silu",
   "hidden_size": 4096,
   "initializer_range": 0.02,
   "num_attention_heads": 32,
   "num_hidden_layers": 32,
   "num_key_value_heads": 8,
   "pretraining_tp": 1,
   "rms_norm_eps": 1e-05,
   "rope_scaling": {
     "factor": 8.0,
   },
   "rope_theta": 500000.0,
   "tie_word_embeddings": false,
+  "torch_dtype": "float32",
   "transformers_version": "4.44.0",
   "use_cache": true,
   "vocab_size": 128256
 }

generation_config.json CHANGED Viewed

@@ -1,10 +1,11 @@
 {
-  "_from_model_config": true,
   "bos_token_id": 128000,
   "do_sample": true,
-  "eos_token_id": 128001,
-  "max_length": 131072,
-  "pad_token_id": 128004,
   "temperature": 0.6,
   "top_p": 0.9,
   "transformers_version": "4.44.0"

 {
   "bos_token_id": 128000,
   "do_sample": true,
+  "eos_token_id": [
+    128001,
+    128008,
+    128009
+  ],
   "temperature": 0.6,
   "top_p": 0.9,
   "transformers_version": "4.44.0"

model-00001-of-00007.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:85de022225908eebafe3533958236e330ccc97f3735a69051bf115e98f0f71b1
 size 4886466168

 version https://git-lfs.github.com/spec/v1
+oid sha256:d14cc5f2a03a721e186beb267fff867da0ed2cf8a60d498e4ee2cd618d1adfdf
 size 4886466168

model-00002-of-00007.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:483bdfd75328c6016993acc4694ef5ca2f6029c8576d2e4f72d5018d0bcf1162
 size 4832007448

 version https://git-lfs.github.com/spec/v1
+oid sha256:1ca31d2466b53fce44243bd1fb61db6b20607c13c65e3dcd4df388d65f379e46
 size 4832007448

model-00003-of-00007.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f0dd25ad96c0ed4fa1f7be62e89842d74b3cee101d6623883e38131b968f8a50
 size 4999813112

 version https://git-lfs.github.com/spec/v1
+oid sha256:86611f1f29bc67abfe500b522864396fba696c1b9273dde9033db3c181f36c2a
 size 4999813112

model-00004-of-00007.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2db579a08620445091b88f359e586d69811cd35f85d67a5c3c40977ae87be505
 size 4999813128

 version https://git-lfs.github.com/spec/v1
+oid sha256:e0bc28b473b551116c26efcda66e8b9d0f185e822e3db676d8838933e0a1aee6
 size 4999813128

model-00005-of-00007.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9133b7d4636287b879826a25c59a820a7c632fd0c232faedacf27e982cec9bcc
 size 4832007496

 version https://git-lfs.github.com/spec/v1
+oid sha256:cfa3c0cbd972e657a25bd36f73001e71a6c340362c7f00ee408eaf542cc12692
 size 4832007496

model-00006-of-00007.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1785d03a4be712e6d45b198cc51ddfdfeab9aacda5f4497afc975c86c3874126
 size 4999813120

 version https://git-lfs.github.com/spec/v1
+oid sha256:e43ce2f34685956c120bb869d344a620fb7329100e45bc862baac8864b7f656f
 size 4999813120

model-00007-of-00007.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2aed5abe69104c5784d3d53e0afe545b478acf8729dfbffe07dabe62ce2aae16
 size 2571158184

 version https://git-lfs.github.com/spec/v1
+oid sha256:4cc38bf86f7fbb6d3c107ce84ebdadb4d5fc118a875767d4bdd48960f7555d73
 size 2571158184

model.safetensors.index.json CHANGED Viewed

The diff for this file is too large to render. See raw diff