ChrisMoe commited on
Commit
e586e6f
·
verified ·
1 Parent(s): d8ad7db

(Trained with Unsloth)

Browse files
config.json CHANGED
@@ -4,7 +4,7 @@
4
  ],
5
  "attention_bias": false,
6
  "attention_dropout": 0.0,
7
- "torch_dtype": "float16",
8
  "eos_token_id": 151645,
9
  "head_dim": 128,
10
  "hidden_act": "silu",
@@ -57,7 +57,7 @@
57
  "num_key_value_heads": 8,
58
  "pad_token_id": 151654,
59
  "quantization_config": {
60
- "bnb_4bit_compute_dtype": "float16",
61
  "bnb_4bit_quant_type": "nf4",
62
  "bnb_4bit_use_double_quant": true,
63
  "llm_int8_enable_fp32_cpu_offload": false,
 
4
  ],
5
  "attention_bias": false,
6
  "attention_dropout": 0.0,
7
+ "torch_dtype": "bfloat16",
8
  "eos_token_id": 151645,
9
  "head_dim": 128,
10
  "hidden_act": "silu",
 
57
  "num_key_value_heads": 8,
58
  "pad_token_id": 151654,
59
  "quantization_config": {
60
+ "bnb_4bit_compute_dtype": "bfloat16",
61
  "bnb_4bit_quant_type": "nf4",
62
  "bnb_4bit_use_double_quant": true,
63
  "llm_int8_enable_fp32_cpu_offload": false,
model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d98c9ae6e07097bfa49fca81ca20fd4c2439c989143417e16c2a0f6cb3d77f77
3
- size 4828897876
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db9d80bfd08559eba0880ce54921f8e7cb82730a8d23695507991dd7d8587820
3
+ size 4828898032
model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:16c3a004b23371ef2cf248a2baf4869d3969dbcf37e792b48008d73036872855
3
  size 1244659840
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20c2d6366ab85c90786ccdd829cd2b9e7d30ef3b2ebbb998280e7e4014b542ff
3
  size 1244659840
model.safetensors.index.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "metadata": {
3
  "total_parameters": 8190735360,
4
- "total_size": 6073360284
5
  },
6
  "weight_map": {
7
  "lm_head.weight": "model-00002-of-00002.safetensors",
 
1
  {
2
  "metadata": {
3
  "total_parameters": 8190735360,
4
+ "total_size": 6073360296
5
  },
6
  "weight_map": {
7
  "lm_head.weight": "model-00002-of-00002.safetensors",