minpeter commited on
Commit
b22692a
·
verified ·
1 Parent(s): 1cba57e

Training in progress, step 157

Browse files
Files changed (3) hide show
  1. config.json +1 -2
  2. model.safetensors +2 -2
  3. training_args.bin +1 -1
config.json CHANGED
@@ -1,5 +1,4 @@
1
  {
2
- "_flash_attn_2_enabled": true,
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
@@ -24,7 +23,7 @@
24
  "rope_scaling": null,
25
  "rope_theta": 10000.0,
26
  "tie_word_embeddings": true,
27
- "torch_dtype": "float32",
28
  "transformers_version": "4.52.4",
29
  "use_cache": true,
30
  "vocab_size": 32018
 
1
  {
 
2
  "architectures": [
3
  "LlamaForCausalLM"
4
  ],
 
23
  "rope_scaling": null,
24
  "rope_theta": 10000.0,
25
  "tie_word_embeddings": true,
26
+ "torch_dtype": "bfloat16",
27
  "transformers_version": "4.52.4",
28
  "use_cache": true,
29
  "vocab_size": 32018
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9b5f21005e5dddb39867b15f39d7498996648347517c34f20c4f3de66f686a3b
3
- size 78437072
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:590b2a4708bce14ae5c96b69a18f6b99fc5a29a5045dca788cdf67aaada33fcb
3
+ size 39224640
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bb82c98b2b446ef4c244934e8fa2b402c4da56ecbd53e95ef252289afcd1be1c
3
  size 5777
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af5c076571bb7d9ea155891bc4a361ba9ceadcc8894ade1661dfed89779db703
3
  size 5777