Training in progress, step 157

Files changed (3) hide show

config.json CHANGED Viewed

@@ -1,4 +1,5 @@
 {
   "architectures": [
     "LlamaForCausalLM"
   ],
@@ -26,6 +27,5 @@
   "torch_dtype": "float32",
   "transformers_version": "4.52.4",
   "use_cache": true,
-  "use_flash_attention_2": true,
   "vocab_size": 32018
 }

 {
+  "_flash_attn_2_enabled": true,
   "architectures": [
     "LlamaForCausalLM"
   ],
   "torch_dtype": "float32",
   "transformers_version": "4.52.4",
   "use_cache": true,
   "vocab_size": 32018
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4af859c74e95b8b2916dd646eaa59fea4d7af8a5f84d958fd806f0a10eb3b405
 size 78437072

 version https://git-lfs.github.com/spec/v1
+oid sha256:9b5f21005e5dddb39867b15f39d7498996648347517c34f20c4f3de66f686a3b
 size 78437072

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b71c3a3068b9872c85cfc89abaff4a667cfb3946d5b420e2a8863844f34aeae8
 size 5777

 version https://git-lfs.github.com/spec/v1
+oid sha256:bb82c98b2b446ef4c244934e8fa2b402c4da56ecbd53e95ef252289afcd1be1c
 size 5777