Training in progress, epoch 1
Browse files- README.md +2 -2
- adapter_config.json +3 -3
- adapter_model.safetensors +1 -1
- runs/Sep05_02-11-22_4a02d2f90a3e/events.out.tfevents.1757038294.4a02d2f90a3e.977.0 +3 -0
- runs/Sep05_02-13-45_4a02d2f90a3e/events.out.tfevents.1757038436.4a02d2f90a3e.2157.0 +3 -0
- runs/Sep05_02-16-00_4a02d2f90a3e/events.out.tfevents.1757038582.4a02d2f90a3e.2731.0 +3 -0
- training_args.bin +1 -1
README.md
CHANGED
|
@@ -35,10 +35,10 @@ This model was trained with SFT.
|
|
| 35 |
### Framework versions
|
| 36 |
|
| 37 |
- TRL: 0.21.0
|
| 38 |
-
- Transformers: 4.
|
| 39 |
- Pytorch: 2.8.0+cu126
|
| 40 |
- Datasets: 4.0.0
|
| 41 |
-
- Tokenizers: 0.
|
| 42 |
|
| 43 |
## Citations
|
| 44 |
|
|
|
|
| 35 |
### Framework versions
|
| 36 |
|
| 37 |
- TRL: 0.21.0
|
| 38 |
+
- Transformers: 4.56.0
|
| 39 |
- Pytorch: 2.8.0+cu126
|
| 40 |
- Datasets: 4.0.0
|
| 41 |
+
- Tokenizers: 0.22.0
|
| 42 |
|
| 43 |
## Citations
|
| 44 |
|
adapter_config.json
CHANGED
|
@@ -26,13 +26,13 @@
|
|
| 26 |
"rank_pattern": {},
|
| 27 |
"revision": null,
|
| 28 |
"target_modules": [
|
|
|
|
| 29 |
"o_proj",
|
| 30 |
"q_proj",
|
|
|
|
| 31 |
"down_proj",
|
| 32 |
-
"up_proj",
|
| 33 |
"k_proj",
|
| 34 |
-
"
|
| 35 |
-
"gate_proj"
|
| 36 |
],
|
| 37 |
"task_type": "CAUSAL_LM",
|
| 38 |
"use_dora": false,
|
|
|
|
| 26 |
"rank_pattern": {},
|
| 27 |
"revision": null,
|
| 28 |
"target_modules": [
|
| 29 |
+
"v_proj",
|
| 30 |
"o_proj",
|
| 31 |
"q_proj",
|
| 32 |
+
"gate_proj",
|
| 33 |
"down_proj",
|
|
|
|
| 34 |
"k_proj",
|
| 35 |
+
"up_proj"
|
|
|
|
| 36 |
],
|
| 37 |
"task_type": "CAUSAL_LM",
|
| 38 |
"use_dora": false,
|
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2468152240
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fb40ae3befec2e9207fc57f0b5e5a0e46290b18ea53c1aa75548a34e3398116c
|
| 3 |
size 2468152240
|
runs/Sep05_02-11-22_4a02d2f90a3e/events.out.tfevents.1757038294.4a02d2f90a3e.977.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6967c62b76a9c19a45347fd7290020182255caad2508ee4e590eb4bf11c91588
|
| 3 |
+
size 16472
|
runs/Sep05_02-13-45_4a02d2f90a3e/events.out.tfevents.1757038436.4a02d2f90a3e.2157.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:64627e39f7fe41fb7ab668c3c5ca1c0a55a1765d488ce4e59e3aa51084faaab0
|
| 3 |
+
size 7525
|
runs/Sep05_02-16-00_4a02d2f90a3e/events.out.tfevents.1757038582.4a02d2f90a3e.2731.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:06b1b58555f2ffacdb7678e723867d9e0448231263a5e0b9100c4a8e24ef60a0
|
| 3 |
+
size 7538
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 6225
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f6f2f9d36b07018159c9dcf1b4c02b6bfa3197507ec278ee261a8e7fbbf748ec
|
| 3 |
size 6225
|