EC2 Default User
commited on
Commit
Β·
e35a331
1
Parent(s):
82520b5
update model
Browse files- 4step/{added_tokens.json β epoch1/added_tokens.json} +0 -0
- 4step/{config.json β epoch1/config.json} +0 -0
- 4step/{generation_config.json β epoch1/generation_config.json} +0 -0
- 4step/{merges.txt β epoch1/merges.txt} +0 -0
- 4step/{model-00001-of-00004.safetensors β epoch1/model-00001-of-00004.safetensors} +0 -0
- 4step/{model-00002-of-00004.safetensors β epoch1/model-00002-of-00004.safetensors} +0 -0
- 4step/{model-00003-of-00004.safetensors β epoch1/model-00003-of-00004.safetensors} +0 -0
- 4step/{model-00004-of-00004.safetensors β epoch1/model-00004-of-00004.safetensors} +0 -0
- 4step/{model.safetensors.index.json β epoch1/model.safetensors.index.json} +0 -0
- 4step/{special_tokens_map.json β epoch1/special_tokens_map.json} +0 -0
- 4step/{tokenizer.json β epoch1/tokenizer.json} +0 -0
- 4step/{tokenizer_config.json β epoch1/tokenizer_config.json} +0 -0
- 4step/{vocab.json β epoch1/vocab.json} +0 -0
- 4step/epoch2/added_tokens.json +3 -0
- 4step/epoch2/config.json +3 -0
- 4step/epoch2/generation_config.json +3 -0
- 4step/epoch2/merges.txt +0 -0
- 4step/epoch2/model-00001-of-00004.safetensors +3 -0
- 4step/epoch2/model-00002-of-00004.safetensors +3 -0
- 4step/epoch2/model-00003-of-00004.safetensors +3 -0
- 4step/epoch2/model-00004-of-00004.safetensors +3 -0
- 4step/epoch2/model.safetensors.index.json +3 -0
- 4step/epoch2/special_tokens_map.json +3 -0
- 4step/epoch2/tokenizer.json +3 -0
- 4step/epoch2/tokenizer_config.json +3 -0
- 4step/epoch2/vocab.json +3 -0
- 4step/epoch3/added_tokens.json +3 -0
- 4step/epoch3/cfg.yaml +32 -0
- 4step/epoch3/config.json +3 -0
- 4step/epoch3/generation_config.json +3 -0
- 4step/epoch3/log.txt +0 -0
- 4step/epoch3/merges.txt +0 -0
- 4step/epoch3/model-00001-of-00004.safetensors +3 -0
- 4step/epoch3/model-00002-of-00004.safetensors +3 -0
- 4step/epoch3/model-00003-of-00004.safetensors +3 -0
- 4step/epoch3/model-00004-of-00004.safetensors +3 -0
- 4step/epoch3/model.safetensors.index.json +3 -0
- 4step/epoch3/special_tokens_map.json +3 -0
- 4step/epoch3/tokenizer.json +3 -0
- 4step/epoch3/tokenizer_config.json +3 -0
- 4step/epoch3/vocab.json +3 -0
4step/{added_tokens.json β epoch1/added_tokens.json}
RENAMED
|
File without changes
|
4step/{config.json β epoch1/config.json}
RENAMED
|
File without changes
|
4step/{generation_config.json β epoch1/generation_config.json}
RENAMED
|
File without changes
|
4step/{merges.txt β epoch1/merges.txt}
RENAMED
|
File without changes
|
4step/{model-00001-of-00004.safetensors β epoch1/model-00001-of-00004.safetensors}
RENAMED
|
File without changes
|
4step/{model-00002-of-00004.safetensors β epoch1/model-00002-of-00004.safetensors}
RENAMED
|
File without changes
|
4step/{model-00003-of-00004.safetensors β epoch1/model-00003-of-00004.safetensors}
RENAMED
|
File without changes
|
4step/{model-00004-of-00004.safetensors β epoch1/model-00004-of-00004.safetensors}
RENAMED
|
File without changes
|
4step/{model.safetensors.index.json β epoch1/model.safetensors.index.json}
RENAMED
|
File without changes
|
4step/{special_tokens_map.json β epoch1/special_tokens_map.json}
RENAMED
|
File without changes
|
4step/{tokenizer.json β epoch1/tokenizer.json}
RENAMED
|
File without changes
|
4step/{tokenizer_config.json β epoch1/tokenizer_config.json}
RENAMED
|
File without changes
|
4step/{vocab.json β epoch1/vocab.json}
RENAMED
|
File without changes
|
4step/epoch2/added_tokens.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5d78c8be18a2b65adade583f4f8354edb141ae6a0d0fe6589bad9a9ac1eda11b
|
| 3 |
+
size 691
|
4step/epoch2/config.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5101c3e74437558e0f0bb91d8624187915c61d026c754b201e0b0c3fb613bdc8
|
| 3 |
+
size 739
|
4step/epoch2/generation_config.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0c5df43ff9c1194f0e3a5d81c3f1356d9745b7a7592d281bbc416c6c0ba92922
|
| 3 |
+
size 248
|
4step/epoch2/merges.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
4step/epoch2/model-00001-of-00004.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8182a130f6be989b87a55b86e51121d3e21df6681b2d81c608016736cc152f92
|
| 3 |
+
size 4874829416
|
4step/epoch2/model-00002-of-00004.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:405a82169044445ce2245d0500fbac31d10d787cadf6136f117cb54ad9cabc34
|
| 3 |
+
size 4932751008
|
4step/epoch2/model-00003-of-00004.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:25498b42de6d7a8b4e4ebf7d72c2d1f4294858f25d146125835b3bb5ec158af1
|
| 3 |
+
size 4330865200
|
4step/epoch2/model-00004-of-00004.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e0fe7dafb94c0d5375cb3811e9a0e19d875777ff0069930b0362ef16b978867b
|
| 3 |
+
size 1087163520
|
4step/epoch2/model.safetensors.index.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d677d897cad6756ca7fb81985640e8610d22a20f9cd4fe706ed14e76869f1cce
|
| 3 |
+
size 27752
|
4step/epoch2/special_tokens_map.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cac6b1eaf1d425b4ab1087ef648d766ebc8f5b410ad28a783130cc6ad6141a06
|
| 3 |
+
size 895
|
4step/epoch2/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:06797a9ae432d4cb6427bd384738a4547b000198d5ddce86f3e721007d34cff0
|
| 3 |
+
size 11422634
|
4step/epoch2/tokenizer_config.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:990b97d80492f771fd974bd3afb0936a43334b69f81ed2b8a364e04a49360a11
|
| 3 |
+
size 7812
|
4step/epoch2/vocab.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910
|
| 3 |
+
size 2776833
|
4step/epoch3/added_tokens.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5d78c8be18a2b65adade583f4f8354edb141ae6a0d0fe6589bad9a9ac1eda11b
|
| 3 |
+
size 691
|
4step/epoch3/cfg.yaml
ADDED
|
@@ -0,0 +1,32 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
model_id: Qwen/Qwen2.5-7B-Instruct
|
| 2 |
+
model_family: qwen2.5
|
| 3 |
+
LoRA:
|
| 4 |
+
r: 0
|
| 5 |
+
alpha: 128
|
| 6 |
+
dropout: 0.05
|
| 7 |
+
used_policy: true
|
| 8 |
+
used_strategy: true
|
| 9 |
+
step_token: <step>,</step>
|
| 10 |
+
answer_token: <answer>,</answer>
|
| 11 |
+
loss_type: grad_ascent
|
| 12 |
+
tune_vision_tower: false
|
| 13 |
+
tune_mm_projector: true
|
| 14 |
+
tune_language_model: true
|
| 15 |
+
data_path: ./dataset/safety_reasoning_v2_4step.json
|
| 16 |
+
split: with_strategy_policy_4step
|
| 17 |
+
batch_size: 2
|
| 18 |
+
gradient_accumulation_steps: 8
|
| 19 |
+
max_grad_norm: 1.0
|
| 20 |
+
num_epochs: 3
|
| 21 |
+
max_length: 3072
|
| 22 |
+
save_dir: models/final_ft_${num_epochs}_epochs_lr${lr}_${model_family}_${split}
|
| 23 |
+
save_steps: 165
|
| 24 |
+
lr: 1.0e-05
|
| 25 |
+
weight_decay: 0.01
|
| 26 |
+
seed: 233
|
| 27 |
+
workers: 4
|
| 28 |
+
lr_scheduler_type: cosine
|
| 29 |
+
warmup_ratio: 0.0
|
| 30 |
+
max_train_steps: -1
|
| 31 |
+
report_to: wandb
|
| 32 |
+
resume_from_checkpoint: ''
|
4step/epoch3/config.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5101c3e74437558e0f0bb91d8624187915c61d026c754b201e0b0c3fb613bdc8
|
| 3 |
+
size 739
|
4step/epoch3/generation_config.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0c5df43ff9c1194f0e3a5d81c3f1356d9745b7a7592d281bbc416c6c0ba92922
|
| 3 |
+
size 248
|
4step/epoch3/log.txt
ADDED
|
File without changes
|
4step/epoch3/merges.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
4step/epoch3/model-00001-of-00004.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:03112b2fce70b792ee41288aea2ca5b5fb9a48e40e247db4934e83232051bc4b
|
| 3 |
+
size 4874829416
|
4step/epoch3/model-00002-of-00004.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8aa2cccfe6e56fb44b4d813242a9f3c7aad90acf49cd1c36b9d06102f38e1929
|
| 3 |
+
size 4932751008
|
4step/epoch3/model-00003-of-00004.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:732d6152aa25d0befa852d76688d597a899164b2090a41549a39e4f28bda0223
|
| 3 |
+
size 4330865200
|
4step/epoch3/model-00004-of-00004.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ac7225d25be346c600f636172bb8ba64a07dff62ba6f088e5005a795f3978c44
|
| 3 |
+
size 1087163520
|
4step/epoch3/model.safetensors.index.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d677d897cad6756ca7fb81985640e8610d22a20f9cd4fe706ed14e76869f1cce
|
| 3 |
+
size 27752
|
4step/epoch3/special_tokens_map.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cac6b1eaf1d425b4ab1087ef648d766ebc8f5b410ad28a783130cc6ad6141a06
|
| 3 |
+
size 895
|
4step/epoch3/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:06797a9ae432d4cb6427bd384738a4547b000198d5ddce86f3e721007d34cff0
|
| 3 |
+
size 11422634
|
4step/epoch3/tokenizer_config.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:990b97d80492f771fd974bd3afb0936a43334b69f81ed2b8a364e04a49360a11
|
| 3 |
+
size 7812
|
4step/epoch3/vocab.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910
|
| 3 |
+
size 2776833
|