varsunk commited on
Commit
581ef5a
·
verified ·
1 Parent(s): d94ee72

Training in progress, step 10

Browse files
README.md CHANGED
@@ -4,8 +4,8 @@ library_name: transformers
4
  model_name: Qwen2.5-7B-Instruct-GRPO-test
5
  tags:
6
  - generated_from_trainer
7
- - grpo
8
  - trl
 
9
  licence: license
10
  ---
11
 
 
4
  model_name: Qwen2.5-7B-Instruct-GRPO-test
5
  tags:
6
  - generated_from_trainer
 
7
  - trl
8
+ - grpo
9
  licence: license
10
  ---
11
 
adapter_config.json CHANGED
@@ -25,8 +25,8 @@
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
28
- "v_proj",
29
- "q_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "trainable_token_indices": null,
 
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
28
+ "q_proj",
29
+ "v_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "trainable_token_indices": null,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b4dcfae68cd903244cc70730451fce118e6a511f5f27e0beec2346aa50af1ff6
3
  size 10107280
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:917933eb12ac118ed87e23112d687f031f6f8d7ff747a9ca1f9e734bbad1e5ec
3
  size 10107280
runs/Jul03_21-41-36_3cde1693ecac/events.out.tfevents.1751578936.3cde1693ecac.893.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc7f2122d7fb37065e5c2ca6de00040790706b4959f102ec8f30cc3454d4e738
3
+ size 8366
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e852e502cbb3a73a806419799c9a8ee08516cacc09a22c4849b55ccea122399c
3
  size 6456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:177c299fcdc2fde97aa979449f07f12aeae51eae4812e7ecd16210a41d1fe53b
3
  size 6456