sabbbbir commited on
Commit
51157f2
·
verified ·
1 Parent(s): 936ec58

Auto-push: step 10

Browse files
README.md CHANGED
@@ -3,8 +3,8 @@ library_name: transformers
3
  model_name: ckpt
4
  tags:
5
  - generated_from_trainer
6
- - trl
7
  - sft
 
8
  licence: license
9
  ---
10
 
 
3
  model_name: ckpt
4
  tags:
5
  - generated_from_trainer
 
6
  - sft
7
+ - trl
8
  licence: license
9
  ---
10
 
checkpoint-5/README.md CHANGED
@@ -1,9 +1,9 @@
1
  ---
2
- base_model: /root/.cache/huggingface/hub/models--sabbbbir--qwen-models/snapshots/c033e06a30d9a2afd45137e926cb77015c470e25/checkpoints/qwen3_6_27b
3
  library_name: peft
4
  pipeline_tag: text-generation
5
  tags:
6
- - base_model:adapter:/root/.cache/huggingface/hub/models--sabbbbir--qwen-models/snapshots/c033e06a30d9a2afd45137e926cb77015c470e25/checkpoints/qwen3_6_27b
7
  - lora
8
  - sft
9
  - transformers
 
1
  ---
2
+ base_model: /root/.cache/huggingface/hub/models--sabbbbir--qwen-models/snapshots/936ec5831cd1882184f34c45189997d741c42657/checkpoints/qwen3_6_27b
3
  library_name: peft
4
  pipeline_tag: text-generation
5
  tags:
6
+ - base_model:adapter:/root/.cache/huggingface/hub/models--sabbbbir--qwen-models/snapshots/936ec5831cd1882184f34c45189997d741c42657/checkpoints/qwen3_6_27b
7
  - lora
8
  - sft
9
  - transformers
checkpoint-5/adapter_config.json CHANGED
@@ -3,7 +3,7 @@
3
  "alpha_pattern": {},
4
  "arrow_config": null,
5
  "auto_mapping": null,
6
- "base_model_name_or_path": "/root/.cache/huggingface/hub/models--sabbbbir--qwen-models/snapshots/c033e06a30d9a2afd45137e926cb77015c470e25/checkpoints/qwen3_6_27b",
7
  "bias": "none",
8
  "corda_config": null,
9
  "ensure_weight_tying": false,
@@ -30,12 +30,12 @@
30
  "revision": null,
31
  "target_modules": [
32
  "k_proj",
33
- "o_proj",
34
  "q_proj",
35
  "v_proj",
36
- "down_proj",
37
- "up_proj",
38
- "gate_proj"
39
  ],
40
  "target_parameters": null,
41
  "task_type": "CAUSAL_LM",
 
3
  "alpha_pattern": {},
4
  "arrow_config": null,
5
  "auto_mapping": null,
6
+ "base_model_name_or_path": "/root/.cache/huggingface/hub/models--sabbbbir--qwen-models/snapshots/936ec5831cd1882184f34c45189997d741c42657/checkpoints/qwen3_6_27b",
7
  "bias": "none",
8
  "corda_config": null,
9
  "ensure_weight_tying": false,
 
30
  "revision": null,
31
  "target_modules": [
32
  "k_proj",
33
+ "up_proj",
34
  "q_proj",
35
  "v_proj",
36
+ "gate_proj",
37
+ "o_proj",
38
+ "down_proj"
39
  ],
40
  "target_parameters": null,
41
  "task_type": "CAUSAL_LM",
checkpoint-5/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1be4301920225e6f992d3c015ce91938db711d44d0319ca26df04a79d49ff6fc
3
  size 79759520
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17d5d9a33d06ed70307a4bfb4c9671ee18b026e8fd4eeb4a2dff0dcc1eed91fd
3
  size 79759520
checkpoint-5/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c8844756f56ee07e66e536d65757b2fab3d661a8b051f9d4f80f7122d995f21e
3
  size 81547303
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:172f44adbf9ed597fe62009c000161823bada70ee2cb4307ed08a63094c49aa6
3
  size 81547303
checkpoint-5/trainer_state.json CHANGED
@@ -11,9 +11,9 @@
11
  "log_history": [
12
  {
13
  "epoch": 0.02661343978709248,
14
- "grad_norm": 120.0,
15
  "learning_rate": 5e-05,
16
- "loss": 58.57597045898437,
17
  "step": 5
18
  }
19
  ],
 
11
  "log_history": [
12
  {
13
  "epoch": 0.02661343978709248,
14
+ "grad_norm": 117.0,
15
  "learning_rate": 5e-05,
16
+ "loss": 58.58668212890625,
17
  "step": 5
18
  }
19
  ],