Add files using upload-large-folder tool
Browse files- qwen25_0.5b_lora_official_5e-05/checkpoint-117744/adapter_config.json +2 -2
- qwen25_0.5b_lora_official_5e-05/checkpoint-117744/adapter_model.safetensors +1 -1
- qwen25_0.5b_lora_official_5e-05/checkpoint-117744/optimizer.pt +1 -1
- qwen25_0.5b_lora_official_5e-05/checkpoint-117744/rng_state.pth +1 -1
- qwen25_0.5b_lora_official_5e-05/checkpoint-117744/trainer_state.json +0 -0
- qwen25_0.5b_qlora_official_5e-05/adapter_config.json +4 -4
- qwen25_0.5b_qlora_official_5e-05/adapter_model.safetensors +1 -1
- qwen25_0.5b_qlora_official_5e-05/checkpoint-117744/adapter_config.json +4 -4
- qwen25_0.5b_qlora_official_5e-05/checkpoint-117744/adapter_model.safetensors +1 -1
- qwen25_0.5b_qlora_official_5e-05/checkpoint-117744/optimizer.pt +1 -1
- qwen25_0.5b_qlora_official_5e-05/checkpoint-117744/rng_state.pth +1 -1
- qwen25_0.5b_qlora_official_5e-05/checkpoint-117744/trainer_state.json +0 -0
- qwen25_0.5b_qlora_official_5e-05/checkpoint-58872/adapter_config.json +4 -4
- qwen25_0.5b_qlora_official_5e-05/checkpoint-58872/adapter_model.safetensors +1 -1
- qwen25_0.5b_qlora_official_5e-05/checkpoint-58872/optimizer.pt +1 -1
- qwen25_0.5b_qlora_official_5e-05/checkpoint-58872/rng_state.pth +1 -1
- qwen25_0.5b_qlora_official_5e-05/checkpoint-58872/trainer_state.json +0 -0
- qwen25_0.5b_qlora_official_5e-05/complete_results.json +0 -0
qwen25_0.5b_lora_official_5e-05/checkpoint-117744/adapter_config.json
CHANGED
|
@@ -26,10 +26,10 @@
|
|
| 26 |
"revision": null,
|
| 27 |
"target_modules": [
|
| 28 |
"down_proj",
|
| 29 |
-
"
|
| 30 |
"q_proj",
|
| 31 |
"k_proj",
|
| 32 |
-
"
|
| 33 |
"gate_proj"
|
| 34 |
],
|
| 35 |
"task_type": "CAUSAL_LM",
|
|
|
|
| 26 |
"revision": null,
|
| 27 |
"target_modules": [
|
| 28 |
"down_proj",
|
| 29 |
+
"up_proj",
|
| 30 |
"q_proj",
|
| 31 |
"k_proj",
|
| 32 |
+
"v_proj",
|
| 33 |
"gate_proj"
|
| 34 |
],
|
| 35 |
"task_type": "CAUSAL_LM",
|
qwen25_0.5b_lora_official_5e-05/checkpoint-117744/adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 576045776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:55ef7746abef55de9befcbfd9bde8562bc3069f2116df3552e0305bf4f898e78
|
| 3 |
size 576045776
|
qwen25_0.5b_lora_official_5e-05/checkpoint-117744/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 65122891
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:17611afa1dd91467d43bda2d2fac911c861f34644d6c67343fca6f8ed8b80060
|
| 3 |
size 65122891
|
qwen25_0.5b_lora_official_5e-05/checkpoint-117744/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14645
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:86daa5470675396d4b6962790fbd7e535011cc46c86c81cec32ffcf78cb5f972
|
| 3 |
size 14645
|
qwen25_0.5b_lora_official_5e-05/checkpoint-117744/trainer_state.json
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
qwen25_0.5b_qlora_official_5e-05/adapter_config.json
CHANGED
|
@@ -25,12 +25,12 @@
|
|
| 25 |
"rank_pattern": {},
|
| 26 |
"revision": null,
|
| 27 |
"target_modules": [
|
| 28 |
-
"q_proj",
|
| 29 |
-
"up_proj",
|
| 30 |
"down_proj",
|
| 31 |
-
"v_proj",
|
| 32 |
"gate_proj",
|
| 33 |
-
"
|
|
|
|
|
|
|
|
|
|
| 34 |
],
|
| 35 |
"task_type": "CAUSAL_LM",
|
| 36 |
"trainable_token_indices": null,
|
|
|
|
| 25 |
"rank_pattern": {},
|
| 26 |
"revision": null,
|
| 27 |
"target_modules": [
|
|
|
|
|
|
|
| 28 |
"down_proj",
|
|
|
|
| 29 |
"gate_proj",
|
| 30 |
+
"q_proj",
|
| 31 |
+
"v_proj",
|
| 32 |
+
"k_proj",
|
| 33 |
+
"up_proj"
|
| 34 |
],
|
| 35 |
"task_type": "CAUSAL_LM",
|
| 36 |
"trainable_token_indices": null,
|
qwen25_0.5b_qlora_official_5e-05/adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 32478192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d4ce4dbb8e62cc443704b1f1437112a10f488e7c2f9cc1465866eb20b8fdb164
|
| 3 |
size 32478192
|
qwen25_0.5b_qlora_official_5e-05/checkpoint-117744/adapter_config.json
CHANGED
|
@@ -25,12 +25,12 @@
|
|
| 25 |
"rank_pattern": {},
|
| 26 |
"revision": null,
|
| 27 |
"target_modules": [
|
| 28 |
-
"q_proj",
|
| 29 |
-
"up_proj",
|
| 30 |
"down_proj",
|
| 31 |
-
"v_proj",
|
| 32 |
"gate_proj",
|
| 33 |
-
"
|
|
|
|
|
|
|
|
|
|
| 34 |
],
|
| 35 |
"task_type": "CAUSAL_LM",
|
| 36 |
"trainable_token_indices": null,
|
|
|
|
| 25 |
"rank_pattern": {},
|
| 26 |
"revision": null,
|
| 27 |
"target_modules": [
|
|
|
|
|
|
|
| 28 |
"down_proj",
|
|
|
|
| 29 |
"gate_proj",
|
| 30 |
+
"q_proj",
|
| 31 |
+
"v_proj",
|
| 32 |
+
"k_proj",
|
| 33 |
+
"up_proj"
|
| 34 |
],
|
| 35 |
"task_type": "CAUSAL_LM",
|
| 36 |
"trainable_token_indices": null,
|
qwen25_0.5b_qlora_official_5e-05/checkpoint-117744/adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 32478192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d4ce4dbb8e62cc443704b1f1437112a10f488e7c2f9cc1465866eb20b8fdb164
|
| 3 |
size 32478192
|
qwen25_0.5b_qlora_official_5e-05/checkpoint-117744/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 65122891
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:99c81924ccd383dc2e8f7e14e8af90c09e5e608b60600f1effc3cb3cf8c509a1
|
| 3 |
size 65122891
|
qwen25_0.5b_qlora_official_5e-05/checkpoint-117744/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14645
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:86daa5470675396d4b6962790fbd7e535011cc46c86c81cec32ffcf78cb5f972
|
| 3 |
size 14645
|
qwen25_0.5b_qlora_official_5e-05/checkpoint-117744/trainer_state.json
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
qwen25_0.5b_qlora_official_5e-05/checkpoint-58872/adapter_config.json
CHANGED
|
@@ -25,12 +25,12 @@
|
|
| 25 |
"rank_pattern": {},
|
| 26 |
"revision": null,
|
| 27 |
"target_modules": [
|
| 28 |
-
"q_proj",
|
| 29 |
-
"up_proj",
|
| 30 |
"down_proj",
|
| 31 |
-
"v_proj",
|
| 32 |
"gate_proj",
|
| 33 |
-
"
|
|
|
|
|
|
|
|
|
|
| 34 |
],
|
| 35 |
"task_type": "CAUSAL_LM",
|
| 36 |
"trainable_token_indices": null,
|
|
|
|
| 25 |
"rank_pattern": {},
|
| 26 |
"revision": null,
|
| 27 |
"target_modules": [
|
|
|
|
|
|
|
| 28 |
"down_proj",
|
|
|
|
| 29 |
"gate_proj",
|
| 30 |
+
"q_proj",
|
| 31 |
+
"v_proj",
|
| 32 |
+
"k_proj",
|
| 33 |
+
"up_proj"
|
| 34 |
],
|
| 35 |
"task_type": "CAUSAL_LM",
|
| 36 |
"trainable_token_indices": null,
|
qwen25_0.5b_qlora_official_5e-05/checkpoint-58872/adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 32478192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aa9310da96e80178328afe21d54cd0ecf5a77c9863c2bc4f971e0f3a4d53b37f
|
| 3 |
size 32478192
|
qwen25_0.5b_qlora_official_5e-05/checkpoint-58872/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 65122891
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cb68bee0db8f52773ee2df54015a455d1bf748ead0b00ab9d19ace1ffd7330d2
|
| 3 |
size 65122891
|
qwen25_0.5b_qlora_official_5e-05/checkpoint-58872/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14645
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a36e171992f098f3068f8b089a8a7bd86863eb6f5c67b464c1ea453a0da73fcb
|
| 3 |
size 14645
|
qwen25_0.5b_qlora_official_5e-05/checkpoint-58872/trainer_state.json
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
qwen25_0.5b_qlora_official_5e-05/complete_results.json
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|