llm001 L05 sft: 3 epoch
Browse files- README.md +1 -1
- model.safetensors +1 -1
- training_args.bin +1 -1
README.md
CHANGED
|
@@ -23,7 +23,7 @@ SFT(有监督微调)版本:基于complexly/olmo3-190m-zh-continue,
|
|
| 23 |
## 训练配置
|
| 24 |
- Learning Rate:5.0e-5
|
| 25 |
- Warmup:5%
|
| 26 |
-
- Epochs:
|
| 27 |
- Max Seq Length:2048
|
| 28 |
- 使用 assistant_only_loss(仅对 assistant 部分计算 loss)
|
| 29 |
- per_device_train_batch_size: 24
|
|
|
|
| 23 |
## 训练配置
|
| 24 |
- Learning Rate:5.0e-5
|
| 25 |
- Warmup:5%
|
| 26 |
+
- Epochs:3 epoch
|
| 27 |
- Max Seq Length:2048
|
| 28 |
- 使用 assistant_only_loss(仅对 assistant 部分计算 loss)
|
| 29 |
- per_device_train_batch_size: 24
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 374038864
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e6767a84cd2fdd2e445f504e1e6753048ac01dd02a91e1113a7bd9cfb520392b
|
| 3 |
size 374038864
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 5368
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:959ee926c718d5a1f3b65131f377b4022c9e09fc931de84a79b6b7d108766cf6
|
| 3 |
size 5368
|