OpensourceThai/Wilai
Browse files- README.md +2 -2
- config.json +1 -1
- generation_config.json +1 -1
- pytorch_model.bin +1 -1
- runs/Sep08_03-09-32_e7c9d734d21f/events.out.tfevents.1757300975.e7c9d734d21f.597.0 +3 -0
- training_args.bin +1 -1
README.md
CHANGED
|
@@ -40,7 +40,7 @@ The following hyperparameters were used during training:
|
|
| 40 |
- optimizer: Use OptimizerNames.ADAMW_TORCH_FUSED with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
|
| 41 |
- lr_scheduler_type: linear
|
| 42 |
- lr_scheduler_warmup_steps: 100
|
| 43 |
-
- num_epochs:
|
| 44 |
- mixed_precision_training: Native AMP
|
| 45 |
|
| 46 |
### Training results
|
|
@@ -49,7 +49,7 @@ The following hyperparameters were used during training:
|
|
| 49 |
|
| 50 |
### Framework versions
|
| 51 |
|
| 52 |
-
- Transformers 4.56.
|
| 53 |
- Pytorch 2.8.0+cu126
|
| 54 |
- Datasets 4.0.0
|
| 55 |
- Tokenizers 0.22.0
|
|
|
|
| 40 |
- optimizer: Use OptimizerNames.ADAMW_TORCH_FUSED with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
|
| 41 |
- lr_scheduler_type: linear
|
| 42 |
- lr_scheduler_warmup_steps: 100
|
| 43 |
+
- num_epochs: 5
|
| 44 |
- mixed_precision_training: Native AMP
|
| 45 |
|
| 46 |
### Training results
|
|
|
|
| 49 |
|
| 50 |
### Framework versions
|
| 51 |
|
| 52 |
+
- Transformers 4.56.1
|
| 53 |
- Pytorch 2.8.0+cu126
|
| 54 |
- Datasets 4.0.0
|
| 55 |
- Tokenizers 0.22.0
|
config.json
CHANGED
|
@@ -17,7 +17,7 @@
|
|
| 17 |
"pad_token_id": 0,
|
| 18 |
"rope": true,
|
| 19 |
"top_k": 2,
|
| 20 |
-
"transformers_version": "4.56.
|
| 21 |
"use_flashattn": true,
|
| 22 |
"vocab_size": 48000
|
| 23 |
}
|
|
|
|
| 17 |
"pad_token_id": 0,
|
| 18 |
"rope": true,
|
| 19 |
"top_k": 2,
|
| 20 |
+
"transformers_version": "4.56.1",
|
| 21 |
"use_flashattn": true,
|
| 22 |
"vocab_size": 48000
|
| 23 |
}
|
generation_config.json
CHANGED
|
@@ -8,5 +8,5 @@
|
|
| 8 |
"pad_token_id": 0,
|
| 9 |
"temperature": 0.7,
|
| 10 |
"top_p": 0.9,
|
| 11 |
-
"transformers_version": "4.56.
|
| 12 |
}
|
|
|
|
| 8 |
"pad_token_id": 0,
|
| 9 |
"temperature": 0.7,
|
| 10 |
"top_p": 0.9,
|
| 11 |
+
"transformers_version": "4.56.1"
|
| 12 |
}
|
pytorch_model.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 664188751
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5e1b15b691eb1a8abe0cf263fb2c66702cb3dc4476cfa945152e8abc3646db74
|
| 3 |
size 664188751
|
runs/Sep08_03-09-32_e7c9d734d21f/events.out.tfevents.1757300975.e7c9d734d21f.597.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f449bd9967575caa81f4d885b20a0988dd96d88e5c96ee766eea3c17d845f97b
|
| 3 |
+
size 38223
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 5777
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:260edcef99f5c590cea91a68c06afb3fbf2b22114a949275810607d6481f8261
|
| 3 |
size 5777
|