End of training
Browse files- README.md +14 -1
- tokenizer_config.json +1 -1
README.md
CHANGED
|
@@ -48,7 +48,7 @@ The following hyperparameters were used during training:
|
|
| 48 |
- seed: 42
|
| 49 |
- optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
|
| 50 |
- lr_scheduler_type: linear
|
| 51 |
-
- num_epochs:
|
| 52 |
- mixed_precision_training: Native AMP
|
| 53 |
|
| 54 |
### Training results
|
|
@@ -57,6 +57,19 @@ The following hyperparameters were used during training:
|
|
| 57 |
|:-------------:|:-----:|:----:|:---------------:|:---------:|:------:|:---:|
|
| 58 |
| 0.0 | 1.0 | 224 | nan | 0.0 | 0.0 | 0.0 |
|
| 59 |
| 0.0 | 2.0 | 448 | nan | 0.0 | 0.0 | 0.0 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 60 |
|
| 61 |
|
| 62 |
### Framework versions
|
|
|
|
| 48 |
- seed: 42
|
| 49 |
- optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
|
| 50 |
- lr_scheduler_type: linear
|
| 51 |
+
- num_epochs: 15
|
| 52 |
- mixed_precision_training: Native AMP
|
| 53 |
|
| 54 |
### Training results
|
|
|
|
| 57 |
|:-------------:|:-----:|:----:|:---------------:|:---------:|:------:|:---:|
|
| 58 |
| 0.0 | 1.0 | 224 | nan | 0.0 | 0.0 | 0.0 |
|
| 59 |
| 0.0 | 2.0 | 448 | nan | 0.0 | 0.0 | 0.0 |
|
| 60 |
+
| 0.0 | 3.0 | 672 | nan | 0.0 | 0.0 | 0.0 |
|
| 61 |
+
| 0.0 | 4.0 | 896 | nan | 0.0 | 0.0 | 0.0 |
|
| 62 |
+
| 0.0 | 5.0 | 1120 | nan | 0.0 | 0.0 | 0.0 |
|
| 63 |
+
| 0.0 | 6.0 | 1344 | nan | 0.0 | 0.0 | 0.0 |
|
| 64 |
+
| 0.0 | 7.0 | 1568 | nan | 0.0 | 0.0 | 0.0 |
|
| 65 |
+
| 0.0 | 8.0 | 1792 | nan | 0.0 | 0.0 | 0.0 |
|
| 66 |
+
| 0.0 | 9.0 | 2016 | nan | 0.0 | 0.0 | 0.0 |
|
| 67 |
+
| 0.0 | 10.0 | 2240 | nan | 0.0 | 0.0 | 0.0 |
|
| 68 |
+
| 0.0 | 11.0 | 2464 | nan | 0.0 | 0.0 | 0.0 |
|
| 69 |
+
| 0.0 | 12.0 | 2688 | nan | 0.0 | 0.0 | 0.0 |
|
| 70 |
+
| 0.0 | 13.0 | 2912 | nan | 0.0 | 0.0 | 0.0 |
|
| 71 |
+
| 0.0 | 14.0 | 3136 | nan | 0.0 | 0.0 | 0.0 |
|
| 72 |
+
| 0.0 | 15.0 | 3360 | nan | 0.0 | 0.0 | 0.0 |
|
| 73 |
|
| 74 |
|
| 75 |
### Framework versions
|
tokenizer_config.json
CHANGED
|
@@ -932,7 +932,7 @@
|
|
| 932 |
"eos_token": "</s>",
|
| 933 |
"extra_ids": 100,
|
| 934 |
"extra_special_tokens": {},
|
| 935 |
-
"max_length":
|
| 936 |
"model_max_length": 512,
|
| 937 |
"pad_token": "<pad>",
|
| 938 |
"sp_model_kwargs": {},
|
|
|
|
| 932 |
"eos_token": "</s>",
|
| 933 |
"extra_ids": 100,
|
| 934 |
"extra_special_tokens": {},
|
| 935 |
+
"max_length": 224,
|
| 936 |
"model_max_length": 512,
|
| 937 |
"pad_token": "<pad>",
|
| 938 |
"sp_model_kwargs": {},
|