BenjaminPittsley commited on
Commit
c3162b6
·
verified ·
1 Parent(s): 7d4c384

Model save

Browse files
Files changed (2) hide show
  1. README.md +9 -11
  2. generation_config.json +2 -4
README.md CHANGED
@@ -33,16 +33,14 @@ More information needed
33
  ### Training hyperparameters
34
 
35
  The following hyperparameters were used during training:
36
- - learning_rate: 5e-05
37
- - train_batch_size: 8
38
- - eval_batch_size: 16
39
  - seed: 42
40
- - gradient_accumulation_steps: 2
41
- - total_train_batch_size: 16
42
- - optimizer: Use OptimizerNames.ADAMW_TORCH_FUSED with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
43
  - lr_scheduler_type: linear
44
- - lr_scheduler_warmup_steps: 100
45
- - num_epochs: 5
46
  - mixed_precision_training: Native AMP
47
 
48
  ### Training results
@@ -51,7 +49,7 @@ The following hyperparameters were used during training:
51
 
52
  ### Framework versions
53
 
54
- - Transformers 4.57.1
55
- - Pytorch 2.8.0+cu126
56
  - Datasets 4.4.1
57
- - Tokenizers 0.22.1
 
33
  ### Training hyperparameters
34
 
35
  The following hyperparameters were used during training:
36
+ - learning_rate: 0.0003
37
+ - train_batch_size: 2
38
+ - eval_batch_size: 8
39
  - seed: 42
40
+ - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
 
 
41
  - lr_scheduler_type: linear
42
+ - lr_scheduler_warmup_ratio: 0.1
43
+ - num_epochs: 50
44
  - mixed_precision_training: Native AMP
45
 
46
  ### Training results
 
49
 
50
  ### Framework versions
51
 
52
+ - Transformers 4.53.3
53
+ - Pytorch 2.6.0+cu124
54
  - Datasets 4.4.1
55
+ - Tokenizers 0.21.2
generation_config.json CHANGED
@@ -1,9 +1,7 @@
1
  {
2
  "_from_model_config": true,
3
  "decoder_start_token_id": 0,
4
- "eos_token_id": [
5
- 1
6
- ],
7
  "pad_token_id": 0,
8
- "transformers_version": "4.57.1"
9
  }
 
1
  {
2
  "_from_model_config": true,
3
  "decoder_start_token_id": 0,
4
+ "eos_token_id": 1,
 
 
5
  "pad_token_id": 0,
6
+ "transformers_version": "4.53.3"
7
  }