Training in progress, epoch 1
Browse files
hyperparameters.yaml
CHANGED
|
@@ -87,14 +87,14 @@ include_tokens_per_second: false
|
|
| 87 |
jit_mode_eval: false
|
| 88 |
label_names: null
|
| 89 |
label_smoothing_factor: 0.0
|
| 90 |
-
learning_rate: 1.
|
| 91 |
length_column_name: length
|
| 92 |
load_best_model_at_end: true
|
| 93 |
local_rank: 0
|
| 94 |
log_level: passive
|
| 95 |
log_level_replica: warning
|
| 96 |
log_on_each_node: true
|
| 97 |
-
logging_dir: model_runs/donut_experiment_bayesian_trial_0/runs/
|
| 98 |
logging_first_step: false
|
| 99 |
logging_nan_inf_filter: true
|
| 100 |
logging_steps: 100
|
|
@@ -109,7 +109,7 @@ metric_for_best_model: loss
|
|
| 109 |
mp_parameters: ''
|
| 110 |
neftune_noise_alpha: null
|
| 111 |
no_cuda: false
|
| 112 |
-
num_train_epochs:
|
| 113 |
optim: !!python/object/apply:transformers.training_args.OptimizerNames
|
| 114 |
- adamw_torch
|
| 115 |
optim_args: null
|
|
@@ -157,4 +157,4 @@ use_legacy_prediction_loop: false
|
|
| 157 |
use_mps_device: false
|
| 158 |
warmup_ratio: 0.0
|
| 159 |
warmup_steps: 0
|
| 160 |
-
weight_decay: 0.
|
|
|
|
| 87 |
jit_mode_eval: false
|
| 88 |
label_names: null
|
| 89 |
label_smoothing_factor: 0.0
|
| 90 |
+
learning_rate: 1.2045081648781836e-05
|
| 91 |
length_column_name: length
|
| 92 |
load_best_model_at_end: true
|
| 93 |
local_rank: 0
|
| 94 |
log_level: passive
|
| 95 |
log_level_replica: warning
|
| 96 |
log_on_each_node: true
|
| 97 |
+
logging_dir: model_runs/donut_experiment_bayesian_trial_0/runs/May30_15-29-21_ip-172-16-168-165.ec2.internal
|
| 98 |
logging_first_step: false
|
| 99 |
logging_nan_inf_filter: true
|
| 100 |
logging_steps: 100
|
|
|
|
| 109 |
mp_parameters: ''
|
| 110 |
neftune_noise_alpha: null
|
| 111 |
no_cuda: false
|
| 112 |
+
num_train_epochs: 5
|
| 113 |
optim: !!python/object/apply:transformers.training_args.OptimizerNames
|
| 114 |
- adamw_torch
|
| 115 |
optim_args: null
|
|
|
|
| 157 |
use_mps_device: false
|
| 158 |
warmup_ratio: 0.0
|
| 159 |
warmup_steps: 0
|
| 160 |
+
weight_decay: 0.008800425083056953
|
hyperparameters_tuned.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"learning_rate": 1.
|
|
|
|
| 1 |
+
{"learning_rate": 1.2045081648781836e-05, "weight_decay": 0.008800425083056953, "num_train_epochs": 5}
|
metrics.jsonl
CHANGED
|
@@ -1,2 +1 @@
|
|
| 1 |
-
{"eval_loss": 0.
|
| 2 |
-
{"eval_loss": 0.47436320781707764, "eval_bleu": 0.0691840661962562, "eval_precisions": [0.8295218295218295, 0.7735849056603774, 0.7247956403269755, 0.6838709677419355], "eval_brevity_penalty": 0.09212440522976928, "eval_length_ratio": 0.29545454545454547, "eval_translation_length": 481, "eval_reference_length": 1628, "eval_cer": 0.7526673269798355, "eval_wer": 0.82323955242213, "eval_runtime": 71.6494, "eval_samples_per_second": 0.796, "eval_steps_per_second": 0.796, "epoch": 2.0}
|
|
|
|
| 1 |
+
{"eval_loss": 0.6227948665618896, "eval_bleu": 0.04856205045021571, "eval_precisions": [0.7096774193548387, 0.6053921568627451, 0.5612535612535613, 0.5102040816326531], "eval_brevity_penalty": 0.08199678262097645, "eval_length_ratio": 0.2856265356265356, "eval_translation_length": 465, "eval_reference_length": 1628, "eval_cer": 0.775094682355145, "eval_wer": 0.8591598980283793, "eval_runtime": 187.5635, "eval_samples_per_second": 0.304, "eval_steps_per_second": 0.304, "epoch": 1.0}
|
|
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 809103512
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:727f7c42a1e454798ad4c84ec87ef1dd197a4148290db837d0d86c003f128542
|
| 3 |
size 809103512
|
runs/May30_15-29-21_ip-172-16-168-165.ec2.internal/events.out.tfevents.1717082961.ip-172-16-168-165.ec2.internal.8916.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a00329ca35c2cb96744bbd74bcd59f96bb5d3047dd56e7f4f8fc25e872c5b5d9
|
| 3 |
+
size 10299
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 5240
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:78cdc1eb0aab87935dcb50385d3f8cd3ccb575e79c07b0a2828bd81d4871de6e
|
| 3 |
size 5240
|