| { |
| "best_metric": null, |
| "best_model_checkpoint": null, |
| "epoch": 0.7568296795952782, |
| "eval_steps": 187, |
| "global_step": 8976, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.0, |
| "grad_norm": 8.5, |
| "learning_rate": 1e-05, |
| "loss": 1.9119, |
| "step": 1 |
| }, |
| { |
| "epoch": 0.02, |
| "grad_norm": 4.59375, |
| "learning_rate": 1e-05, |
| "loss": 1.7164, |
| "step": 187 |
| }, |
| { |
| "epoch": 0.02, |
| "eval_validation_privacy_sources_loss": 1.0334585905075073, |
| "eval_validation_privacy_sources_runtime": 212.2756, |
| "eval_validation_privacy_sources_samples_per_second": 1.804, |
| "eval_validation_privacy_sources_steps_per_second": 0.904, |
| "step": 187 |
| }, |
| { |
| "epoch": 0.02, |
| "eval_validation_agenda_digitale_loss": 1.5160526037216187, |
| "eval_validation_agenda_digitale_runtime": 188.4106, |
| "eval_validation_agenda_digitale_samples_per_second": 1.805, |
| "eval_validation_agenda_digitale_steps_per_second": 0.902, |
| "step": 187 |
| }, |
| { |
| "epoch": 0.02, |
| "eval_validation_leggepertutti_loss": 1.3417482376098633, |
| "eval_validation_leggepertutti_runtime": 35.8837, |
| "eval_validation_leggepertutti_samples_per_second": 1.811, |
| "eval_validation_leggepertutti_steps_per_second": 0.92, |
| "step": 187 |
| }, |
| { |
| "epoch": 0.02, |
| "eval_validation_altalexprivacy_loss": 1.3672271966934204, |
| "eval_validation_altalexprivacy_runtime": 58.6063, |
| "eval_validation_altalexprivacy_samples_per_second": 1.809, |
| "eval_validation_altalexprivacy_steps_per_second": 0.904, |
| "step": 187 |
| }, |
| { |
| "epoch": 0.02, |
| "eval_validation_mc4_it_loss": 1.9217756986618042, |
| "eval_validation_mc4_it_runtime": 78.6277, |
| "eval_validation_mc4_it_samples_per_second": 1.806, |
| "eval_validation_mc4_it_steps_per_second": 0.903, |
| "step": 187 |
| }, |
| { |
| "epoch": 0.02, |
| "eval_validation_dolma_loss": 1.9627543687820435, |
| "eval_validation_dolma_runtime": 54.0088, |
| "eval_validation_dolma_samples_per_second": 1.815, |
| "eval_validation_dolma_steps_per_second": 0.907, |
| "step": 187 |
| }, |
| { |
| "epoch": 0.03, |
| "grad_norm": 3.859375, |
| "learning_rate": 1e-05, |
| "loss": 1.6579, |
| "step": 374 |
| }, |
| { |
| "epoch": 0.03, |
| "eval_validation_privacy_sources_loss": 0.9830030798912048, |
| "eval_validation_privacy_sources_runtime": 210.811, |
| "eval_validation_privacy_sources_samples_per_second": 1.817, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 374 |
| }, |
| { |
| "epoch": 0.03, |
| "eval_validation_agenda_digitale_loss": 1.4846152067184448, |
| "eval_validation_agenda_digitale_runtime": 187.1837, |
| "eval_validation_agenda_digitale_samples_per_second": 1.816, |
| "eval_validation_agenda_digitale_steps_per_second": 0.908, |
| "step": 374 |
| }, |
| { |
| "epoch": 0.03, |
| "eval_validation_leggepertutti_loss": 1.3172152042388916, |
| "eval_validation_leggepertutti_runtime": 35.7866, |
| "eval_validation_leggepertutti_samples_per_second": 1.816, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 374 |
| }, |
| { |
| "epoch": 0.03, |
| "eval_validation_altalexprivacy_loss": 1.3326139450073242, |
| "eval_validation_altalexprivacy_runtime": 58.3381, |
| "eval_validation_altalexprivacy_samples_per_second": 1.817, |
| "eval_validation_altalexprivacy_steps_per_second": 0.908, |
| "step": 374 |
| }, |
| { |
| "epoch": 0.03, |
| "eval_validation_mc4_it_loss": 1.8915678262710571, |
| "eval_validation_mc4_it_runtime": 78.169, |
| "eval_validation_mc4_it_samples_per_second": 1.817, |
| "eval_validation_mc4_it_steps_per_second": 0.908, |
| "step": 374 |
| }, |
| { |
| "epoch": 0.03, |
| "eval_validation_dolma_loss": 1.9608409404754639, |
| "eval_validation_dolma_runtime": 53.9716, |
| "eval_validation_dolma_samples_per_second": 1.816, |
| "eval_validation_dolma_steps_per_second": 0.908, |
| "step": 374 |
| }, |
| { |
| "epoch": 0.05, |
| "grad_norm": 3.484375, |
| "learning_rate": 1e-05, |
| "loss": 1.6402, |
| "step": 561 |
| }, |
| { |
| "epoch": 0.05, |
| "eval_validation_privacy_sources_loss": 0.9559596180915833, |
| "eval_validation_privacy_sources_runtime": 210.7246, |
| "eval_validation_privacy_sources_samples_per_second": 1.818, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 561 |
| }, |
| { |
| "epoch": 0.05, |
| "eval_validation_agenda_digitale_loss": 1.4720743894577026, |
| "eval_validation_agenda_digitale_runtime": 187.11, |
| "eval_validation_agenda_digitale_samples_per_second": 1.817, |
| "eval_validation_agenda_digitale_steps_per_second": 0.909, |
| "step": 561 |
| }, |
| { |
| "epoch": 0.05, |
| "eval_validation_leggepertutti_loss": 1.3074837923049927, |
| "eval_validation_leggepertutti_runtime": 35.7797, |
| "eval_validation_leggepertutti_samples_per_second": 1.817, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 561 |
| }, |
| { |
| "epoch": 0.05, |
| "eval_validation_altalexprivacy_loss": 1.3142317533493042, |
| "eval_validation_altalexprivacy_runtime": 58.315, |
| "eval_validation_altalexprivacy_samples_per_second": 1.818, |
| "eval_validation_altalexprivacy_steps_per_second": 0.909, |
| "step": 561 |
| }, |
| { |
| "epoch": 0.05, |
| "eval_validation_mc4_it_loss": 1.87451171875, |
| "eval_validation_mc4_it_runtime": 78.1299, |
| "eval_validation_mc4_it_samples_per_second": 1.817, |
| "eval_validation_mc4_it_steps_per_second": 0.909, |
| "step": 561 |
| }, |
| { |
| "epoch": 0.05, |
| "eval_validation_dolma_loss": 1.956404447555542, |
| "eval_validation_dolma_runtime": 53.9194, |
| "eval_validation_dolma_samples_per_second": 1.818, |
| "eval_validation_dolma_steps_per_second": 0.909, |
| "step": 561 |
| }, |
| { |
| "epoch": 0.06, |
| "grad_norm": 9.625, |
| "learning_rate": 1e-05, |
| "loss": 1.6284, |
| "step": 748 |
| }, |
| { |
| "epoch": 0.06, |
| "eval_validation_privacy_sources_loss": 0.933682918548584, |
| "eval_validation_privacy_sources_runtime": 210.799, |
| "eval_validation_privacy_sources_samples_per_second": 1.817, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 748 |
| }, |
| { |
| "epoch": 0.06, |
| "eval_validation_agenda_digitale_loss": 1.4578524827957153, |
| "eval_validation_agenda_digitale_runtime": 187.08, |
| "eval_validation_agenda_digitale_samples_per_second": 1.817, |
| "eval_validation_agenda_digitale_steps_per_second": 0.909, |
| "step": 748 |
| }, |
| { |
| "epoch": 0.06, |
| "eval_validation_leggepertutti_loss": 1.2905200719833374, |
| "eval_validation_leggepertutti_runtime": 35.7738, |
| "eval_validation_leggepertutti_samples_per_second": 1.817, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 748 |
| }, |
| { |
| "epoch": 0.06, |
| "eval_validation_altalexprivacy_loss": 1.2977306842803955, |
| "eval_validation_altalexprivacy_runtime": 58.3215, |
| "eval_validation_altalexprivacy_samples_per_second": 1.818, |
| "eval_validation_altalexprivacy_steps_per_second": 0.909, |
| "step": 748 |
| }, |
| { |
| "epoch": 0.06, |
| "eval_validation_mc4_it_loss": 1.8592724800109863, |
| "eval_validation_mc4_it_runtime": 78.1141, |
| "eval_validation_mc4_it_samples_per_second": 1.818, |
| "eval_validation_mc4_it_steps_per_second": 0.909, |
| "step": 748 |
| }, |
| { |
| "epoch": 0.06, |
| "eval_validation_dolma_loss": 1.9574466943740845, |
| "eval_validation_dolma_runtime": 53.9297, |
| "eval_validation_dolma_samples_per_second": 1.817, |
| "eval_validation_dolma_steps_per_second": 0.909, |
| "step": 748 |
| }, |
| { |
| "epoch": 0.08, |
| "grad_norm": 3.390625, |
| "learning_rate": 1e-05, |
| "loss": 1.6082, |
| "step": 935 |
| }, |
| { |
| "epoch": 0.08, |
| "eval_validation_privacy_sources_loss": 0.919241726398468, |
| "eval_validation_privacy_sources_runtime": 210.6302, |
| "eval_validation_privacy_sources_samples_per_second": 1.818, |
| "eval_validation_privacy_sources_steps_per_second": 0.912, |
| "step": 935 |
| }, |
| { |
| "epoch": 0.08, |
| "eval_validation_agenda_digitale_loss": 1.4438046216964722, |
| "eval_validation_agenda_digitale_runtime": 187.0727, |
| "eval_validation_agenda_digitale_samples_per_second": 1.817, |
| "eval_validation_agenda_digitale_steps_per_second": 0.909, |
| "step": 935 |
| }, |
| { |
| "epoch": 0.08, |
| "eval_validation_leggepertutti_loss": 1.2822848558425903, |
| "eval_validation_leggepertutti_runtime": 35.7909, |
| "eval_validation_leggepertutti_samples_per_second": 1.816, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 935 |
| }, |
| { |
| "epoch": 0.08, |
| "eval_validation_altalexprivacy_loss": 1.2801928520202637, |
| "eval_validation_altalexprivacy_runtime": 58.3369, |
| "eval_validation_altalexprivacy_samples_per_second": 1.817, |
| "eval_validation_altalexprivacy_steps_per_second": 0.909, |
| "step": 935 |
| }, |
| { |
| "epoch": 0.08, |
| "eval_validation_mc4_it_loss": 1.8457767963409424, |
| "eval_validation_mc4_it_runtime": 78.1714, |
| "eval_validation_mc4_it_samples_per_second": 1.817, |
| "eval_validation_mc4_it_steps_per_second": 0.908, |
| "step": 935 |
| }, |
| { |
| "epoch": 0.08, |
| "eval_validation_dolma_loss": 1.9588344097137451, |
| "eval_validation_dolma_runtime": 53.9317, |
| "eval_validation_dolma_samples_per_second": 1.817, |
| "eval_validation_dolma_steps_per_second": 0.909, |
| "step": 935 |
| }, |
| { |
| "epoch": 0.09, |
| "grad_norm": 3.46875, |
| "learning_rate": 1e-05, |
| "loss": 1.5989, |
| "step": 1122 |
| }, |
| { |
| "epoch": 0.09, |
| "eval_validation_privacy_sources_loss": 0.9032600522041321, |
| "eval_validation_privacy_sources_runtime": 210.7002, |
| "eval_validation_privacy_sources_samples_per_second": 1.818, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 1122 |
| }, |
| { |
| "epoch": 0.09, |
| "eval_validation_agenda_digitale_loss": 1.433292031288147, |
| "eval_validation_agenda_digitale_runtime": 187.0521, |
| "eval_validation_agenda_digitale_samples_per_second": 1.818, |
| "eval_validation_agenda_digitale_steps_per_second": 0.909, |
| "step": 1122 |
| }, |
| { |
| "epoch": 0.09, |
| "eval_validation_leggepertutti_loss": 1.2763991355895996, |
| "eval_validation_leggepertutti_runtime": 35.7627, |
| "eval_validation_leggepertutti_samples_per_second": 1.818, |
| "eval_validation_leggepertutti_steps_per_second": 0.923, |
| "step": 1122 |
| }, |
| { |
| "epoch": 0.09, |
| "eval_validation_altalexprivacy_loss": 1.2663257122039795, |
| "eval_validation_altalexprivacy_runtime": 58.3197, |
| "eval_validation_altalexprivacy_samples_per_second": 1.818, |
| "eval_validation_altalexprivacy_steps_per_second": 0.909, |
| "step": 1122 |
| }, |
| { |
| "epoch": 0.09, |
| "eval_validation_mc4_it_loss": 1.8358547687530518, |
| "eval_validation_mc4_it_runtime": 78.1183, |
| "eval_validation_mc4_it_samples_per_second": 1.818, |
| "eval_validation_mc4_it_steps_per_second": 0.909, |
| "step": 1122 |
| }, |
| { |
| "epoch": 0.09, |
| "eval_validation_dolma_loss": 2.0097882747650146, |
| "eval_validation_dolma_runtime": 53.9266, |
| "eval_validation_dolma_samples_per_second": 1.817, |
| "eval_validation_dolma_steps_per_second": 0.909, |
| "step": 1122 |
| }, |
| { |
| "epoch": 0.11, |
| "grad_norm": 3.40625, |
| "learning_rate": 1e-05, |
| "loss": 1.6161, |
| "step": 1309 |
| }, |
| { |
| "epoch": 0.11, |
| "eval_validation_privacy_sources_loss": 0.8906105160713196, |
| "eval_validation_privacy_sources_runtime": 210.7431, |
| "eval_validation_privacy_sources_samples_per_second": 1.817, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 1309 |
| }, |
| { |
| "epoch": 0.11, |
| "eval_validation_agenda_digitale_loss": 1.4252179861068726, |
| "eval_validation_agenda_digitale_runtime": 187.1263, |
| "eval_validation_agenda_digitale_samples_per_second": 1.817, |
| "eval_validation_agenda_digitale_steps_per_second": 0.908, |
| "step": 1309 |
| }, |
| { |
| "epoch": 0.11, |
| "eval_validation_leggepertutti_loss": 1.2690521478652954, |
| "eval_validation_leggepertutti_runtime": 35.7673, |
| "eval_validation_leggepertutti_samples_per_second": 1.817, |
| "eval_validation_leggepertutti_steps_per_second": 0.923, |
| "step": 1309 |
| }, |
| { |
| "epoch": 0.11, |
| "eval_validation_altalexprivacy_loss": 1.258312463760376, |
| "eval_validation_altalexprivacy_runtime": 58.3303, |
| "eval_validation_altalexprivacy_samples_per_second": 1.817, |
| "eval_validation_altalexprivacy_steps_per_second": 0.909, |
| "step": 1309 |
| }, |
| { |
| "epoch": 0.11, |
| "eval_validation_mc4_it_loss": 1.8263970613479614, |
| "eval_validation_mc4_it_runtime": 78.147, |
| "eval_validation_mc4_it_samples_per_second": 1.817, |
| "eval_validation_mc4_it_steps_per_second": 0.909, |
| "step": 1309 |
| }, |
| { |
| "epoch": 0.11, |
| "eval_validation_dolma_loss": 1.9555673599243164, |
| "eval_validation_dolma_runtime": 53.9288, |
| "eval_validation_dolma_samples_per_second": 1.817, |
| "eval_validation_dolma_steps_per_second": 0.909, |
| "step": 1309 |
| }, |
| { |
| "epoch": 0.13, |
| "grad_norm": 3.25, |
| "learning_rate": 1e-05, |
| "loss": 1.5911, |
| "step": 1496 |
| }, |
| { |
| "epoch": 0.13, |
| "eval_validation_privacy_sources_loss": 0.8815954327583313, |
| "eval_validation_privacy_sources_runtime": 210.7215, |
| "eval_validation_privacy_sources_samples_per_second": 1.818, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 1496 |
| }, |
| { |
| "epoch": 0.13, |
| "eval_validation_agenda_digitale_loss": 1.4188568592071533, |
| "eval_validation_agenda_digitale_runtime": 187.0962, |
| "eval_validation_agenda_digitale_samples_per_second": 1.817, |
| "eval_validation_agenda_digitale_steps_per_second": 0.909, |
| "step": 1496 |
| }, |
| { |
| "epoch": 0.13, |
| "eval_validation_leggepertutti_loss": 1.269508957862854, |
| "eval_validation_leggepertutti_runtime": 35.7762, |
| "eval_validation_leggepertutti_samples_per_second": 1.817, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 1496 |
| }, |
| { |
| "epoch": 0.13, |
| "eval_validation_altalexprivacy_loss": 1.2556049823760986, |
| "eval_validation_altalexprivacy_runtime": 58.3467, |
| "eval_validation_altalexprivacy_samples_per_second": 1.817, |
| "eval_validation_altalexprivacy_steps_per_second": 0.908, |
| "step": 1496 |
| }, |
| { |
| "epoch": 0.13, |
| "eval_validation_mc4_it_loss": 1.8174842596054077, |
| "eval_validation_mc4_it_runtime": 78.1412, |
| "eval_validation_mc4_it_samples_per_second": 1.817, |
| "eval_validation_mc4_it_steps_per_second": 0.909, |
| "step": 1496 |
| }, |
| { |
| "epoch": 0.13, |
| "eval_validation_dolma_loss": 1.9592047929763794, |
| "eval_validation_dolma_runtime": 53.9471, |
| "eval_validation_dolma_samples_per_second": 1.817, |
| "eval_validation_dolma_steps_per_second": 0.908, |
| "step": 1496 |
| }, |
| { |
| "epoch": 0.14, |
| "grad_norm": 3.359375, |
| "learning_rate": 1e-05, |
| "loss": 1.5694, |
| "step": 1683 |
| }, |
| { |
| "epoch": 0.14, |
| "eval_validation_privacy_sources_loss": 0.8737432956695557, |
| "eval_validation_privacy_sources_runtime": 210.8196, |
| "eval_validation_privacy_sources_samples_per_second": 1.817, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 1683 |
| }, |
| { |
| "epoch": 0.14, |
| "eval_validation_agenda_digitale_loss": 1.4132717847824097, |
| "eval_validation_agenda_digitale_runtime": 187.1554, |
| "eval_validation_agenda_digitale_samples_per_second": 1.817, |
| "eval_validation_agenda_digitale_steps_per_second": 0.908, |
| "step": 1683 |
| }, |
| { |
| "epoch": 0.14, |
| "eval_validation_leggepertutti_loss": 1.2630620002746582, |
| "eval_validation_leggepertutti_runtime": 35.7934, |
| "eval_validation_leggepertutti_samples_per_second": 1.816, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 1683 |
| }, |
| { |
| "epoch": 0.14, |
| "eval_validation_altalexprivacy_loss": 1.247528076171875, |
| "eval_validation_altalexprivacy_runtime": 58.3547, |
| "eval_validation_altalexprivacy_samples_per_second": 1.816, |
| "eval_validation_altalexprivacy_steps_per_second": 0.908, |
| "step": 1683 |
| }, |
| { |
| "epoch": 0.14, |
| "eval_validation_mc4_it_loss": 1.8103784322738647, |
| "eval_validation_mc4_it_runtime": 78.1665, |
| "eval_validation_mc4_it_samples_per_second": 1.817, |
| "eval_validation_mc4_it_steps_per_second": 0.908, |
| "step": 1683 |
| }, |
| { |
| "epoch": 0.14, |
| "eval_validation_dolma_loss": 1.956905722618103, |
| "eval_validation_dolma_runtime": 53.9622, |
| "eval_validation_dolma_samples_per_second": 1.816, |
| "eval_validation_dolma_steps_per_second": 0.908, |
| "step": 1683 |
| }, |
| { |
| "epoch": 0.16, |
| "grad_norm": 3.1875, |
| "learning_rate": 1e-05, |
| "loss": 1.563, |
| "step": 1870 |
| }, |
| { |
| "epoch": 0.16, |
| "eval_validation_privacy_sources_loss": 0.8650386929512024, |
| "eval_validation_privacy_sources_runtime": 210.8215, |
| "eval_validation_privacy_sources_samples_per_second": 1.817, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 1870 |
| }, |
| { |
| "epoch": 0.16, |
| "eval_validation_agenda_digitale_loss": 1.4071804285049438, |
| "eval_validation_agenda_digitale_runtime": 187.1502, |
| "eval_validation_agenda_digitale_samples_per_second": 1.817, |
| "eval_validation_agenda_digitale_steps_per_second": 0.908, |
| "step": 1870 |
| }, |
| { |
| "epoch": 0.16, |
| "eval_validation_leggepertutti_loss": 1.2562586069107056, |
| "eval_validation_leggepertutti_runtime": 35.7742, |
| "eval_validation_leggepertutti_samples_per_second": 1.817, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 1870 |
| }, |
| { |
| "epoch": 0.16, |
| "eval_validation_altalexprivacy_loss": 1.240662932395935, |
| "eval_validation_altalexprivacy_runtime": 58.3499, |
| "eval_validation_altalexprivacy_samples_per_second": 1.817, |
| "eval_validation_altalexprivacy_steps_per_second": 0.908, |
| "step": 1870 |
| }, |
| { |
| "epoch": 0.16, |
| "eval_validation_mc4_it_loss": 1.8042465448379517, |
| "eval_validation_mc4_it_runtime": 78.1652, |
| "eval_validation_mc4_it_samples_per_second": 1.817, |
| "eval_validation_mc4_it_steps_per_second": 0.908, |
| "step": 1870 |
| }, |
| { |
| "epoch": 0.16, |
| "eval_validation_dolma_loss": 1.9527182579040527, |
| "eval_validation_dolma_runtime": 53.948, |
| "eval_validation_dolma_samples_per_second": 1.817, |
| "eval_validation_dolma_steps_per_second": 0.908, |
| "step": 1870 |
| }, |
| { |
| "epoch": 0.17, |
| "grad_norm": 3.171875, |
| "learning_rate": 1e-05, |
| "loss": 1.5747, |
| "step": 2057 |
| }, |
| { |
| "epoch": 0.17, |
| "eval_validation_privacy_sources_loss": 0.8606281876564026, |
| "eval_validation_privacy_sources_runtime": 210.8197, |
| "eval_validation_privacy_sources_samples_per_second": 1.817, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 2057 |
| }, |
| { |
| "epoch": 0.17, |
| "eval_validation_agenda_digitale_loss": 1.401216983795166, |
| "eval_validation_agenda_digitale_runtime": 187.1929, |
| "eval_validation_agenda_digitale_samples_per_second": 1.816, |
| "eval_validation_agenda_digitale_steps_per_second": 0.908, |
| "step": 2057 |
| }, |
| { |
| "epoch": 0.17, |
| "eval_validation_leggepertutti_loss": 1.249880075454712, |
| "eval_validation_leggepertutti_runtime": 35.7828, |
| "eval_validation_leggepertutti_samples_per_second": 1.817, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 2057 |
| }, |
| { |
| "epoch": 0.17, |
| "eval_validation_altalexprivacy_loss": 1.2347912788391113, |
| "eval_validation_altalexprivacy_runtime": 58.3271, |
| "eval_validation_altalexprivacy_samples_per_second": 1.817, |
| "eval_validation_altalexprivacy_steps_per_second": 0.909, |
| "step": 2057 |
| }, |
| { |
| "epoch": 0.17, |
| "eval_validation_mc4_it_loss": 1.7988897562026978, |
| "eval_validation_mc4_it_runtime": 78.1637, |
| "eval_validation_mc4_it_samples_per_second": 1.817, |
| "eval_validation_mc4_it_steps_per_second": 0.908, |
| "step": 2057 |
| }, |
| { |
| "epoch": 0.17, |
| "eval_validation_dolma_loss": 1.9512945413589478, |
| "eval_validation_dolma_runtime": 53.9545, |
| "eval_validation_dolma_samples_per_second": 1.816, |
| "eval_validation_dolma_steps_per_second": 0.908, |
| "step": 2057 |
| }, |
| { |
| "epoch": 0.19, |
| "grad_norm": 3.703125, |
| "learning_rate": 1e-05, |
| "loss": 1.5631, |
| "step": 2244 |
| }, |
| { |
| "epoch": 0.19, |
| "eval_validation_privacy_sources_loss": 0.8552854061126709, |
| "eval_validation_privacy_sources_runtime": 210.7654, |
| "eval_validation_privacy_sources_samples_per_second": 1.817, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 2244 |
| }, |
| { |
| "epoch": 0.19, |
| "eval_validation_agenda_digitale_loss": 1.3981597423553467, |
| "eval_validation_agenda_digitale_runtime": 187.0896, |
| "eval_validation_agenda_digitale_samples_per_second": 1.817, |
| "eval_validation_agenda_digitale_steps_per_second": 0.909, |
| "step": 2244 |
| }, |
| { |
| "epoch": 0.19, |
| "eval_validation_leggepertutti_loss": 1.249776840209961, |
| "eval_validation_leggepertutti_runtime": 35.7701, |
| "eval_validation_leggepertutti_samples_per_second": 1.817, |
| "eval_validation_leggepertutti_steps_per_second": 0.923, |
| "step": 2244 |
| }, |
| { |
| "epoch": 0.19, |
| "eval_validation_altalexprivacy_loss": 1.2317657470703125, |
| "eval_validation_altalexprivacy_runtime": 58.3402, |
| "eval_validation_altalexprivacy_samples_per_second": 1.817, |
| "eval_validation_altalexprivacy_steps_per_second": 0.908, |
| "step": 2244 |
| }, |
| { |
| "epoch": 0.19, |
| "eval_validation_mc4_it_loss": 1.7936795949935913, |
| "eval_validation_mc4_it_runtime": 78.1539, |
| "eval_validation_mc4_it_samples_per_second": 1.817, |
| "eval_validation_mc4_it_steps_per_second": 0.908, |
| "step": 2244 |
| }, |
| { |
| "epoch": 0.19, |
| "eval_validation_dolma_loss": 1.949507474899292, |
| "eval_validation_dolma_runtime": 53.9287, |
| "eval_validation_dolma_samples_per_second": 1.817, |
| "eval_validation_dolma_steps_per_second": 0.909, |
| "step": 2244 |
| }, |
| { |
| "epoch": 0.2, |
| "grad_norm": 3.28125, |
| "learning_rate": 1e-05, |
| "loss": 1.5502, |
| "step": 2431 |
| }, |
| { |
| "epoch": 0.2, |
| "eval_validation_privacy_sources_loss": 0.8490111231803894, |
| "eval_validation_privacy_sources_runtime": 210.7371, |
| "eval_validation_privacy_sources_samples_per_second": 1.817, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 2431 |
| }, |
| { |
| "epoch": 0.2, |
| "eval_validation_agenda_digitale_loss": 1.391976237297058, |
| "eval_validation_agenda_digitale_runtime": 187.0694, |
| "eval_validation_agenda_digitale_samples_per_second": 1.818, |
| "eval_validation_agenda_digitale_steps_per_second": 0.909, |
| "step": 2431 |
| }, |
| { |
| "epoch": 0.2, |
| "eval_validation_leggepertutti_loss": 1.2457927465438843, |
| "eval_validation_leggepertutti_runtime": 35.7756, |
| "eval_validation_leggepertutti_samples_per_second": 1.817, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 2431 |
| }, |
| { |
| "epoch": 0.2, |
| "eval_validation_altalexprivacy_loss": 1.2249823808670044, |
| "eval_validation_altalexprivacy_runtime": 58.3391, |
| "eval_validation_altalexprivacy_samples_per_second": 1.817, |
| "eval_validation_altalexprivacy_steps_per_second": 0.908, |
| "step": 2431 |
| }, |
| { |
| "epoch": 0.2, |
| "eval_validation_mc4_it_loss": 1.7877947092056274, |
| "eval_validation_mc4_it_runtime": 78.1519, |
| "eval_validation_mc4_it_samples_per_second": 1.817, |
| "eval_validation_mc4_it_steps_per_second": 0.908, |
| "step": 2431 |
| }, |
| { |
| "epoch": 0.2, |
| "eval_validation_dolma_loss": 1.9478541612625122, |
| "eval_validation_dolma_runtime": 53.9392, |
| "eval_validation_dolma_samples_per_second": 1.817, |
| "eval_validation_dolma_steps_per_second": 0.908, |
| "step": 2431 |
| }, |
| { |
| "epoch": 0.22, |
| "grad_norm": 3.109375, |
| "learning_rate": 1e-05, |
| "loss": 1.5612, |
| "step": 2618 |
| }, |
| { |
| "epoch": 0.22, |
| "eval_validation_privacy_sources_loss": 0.8443201184272766, |
| "eval_validation_privacy_sources_runtime": 210.7053, |
| "eval_validation_privacy_sources_samples_per_second": 1.818, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 2618 |
| }, |
| { |
| "epoch": 0.22, |
| "eval_validation_agenda_digitale_loss": 1.3874356746673584, |
| "eval_validation_agenda_digitale_runtime": 187.0741, |
| "eval_validation_agenda_digitale_samples_per_second": 1.817, |
| "eval_validation_agenda_digitale_steps_per_second": 0.909, |
| "step": 2618 |
| }, |
| { |
| "epoch": 0.22, |
| "eval_validation_leggepertutti_loss": 1.242628574371338, |
| "eval_validation_leggepertutti_runtime": 35.7724, |
| "eval_validation_leggepertutti_samples_per_second": 1.817, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 2618 |
| }, |
| { |
| "epoch": 0.22, |
| "eval_validation_altalexprivacy_loss": 1.22023606300354, |
| "eval_validation_altalexprivacy_runtime": 58.3215, |
| "eval_validation_altalexprivacy_samples_per_second": 1.818, |
| "eval_validation_altalexprivacy_steps_per_second": 0.909, |
| "step": 2618 |
| }, |
| { |
| "epoch": 0.22, |
| "eval_validation_mc4_it_loss": 1.783267617225647, |
| "eval_validation_mc4_it_runtime": 78.1277, |
| "eval_validation_mc4_it_samples_per_second": 1.818, |
| "eval_validation_mc4_it_steps_per_second": 0.909, |
| "step": 2618 |
| }, |
| { |
| "epoch": 0.22, |
| "eval_validation_dolma_loss": 1.9474639892578125, |
| "eval_validation_dolma_runtime": 53.9215, |
| "eval_validation_dolma_samples_per_second": 1.817, |
| "eval_validation_dolma_steps_per_second": 0.909, |
| "step": 2618 |
| }, |
| { |
| "epoch": 0.24, |
| "grad_norm": 9.0, |
| "learning_rate": 1e-05, |
| "loss": 1.5625, |
| "step": 2805 |
| }, |
| { |
| "epoch": 0.24, |
| "eval_validation_privacy_sources_loss": 0.8386737108230591, |
| "eval_validation_privacy_sources_runtime": 210.6496, |
| "eval_validation_privacy_sources_samples_per_second": 1.818, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 2805 |
| }, |
| { |
| "epoch": 0.24, |
| "eval_validation_agenda_digitale_loss": 1.3825620412826538, |
| "eval_validation_agenda_digitale_runtime": 186.9852, |
| "eval_validation_agenda_digitale_samples_per_second": 1.818, |
| "eval_validation_agenda_digitale_steps_per_second": 0.909, |
| "step": 2805 |
| }, |
| { |
| "epoch": 0.24, |
| "eval_validation_leggepertutti_loss": 1.2439346313476562, |
| "eval_validation_leggepertutti_runtime": 35.762, |
| "eval_validation_leggepertutti_samples_per_second": 1.818, |
| "eval_validation_leggepertutti_steps_per_second": 0.923, |
| "step": 2805 |
| }, |
| { |
| "epoch": 0.24, |
| "eval_validation_altalexprivacy_loss": 1.2144984006881714, |
| "eval_validation_altalexprivacy_runtime": 58.2929, |
| "eval_validation_altalexprivacy_samples_per_second": 1.818, |
| "eval_validation_altalexprivacy_steps_per_second": 0.909, |
| "step": 2805 |
| }, |
| { |
| "epoch": 0.24, |
| "eval_validation_mc4_it_loss": 1.7777953147888184, |
| "eval_validation_mc4_it_runtime": 78.0862, |
| "eval_validation_mc4_it_samples_per_second": 1.819, |
| "eval_validation_mc4_it_steps_per_second": 0.909, |
| "step": 2805 |
| }, |
| { |
| "epoch": 0.24, |
| "eval_validation_dolma_loss": 1.9426158666610718, |
| "eval_validation_dolma_runtime": 53.8932, |
| "eval_validation_dolma_samples_per_second": 1.818, |
| "eval_validation_dolma_steps_per_second": 0.909, |
| "step": 2805 |
| }, |
| { |
| "epoch": 0.25, |
| "grad_norm": 3.09375, |
| "learning_rate": 1e-05, |
| "loss": 1.5659, |
| "step": 2992 |
| }, |
| { |
| "epoch": 0.25, |
| "eval_validation_privacy_sources_loss": 0.8341156840324402, |
| "eval_validation_privacy_sources_runtime": 210.6733, |
| "eval_validation_privacy_sources_samples_per_second": 1.818, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 2992 |
| }, |
| { |
| "epoch": 0.25, |
| "eval_validation_agenda_digitale_loss": 1.3803825378417969, |
| "eval_validation_agenda_digitale_runtime": 187.0096, |
| "eval_validation_agenda_digitale_samples_per_second": 1.818, |
| "eval_validation_agenda_digitale_steps_per_second": 0.909, |
| "step": 2992 |
| }, |
| { |
| "epoch": 0.25, |
| "eval_validation_leggepertutti_loss": 1.2398289442062378, |
| "eval_validation_leggepertutti_runtime": 35.7578, |
| "eval_validation_leggepertutti_samples_per_second": 1.818, |
| "eval_validation_leggepertutti_steps_per_second": 0.923, |
| "step": 2992 |
| }, |
| { |
| "epoch": 0.25, |
| "eval_validation_altalexprivacy_loss": 1.2100013494491577, |
| "eval_validation_altalexprivacy_runtime": 58.3051, |
| "eval_validation_altalexprivacy_samples_per_second": 1.818, |
| "eval_validation_altalexprivacy_steps_per_second": 0.909, |
| "step": 2992 |
| }, |
| { |
| "epoch": 0.25, |
| "eval_validation_mc4_it_loss": 1.7749333381652832, |
| "eval_validation_mc4_it_runtime": 78.0968, |
| "eval_validation_mc4_it_samples_per_second": 1.818, |
| "eval_validation_mc4_it_steps_per_second": 0.909, |
| "step": 2992 |
| }, |
| { |
| "epoch": 0.25, |
| "eval_validation_dolma_loss": 1.9426519870758057, |
| "eval_validation_dolma_runtime": 53.9195, |
| "eval_validation_dolma_samples_per_second": 1.818, |
| "eval_validation_dolma_steps_per_second": 0.909, |
| "step": 2992 |
| }, |
| { |
| "epoch": 0.27, |
| "grad_norm": 3.265625, |
| "learning_rate": 1e-05, |
| "loss": 1.5527, |
| "step": 3179 |
| }, |
| { |
| "epoch": 0.27, |
| "eval_validation_privacy_sources_loss": 0.8318145871162415, |
| "eval_validation_privacy_sources_runtime": 210.7255, |
| "eval_validation_privacy_sources_samples_per_second": 1.818, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 3179 |
| }, |
| { |
| "epoch": 0.27, |
| "eval_validation_agenda_digitale_loss": 1.378063440322876, |
| "eval_validation_agenda_digitale_runtime": 187.087, |
| "eval_validation_agenda_digitale_samples_per_second": 1.817, |
| "eval_validation_agenda_digitale_steps_per_second": 0.909, |
| "step": 3179 |
| }, |
| { |
| "epoch": 0.27, |
| "eval_validation_leggepertutti_loss": 1.2370458841323853, |
| "eval_validation_leggepertutti_runtime": 35.7809, |
| "eval_validation_leggepertutti_samples_per_second": 1.817, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 3179 |
| }, |
| { |
| "epoch": 0.27, |
| "eval_validation_altalexprivacy_loss": 1.2080256938934326, |
| "eval_validation_altalexprivacy_runtime": 58.3354, |
| "eval_validation_altalexprivacy_samples_per_second": 1.817, |
| "eval_validation_altalexprivacy_steps_per_second": 0.909, |
| "step": 3179 |
| }, |
| { |
| "epoch": 0.27, |
| "eval_validation_mc4_it_loss": 1.7702537775039673, |
| "eval_validation_mc4_it_runtime": 78.1409, |
| "eval_validation_mc4_it_samples_per_second": 1.817, |
| "eval_validation_mc4_it_steps_per_second": 0.909, |
| "step": 3179 |
| }, |
| { |
| "epoch": 0.27, |
| "eval_validation_dolma_loss": 1.950868844985962, |
| "eval_validation_dolma_runtime": 53.9369, |
| "eval_validation_dolma_samples_per_second": 1.817, |
| "eval_validation_dolma_steps_per_second": 0.908, |
| "step": 3179 |
| }, |
| { |
| "epoch": 0.28, |
| "grad_norm": 3.265625, |
| "learning_rate": 1e-05, |
| "loss": 1.5476, |
| "step": 3366 |
| }, |
| { |
| "epoch": 0.28, |
| "eval_validation_privacy_sources_loss": 0.8264653086662292, |
| "eval_validation_privacy_sources_runtime": 210.7205, |
| "eval_validation_privacy_sources_samples_per_second": 1.818, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 3366 |
| }, |
| { |
| "epoch": 0.28, |
| "eval_validation_agenda_digitale_loss": 1.3743617534637451, |
| "eval_validation_agenda_digitale_runtime": 187.1448, |
| "eval_validation_agenda_digitale_samples_per_second": 1.817, |
| "eval_validation_agenda_digitale_steps_per_second": 0.908, |
| "step": 3366 |
| }, |
| { |
| "epoch": 0.28, |
| "eval_validation_leggepertutti_loss": 1.2376344203948975, |
| "eval_validation_leggepertutti_runtime": 35.7729, |
| "eval_validation_leggepertutti_samples_per_second": 1.817, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 3366 |
| }, |
| { |
| "epoch": 0.28, |
| "eval_validation_altalexprivacy_loss": 1.2052847146987915, |
| "eval_validation_altalexprivacy_runtime": 58.3348, |
| "eval_validation_altalexprivacy_samples_per_second": 1.817, |
| "eval_validation_altalexprivacy_steps_per_second": 0.909, |
| "step": 3366 |
| }, |
| { |
| "epoch": 0.28, |
| "eval_validation_mc4_it_loss": 1.7669274806976318, |
| "eval_validation_mc4_it_runtime": 78.1532, |
| "eval_validation_mc4_it_samples_per_second": 1.817, |
| "eval_validation_mc4_it_steps_per_second": 0.908, |
| "step": 3366 |
| }, |
| { |
| "epoch": 0.28, |
| "eval_validation_dolma_loss": 1.9461361169815063, |
| "eval_validation_dolma_runtime": 53.9281, |
| "eval_validation_dolma_samples_per_second": 1.817, |
| "eval_validation_dolma_steps_per_second": 0.909, |
| "step": 3366 |
| }, |
| { |
| "epoch": 0.3, |
| "grad_norm": 3.625, |
| "learning_rate": 1e-05, |
| "loss": 1.558, |
| "step": 3553 |
| }, |
| { |
| "epoch": 0.3, |
| "eval_validation_privacy_sources_loss": 0.822688102722168, |
| "eval_validation_privacy_sources_runtime": 210.9998, |
| "eval_validation_privacy_sources_samples_per_second": 1.815, |
| "eval_validation_privacy_sources_steps_per_second": 0.91, |
| "step": 3553 |
| }, |
| { |
| "epoch": 0.3, |
| "eval_validation_agenda_digitale_loss": 1.3728498220443726, |
| "eval_validation_agenda_digitale_runtime": 187.2711, |
| "eval_validation_agenda_digitale_samples_per_second": 1.816, |
| "eval_validation_agenda_digitale_steps_per_second": 0.908, |
| "step": 3553 |
| }, |
| { |
| "epoch": 0.3, |
| "eval_validation_leggepertutti_loss": 1.2360832691192627, |
| "eval_validation_leggepertutti_runtime": 35.7958, |
| "eval_validation_leggepertutti_samples_per_second": 1.816, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 3553 |
| }, |
| { |
| "epoch": 0.3, |
| "eval_validation_altalexprivacy_loss": 1.2027132511138916, |
| "eval_validation_altalexprivacy_runtime": 58.3972, |
| "eval_validation_altalexprivacy_samples_per_second": 1.815, |
| "eval_validation_altalexprivacy_steps_per_second": 0.908, |
| "step": 3553 |
| }, |
| { |
| "epoch": 0.3, |
| "eval_validation_mc4_it_loss": 1.7643710374832153, |
| "eval_validation_mc4_it_runtime": 78.2118, |
| "eval_validation_mc4_it_samples_per_second": 1.816, |
| "eval_validation_mc4_it_steps_per_second": 0.908, |
| "step": 3553 |
| }, |
| { |
| "epoch": 0.3, |
| "eval_validation_dolma_loss": 1.9442397356033325, |
| "eval_validation_dolma_runtime": 53.9609, |
| "eval_validation_dolma_samples_per_second": 1.816, |
| "eval_validation_dolma_steps_per_second": 0.908, |
| "step": 3553 |
| }, |
| { |
| "epoch": 0.32, |
| "grad_norm": 4.65625, |
| "learning_rate": 1e-05, |
| "loss": 1.535, |
| "step": 3740 |
| }, |
| { |
| "epoch": 0.32, |
| "eval_validation_privacy_sources_loss": 0.8193829655647278, |
| "eval_validation_privacy_sources_runtime": 210.8214, |
| "eval_validation_privacy_sources_samples_per_second": 1.817, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 3740 |
| }, |
| { |
| "epoch": 0.32, |
| "eval_validation_agenda_digitale_loss": 1.3690398931503296, |
| "eval_validation_agenda_digitale_runtime": 187.1433, |
| "eval_validation_agenda_digitale_samples_per_second": 1.817, |
| "eval_validation_agenda_digitale_steps_per_second": 0.908, |
| "step": 3740 |
| }, |
| { |
| "epoch": 0.32, |
| "eval_validation_leggepertutti_loss": 1.2321481704711914, |
| "eval_validation_leggepertutti_runtime": 35.7856, |
| "eval_validation_leggepertutti_samples_per_second": 1.816, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 3740 |
| }, |
| { |
| "epoch": 0.32, |
| "eval_validation_altalexprivacy_loss": 1.1964303255081177, |
| "eval_validation_altalexprivacy_runtime": 58.3552, |
| "eval_validation_altalexprivacy_samples_per_second": 1.816, |
| "eval_validation_altalexprivacy_steps_per_second": 0.908, |
| "step": 3740 |
| }, |
| { |
| "epoch": 0.32, |
| "eval_validation_mc4_it_loss": 1.7612253427505493, |
| "eval_validation_mc4_it_runtime": 78.1715, |
| "eval_validation_mc4_it_samples_per_second": 1.817, |
| "eval_validation_mc4_it_steps_per_second": 0.908, |
| "step": 3740 |
| }, |
| { |
| "epoch": 0.32, |
| "eval_validation_dolma_loss": 1.9415688514709473, |
| "eval_validation_dolma_runtime": 53.9531, |
| "eval_validation_dolma_samples_per_second": 1.816, |
| "eval_validation_dolma_steps_per_second": 0.908, |
| "step": 3740 |
| }, |
| { |
| "epoch": 0.33, |
| "grad_norm": 3.203125, |
| "learning_rate": 1e-05, |
| "loss": 1.551, |
| "step": 3927 |
| }, |
| { |
| "epoch": 0.33, |
| "eval_validation_privacy_sources_loss": 0.8159863352775574, |
| "eval_validation_privacy_sources_runtime": 210.8294, |
| "eval_validation_privacy_sources_samples_per_second": 1.817, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 3927 |
| }, |
| { |
| "epoch": 0.33, |
| "eval_validation_agenda_digitale_loss": 1.3660005331039429, |
| "eval_validation_agenda_digitale_runtime": 187.2084, |
| "eval_validation_agenda_digitale_samples_per_second": 1.816, |
| "eval_validation_agenda_digitale_steps_per_second": 0.908, |
| "step": 3927 |
| }, |
| { |
| "epoch": 0.33, |
| "eval_validation_leggepertutti_loss": 1.2291594743728638, |
| "eval_validation_leggepertutti_runtime": 35.7917, |
| "eval_validation_leggepertutti_samples_per_second": 1.816, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 3927 |
| }, |
| { |
| "epoch": 0.33, |
| "eval_validation_altalexprivacy_loss": 1.1953657865524292, |
| "eval_validation_altalexprivacy_runtime": 58.3486, |
| "eval_validation_altalexprivacy_samples_per_second": 1.817, |
| "eval_validation_altalexprivacy_steps_per_second": 0.908, |
| "step": 3927 |
| }, |
| { |
| "epoch": 0.33, |
| "eval_validation_mc4_it_loss": 1.7568954229354858, |
| "eval_validation_mc4_it_runtime": 78.1754, |
| "eval_validation_mc4_it_samples_per_second": 1.816, |
| "eval_validation_mc4_it_steps_per_second": 0.908, |
| "step": 3927 |
| }, |
| { |
| "epoch": 0.33, |
| "eval_validation_dolma_loss": 1.9388848543167114, |
| "eval_validation_dolma_runtime": 53.9683, |
| "eval_validation_dolma_samples_per_second": 1.816, |
| "eval_validation_dolma_steps_per_second": 0.908, |
| "step": 3927 |
| }, |
| { |
| "epoch": 0.35, |
| "grad_norm": 3.578125, |
| "learning_rate": 1e-05, |
| "loss": 1.5452, |
| "step": 4114 |
| }, |
| { |
| "epoch": 0.35, |
| "eval_validation_privacy_sources_loss": 0.8137150406837463, |
| "eval_validation_privacy_sources_runtime": 210.7357, |
| "eval_validation_privacy_sources_samples_per_second": 1.817, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 4114 |
| }, |
| { |
| "epoch": 0.35, |
| "eval_validation_agenda_digitale_loss": 1.3656136989593506, |
| "eval_validation_agenda_digitale_runtime": 187.146, |
| "eval_validation_agenda_digitale_samples_per_second": 1.817, |
| "eval_validation_agenda_digitale_steps_per_second": 0.908, |
| "step": 4114 |
| }, |
| { |
| "epoch": 0.35, |
| "eval_validation_leggepertutti_loss": 1.2296239137649536, |
| "eval_validation_leggepertutti_runtime": 35.7766, |
| "eval_validation_leggepertutti_samples_per_second": 1.817, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 4114 |
| }, |
| { |
| "epoch": 0.35, |
| "eval_validation_altalexprivacy_loss": 1.1915565729141235, |
| "eval_validation_altalexprivacy_runtime": 58.3322, |
| "eval_validation_altalexprivacy_samples_per_second": 1.817, |
| "eval_validation_altalexprivacy_steps_per_second": 0.909, |
| "step": 4114 |
| }, |
| { |
| "epoch": 0.35, |
| "eval_validation_mc4_it_loss": 1.7542990446090698, |
| "eval_validation_mc4_it_runtime": 78.1622, |
| "eval_validation_mc4_it_samples_per_second": 1.817, |
| "eval_validation_mc4_it_steps_per_second": 0.908, |
| "step": 4114 |
| }, |
| { |
| "epoch": 0.35, |
| "eval_validation_dolma_loss": 1.9385536909103394, |
| "eval_validation_dolma_runtime": 53.9474, |
| "eval_validation_dolma_samples_per_second": 1.817, |
| "eval_validation_dolma_steps_per_second": 0.908, |
| "step": 4114 |
| }, |
| { |
| "epoch": 0.36, |
| "grad_norm": 3.421875, |
| "learning_rate": 1e-05, |
| "loss": 1.5371, |
| "step": 4301 |
| }, |
| { |
| "epoch": 0.36, |
| "eval_validation_privacy_sources_loss": 0.8114846348762512, |
| "eval_validation_privacy_sources_runtime": 210.7483, |
| "eval_validation_privacy_sources_samples_per_second": 1.817, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 4301 |
| }, |
| { |
| "epoch": 0.36, |
| "eval_validation_agenda_digitale_loss": 1.36287522315979, |
| "eval_validation_agenda_digitale_runtime": 187.0978, |
| "eval_validation_agenda_digitale_samples_per_second": 1.817, |
| "eval_validation_agenda_digitale_steps_per_second": 0.909, |
| "step": 4301 |
| }, |
| { |
| "epoch": 0.36, |
| "eval_validation_leggepertutti_loss": 1.225502371788025, |
| "eval_validation_leggepertutti_runtime": 35.7725, |
| "eval_validation_leggepertutti_samples_per_second": 1.817, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 4301 |
| }, |
| { |
| "epoch": 0.36, |
| "eval_validation_altalexprivacy_loss": 1.1899324655532837, |
| "eval_validation_altalexprivacy_runtime": 58.3269, |
| "eval_validation_altalexprivacy_samples_per_second": 1.817, |
| "eval_validation_altalexprivacy_steps_per_second": 0.909, |
| "step": 4301 |
| }, |
| { |
| "epoch": 0.36, |
| "eval_validation_mc4_it_loss": 1.7518540620803833, |
| "eval_validation_mc4_it_runtime": 78.1395, |
| "eval_validation_mc4_it_samples_per_second": 1.817, |
| "eval_validation_mc4_it_steps_per_second": 0.909, |
| "step": 4301 |
| }, |
| { |
| "epoch": 0.36, |
| "eval_validation_dolma_loss": 1.9364405870437622, |
| "eval_validation_dolma_runtime": 53.9366, |
| "eval_validation_dolma_samples_per_second": 1.817, |
| "eval_validation_dolma_steps_per_second": 0.908, |
| "step": 4301 |
| }, |
| { |
| "epoch": 0.38, |
| "grad_norm": 3.4375, |
| "learning_rate": 1e-05, |
| "loss": 1.5349, |
| "step": 4488 |
| }, |
| { |
| "epoch": 0.38, |
| "eval_validation_privacy_sources_loss": 0.8089282512664795, |
| "eval_validation_privacy_sources_runtime": 210.6735, |
| "eval_validation_privacy_sources_samples_per_second": 1.818, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 4488 |
| }, |
| { |
| "epoch": 0.38, |
| "eval_validation_agenda_digitale_loss": 1.3604696989059448, |
| "eval_validation_agenda_digitale_runtime": 187.0247, |
| "eval_validation_agenda_digitale_samples_per_second": 1.818, |
| "eval_validation_agenda_digitale_steps_per_second": 0.909, |
| "step": 4488 |
| }, |
| { |
| "epoch": 0.38, |
| "eval_validation_leggepertutti_loss": 1.2236857414245605, |
| "eval_validation_leggepertutti_runtime": 35.775, |
| "eval_validation_leggepertutti_samples_per_second": 1.817, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 4488 |
| }, |
| { |
| "epoch": 0.38, |
| "eval_validation_altalexprivacy_loss": 1.1892808675765991, |
| "eval_validation_altalexprivacy_runtime": 58.2983, |
| "eval_validation_altalexprivacy_samples_per_second": 1.818, |
| "eval_validation_altalexprivacy_steps_per_second": 0.909, |
| "step": 4488 |
| }, |
| { |
| "epoch": 0.38, |
| "eval_validation_mc4_it_loss": 1.7490640878677368, |
| "eval_validation_mc4_it_runtime": 78.1304, |
| "eval_validation_mc4_it_samples_per_second": 1.817, |
| "eval_validation_mc4_it_steps_per_second": 0.909, |
| "step": 4488 |
| }, |
| { |
| "epoch": 0.38, |
| "eval_validation_dolma_loss": 1.9361358880996704, |
| "eval_validation_dolma_runtime": 53.9258, |
| "eval_validation_dolma_samples_per_second": 1.817, |
| "eval_validation_dolma_steps_per_second": 0.909, |
| "step": 4488 |
| }, |
| { |
| "epoch": 0.39, |
| "grad_norm": 3.265625, |
| "learning_rate": 1e-05, |
| "loss": 1.538, |
| "step": 4675 |
| }, |
| { |
| "epoch": 0.39, |
| "eval_validation_privacy_sources_loss": 0.8068882822990417, |
| "eval_validation_privacy_sources_runtime": 210.6987, |
| "eval_validation_privacy_sources_samples_per_second": 1.818, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 4675 |
| }, |
| { |
| "epoch": 0.39, |
| "eval_validation_agenda_digitale_loss": 1.357992172241211, |
| "eval_validation_agenda_digitale_runtime": 187.0601, |
| "eval_validation_agenda_digitale_samples_per_second": 1.818, |
| "eval_validation_agenda_digitale_steps_per_second": 0.909, |
| "step": 4675 |
| }, |
| { |
| "epoch": 0.39, |
| "eval_validation_leggepertutti_loss": 1.2222189903259277, |
| "eval_validation_leggepertutti_runtime": 35.7685, |
| "eval_validation_leggepertutti_samples_per_second": 1.817, |
| "eval_validation_leggepertutti_steps_per_second": 0.923, |
| "step": 4675 |
| }, |
| { |
| "epoch": 0.39, |
| "eval_validation_altalexprivacy_loss": 1.1868293285369873, |
| "eval_validation_altalexprivacy_runtime": 58.3028, |
| "eval_validation_altalexprivacy_samples_per_second": 1.818, |
| "eval_validation_altalexprivacy_steps_per_second": 0.909, |
| "step": 4675 |
| }, |
| { |
| "epoch": 0.39, |
| "eval_validation_mc4_it_loss": 1.747467279434204, |
| "eval_validation_mc4_it_runtime": 78.0822, |
| "eval_validation_mc4_it_samples_per_second": 1.819, |
| "eval_validation_mc4_it_steps_per_second": 0.909, |
| "step": 4675 |
| }, |
| { |
| "epoch": 0.39, |
| "eval_validation_dolma_loss": 1.9376739263534546, |
| "eval_validation_dolma_runtime": 53.9131, |
| "eval_validation_dolma_samples_per_second": 1.818, |
| "eval_validation_dolma_steps_per_second": 0.909, |
| "step": 4675 |
| }, |
| { |
| "epoch": 0.41, |
| "grad_norm": 4.5625, |
| "learning_rate": 1e-05, |
| "loss": 1.5217, |
| "step": 4862 |
| }, |
| { |
| "epoch": 0.41, |
| "eval_validation_privacy_sources_loss": 0.8034628033638, |
| "eval_validation_privacy_sources_runtime": 210.664, |
| "eval_validation_privacy_sources_samples_per_second": 1.818, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 4862 |
| }, |
| { |
| "epoch": 0.41, |
| "eval_validation_agenda_digitale_loss": 1.3556355237960815, |
| "eval_validation_agenda_digitale_runtime": 187.0481, |
| "eval_validation_agenda_digitale_samples_per_second": 1.818, |
| "eval_validation_agenda_digitale_steps_per_second": 0.909, |
| "step": 4862 |
| }, |
| { |
| "epoch": 0.41, |
| "eval_validation_leggepertutti_loss": 1.2238881587982178, |
| "eval_validation_leggepertutti_runtime": 35.77, |
| "eval_validation_leggepertutti_samples_per_second": 1.817, |
| "eval_validation_leggepertutti_steps_per_second": 0.923, |
| "step": 4862 |
| }, |
| { |
| "epoch": 0.41, |
| "eval_validation_altalexprivacy_loss": 1.1821054220199585, |
| "eval_validation_altalexprivacy_runtime": 58.3131, |
| "eval_validation_altalexprivacy_samples_per_second": 1.818, |
| "eval_validation_altalexprivacy_steps_per_second": 0.909, |
| "step": 4862 |
| }, |
| { |
| "epoch": 0.41, |
| "eval_validation_mc4_it_loss": 1.7454167604446411, |
| "eval_validation_mc4_it_runtime": 78.136, |
| "eval_validation_mc4_it_samples_per_second": 1.817, |
| "eval_validation_mc4_it_steps_per_second": 0.909, |
| "step": 4862 |
| }, |
| { |
| "epoch": 0.41, |
| "eval_validation_dolma_loss": 1.9336557388305664, |
| "eval_validation_dolma_runtime": 53.931, |
| "eval_validation_dolma_samples_per_second": 1.817, |
| "eval_validation_dolma_steps_per_second": 0.909, |
| "step": 4862 |
| }, |
| { |
| "epoch": 0.43, |
| "grad_norm": 3.25, |
| "learning_rate": 1e-05, |
| "loss": 1.5231, |
| "step": 5049 |
| }, |
| { |
| "epoch": 0.43, |
| "eval_validation_privacy_sources_loss": 0.8018712997436523, |
| "eval_validation_privacy_sources_runtime": 210.6286, |
| "eval_validation_privacy_sources_samples_per_second": 1.818, |
| "eval_validation_privacy_sources_steps_per_second": 0.912, |
| "step": 5049 |
| }, |
| { |
| "epoch": 0.43, |
| "eval_validation_agenda_digitale_loss": 1.3536696434020996, |
| "eval_validation_agenda_digitale_runtime": 186.962, |
| "eval_validation_agenda_digitale_samples_per_second": 1.819, |
| "eval_validation_agenda_digitale_steps_per_second": 0.909, |
| "step": 5049 |
| }, |
| { |
| "epoch": 0.43, |
| "eval_validation_leggepertutti_loss": 1.219115138053894, |
| "eval_validation_leggepertutti_runtime": 35.7552, |
| "eval_validation_leggepertutti_samples_per_second": 1.818, |
| "eval_validation_leggepertutti_steps_per_second": 0.923, |
| "step": 5049 |
| }, |
| { |
| "epoch": 0.43, |
| "eval_validation_altalexprivacy_loss": 1.1803195476531982, |
| "eval_validation_altalexprivacy_runtime": 58.254, |
| "eval_validation_altalexprivacy_samples_per_second": 1.82, |
| "eval_validation_altalexprivacy_steps_per_second": 0.91, |
| "step": 5049 |
| }, |
| { |
| "epoch": 0.43, |
| "eval_validation_mc4_it_loss": 1.7427842617034912, |
| "eval_validation_mc4_it_runtime": 78.0819, |
| "eval_validation_mc4_it_samples_per_second": 1.819, |
| "eval_validation_mc4_it_steps_per_second": 0.909, |
| "step": 5049 |
| }, |
| { |
| "epoch": 0.43, |
| "eval_validation_dolma_loss": 1.932908058166504, |
| "eval_validation_dolma_runtime": 53.9066, |
| "eval_validation_dolma_samples_per_second": 1.818, |
| "eval_validation_dolma_steps_per_second": 0.909, |
| "step": 5049 |
| }, |
| { |
| "epoch": 0.44, |
| "grad_norm": 3.34375, |
| "learning_rate": 1e-05, |
| "loss": 1.535, |
| "step": 5236 |
| }, |
| { |
| "epoch": 0.44, |
| "eval_validation_privacy_sources_loss": 0.7990080714225769, |
| "eval_validation_privacy_sources_runtime": 210.6936, |
| "eval_validation_privacy_sources_samples_per_second": 1.818, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 5236 |
| }, |
| { |
| "epoch": 0.44, |
| "eval_validation_agenda_digitale_loss": 1.3512707948684692, |
| "eval_validation_agenda_digitale_runtime": 187.0661, |
| "eval_validation_agenda_digitale_samples_per_second": 1.818, |
| "eval_validation_agenda_digitale_steps_per_second": 0.909, |
| "step": 5236 |
| }, |
| { |
| "epoch": 0.44, |
| "eval_validation_leggepertutti_loss": 1.2183226346969604, |
| "eval_validation_leggepertutti_runtime": 35.7756, |
| "eval_validation_leggepertutti_samples_per_second": 1.817, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 5236 |
| }, |
| { |
| "epoch": 0.44, |
| "eval_validation_altalexprivacy_loss": 1.1762974262237549, |
| "eval_validation_altalexprivacy_runtime": 58.3182, |
| "eval_validation_altalexprivacy_samples_per_second": 1.818, |
| "eval_validation_altalexprivacy_steps_per_second": 0.909, |
| "step": 5236 |
| }, |
| { |
| "epoch": 0.44, |
| "eval_validation_mc4_it_loss": 1.7408561706542969, |
| "eval_validation_mc4_it_runtime": 78.1139, |
| "eval_validation_mc4_it_samples_per_second": 1.818, |
| "eval_validation_mc4_it_steps_per_second": 0.909, |
| "step": 5236 |
| }, |
| { |
| "epoch": 0.44, |
| "eval_validation_dolma_loss": 1.9324188232421875, |
| "eval_validation_dolma_runtime": 53.9296, |
| "eval_validation_dolma_samples_per_second": 1.817, |
| "eval_validation_dolma_steps_per_second": 0.909, |
| "step": 5236 |
| }, |
| { |
| "epoch": 0.46, |
| "grad_norm": 3.40625, |
| "learning_rate": 1e-05, |
| "loss": 1.5195, |
| "step": 5423 |
| }, |
| { |
| "epoch": 0.46, |
| "eval_validation_privacy_sources_loss": 0.7970147728919983, |
| "eval_validation_privacy_sources_runtime": 210.7209, |
| "eval_validation_privacy_sources_samples_per_second": 1.818, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 5423 |
| }, |
| { |
| "epoch": 0.46, |
| "eval_validation_agenda_digitale_loss": 1.350595235824585, |
| "eval_validation_agenda_digitale_runtime": 187.0929, |
| "eval_validation_agenda_digitale_samples_per_second": 1.817, |
| "eval_validation_agenda_digitale_steps_per_second": 0.909, |
| "step": 5423 |
| }, |
| { |
| "epoch": 0.46, |
| "eval_validation_leggepertutti_loss": 1.2196227312088013, |
| "eval_validation_leggepertutti_runtime": 35.7764, |
| "eval_validation_leggepertutti_samples_per_second": 1.817, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 5423 |
| }, |
| { |
| "epoch": 0.46, |
| "eval_validation_altalexprivacy_loss": 1.176468014717102, |
| "eval_validation_altalexprivacy_runtime": 58.3399, |
| "eval_validation_altalexprivacy_samples_per_second": 1.817, |
| "eval_validation_altalexprivacy_steps_per_second": 0.908, |
| "step": 5423 |
| }, |
| { |
| "epoch": 0.46, |
| "eval_validation_mc4_it_loss": 1.7395856380462646, |
| "eval_validation_mc4_it_runtime": 78.1494, |
| "eval_validation_mc4_it_samples_per_second": 1.817, |
| "eval_validation_mc4_it_steps_per_second": 0.909, |
| "step": 5423 |
| }, |
| { |
| "epoch": 0.46, |
| "eval_validation_dolma_loss": 1.9318716526031494, |
| "eval_validation_dolma_runtime": 53.9467, |
| "eval_validation_dolma_samples_per_second": 1.817, |
| "eval_validation_dolma_steps_per_second": 0.908, |
| "step": 5423 |
| }, |
| { |
| "epoch": 0.47, |
| "grad_norm": 3.484375, |
| "learning_rate": 1e-05, |
| "loss": 1.5356, |
| "step": 5610 |
| }, |
| { |
| "epoch": 0.47, |
| "eval_validation_privacy_sources_loss": 0.7967193126678467, |
| "eval_validation_privacy_sources_runtime": 210.7692, |
| "eval_validation_privacy_sources_samples_per_second": 1.817, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 5610 |
| }, |
| { |
| "epoch": 0.47, |
| "eval_validation_agenda_digitale_loss": 1.3498324155807495, |
| "eval_validation_agenda_digitale_runtime": 187.1217, |
| "eval_validation_agenda_digitale_samples_per_second": 1.817, |
| "eval_validation_agenda_digitale_steps_per_second": 0.908, |
| "step": 5610 |
| }, |
| { |
| "epoch": 0.47, |
| "eval_validation_leggepertutti_loss": 1.2213656902313232, |
| "eval_validation_leggepertutti_runtime": 35.7931, |
| "eval_validation_leggepertutti_samples_per_second": 1.816, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 5610 |
| }, |
| { |
| "epoch": 0.47, |
| "eval_validation_altalexprivacy_loss": 1.1725049018859863, |
| "eval_validation_altalexprivacy_runtime": 58.34, |
| "eval_validation_altalexprivacy_samples_per_second": 1.817, |
| "eval_validation_altalexprivacy_steps_per_second": 0.908, |
| "step": 5610 |
| }, |
| { |
| "epoch": 0.47, |
| "eval_validation_mc4_it_loss": 1.7369210720062256, |
| "eval_validation_mc4_it_runtime": 78.1677, |
| "eval_validation_mc4_it_samples_per_second": 1.817, |
| "eval_validation_mc4_it_steps_per_second": 0.908, |
| "step": 5610 |
| }, |
| { |
| "epoch": 0.47, |
| "eval_validation_dolma_loss": 1.931601643562317, |
| "eval_validation_dolma_runtime": 53.9523, |
| "eval_validation_dolma_samples_per_second": 1.816, |
| "eval_validation_dolma_steps_per_second": 0.908, |
| "step": 5610 |
| }, |
| { |
| "epoch": 0.49, |
| "grad_norm": 3.25, |
| "learning_rate": 1e-05, |
| "loss": 1.5248, |
| "step": 5797 |
| }, |
| { |
| "epoch": 0.49, |
| "eval_validation_privacy_sources_loss": 0.7927350997924805, |
| "eval_validation_privacy_sources_runtime": 210.7499, |
| "eval_validation_privacy_sources_samples_per_second": 1.817, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 5797 |
| }, |
| { |
| "epoch": 0.49, |
| "eval_validation_agenda_digitale_loss": 1.3474359512329102, |
| "eval_validation_agenda_digitale_runtime": 187.1385, |
| "eval_validation_agenda_digitale_samples_per_second": 1.817, |
| "eval_validation_agenda_digitale_steps_per_second": 0.908, |
| "step": 5797 |
| }, |
| { |
| "epoch": 0.49, |
| "eval_validation_leggepertutti_loss": 1.2162562608718872, |
| "eval_validation_leggepertutti_runtime": 35.7966, |
| "eval_validation_leggepertutti_samples_per_second": 1.816, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 5797 |
| }, |
| { |
| "epoch": 0.49, |
| "eval_validation_altalexprivacy_loss": 1.1715296506881714, |
| "eval_validation_altalexprivacy_runtime": 58.3612, |
| "eval_validation_altalexprivacy_samples_per_second": 1.816, |
| "eval_validation_altalexprivacy_steps_per_second": 0.908, |
| "step": 5797 |
| }, |
| { |
| "epoch": 0.49, |
| "eval_validation_mc4_it_loss": 1.7344577312469482, |
| "eval_validation_mc4_it_runtime": 78.1843, |
| "eval_validation_mc4_it_samples_per_second": 1.816, |
| "eval_validation_mc4_it_steps_per_second": 0.908, |
| "step": 5797 |
| }, |
| { |
| "epoch": 0.49, |
| "eval_validation_dolma_loss": 1.9310978651046753, |
| "eval_validation_dolma_runtime": 53.9513, |
| "eval_validation_dolma_samples_per_second": 1.816, |
| "eval_validation_dolma_steps_per_second": 0.908, |
| "step": 5797 |
| }, |
| { |
| "epoch": 0.5, |
| "grad_norm": 3.390625, |
| "learning_rate": 1e-05, |
| "loss": 1.5147, |
| "step": 5984 |
| }, |
| { |
| "epoch": 0.5, |
| "eval_validation_privacy_sources_loss": 0.7904417514801025, |
| "eval_validation_privacy_sources_runtime": 210.6793, |
| "eval_validation_privacy_sources_samples_per_second": 1.818, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 5984 |
| }, |
| { |
| "epoch": 0.5, |
| "eval_validation_agenda_digitale_loss": 1.3463512659072876, |
| "eval_validation_agenda_digitale_runtime": 187.0767, |
| "eval_validation_agenda_digitale_samples_per_second": 1.817, |
| "eval_validation_agenda_digitale_steps_per_second": 0.909, |
| "step": 5984 |
| }, |
| { |
| "epoch": 0.5, |
| "eval_validation_leggepertutti_loss": 1.2104567289352417, |
| "eval_validation_leggepertutti_runtime": 35.7676, |
| "eval_validation_leggepertutti_samples_per_second": 1.817, |
| "eval_validation_leggepertutti_steps_per_second": 0.923, |
| "step": 5984 |
| }, |
| { |
| "epoch": 0.5, |
| "eval_validation_altalexprivacy_loss": 1.1698046922683716, |
| "eval_validation_altalexprivacy_runtime": 58.3216, |
| "eval_validation_altalexprivacy_samples_per_second": 1.818, |
| "eval_validation_altalexprivacy_steps_per_second": 0.909, |
| "step": 5984 |
| }, |
| { |
| "epoch": 0.5, |
| "eval_validation_mc4_it_loss": 1.733211874961853, |
| "eval_validation_mc4_it_runtime": 78.1157, |
| "eval_validation_mc4_it_samples_per_second": 1.818, |
| "eval_validation_mc4_it_steps_per_second": 0.909, |
| "step": 5984 |
| }, |
| { |
| "epoch": 0.5, |
| "eval_validation_dolma_loss": 1.9291273355484009, |
| "eval_validation_dolma_runtime": 53.9368, |
| "eval_validation_dolma_samples_per_second": 1.817, |
| "eval_validation_dolma_steps_per_second": 0.908, |
| "step": 5984 |
| }, |
| { |
| "epoch": 0.52, |
| "grad_norm": 3.15625, |
| "learning_rate": 1e-05, |
| "loss": 1.5307, |
| "step": 6171 |
| }, |
| { |
| "epoch": 0.52, |
| "eval_validation_privacy_sources_loss": 0.7893861532211304, |
| "eval_validation_privacy_sources_runtime": 210.7488, |
| "eval_validation_privacy_sources_samples_per_second": 1.817, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 6171 |
| }, |
| { |
| "epoch": 0.52, |
| "eval_validation_agenda_digitale_loss": 1.3451480865478516, |
| "eval_validation_agenda_digitale_runtime": 187.0845, |
| "eval_validation_agenda_digitale_samples_per_second": 1.817, |
| "eval_validation_agenda_digitale_steps_per_second": 0.909, |
| "step": 6171 |
| }, |
| { |
| "epoch": 0.52, |
| "eval_validation_leggepertutti_loss": 1.2113819122314453, |
| "eval_validation_leggepertutti_runtime": 35.7727, |
| "eval_validation_leggepertutti_samples_per_second": 1.817, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 6171 |
| }, |
| { |
| "epoch": 0.52, |
| "eval_validation_altalexprivacy_loss": 1.1663610935211182, |
| "eval_validation_altalexprivacy_runtime": 58.3307, |
| "eval_validation_altalexprivacy_samples_per_second": 1.817, |
| "eval_validation_altalexprivacy_steps_per_second": 0.909, |
| "step": 6171 |
| }, |
| { |
| "epoch": 0.52, |
| "eval_validation_mc4_it_loss": 1.7309118509292603, |
| "eval_validation_mc4_it_runtime": 78.1316, |
| "eval_validation_mc4_it_samples_per_second": 1.817, |
| "eval_validation_mc4_it_steps_per_second": 0.909, |
| "step": 6171 |
| }, |
| { |
| "epoch": 0.52, |
| "eval_validation_dolma_loss": 1.9281673431396484, |
| "eval_validation_dolma_runtime": 53.9207, |
| "eval_validation_dolma_samples_per_second": 1.817, |
| "eval_validation_dolma_steps_per_second": 0.909, |
| "step": 6171 |
| }, |
| { |
| "epoch": 0.54, |
| "grad_norm": 3.078125, |
| "learning_rate": 1e-05, |
| "loss": 1.5203, |
| "step": 6358 |
| }, |
| { |
| "epoch": 0.54, |
| "eval_validation_privacy_sources_loss": 0.7874845266342163, |
| "eval_validation_privacy_sources_runtime": 210.6148, |
| "eval_validation_privacy_sources_samples_per_second": 1.818, |
| "eval_validation_privacy_sources_steps_per_second": 0.912, |
| "step": 6358 |
| }, |
| { |
| "epoch": 0.54, |
| "eval_validation_agenda_digitale_loss": 1.3434906005859375, |
| "eval_validation_agenda_digitale_runtime": 186.9358, |
| "eval_validation_agenda_digitale_samples_per_second": 1.819, |
| "eval_validation_agenda_digitale_steps_per_second": 0.909, |
| "step": 6358 |
| }, |
| { |
| "epoch": 0.54, |
| "eval_validation_leggepertutti_loss": 1.2103608846664429, |
| "eval_validation_leggepertutti_runtime": 35.7522, |
| "eval_validation_leggepertutti_samples_per_second": 1.818, |
| "eval_validation_leggepertutti_steps_per_second": 0.923, |
| "step": 6358 |
| }, |
| { |
| "epoch": 0.54, |
| "eval_validation_altalexprivacy_loss": 1.164802074432373, |
| "eval_validation_altalexprivacy_runtime": 58.2954, |
| "eval_validation_altalexprivacy_samples_per_second": 1.818, |
| "eval_validation_altalexprivacy_steps_per_second": 0.909, |
| "step": 6358 |
| }, |
| { |
| "epoch": 0.54, |
| "eval_validation_mc4_it_loss": 1.7286055088043213, |
| "eval_validation_mc4_it_runtime": 78.0929, |
| "eval_validation_mc4_it_samples_per_second": 1.818, |
| "eval_validation_mc4_it_steps_per_second": 0.909, |
| "step": 6358 |
| }, |
| { |
| "epoch": 0.54, |
| "eval_validation_dolma_loss": 1.927778720855713, |
| "eval_validation_dolma_runtime": 53.9081, |
| "eval_validation_dolma_samples_per_second": 1.818, |
| "eval_validation_dolma_steps_per_second": 0.909, |
| "step": 6358 |
| }, |
| { |
| "epoch": 0.55, |
| "grad_norm": 3.59375, |
| "learning_rate": 1e-05, |
| "loss": 1.5257, |
| "step": 6545 |
| }, |
| { |
| "epoch": 0.55, |
| "eval_validation_privacy_sources_loss": 0.785801887512207, |
| "eval_validation_privacy_sources_runtime": 210.655, |
| "eval_validation_privacy_sources_samples_per_second": 1.818, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 6545 |
| }, |
| { |
| "epoch": 0.55, |
| "eval_validation_agenda_digitale_loss": 1.341984510421753, |
| "eval_validation_agenda_digitale_runtime": 186.9769, |
| "eval_validation_agenda_digitale_samples_per_second": 1.818, |
| "eval_validation_agenda_digitale_steps_per_second": 0.909, |
| "step": 6545 |
| }, |
| { |
| "epoch": 0.55, |
| "eval_validation_leggepertutti_loss": 1.208351492881775, |
| "eval_validation_leggepertutti_runtime": 35.7494, |
| "eval_validation_leggepertutti_samples_per_second": 1.818, |
| "eval_validation_leggepertutti_steps_per_second": 0.923, |
| "step": 6545 |
| }, |
| { |
| "epoch": 0.55, |
| "eval_validation_altalexprivacy_loss": 1.1633599996566772, |
| "eval_validation_altalexprivacy_runtime": 58.2944, |
| "eval_validation_altalexprivacy_samples_per_second": 1.818, |
| "eval_validation_altalexprivacy_steps_per_second": 0.909, |
| "step": 6545 |
| }, |
| { |
| "epoch": 0.55, |
| "eval_validation_mc4_it_loss": 1.726757526397705, |
| "eval_validation_mc4_it_runtime": 78.0983, |
| "eval_validation_mc4_it_samples_per_second": 1.818, |
| "eval_validation_mc4_it_steps_per_second": 0.909, |
| "step": 6545 |
| }, |
| { |
| "epoch": 0.55, |
| "eval_validation_dolma_loss": 1.9275562763214111, |
| "eval_validation_dolma_runtime": 53.8914, |
| "eval_validation_dolma_samples_per_second": 1.818, |
| "eval_validation_dolma_steps_per_second": 0.909, |
| "step": 6545 |
| }, |
| { |
| "epoch": 0.57, |
| "grad_norm": 3.234375, |
| "learning_rate": 1e-05, |
| "loss": 1.5019, |
| "step": 6732 |
| }, |
| { |
| "epoch": 0.57, |
| "eval_validation_privacy_sources_loss": 0.7848771214485168, |
| "eval_validation_privacy_sources_runtime": 210.6636, |
| "eval_validation_privacy_sources_samples_per_second": 1.818, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 6732 |
| }, |
| { |
| "epoch": 0.57, |
| "eval_validation_agenda_digitale_loss": 1.3411486148834229, |
| "eval_validation_agenda_digitale_runtime": 186.9976, |
| "eval_validation_agenda_digitale_samples_per_second": 1.818, |
| "eval_validation_agenda_digitale_steps_per_second": 0.909, |
| "step": 6732 |
| }, |
| { |
| "epoch": 0.57, |
| "eval_validation_leggepertutti_loss": 1.2077082395553589, |
| "eval_validation_leggepertutti_runtime": 35.7665, |
| "eval_validation_leggepertutti_samples_per_second": 1.817, |
| "eval_validation_leggepertutti_steps_per_second": 0.923, |
| "step": 6732 |
| }, |
| { |
| "epoch": 0.57, |
| "eval_validation_altalexprivacy_loss": 1.1618914604187012, |
| "eval_validation_altalexprivacy_runtime": 58.33, |
| "eval_validation_altalexprivacy_samples_per_second": 1.817, |
| "eval_validation_altalexprivacy_steps_per_second": 0.909, |
| "step": 6732 |
| }, |
| { |
| "epoch": 0.57, |
| "eval_validation_mc4_it_loss": 1.725679874420166, |
| "eval_validation_mc4_it_runtime": 78.1276, |
| "eval_validation_mc4_it_samples_per_second": 1.818, |
| "eval_validation_mc4_it_steps_per_second": 0.909, |
| "step": 6732 |
| }, |
| { |
| "epoch": 0.57, |
| "eval_validation_dolma_loss": 1.9271798133850098, |
| "eval_validation_dolma_runtime": 53.9117, |
| "eval_validation_dolma_samples_per_second": 1.818, |
| "eval_validation_dolma_steps_per_second": 0.909, |
| "step": 6732 |
| }, |
| { |
| "epoch": 0.58, |
| "grad_norm": 3.15625, |
| "learning_rate": 1e-05, |
| "loss": 1.5152, |
| "step": 6919 |
| }, |
| { |
| "epoch": 0.58, |
| "eval_validation_privacy_sources_loss": 0.782995879650116, |
| "eval_validation_privacy_sources_runtime": 210.7422, |
| "eval_validation_privacy_sources_samples_per_second": 1.817, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 6919 |
| }, |
| { |
| "epoch": 0.58, |
| "eval_validation_agenda_digitale_loss": 1.3396461009979248, |
| "eval_validation_agenda_digitale_runtime": 187.0789, |
| "eval_validation_agenda_digitale_samples_per_second": 1.817, |
| "eval_validation_agenda_digitale_steps_per_second": 0.909, |
| "step": 6919 |
| }, |
| { |
| "epoch": 0.58, |
| "eval_validation_leggepertutti_loss": 1.2054615020751953, |
| "eval_validation_leggepertutti_runtime": 35.7709, |
| "eval_validation_leggepertutti_samples_per_second": 1.817, |
| "eval_validation_leggepertutti_steps_per_second": 0.923, |
| "step": 6919 |
| }, |
| { |
| "epoch": 0.58, |
| "eval_validation_altalexprivacy_loss": 1.1602697372436523, |
| "eval_validation_altalexprivacy_runtime": 58.3175, |
| "eval_validation_altalexprivacy_samples_per_second": 1.818, |
| "eval_validation_altalexprivacy_steps_per_second": 0.909, |
| "step": 6919 |
| }, |
| { |
| "epoch": 0.58, |
| "eval_validation_mc4_it_loss": 1.724775791168213, |
| "eval_validation_mc4_it_runtime": 78.0214, |
| "eval_validation_mc4_it_samples_per_second": 1.82, |
| "eval_validation_mc4_it_steps_per_second": 0.91, |
| "step": 6919 |
| }, |
| { |
| "epoch": 0.58, |
| "eval_validation_dolma_loss": 1.9262704849243164, |
| "eval_validation_dolma_runtime": 53.8374, |
| "eval_validation_dolma_samples_per_second": 1.82, |
| "eval_validation_dolma_steps_per_second": 0.91, |
| "step": 6919 |
| }, |
| { |
| "epoch": 0.6, |
| "grad_norm": 3.28125, |
| "learning_rate": 1e-05, |
| "loss": 1.5167, |
| "step": 7106 |
| }, |
| { |
| "epoch": 0.6, |
| "eval_validation_privacy_sources_loss": 0.7818235158920288, |
| "eval_validation_privacy_sources_runtime": 210.7745, |
| "eval_validation_privacy_sources_samples_per_second": 1.817, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 7106 |
| }, |
| { |
| "epoch": 0.6, |
| "eval_validation_agenda_digitale_loss": 1.3387728929519653, |
| "eval_validation_agenda_digitale_runtime": 187.1722, |
| "eval_validation_agenda_digitale_samples_per_second": 1.817, |
| "eval_validation_agenda_digitale_steps_per_second": 0.908, |
| "step": 7106 |
| }, |
| { |
| "epoch": 0.6, |
| "eval_validation_leggepertutti_loss": 1.2060880661010742, |
| "eval_validation_leggepertutti_runtime": 35.7758, |
| "eval_validation_leggepertutti_samples_per_second": 1.817, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 7106 |
| }, |
| { |
| "epoch": 0.6, |
| "eval_validation_altalexprivacy_loss": 1.158158302307129, |
| "eval_validation_altalexprivacy_runtime": 58.3272, |
| "eval_validation_altalexprivacy_samples_per_second": 1.817, |
| "eval_validation_altalexprivacy_steps_per_second": 0.909, |
| "step": 7106 |
| }, |
| { |
| "epoch": 0.6, |
| "eval_validation_mc4_it_loss": 1.7227188348770142, |
| "eval_validation_mc4_it_runtime": 78.0893, |
| "eval_validation_mc4_it_samples_per_second": 1.818, |
| "eval_validation_mc4_it_steps_per_second": 0.909, |
| "step": 7106 |
| }, |
| { |
| "epoch": 0.6, |
| "eval_validation_dolma_loss": 1.925492763519287, |
| "eval_validation_dolma_runtime": 53.8538, |
| "eval_validation_dolma_samples_per_second": 1.82, |
| "eval_validation_dolma_steps_per_second": 0.91, |
| "step": 7106 |
| }, |
| { |
| "epoch": 0.61, |
| "grad_norm": 3.390625, |
| "learning_rate": 1e-05, |
| "loss": 1.4819, |
| "step": 7293 |
| }, |
| { |
| "epoch": 0.61, |
| "eval_validation_privacy_sources_loss": 0.7804288268089294, |
| "eval_validation_privacy_sources_runtime": 210.7884, |
| "eval_validation_privacy_sources_samples_per_second": 1.817, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 7293 |
| }, |
| { |
| "epoch": 0.61, |
| "eval_validation_agenda_digitale_loss": 1.337357521057129, |
| "eval_validation_agenda_digitale_runtime": 187.1395, |
| "eval_validation_agenda_digitale_samples_per_second": 1.817, |
| "eval_validation_agenda_digitale_steps_per_second": 0.908, |
| "step": 7293 |
| }, |
| { |
| "epoch": 0.61, |
| "eval_validation_leggepertutti_loss": 1.205103874206543, |
| "eval_validation_leggepertutti_runtime": 35.7974, |
| "eval_validation_leggepertutti_samples_per_second": 1.816, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 7293 |
| }, |
| { |
| "epoch": 0.61, |
| "eval_validation_altalexprivacy_loss": 1.155694603919983, |
| "eval_validation_altalexprivacy_runtime": 58.3571, |
| "eval_validation_altalexprivacy_samples_per_second": 1.816, |
| "eval_validation_altalexprivacy_steps_per_second": 0.908, |
| "step": 7293 |
| }, |
| { |
| "epoch": 0.61, |
| "eval_validation_mc4_it_loss": 1.7214677333831787, |
| "eval_validation_mc4_it_runtime": 78.1458, |
| "eval_validation_mc4_it_samples_per_second": 1.817, |
| "eval_validation_mc4_it_steps_per_second": 0.909, |
| "step": 7293 |
| }, |
| { |
| "epoch": 0.61, |
| "eval_validation_dolma_loss": 1.926133155822754, |
| "eval_validation_dolma_runtime": 53.9449, |
| "eval_validation_dolma_samples_per_second": 1.817, |
| "eval_validation_dolma_steps_per_second": 0.908, |
| "step": 7293 |
| }, |
| { |
| "epoch": 0.63, |
| "grad_norm": 3.34375, |
| "learning_rate": 1e-05, |
| "loss": 1.5164, |
| "step": 7480 |
| }, |
| { |
| "epoch": 0.63, |
| "eval_validation_privacy_sources_loss": 0.7794305682182312, |
| "eval_validation_privacy_sources_runtime": 210.7859, |
| "eval_validation_privacy_sources_samples_per_second": 1.817, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 7480 |
| }, |
| { |
| "epoch": 0.63, |
| "eval_validation_agenda_digitale_loss": 1.3364444971084595, |
| "eval_validation_agenda_digitale_runtime": 187.1772, |
| "eval_validation_agenda_digitale_samples_per_second": 1.816, |
| "eval_validation_agenda_digitale_steps_per_second": 0.908, |
| "step": 7480 |
| }, |
| { |
| "epoch": 0.63, |
| "eval_validation_leggepertutti_loss": 1.2025309801101685, |
| "eval_validation_leggepertutti_runtime": 35.7941, |
| "eval_validation_leggepertutti_samples_per_second": 1.816, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 7480 |
| }, |
| { |
| "epoch": 0.63, |
| "eval_validation_altalexprivacy_loss": 1.1547417640686035, |
| "eval_validation_altalexprivacy_runtime": 58.3512, |
| "eval_validation_altalexprivacy_samples_per_second": 1.817, |
| "eval_validation_altalexprivacy_steps_per_second": 0.908, |
| "step": 7480 |
| }, |
| { |
| "epoch": 0.63, |
| "eval_validation_mc4_it_loss": 1.7210993766784668, |
| "eval_validation_mc4_it_runtime": 78.1723, |
| "eval_validation_mc4_it_samples_per_second": 1.816, |
| "eval_validation_mc4_it_steps_per_second": 0.908, |
| "step": 7480 |
| }, |
| { |
| "epoch": 0.63, |
| "eval_validation_dolma_loss": 1.925874948501587, |
| "eval_validation_dolma_runtime": 53.9674, |
| "eval_validation_dolma_samples_per_second": 1.816, |
| "eval_validation_dolma_steps_per_second": 0.908, |
| "step": 7480 |
| }, |
| { |
| "epoch": 0.65, |
| "grad_norm": 3.140625, |
| "learning_rate": 1e-05, |
| "loss": 1.5167, |
| "step": 7667 |
| }, |
| { |
| "epoch": 0.65, |
| "eval_validation_privacy_sources_loss": 0.7769683599472046, |
| "eval_validation_privacy_sources_runtime": 210.8943, |
| "eval_validation_privacy_sources_samples_per_second": 1.816, |
| "eval_validation_privacy_sources_steps_per_second": 0.91, |
| "step": 7667 |
| }, |
| { |
| "epoch": 0.65, |
| "eval_validation_agenda_digitale_loss": 1.3346428871154785, |
| "eval_validation_agenda_digitale_runtime": 187.2224, |
| "eval_validation_agenda_digitale_samples_per_second": 1.816, |
| "eval_validation_agenda_digitale_steps_per_second": 0.908, |
| "step": 7667 |
| }, |
| { |
| "epoch": 0.65, |
| "eval_validation_leggepertutti_loss": 1.2033891677856445, |
| "eval_validation_leggepertutti_runtime": 35.8133, |
| "eval_validation_leggepertutti_samples_per_second": 1.815, |
| "eval_validation_leggepertutti_steps_per_second": 0.921, |
| "step": 7667 |
| }, |
| { |
| "epoch": 0.65, |
| "eval_validation_altalexprivacy_loss": 1.1526622772216797, |
| "eval_validation_altalexprivacy_runtime": 58.3616, |
| "eval_validation_altalexprivacy_samples_per_second": 1.816, |
| "eval_validation_altalexprivacy_steps_per_second": 0.908, |
| "step": 7667 |
| }, |
| { |
| "epoch": 0.65, |
| "eval_validation_mc4_it_loss": 1.7187703847885132, |
| "eval_validation_mc4_it_runtime": 78.1967, |
| "eval_validation_mc4_it_samples_per_second": 1.816, |
| "eval_validation_mc4_it_steps_per_second": 0.908, |
| "step": 7667 |
| }, |
| { |
| "epoch": 0.65, |
| "eval_validation_dolma_loss": 1.9250844717025757, |
| "eval_validation_dolma_runtime": 53.9678, |
| "eval_validation_dolma_samples_per_second": 1.816, |
| "eval_validation_dolma_steps_per_second": 0.908, |
| "step": 7667 |
| }, |
| { |
| "epoch": 0.66, |
| "grad_norm": 3.3125, |
| "learning_rate": 1e-05, |
| "loss": 1.5074, |
| "step": 7854 |
| }, |
| { |
| "epoch": 0.66, |
| "eval_validation_privacy_sources_loss": 0.7756584286689758, |
| "eval_validation_privacy_sources_runtime": 210.8848, |
| "eval_validation_privacy_sources_samples_per_second": 1.816, |
| "eval_validation_privacy_sources_steps_per_second": 0.91, |
| "step": 7854 |
| }, |
| { |
| "epoch": 0.66, |
| "eval_validation_agenda_digitale_loss": 1.333917260169983, |
| "eval_validation_agenda_digitale_runtime": 187.2267, |
| "eval_validation_agenda_digitale_samples_per_second": 1.816, |
| "eval_validation_agenda_digitale_steps_per_second": 0.908, |
| "step": 7854 |
| }, |
| { |
| "epoch": 0.66, |
| "eval_validation_leggepertutti_loss": 1.2030140161514282, |
| "eval_validation_leggepertutti_runtime": 35.8032, |
| "eval_validation_leggepertutti_samples_per_second": 1.815, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 7854 |
| }, |
| { |
| "epoch": 0.66, |
| "eval_validation_altalexprivacy_loss": 1.153552770614624, |
| "eval_validation_altalexprivacy_runtime": 58.3793, |
| "eval_validation_altalexprivacy_samples_per_second": 1.816, |
| "eval_validation_altalexprivacy_steps_per_second": 0.908, |
| "step": 7854 |
| }, |
| { |
| "epoch": 0.66, |
| "eval_validation_mc4_it_loss": 1.717726230621338, |
| "eval_validation_mc4_it_runtime": 78.2107, |
| "eval_validation_mc4_it_samples_per_second": 1.816, |
| "eval_validation_mc4_it_steps_per_second": 0.908, |
| "step": 7854 |
| }, |
| { |
| "epoch": 0.66, |
| "eval_validation_dolma_loss": 1.9249721765518188, |
| "eval_validation_dolma_runtime": 53.9763, |
| "eval_validation_dolma_samples_per_second": 1.816, |
| "eval_validation_dolma_steps_per_second": 0.908, |
| "step": 7854 |
| }, |
| { |
| "epoch": 0.68, |
| "grad_norm": 3.171875, |
| "learning_rate": 1e-05, |
| "loss": 1.5122, |
| "step": 8041 |
| }, |
| { |
| "epoch": 0.68, |
| "eval_validation_privacy_sources_loss": 0.7745267152786255, |
| "eval_validation_privacy_sources_runtime": 210.8448, |
| "eval_validation_privacy_sources_samples_per_second": 1.817, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 8041 |
| }, |
| { |
| "epoch": 0.68, |
| "eval_validation_agenda_digitale_loss": 1.3330841064453125, |
| "eval_validation_agenda_digitale_runtime": 187.1352, |
| "eval_validation_agenda_digitale_samples_per_second": 1.817, |
| "eval_validation_agenda_digitale_steps_per_second": 0.908, |
| "step": 8041 |
| }, |
| { |
| "epoch": 0.68, |
| "eval_validation_leggepertutti_loss": 1.2008785009384155, |
| "eval_validation_leggepertutti_runtime": 35.7832, |
| "eval_validation_leggepertutti_samples_per_second": 1.816, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 8041 |
| }, |
| { |
| "epoch": 0.68, |
| "eval_validation_altalexprivacy_loss": 1.151678442955017, |
| "eval_validation_altalexprivacy_runtime": 58.3429, |
| "eval_validation_altalexprivacy_samples_per_second": 1.817, |
| "eval_validation_altalexprivacy_steps_per_second": 0.908, |
| "step": 8041 |
| }, |
| { |
| "epoch": 0.68, |
| "eval_validation_mc4_it_loss": 1.7152659893035889, |
| "eval_validation_mc4_it_runtime": 78.2034, |
| "eval_validation_mc4_it_samples_per_second": 1.816, |
| "eval_validation_mc4_it_steps_per_second": 0.908, |
| "step": 8041 |
| }, |
| { |
| "epoch": 0.68, |
| "eval_validation_dolma_loss": 1.9242494106292725, |
| "eval_validation_dolma_runtime": 53.9675, |
| "eval_validation_dolma_samples_per_second": 1.816, |
| "eval_validation_dolma_steps_per_second": 0.908, |
| "step": 8041 |
| }, |
| { |
| "epoch": 0.69, |
| "grad_norm": 3.25, |
| "learning_rate": 1e-05, |
| "loss": 1.5049, |
| "step": 8228 |
| }, |
| { |
| "epoch": 0.69, |
| "eval_validation_privacy_sources_loss": 0.7725993394851685, |
| "eval_validation_privacy_sources_runtime": 210.8542, |
| "eval_validation_privacy_sources_samples_per_second": 1.816, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 8228 |
| }, |
| { |
| "epoch": 0.69, |
| "eval_validation_agenda_digitale_loss": 1.3322275876998901, |
| "eval_validation_agenda_digitale_runtime": 187.1476, |
| "eval_validation_agenda_digitale_samples_per_second": 1.817, |
| "eval_validation_agenda_digitale_steps_per_second": 0.908, |
| "step": 8228 |
| }, |
| { |
| "epoch": 0.69, |
| "eval_validation_leggepertutti_loss": 1.2016466856002808, |
| "eval_validation_leggepertutti_runtime": 35.7933, |
| "eval_validation_leggepertutti_samples_per_second": 1.816, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 8228 |
| }, |
| { |
| "epoch": 0.69, |
| "eval_validation_altalexprivacy_loss": 1.1518696546554565, |
| "eval_validation_altalexprivacy_runtime": 58.3473, |
| "eval_validation_altalexprivacy_samples_per_second": 1.817, |
| "eval_validation_altalexprivacy_steps_per_second": 0.908, |
| "step": 8228 |
| }, |
| { |
| "epoch": 0.69, |
| "eval_validation_mc4_it_loss": 1.7144805192947388, |
| "eval_validation_mc4_it_runtime": 78.23, |
| "eval_validation_mc4_it_samples_per_second": 1.815, |
| "eval_validation_mc4_it_steps_per_second": 0.908, |
| "step": 8228 |
| }, |
| { |
| "epoch": 0.69, |
| "eval_validation_dolma_loss": 1.9236359596252441, |
| "eval_validation_dolma_runtime": 53.9611, |
| "eval_validation_dolma_samples_per_second": 1.816, |
| "eval_validation_dolma_steps_per_second": 0.908, |
| "step": 8228 |
| }, |
| { |
| "epoch": 0.71, |
| "grad_norm": 3.5625, |
| "learning_rate": 1e-05, |
| "loss": 1.5078, |
| "step": 8415 |
| }, |
| { |
| "epoch": 0.71, |
| "eval_validation_privacy_sources_loss": 0.7713748216629028, |
| "eval_validation_privacy_sources_runtime": 210.7439, |
| "eval_validation_privacy_sources_samples_per_second": 1.817, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 8415 |
| }, |
| { |
| "epoch": 0.71, |
| "eval_validation_agenda_digitale_loss": 1.3305851221084595, |
| "eval_validation_agenda_digitale_runtime": 187.0756, |
| "eval_validation_agenda_digitale_samples_per_second": 1.817, |
| "eval_validation_agenda_digitale_steps_per_second": 0.909, |
| "step": 8415 |
| }, |
| { |
| "epoch": 0.71, |
| "eval_validation_leggepertutti_loss": 1.201823115348816, |
| "eval_validation_leggepertutti_runtime": 35.7743, |
| "eval_validation_leggepertutti_samples_per_second": 1.817, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 8415 |
| }, |
| { |
| "epoch": 0.71, |
| "eval_validation_altalexprivacy_loss": 1.1515058279037476, |
| "eval_validation_altalexprivacy_runtime": 58.3222, |
| "eval_validation_altalexprivacy_samples_per_second": 1.817, |
| "eval_validation_altalexprivacy_steps_per_second": 0.909, |
| "step": 8415 |
| }, |
| { |
| "epoch": 0.71, |
| "eval_validation_mc4_it_loss": 1.7134541273117065, |
| "eval_validation_mc4_it_runtime": 78.1435, |
| "eval_validation_mc4_it_samples_per_second": 1.817, |
| "eval_validation_mc4_it_steps_per_second": 0.909, |
| "step": 8415 |
| }, |
| { |
| "epoch": 0.71, |
| "eval_validation_dolma_loss": 1.9214420318603516, |
| "eval_validation_dolma_runtime": 53.9466, |
| "eval_validation_dolma_samples_per_second": 1.817, |
| "eval_validation_dolma_steps_per_second": 0.908, |
| "step": 8415 |
| }, |
| { |
| "epoch": 0.73, |
| "grad_norm": 3.703125, |
| "learning_rate": 1e-05, |
| "loss": 1.5202, |
| "step": 8602 |
| }, |
| { |
| "epoch": 0.73, |
| "eval_validation_privacy_sources_loss": 0.7698016166687012, |
| "eval_validation_privacy_sources_runtime": 210.796, |
| "eval_validation_privacy_sources_samples_per_second": 1.817, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 8602 |
| }, |
| { |
| "epoch": 0.73, |
| "eval_validation_agenda_digitale_loss": 1.32979416847229, |
| "eval_validation_agenda_digitale_runtime": 187.115, |
| "eval_validation_agenda_digitale_samples_per_second": 1.817, |
| "eval_validation_agenda_digitale_steps_per_second": 0.909, |
| "step": 8602 |
| }, |
| { |
| "epoch": 0.73, |
| "eval_validation_leggepertutti_loss": 1.199041724205017, |
| "eval_validation_leggepertutti_runtime": 35.7819, |
| "eval_validation_leggepertutti_samples_per_second": 1.817, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 8602 |
| }, |
| { |
| "epoch": 0.73, |
| "eval_validation_altalexprivacy_loss": 1.1484341621398926, |
| "eval_validation_altalexprivacy_runtime": 58.3475, |
| "eval_validation_altalexprivacy_samples_per_second": 1.817, |
| "eval_validation_altalexprivacy_steps_per_second": 0.908, |
| "step": 8602 |
| }, |
| { |
| "epoch": 0.73, |
| "eval_validation_mc4_it_loss": 1.712436556816101, |
| "eval_validation_mc4_it_runtime": 78.1412, |
| "eval_validation_mc4_it_samples_per_second": 1.817, |
| "eval_validation_mc4_it_steps_per_second": 0.909, |
| "step": 8602 |
| }, |
| { |
| "epoch": 0.73, |
| "eval_validation_dolma_loss": 1.920310139656067, |
| "eval_validation_dolma_runtime": 53.9275, |
| "eval_validation_dolma_samples_per_second": 1.817, |
| "eval_validation_dolma_steps_per_second": 0.909, |
| "step": 8602 |
| }, |
| { |
| "epoch": 0.74, |
| "grad_norm": 3.34375, |
| "learning_rate": 1e-05, |
| "loss": 1.5081, |
| "step": 8789 |
| }, |
| { |
| "epoch": 0.74, |
| "eval_validation_privacy_sources_loss": 0.7663451433181763, |
| "eval_validation_privacy_sources_runtime": 210.7295, |
| "eval_validation_privacy_sources_samples_per_second": 1.817, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 8789 |
| }, |
| { |
| "epoch": 0.74, |
| "eval_validation_agenda_digitale_loss": 1.3283993005752563, |
| "eval_validation_agenda_digitale_runtime": 187.0536, |
| "eval_validation_agenda_digitale_samples_per_second": 1.818, |
| "eval_validation_agenda_digitale_steps_per_second": 0.909, |
| "step": 8789 |
| }, |
| { |
| "epoch": 0.74, |
| "eval_validation_leggepertutti_loss": 1.1974841356277466, |
| "eval_validation_leggepertutti_runtime": 35.7753, |
| "eval_validation_leggepertutti_samples_per_second": 1.817, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 8789 |
| }, |
| { |
| "epoch": 0.74, |
| "eval_validation_altalexprivacy_loss": 1.1478264331817627, |
| "eval_validation_altalexprivacy_runtime": 58.3304, |
| "eval_validation_altalexprivacy_samples_per_second": 1.817, |
| "eval_validation_altalexprivacy_steps_per_second": 0.909, |
| "step": 8789 |
| }, |
| { |
| "epoch": 0.74, |
| "eval_validation_mc4_it_loss": 1.7111691236495972, |
| "eval_validation_mc4_it_runtime": 78.1361, |
| "eval_validation_mc4_it_samples_per_second": 1.817, |
| "eval_validation_mc4_it_steps_per_second": 0.909, |
| "step": 8789 |
| }, |
| { |
| "epoch": 0.74, |
| "eval_validation_dolma_loss": 1.9195369482040405, |
| "eval_validation_dolma_runtime": 53.9301, |
| "eval_validation_dolma_samples_per_second": 1.817, |
| "eval_validation_dolma_steps_per_second": 0.909, |
| "step": 8789 |
| }, |
| { |
| "epoch": 0.76, |
| "grad_norm": 3.1875, |
| "learning_rate": 1e-05, |
| "loss": 1.4961, |
| "step": 8976 |
| }, |
| { |
| "epoch": 0.76, |
| "eval_validation_privacy_sources_loss": 0.7659348845481873, |
| "eval_validation_privacy_sources_runtime": 210.8114, |
| "eval_validation_privacy_sources_samples_per_second": 1.817, |
| "eval_validation_privacy_sources_steps_per_second": 0.911, |
| "step": 8976 |
| }, |
| { |
| "epoch": 0.76, |
| "eval_validation_agenda_digitale_loss": 1.327588438987732, |
| "eval_validation_agenda_digitale_runtime": 187.1637, |
| "eval_validation_agenda_digitale_samples_per_second": 1.817, |
| "eval_validation_agenda_digitale_steps_per_second": 0.908, |
| "step": 8976 |
| }, |
| { |
| "epoch": 0.76, |
| "eval_validation_leggepertutti_loss": 1.19636070728302, |
| "eval_validation_leggepertutti_runtime": 35.7916, |
| "eval_validation_leggepertutti_samples_per_second": 1.816, |
| "eval_validation_leggepertutti_steps_per_second": 0.922, |
| "step": 8976 |
| }, |
| { |
| "epoch": 0.76, |
| "eval_validation_altalexprivacy_loss": 1.1442352533340454, |
| "eval_validation_altalexprivacy_runtime": 58.3506, |
| "eval_validation_altalexprivacy_samples_per_second": 1.817, |
| "eval_validation_altalexprivacy_steps_per_second": 0.908, |
| "step": 8976 |
| }, |
| { |
| "epoch": 0.76, |
| "eval_validation_mc4_it_loss": 1.7103118896484375, |
| "eval_validation_mc4_it_runtime": 78.1585, |
| "eval_validation_mc4_it_samples_per_second": 1.817, |
| "eval_validation_mc4_it_steps_per_second": 0.908, |
| "step": 8976 |
| }, |
| { |
| "epoch": 0.76, |
| "eval_validation_dolma_loss": 1.919664978981018, |
| "eval_validation_dolma_runtime": 53.9545, |
| "eval_validation_dolma_samples_per_second": 1.816, |
| "eval_validation_dolma_steps_per_second": 0.908, |
| "step": 8976 |
| } |
| ], |
| "logging_steps": 187, |
| "max_steps": 23720, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 2, |
| "save_steps": 187, |
| "total_flos": 3.764568491263682e+19, |
| "train_batch_size": 1, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|