diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round10.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..eaa53bf46f36c8c2d497f87c6c2f03b401ac3c8a --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28ef8239d82162ec0cd709c417e174890fa11c1a4d3bb24871eb9c35db756c95 +size 368443438 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round12.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..a7c1f10450f49141b913c65f045b44dc56f18cb3 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a91dbfbd03b0eda5eea78822e04cc2b1e3b5890093975eea94cc34f926140df +size 368443438 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round15.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..55d5af0df8e9e094450eeb7f19736a0d5de2c8d6 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f2a82b2beb0af43f3895ebcf348c413e0ecd5ed806c5831de2d4b891e4f46e1 +size 368443438 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round17.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..b8d9f0eb5eca2fb48b6fa483d00c08ebb57a3675 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19a985f1833e783d4938f0a9ce7528e24a1d41ae07972a5bf344eb39d15eb2a0 +size 368443438 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round2.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..4a5c448b264c2fdd7631c33bc82d30b3bdc0b672 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f7af35ffe4dc0fba5de51bfd5ad8b4fb9fe896b1b6c84c1e61b575b0c704b1a +size 368442474 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round20.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..4d216743f74fa4c4d7cebee847ec692e18279ea9 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73b3d0a1d38c13e810a623753d551af1a679f168805592f2407c3b4171bee819 +size 368443438 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round5.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..7d6998bacc99abefbcef0b714ac4db17bf286ad5 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73bff6b90d411e41eb15f92cbe7e80d64cc0c652de9e204bbdcab4facc759ccb +size 368442474 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round7.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..179e2651f72470a23f59e644bdd4708ede6e1d01 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a78ae0540308ef5b38f30f678f176dc07b31ac92282a3f1061b27960904527b6 +size 368442474 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_trainer_state.json b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..cf546a65862ec77c78ea64bd55e9717051cf6c80 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_trainer_state.json @@ -0,0 +1,378 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 97, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.020618556701030927, + "grad_norm": 1.1101641654968262, + "learning_rate": 2e-05, + "loss": 0.8945, + "step": 2 + }, + { + "epoch": 0.041237113402061855, + "grad_norm": 1.6314992904663086, + "learning_rate": 2e-05, + "loss": 1.4103, + "step": 4 + }, + { + "epoch": 0.061855670103092786, + "grad_norm": 2.4410200119018555, + "learning_rate": 2e-05, + "loss": 1.3191, + "step": 6 + }, + { + "epoch": 0.08247422680412371, + "grad_norm": 3.6628243923187256, + "learning_rate": 2e-05, + "loss": 1.968, + "step": 8 + }, + { + "epoch": 0.10309278350515463, + "grad_norm": 6.844225883483887, + "learning_rate": 2e-05, + "loss": 1.5729, + "step": 10 + }, + { + "epoch": 0.12371134020618557, + "grad_norm": 0.7698001265525818, + "learning_rate": 2e-05, + "loss": 0.5719, + "step": 12 + }, + { + "epoch": 0.14432989690721648, + "grad_norm": 0.5793606042861938, + "learning_rate": 2e-05, + "loss": 1.5151, + "step": 14 + }, + { + "epoch": 0.16494845360824742, + "grad_norm": 1.8425798416137695, + "learning_rate": 2e-05, + "loss": 1.0999, + "step": 16 + }, + { + "epoch": 0.18556701030927836, + "grad_norm": 1.134320855140686, + "learning_rate": 2e-05, + "loss": 0.9422, + "step": 18 + }, + { + "epoch": 0.20618556701030927, + "grad_norm": 1.168424367904663, + "learning_rate": 2e-05, + "loss": 0.7192, + "step": 20 + }, + { + "epoch": 0.2268041237113402, + "grad_norm": 3.056905746459961, + "learning_rate": 2e-05, + "loss": 0.6074, + "step": 22 + }, + { + "epoch": 0.24742268041237114, + "grad_norm": 0.6598642468452454, + "learning_rate": 2e-05, + "loss": 0.346, + "step": 24 + }, + { + "epoch": 0.26804123711340205, + "grad_norm": 1.0676809549331665, + "learning_rate": 2e-05, + "loss": 1.1766, + "step": 26 + }, + { + "epoch": 0.28865979381443296, + "grad_norm": 1.2854700088500977, + "learning_rate": 2e-05, + "loss": 1.3399, + "step": 28 + }, + { + "epoch": 0.30927835051546393, + "grad_norm": 2.3572678565979004, + "learning_rate": 2e-05, + "loss": 1.1957, + "step": 30 + }, + { + "epoch": 0.32989690721649484, + "grad_norm": 1.2973973751068115, + "learning_rate": 2e-05, + "loss": 1.8289, + "step": 32 + }, + { + "epoch": 0.35051546391752575, + "grad_norm": 0.6981891989707947, + "learning_rate": 2e-05, + "loss": 0.7445, + "step": 34 + }, + { + "epoch": 0.3711340206185567, + "grad_norm": 0.41950735449790955, + "learning_rate": 2e-05, + "loss": 0.8945, + "step": 36 + }, + { + "epoch": 0.3917525773195876, + "grad_norm": 2.4804954528808594, + "learning_rate": 2e-05, + "loss": 0.8976, + "step": 38 + }, + { + "epoch": 0.41237113402061853, + "grad_norm": 0.989696741104126, + "learning_rate": 2e-05, + "loss": 0.8965, + "step": 40 + }, + { + "epoch": 0.4329896907216495, + "grad_norm": 0.7618101239204407, + "learning_rate": 2e-05, + "loss": 1.5496, + "step": 42 + }, + { + "epoch": 0.4536082474226804, + "grad_norm": 3.34183406829834, + "learning_rate": 2e-05, + "loss": 0.5556, + "step": 44 + }, + { + "epoch": 0.4742268041237113, + "grad_norm": 1.5414451360702515, + "learning_rate": 2e-05, + "loss": 0.9727, + "step": 46 + }, + { + "epoch": 0.4948453608247423, + "grad_norm": 3.042322874069214, + "learning_rate": 2e-05, + "loss": 0.8753, + "step": 48 + }, + { + "epoch": 0.5154639175257731, + "grad_norm": 2.1184558868408203, + "learning_rate": 2e-05, + "loss": 1.381, + "step": 50 + }, + { + "epoch": 0.5360824742268041, + "grad_norm": 0.3003075420856476, + "learning_rate": 2e-05, + "loss": 0.2195, + "step": 52 + }, + { + "epoch": 0.5567010309278351, + "grad_norm": 0.7136024236679077, + "learning_rate": 2e-05, + "loss": 1.4137, + "step": 54 + }, + { + "epoch": 0.5773195876288659, + "grad_norm": 2.5711076259613037, + "learning_rate": 2e-05, + "loss": 1.3358, + "step": 56 + }, + { + "epoch": 0.5979381443298969, + "grad_norm": 3.2242660522460938, + "learning_rate": 2e-05, + "loss": 0.6124, + "step": 58 + }, + { + "epoch": 0.6185567010309279, + "grad_norm": 1.4743932485580444, + "learning_rate": 2e-05, + "loss": 0.8501, + "step": 60 + }, + { + "epoch": 0.6391752577319587, + "grad_norm": 1.8894503116607666, + "learning_rate": 2e-05, + "loss": 0.7892, + "step": 62 + }, + { + "epoch": 0.6597938144329897, + "grad_norm": 4.588108539581299, + "learning_rate": 2e-05, + "loss": 1.0005, + "step": 64 + }, + { + "epoch": 0.6804123711340206, + "grad_norm": 0.5758951306343079, + "learning_rate": 2e-05, + "loss": 0.1539, + "step": 66 + }, + { + "epoch": 0.7010309278350515, + "grad_norm": 3.7251107692718506, + "learning_rate": 2e-05, + "loss": 0.3073, + "step": 68 + }, + { + "epoch": 0.7216494845360825, + "grad_norm": 2.5955007076263428, + "learning_rate": 2e-05, + "loss": 0.7984, + "step": 70 + }, + { + "epoch": 0.7422680412371134, + "grad_norm": 2.8188343048095703, + "learning_rate": 2e-05, + "loss": 0.8585, + "step": 72 + }, + { + "epoch": 0.7628865979381443, + "grad_norm": 4.2932634353637695, + "learning_rate": 2e-05, + "loss": 0.7, + "step": 74 + }, + { + "epoch": 0.7835051546391752, + "grad_norm": 2.4785430431365967, + "learning_rate": 2e-05, + "loss": 1.4911, + "step": 76 + }, + { + "epoch": 0.8041237113402062, + "grad_norm": 3.244961977005005, + "learning_rate": 2e-05, + "loss": 0.9058, + "step": 78 + }, + { + "epoch": 0.8247422680412371, + "grad_norm": 3.3959240913391113, + "learning_rate": 2e-05, + "loss": 1.928, + "step": 80 + }, + { + "epoch": 0.845360824742268, + "grad_norm": 0.36406227946281433, + "learning_rate": 2e-05, + "loss": 1.2079, + "step": 82 + }, + { + "epoch": 0.865979381443299, + "grad_norm": 1.649201512336731, + "learning_rate": 2e-05, + "loss": 1.3682, + "step": 84 + }, + { + "epoch": 0.8865979381443299, + "grad_norm": 1.951743721961975, + "learning_rate": 2e-05, + "loss": 0.9706, + "step": 86 + }, + { + "epoch": 0.9072164948453608, + "grad_norm": 1.6012216806411743, + "learning_rate": 2e-05, + "loss": 0.956, + "step": 88 + }, + { + "epoch": 0.9278350515463918, + "grad_norm": 1.059224247932434, + "learning_rate": 2e-05, + "loss": 0.7971, + "step": 90 + }, + { + "epoch": 0.9484536082474226, + "grad_norm": 1.2695350646972656, + "learning_rate": 2e-05, + "loss": 1.2903, + "step": 92 + }, + { + "epoch": 0.9690721649484536, + "grad_norm": 0.9126003980636597, + "learning_rate": 2e-05, + "loss": 0.486, + "step": 94 + }, + { + "epoch": 0.9896907216494846, + "grad_norm": 0.9548375606536865, + "learning_rate": 2e-05, + "loss": 0.4924, + "step": 96 + }, + { + "epoch": 1.0, + "step": 97, + "total_flos": 5653713448337408.0, + "train_loss": 1.0004102569265463, + "train_runtime": 222.4287, + "train_samples_per_second": 1.744, + "train_steps_per_second": 0.436 + } + ], + "logging_steps": 2, + "max_steps": 97, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 5653713448337408.0, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round10.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..ce159db736548a09d43ed42dcefd6677bcb030e3 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac50ab133a7a5aa9dfea61e6d8ed7653bb6f285eb13975c45759804e1c5a0113 +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round12.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..9e9758828e9d9f292debe3f0870d39b64327e0b2 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66dd8680ac517ba6ca8d2ff3c8a3cbad6fe0cccec680ad711d030f9dd2c6554f +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round15.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..54c4ea59ca080630180eb7c31f23cc75b8cd2593 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:268c8d523348ff94235dca656d4225fe4d7311eda06f2dd672cb2995a74cf1ad +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round17.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..3ac72445d7cc123b2218762a03aac1930c39de7b --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5ee153c72366a156c658c58c08fb31ae4d89aaf7cf231b1a3fc2cf80098a182 +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round2.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..b84a635971e6c799504d60e08e8b7227bcf95490 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4a9d2ff90a509ed280525e7783832b83f0e780f8cc85032615ccff649e9190e +size 791576546 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round20.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..859da5b7d6a017804f9bfa2e5214abd103a53941 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c82a6b29ae63539e855ee08429abf75f2eb504c822f65b9cd7a456e87d8af94 +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round5.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..3219f789c46f8ed6438d680aae66be5e5f93ee33 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8ecbe4f845d20983d9fa3c345743a695c773b6f8352ba9e0b9e3fd4efcd378d +size 791576546 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round7.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..1312fc9440c1107be2d2d5ff99c5dbe1e9c2e39d --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21522413a5083211437c3a7d2e7d2f40176b80d21234179e98a978a40f816dac +size 791576546 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_trainer_state.json b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..6ac1bafb526c7106ca21d267ce8a8636ad2f5e3c --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_trainer_state.json @@ -0,0 +1,378 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 97, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.020618556701030927, + "grad_norm": 5.094399929046631, + "learning_rate": 2e-05, + "loss": 1.5978, + "step": 2 + }, + { + "epoch": 0.041237113402061855, + "grad_norm": 2.2240917682647705, + "learning_rate": 2e-05, + "loss": 2.3088, + "step": 4 + }, + { + "epoch": 0.061855670103092786, + "grad_norm": 1.5078622102737427, + "learning_rate": 2e-05, + "loss": 0.9092, + "step": 6 + }, + { + "epoch": 0.08247422680412371, + "grad_norm": 0.8912699818611145, + "learning_rate": 2e-05, + "loss": 0.6373, + "step": 8 + }, + { + "epoch": 0.10309278350515463, + "grad_norm": 0.416252076625824, + "learning_rate": 2e-05, + "loss": 0.8186, + "step": 10 + }, + { + "epoch": 0.12371134020618557, + "grad_norm": 0.8248510360717773, + "learning_rate": 2e-05, + "loss": 1.0876, + "step": 12 + }, + { + "epoch": 0.14432989690721648, + "grad_norm": 0.9105907082557678, + "learning_rate": 2e-05, + "loss": 0.9326, + "step": 14 + }, + { + "epoch": 0.16494845360824742, + "grad_norm": 0.7425227761268616, + "learning_rate": 2e-05, + "loss": 1.1207, + "step": 16 + }, + { + "epoch": 0.18556701030927836, + "grad_norm": 1.2341773509979248, + "learning_rate": 2e-05, + "loss": 1.0813, + "step": 18 + }, + { + "epoch": 0.20618556701030927, + "grad_norm": 1.2988817691802979, + "learning_rate": 2e-05, + "loss": 1.5784, + "step": 20 + }, + { + "epoch": 0.2268041237113402, + "grad_norm": 1.1802982091903687, + "learning_rate": 2e-05, + "loss": 1.1858, + "step": 22 + }, + { + "epoch": 0.24742268041237114, + "grad_norm": 0.40825000405311584, + "learning_rate": 2e-05, + "loss": 1.0679, + "step": 24 + }, + { + "epoch": 0.26804123711340205, + "grad_norm": 1.1907871961593628, + "learning_rate": 2e-05, + "loss": 0.9465, + "step": 26 + }, + { + "epoch": 0.28865979381443296, + "grad_norm": 2.7417049407958984, + "learning_rate": 2e-05, + "loss": 1.6913, + "step": 28 + }, + { + "epoch": 0.30927835051546393, + "grad_norm": 1.4188278913497925, + "learning_rate": 2e-05, + "loss": 1.126, + "step": 30 + }, + { + "epoch": 0.32989690721649484, + "grad_norm": 1.1148083209991455, + "learning_rate": 2e-05, + "loss": 0.5853, + "step": 32 + }, + { + "epoch": 0.35051546391752575, + "grad_norm": 1.284436821937561, + "learning_rate": 2e-05, + "loss": 0.6709, + "step": 34 + }, + { + "epoch": 0.3711340206185567, + "grad_norm": 1.7680528163909912, + "learning_rate": 2e-05, + "loss": 0.6444, + "step": 36 + }, + { + "epoch": 0.3917525773195876, + "grad_norm": 1.0730924606323242, + "learning_rate": 2e-05, + "loss": 0.6197, + "step": 38 + }, + { + "epoch": 0.41237113402061853, + "grad_norm": 0.9840460419654846, + "learning_rate": 2e-05, + "loss": 0.9225, + "step": 40 + }, + { + "epoch": 0.4329896907216495, + "grad_norm": 2.7215404510498047, + "learning_rate": 2e-05, + "loss": 1.1065, + "step": 42 + }, + { + "epoch": 0.4536082474226804, + "grad_norm": 1.0859086513519287, + "learning_rate": 2e-05, + "loss": 1.6448, + "step": 44 + }, + { + "epoch": 0.4742268041237113, + "grad_norm": 0.6916680335998535, + "learning_rate": 2e-05, + "loss": 0.5747, + "step": 46 + }, + { + "epoch": 0.4948453608247423, + "grad_norm": 0.5634881854057312, + "learning_rate": 2e-05, + "loss": 0.8072, + "step": 48 + }, + { + "epoch": 0.5154639175257731, + "grad_norm": 1.403308629989624, + "learning_rate": 2e-05, + "loss": 0.757, + "step": 50 + }, + { + "epoch": 0.5360824742268041, + "grad_norm": 1.0651711225509644, + "learning_rate": 2e-05, + "loss": 1.2329, + "step": 52 + }, + { + "epoch": 0.5567010309278351, + "grad_norm": 3.2769243717193604, + "learning_rate": 2e-05, + "loss": 0.9653, + "step": 54 + }, + { + "epoch": 0.5773195876288659, + "grad_norm": 1.2478959560394287, + "learning_rate": 2e-05, + "loss": 0.8591, + "step": 56 + }, + { + "epoch": 0.5979381443298969, + "grad_norm": 3.3655834197998047, + "learning_rate": 2e-05, + "loss": 1.6742, + "step": 58 + }, + { + "epoch": 0.6185567010309279, + "grad_norm": 1.0023908615112305, + "learning_rate": 2e-05, + "loss": 1.0587, + "step": 60 + }, + { + "epoch": 0.6391752577319587, + "grad_norm": 4.638378620147705, + "learning_rate": 2e-05, + "loss": 1.052, + "step": 62 + }, + { + "epoch": 0.6597938144329897, + "grad_norm": 1.3997457027435303, + "learning_rate": 2e-05, + "loss": 0.7772, + "step": 64 + }, + { + "epoch": 0.6804123711340206, + "grad_norm": 2.229414224624634, + "learning_rate": 2e-05, + "loss": 1.2991, + "step": 66 + }, + { + "epoch": 0.7010309278350515, + "grad_norm": 0.4760843515396118, + "learning_rate": 2e-05, + "loss": 0.9409, + "step": 68 + }, + { + "epoch": 0.7216494845360825, + "grad_norm": 1.4938956499099731, + "learning_rate": 2e-05, + "loss": 1.0356, + "step": 70 + }, + { + "epoch": 0.7422680412371134, + "grad_norm": 1.7016663551330566, + "learning_rate": 2e-05, + "loss": 0.9062, + "step": 72 + }, + { + "epoch": 0.7628865979381443, + "grad_norm": 1.5440024137496948, + "learning_rate": 2e-05, + "loss": 1.5393, + "step": 74 + }, + { + "epoch": 0.7835051546391752, + "grad_norm": 0.718760073184967, + "learning_rate": 2e-05, + "loss": 0.5889, + "step": 76 + }, + { + "epoch": 0.8041237113402062, + "grad_norm": 1.5525449514389038, + "learning_rate": 2e-05, + "loss": 1.275, + "step": 78 + }, + { + "epoch": 0.8247422680412371, + "grad_norm": 0.4799572229385376, + "learning_rate": 2e-05, + "loss": 0.7098, + "step": 80 + }, + { + "epoch": 0.845360824742268, + "grad_norm": 1.6241955757141113, + "learning_rate": 2e-05, + "loss": 1.1278, + "step": 82 + }, + { + "epoch": 0.865979381443299, + "grad_norm": 1.5434255599975586, + "learning_rate": 2e-05, + "loss": 0.8865, + "step": 84 + }, + { + "epoch": 0.8865979381443299, + "grad_norm": 4.1449079513549805, + "learning_rate": 2e-05, + "loss": 1.3477, + "step": 86 + }, + { + "epoch": 0.9072164948453608, + "grad_norm": 1.316735029220581, + "learning_rate": 2e-05, + "loss": 0.5452, + "step": 88 + }, + { + "epoch": 0.9278350515463918, + "grad_norm": 1.4440531730651855, + "learning_rate": 2e-05, + "loss": 0.7568, + "step": 90 + }, + { + "epoch": 0.9484536082474226, + "grad_norm": 0.6465669870376587, + "learning_rate": 2e-05, + "loss": 0.5148, + "step": 92 + }, + { + "epoch": 0.9690721649484536, + "grad_norm": 3.1840262413024902, + "learning_rate": 2e-05, + "loss": 0.8276, + "step": 94 + }, + { + "epoch": 0.9896907216494846, + "grad_norm": 2.191006898880005, + "learning_rate": 2e-05, + "loss": 1.0671, + "step": 96 + }, + { + "epoch": 1.0, + "step": 97, + "total_flos": 1.3522822525616128e+16, + "train_loss": 1.024123240991966, + "train_runtime": 329.2802, + "train_samples_per_second": 1.178, + "train_steps_per_second": 0.295 + } + ], + "logging_steps": 2, + "max_steps": 97, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 1.3522822525616128e+16, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round10.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..572d755c9a95183f67caa3ab081a379fd2e6ae1b --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1953a5d682996bf7f4974e09538f0db4357535a914fdb147d514c228417d8158 +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round12.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..e544180afe9fd10ee7030e76850704aef2900c10 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ed6b8398417dec05d433da0925ff0676355f83e22912bb2f246305243882495 +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round15.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..f3dd0ddd9175b7ccbeae00396cb5cc8ed74deec7 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c86152694df067a9e575791bae4a78d113d1c1f3913acddace1c81189a40bf60 +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round17.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..37dc60d58e9d74027211d6f82722deab7980ed72 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:007fd7465945f737972fd09d5a5bfac976291174c2cc1f3e6c0abd42fb1e15cd +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round2.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..62b74d233775b7768e610eb22af3c93cee27d4a2 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be898f74488af89b95d07167565247944b62909ca7fb60878c1b9188e44ae294 +size 791576546 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round20.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..aa752942ec68071d1370c20347d8ecff3c70fdfc --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:660fb4b5ab21dd5fa6cd373a6b44bf7bd6aa27bb38b6ba9ee00958c570110ae9 +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round5.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..d0b8a9e22276c2b6cf1e6d7f871d0f9583add585 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:072d545c26b4cc2a1e2ac58d2d97e7ee52ea4b8b2e6598e811dc3ab58507587d +size 791576546 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round7.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..7de41ba03849e4bb08e58fff7f9682added742d0 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01c36cedd65d7a1994dcd41a9ed47d891dcca4dba251524fa7d3877c98a16075 +size 791576546 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_trainer_state.json b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..cdbfb531f247be640c139742b54e76186f918bc9 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_trainer_state.json @@ -0,0 +1,378 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 97, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.020618556701030927, + "grad_norm": 2.715688943862915, + "learning_rate": 2e-05, + "loss": 0.7903, + "step": 2 + }, + { + "epoch": 0.041237113402061855, + "grad_norm": 1.7270240783691406, + "learning_rate": 2e-05, + "loss": 0.8497, + "step": 4 + }, + { + "epoch": 0.061855670103092786, + "grad_norm": 2.6262009143829346, + "learning_rate": 2e-05, + "loss": 2.5311, + "step": 6 + }, + { + "epoch": 0.08247422680412371, + "grad_norm": 2.0781748294830322, + "learning_rate": 2e-05, + "loss": 0.6511, + "step": 8 + }, + { + "epoch": 0.10309278350515463, + "grad_norm": 3.878676176071167, + "learning_rate": 2e-05, + "loss": 1.6893, + "step": 10 + }, + { + "epoch": 0.12371134020618557, + "grad_norm": 0.30152788758277893, + "learning_rate": 2e-05, + "loss": 0.2982, + "step": 12 + }, + { + "epoch": 0.14432989690721648, + "grad_norm": 2.4543538093566895, + "learning_rate": 2e-05, + "loss": 1.4963, + "step": 14 + }, + { + "epoch": 0.16494845360824742, + "grad_norm": 1.1550655364990234, + "learning_rate": 2e-05, + "loss": 0.5657, + "step": 16 + }, + { + "epoch": 0.18556701030927836, + "grad_norm": 1.4158210754394531, + "learning_rate": 2e-05, + "loss": 0.6207, + "step": 18 + }, + { + "epoch": 0.20618556701030927, + "grad_norm": 1.8720401525497437, + "learning_rate": 2e-05, + "loss": 0.9528, + "step": 20 + }, + { + "epoch": 0.2268041237113402, + "grad_norm": 1.3980697393417358, + "learning_rate": 2e-05, + "loss": 0.7742, + "step": 22 + }, + { + "epoch": 0.24742268041237114, + "grad_norm": 0.7552713751792908, + "learning_rate": 2e-05, + "loss": 0.56, + "step": 24 + }, + { + "epoch": 0.26804123711340205, + "grad_norm": 2.9224400520324707, + "learning_rate": 2e-05, + "loss": 0.761, + "step": 26 + }, + { + "epoch": 0.28865979381443296, + "grad_norm": 2.1200363636016846, + "learning_rate": 2e-05, + "loss": 1.8194, + "step": 28 + }, + { + "epoch": 0.30927835051546393, + "grad_norm": 1.0131165981292725, + "learning_rate": 2e-05, + "loss": 0.5858, + "step": 30 + }, + { + "epoch": 0.32989690721649484, + "grad_norm": 1.1930532455444336, + "learning_rate": 2e-05, + "loss": 0.3527, + "step": 32 + }, + { + "epoch": 0.35051546391752575, + "grad_norm": 0.8298959136009216, + "learning_rate": 2e-05, + "loss": 0.7283, + "step": 34 + }, + { + "epoch": 0.3711340206185567, + "grad_norm": 0.21372075378894806, + "learning_rate": 2e-05, + "loss": 0.679, + "step": 36 + }, + { + "epoch": 0.3917525773195876, + "grad_norm": 0.6620970368385315, + "learning_rate": 2e-05, + "loss": 0.308, + "step": 38 + }, + { + "epoch": 0.41237113402061853, + "grad_norm": 1.3406527042388916, + "learning_rate": 2e-05, + "loss": 1.0992, + "step": 40 + }, + { + "epoch": 0.4329896907216495, + "grad_norm": 8.218306541442871, + "learning_rate": 2e-05, + "loss": 2.0959, + "step": 42 + }, + { + "epoch": 0.4536082474226804, + "grad_norm": 1.171020269393921, + "learning_rate": 2e-05, + "loss": 0.6386, + "step": 44 + }, + { + "epoch": 0.4742268041237113, + "grad_norm": 2.1302266120910645, + "learning_rate": 2e-05, + "loss": 1.7207, + "step": 46 + }, + { + "epoch": 0.4948453608247423, + "grad_norm": 1.39640474319458, + "learning_rate": 2e-05, + "loss": 1.7815, + "step": 48 + }, + { + "epoch": 0.5154639175257731, + "grad_norm": 1.7075337171554565, + "learning_rate": 2e-05, + "loss": 1.1565, + "step": 50 + }, + { + "epoch": 0.5360824742268041, + "grad_norm": 0.19492167234420776, + "learning_rate": 2e-05, + "loss": 0.3214, + "step": 52 + }, + { + "epoch": 0.5567010309278351, + "grad_norm": 2.8099043369293213, + "learning_rate": 2e-05, + "loss": 1.2814, + "step": 54 + }, + { + "epoch": 0.5773195876288659, + "grad_norm": 3.1069672107696533, + "learning_rate": 2e-05, + "loss": 1.6989, + "step": 56 + }, + { + "epoch": 0.5979381443298969, + "grad_norm": 1.5938727855682373, + "learning_rate": 2e-05, + "loss": 1.0741, + "step": 58 + }, + { + "epoch": 0.6185567010309279, + "grad_norm": 2.409372329711914, + "learning_rate": 2e-05, + "loss": 0.712, + "step": 60 + }, + { + "epoch": 0.6391752577319587, + "grad_norm": 1.280025839805603, + "learning_rate": 2e-05, + "loss": 0.6074, + "step": 62 + }, + { + "epoch": 0.6597938144329897, + "grad_norm": 1.893931269645691, + "learning_rate": 2e-05, + "loss": 0.9652, + "step": 64 + }, + { + "epoch": 0.6804123711340206, + "grad_norm": 1.0092408657073975, + "learning_rate": 2e-05, + "loss": 0.5104, + "step": 66 + }, + { + "epoch": 0.7010309278350515, + "grad_norm": 1.1251095533370972, + "learning_rate": 2e-05, + "loss": 0.5629, + "step": 68 + }, + { + "epoch": 0.7216494845360825, + "grad_norm": 3.200808048248291, + "learning_rate": 2e-05, + "loss": 1.9959, + "step": 70 + }, + { + "epoch": 0.7422680412371134, + "grad_norm": 2.1445953845977783, + "learning_rate": 2e-05, + "loss": 0.8926, + "step": 72 + }, + { + "epoch": 0.7628865979381443, + "grad_norm": 0.7390415072441101, + "learning_rate": 2e-05, + "loss": 0.3945, + "step": 74 + }, + { + "epoch": 0.7835051546391752, + "grad_norm": 3.7797181606292725, + "learning_rate": 2e-05, + "loss": 1.2296, + "step": 76 + }, + { + "epoch": 0.8041237113402062, + "grad_norm": 1.9498169422149658, + "learning_rate": 2e-05, + "loss": 0.9621, + "step": 78 + }, + { + "epoch": 0.8247422680412371, + "grad_norm": 2.3580148220062256, + "learning_rate": 2e-05, + "loss": 1.074, + "step": 80 + }, + { + "epoch": 0.845360824742268, + "grad_norm": 3.7689895629882812, + "learning_rate": 2e-05, + "loss": 0.8532, + "step": 82 + }, + { + "epoch": 0.865979381443299, + "grad_norm": 1.0212076902389526, + "learning_rate": 2e-05, + "loss": 0.3944, + "step": 84 + }, + { + "epoch": 0.8865979381443299, + "grad_norm": 1.0816051959991455, + "learning_rate": 2e-05, + "loss": 0.7249, + "step": 86 + }, + { + "epoch": 0.9072164948453608, + "grad_norm": 0.7434933185577393, + "learning_rate": 2e-05, + "loss": 0.4865, + "step": 88 + }, + { + "epoch": 0.9278350515463918, + "grad_norm": 1.409759521484375, + "learning_rate": 2e-05, + "loss": 0.5403, + "step": 90 + }, + { + "epoch": 0.9484536082474226, + "grad_norm": 2.005401849746704, + "learning_rate": 2e-05, + "loss": 1.0927, + "step": 92 + }, + { + "epoch": 0.9690721649484536, + "grad_norm": 3.6402158737182617, + "learning_rate": 2e-05, + "loss": 0.7249, + "step": 94 + }, + { + "epoch": 0.9896907216494846, + "grad_norm": 2.5542266368865967, + "learning_rate": 2e-05, + "loss": 1.3884, + "step": 96 + }, + { + "epoch": 1.0, + "step": 97, + "total_flos": 1.5329114357497856e+16, + "train_loss": 0.9519824686738634, + "train_runtime": 357.0654, + "train_samples_per_second": 1.087, + "train_steps_per_second": 0.272 + } + ], + "logging_steps": 2, + "max_steps": 97, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 1.5329114357497856e+16, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round10.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..78e004f232f20ba97fd4ed737d4ce6e824d02cc3 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4803816dd8fe4467fa5f43227533a56f083b8ad0f6ddd457d12f761c554043f4 +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round12.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..044792e7ee7b2d16c9cf8b89019f40253ef894ca --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17a6865b4d478bbb296c1066419695af40fc07ad1147c3fbff13658f9808bc29 +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round15.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..df0567844df9f6a952b3d562334d5b244c3e2f45 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b66cc40edb9397433df9178db225f73eafa6ea65334a7650e8930a9fbbb8b4a4 +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round17.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..8cedea4d69dc23538ff9b00ac4635e165b7163b9 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68112bcb7c765592e71c2a4308eb7fc02b16edd1004be3c05f8ea3fb426f24c7 +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round2.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..d1aee57bc95bba8a4ab437825bab0176c8db3cc8 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:821b9803cea659a4bee96d4875ddcf797492fe28233d4eb5c9f67c7c429d5d60 +size 791576546 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round20.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..f84583b979e3371274da0cb8bf02a3461f580009 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2bf168da76f1338f80db83394c6a07d9359185723fa8e27c2aee29c881c64f1 +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round5.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..6d44a506a826d0917f0ce4507502e82726d3b203 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ceb89ff4f0927002a37fbf5b1b3961045b663c7ab2467c070fde86fc9f14a14 +size 791576546 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round7.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..15239ac86212427817a2b6bcfa2178a533290e91 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fffbadb068adde75a38be22546d8dfa6c08ffaa70b7f23aa68aeb6eff62809f +size 791576546 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_trainer_state.json b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..e858c839c208552a282ba057edca2809bdffc8bd --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_trainer_state.json @@ -0,0 +1,378 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 97, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.020618556701030927, + "grad_norm": 0.5930002927780151, + "learning_rate": 2e-05, + "loss": 1.7236, + "step": 2 + }, + { + "epoch": 0.041237113402061855, + "grad_norm": 0.7709837555885315, + "learning_rate": 2e-05, + "loss": 2.0088, + "step": 4 + }, + { + "epoch": 0.061855670103092786, + "grad_norm": 0.4815305769443512, + "learning_rate": 2e-05, + "loss": 1.4131, + "step": 6 + }, + { + "epoch": 0.08247422680412371, + "grad_norm": 0.48609688878059387, + "learning_rate": 2e-05, + "loss": 1.1724, + "step": 8 + }, + { + "epoch": 0.10309278350515463, + "grad_norm": 0.4869016706943512, + "learning_rate": 2e-05, + "loss": 1.7295, + "step": 10 + }, + { + "epoch": 0.12371134020618557, + "grad_norm": 0.37476807832717896, + "learning_rate": 2e-05, + "loss": 1.6475, + "step": 12 + }, + { + "epoch": 0.14432989690721648, + "grad_norm": 0.6886877417564392, + "learning_rate": 2e-05, + "loss": 1.4917, + "step": 14 + }, + { + "epoch": 0.16494845360824742, + "grad_norm": 0.5024330615997314, + "learning_rate": 2e-05, + "loss": 1.4277, + "step": 16 + }, + { + "epoch": 0.18556701030927836, + "grad_norm": 0.6298432946205139, + "learning_rate": 2e-05, + "loss": 1.5801, + "step": 18 + }, + { + "epoch": 0.20618556701030927, + "grad_norm": 0.46709224581718445, + "learning_rate": 2e-05, + "loss": 1.625, + "step": 20 + }, + { + "epoch": 0.2268041237113402, + "grad_norm": 0.4031917154788971, + "learning_rate": 2e-05, + "loss": 1.5425, + "step": 22 + }, + { + "epoch": 0.24742268041237114, + "grad_norm": 0.5809447169303894, + "learning_rate": 2e-05, + "loss": 1.8184, + "step": 24 + }, + { + "epoch": 0.26804123711340205, + "grad_norm": 0.43344253301620483, + "learning_rate": 2e-05, + "loss": 1.6924, + "step": 26 + }, + { + "epoch": 0.28865979381443296, + "grad_norm": 0.5011717081069946, + "learning_rate": 2e-05, + "loss": 1.3584, + "step": 28 + }, + { + "epoch": 0.30927835051546393, + "grad_norm": 0.4586883783340454, + "learning_rate": 2e-05, + "loss": 1.501, + "step": 30 + }, + { + "epoch": 0.32989690721649484, + "grad_norm": 0.6749467253684998, + "learning_rate": 2e-05, + "loss": 1.6797, + "step": 32 + }, + { + "epoch": 0.35051546391752575, + "grad_norm": 0.38988545536994934, + "learning_rate": 2e-05, + "loss": 1.3579, + "step": 34 + }, + { + "epoch": 0.3711340206185567, + "grad_norm": 0.48226863145828247, + "learning_rate": 2e-05, + "loss": 1.707, + "step": 36 + }, + { + "epoch": 0.3917525773195876, + "grad_norm": 0.48712313175201416, + "learning_rate": 2e-05, + "loss": 1.4121, + "step": 38 + }, + { + "epoch": 0.41237113402061853, + "grad_norm": 0.44966915249824524, + "learning_rate": 2e-05, + "loss": 1.6276, + "step": 40 + }, + { + "epoch": 0.4329896907216495, + "grad_norm": 0.5168526768684387, + "learning_rate": 2e-05, + "loss": 1.6426, + "step": 42 + }, + { + "epoch": 0.4536082474226804, + "grad_norm": 0.5030601620674133, + "learning_rate": 2e-05, + "loss": 1.5693, + "step": 44 + }, + { + "epoch": 0.4742268041237113, + "grad_norm": 0.7527281045913696, + "learning_rate": 2e-05, + "loss": 1.5518, + "step": 46 + }, + { + "epoch": 0.4948453608247423, + "grad_norm": 1.2194421291351318, + "learning_rate": 2e-05, + "loss": 1.5342, + "step": 48 + }, + { + "epoch": 0.5154639175257731, + "grad_norm": 0.5955514907836914, + "learning_rate": 2e-05, + "loss": 1.5137, + "step": 50 + }, + { + "epoch": 0.5360824742268041, + "grad_norm": 0.7728529572486877, + "learning_rate": 2e-05, + "loss": 1.6963, + "step": 52 + }, + { + "epoch": 0.5567010309278351, + "grad_norm": 0.73228919506073, + "learning_rate": 2e-05, + "loss": 1.4502, + "step": 54 + }, + { + "epoch": 0.5773195876288659, + "grad_norm": 0.4163931906223297, + "learning_rate": 2e-05, + "loss": 1.4219, + "step": 56 + }, + { + "epoch": 0.5979381443298969, + "grad_norm": 0.5588869452476501, + "learning_rate": 2e-05, + "loss": 1.1425, + "step": 58 + }, + { + "epoch": 0.6185567010309279, + "grad_norm": 0.6062840223312378, + "learning_rate": 2e-05, + "loss": 1.4331, + "step": 60 + }, + { + "epoch": 0.6391752577319587, + "grad_norm": 1.0351043939590454, + "learning_rate": 2e-05, + "loss": 1.4609, + "step": 62 + }, + { + "epoch": 0.6597938144329897, + "grad_norm": 0.6619802713394165, + "learning_rate": 2e-05, + "loss": 1.4189, + "step": 64 + }, + { + "epoch": 0.6804123711340206, + "grad_norm": 0.37535732984542847, + "learning_rate": 2e-05, + "loss": 1.3813, + "step": 66 + }, + { + "epoch": 0.7010309278350515, + "grad_norm": 0.9288793802261353, + "learning_rate": 2e-05, + "loss": 1.397, + "step": 68 + }, + { + "epoch": 0.7216494845360825, + "grad_norm": 1.1058944463729858, + "learning_rate": 2e-05, + "loss": 1.4009, + "step": 70 + }, + { + "epoch": 0.7422680412371134, + "grad_norm": 0.7440882921218872, + "learning_rate": 2e-05, + "loss": 1.007, + "step": 72 + }, + { + "epoch": 0.7628865979381443, + "grad_norm": 1.2134323120117188, + "learning_rate": 2e-05, + "loss": 1.3503, + "step": 74 + }, + { + "epoch": 0.7835051546391752, + "grad_norm": 0.4168848693370819, + "learning_rate": 2e-05, + "loss": 1.0313, + "step": 76 + }, + { + "epoch": 0.8041237113402062, + "grad_norm": 1.7301552295684814, + "learning_rate": 2e-05, + "loss": 1.4034, + "step": 78 + }, + { + "epoch": 0.8247422680412371, + "grad_norm": 0.9088520407676697, + "learning_rate": 2e-05, + "loss": 1.8931, + "step": 80 + }, + { + "epoch": 0.845360824742268, + "grad_norm": 1.6952238082885742, + "learning_rate": 2e-05, + "loss": 1.0514, + "step": 82 + }, + { + "epoch": 0.865979381443299, + "grad_norm": 1.3661904335021973, + "learning_rate": 2e-05, + "loss": 1.5254, + "step": 84 + }, + { + "epoch": 0.8865979381443299, + "grad_norm": 1.5365053415298462, + "learning_rate": 2e-05, + "loss": 1.5001, + "step": 86 + }, + { + "epoch": 0.9072164948453608, + "grad_norm": 0.4049004018306732, + "learning_rate": 2e-05, + "loss": 1.4141, + "step": 88 + }, + { + "epoch": 0.9278350515463918, + "grad_norm": 2.052964448928833, + "learning_rate": 2e-05, + "loss": 1.0455, + "step": 90 + }, + { + "epoch": 0.9484536082474226, + "grad_norm": 0.5465191602706909, + "learning_rate": 2e-05, + "loss": 0.741, + "step": 92 + }, + { + "epoch": 0.9690721649484536, + "grad_norm": 1.1672446727752686, + "learning_rate": 2e-05, + "loss": 1.199, + "step": 94 + }, + { + "epoch": 0.9896907216494846, + "grad_norm": 5.172623634338379, + "learning_rate": 2e-05, + "loss": 1.6101, + "step": 96 + }, + { + "epoch": 1.0, + "step": 97, + "total_flos": 2.080121124238131e+16, + "train_loss": 1.4608057553006202, + "train_runtime": 363.6952, + "train_samples_per_second": 1.067, + "train_steps_per_second": 0.267 + } + ], + "logging_steps": 2, + "max_steps": 97, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 2.080121124238131e+16, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round10.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..6c46b8b16c831cd2785e179c6f877ed9a45370f8 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:628f3ab6268a995e5a6e695182629e912860d336c361110825fb7b14d330bdfc +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round12.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..a833bee1613efd60c9c53f54f55fd81c8ea94b7a --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f1eee78bdc9cbaaa5ace24962d539c619df8286a9a8c422289db2d7ab9cf5b0 +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round15.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..8434cbb05ae17df8d89d97a6df374797e98fbcfe --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e796e13255d7cee709ff69e3726f6fce731a851ab6157426a862a721e87d3cb +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round17.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..8bcd83bfa93daa6d243b9f3f379be30ccd569421 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdf354f93337dea3a94a04a869e06347f6ddcdb402a620069706c8a3c277b8e4 +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round2.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..b6985b53eea0b7b126b939c652f10a7767c21c26 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54df4904f4d80d2309f8e2f522b18507c5d402c766e60b504ee27c785f98c7f6 +size 791576546 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round20.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..9218cb9e6b1588e815727d922cbdebe18a5275ad --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cc7b2d7613df2e86e28c49ee82f08d88d80e81163985534d20ec6f6315e4088 +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round5.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..7966b53427a4c873f20bfcd091c59b3550253c7f --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68b90ac9fa152488ded4afc57fe26add9bcab9bea5454ffa4ab484f45ff280c6 +size 791576546 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round7.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..3669f1611fa2f38be59b563c626e242f7d352f51 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:517901987a25dbccbe2e3c55929dd9f1d58b55e2c4ba4e450b7b6a6115e9ba8f +size 791576546 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_trainer_state.json b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..352f0a557a66545e265a06223d7ffaba0cc4faaf --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_trainer_state.json @@ -0,0 +1,378 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 97, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.020618556701030927, + "grad_norm": 1.857858657836914, + "learning_rate": 2e-05, + "loss": 1.0093, + "step": 2 + }, + { + "epoch": 0.041237113402061855, + "grad_norm": 1.128074049949646, + "learning_rate": 2e-05, + "loss": 0.9811, + "step": 4 + }, + { + "epoch": 0.061855670103092786, + "grad_norm": 1.1853967905044556, + "learning_rate": 2e-05, + "loss": 0.6298, + "step": 6 + }, + { + "epoch": 0.08247422680412371, + "grad_norm": 2.01977276802063, + "learning_rate": 2e-05, + "loss": 0.7973, + "step": 8 + }, + { + "epoch": 0.10309278350515463, + "grad_norm": 3.552171468734741, + "learning_rate": 2e-05, + "loss": 3.2413, + "step": 10 + }, + { + "epoch": 0.12371134020618557, + "grad_norm": 2.4959380626678467, + "learning_rate": 2e-05, + "loss": 0.8036, + "step": 12 + }, + { + "epoch": 0.14432989690721648, + "grad_norm": 0.18528757989406586, + "learning_rate": 2e-05, + "loss": 0.8049, + "step": 14 + }, + { + "epoch": 0.16494845360824742, + "grad_norm": 0.3887205421924591, + "learning_rate": 2e-05, + "loss": 1.034, + "step": 16 + }, + { + "epoch": 0.18556701030927836, + "grad_norm": 1.167763352394104, + "learning_rate": 2e-05, + "loss": 1.0904, + "step": 18 + }, + { + "epoch": 0.20618556701030927, + "grad_norm": 1.1180120706558228, + "learning_rate": 2e-05, + "loss": 1.1927, + "step": 20 + }, + { + "epoch": 0.2268041237113402, + "grad_norm": 0.34743738174438477, + "learning_rate": 2e-05, + "loss": 0.9405, + "step": 22 + }, + { + "epoch": 0.24742268041237114, + "grad_norm": 0.5589756965637207, + "learning_rate": 2e-05, + "loss": 1.2665, + "step": 24 + }, + { + "epoch": 0.26804123711340205, + "grad_norm": 1.364461898803711, + "learning_rate": 2e-05, + "loss": 0.9861, + "step": 26 + }, + { + "epoch": 0.28865979381443296, + "grad_norm": 1.4796721935272217, + "learning_rate": 2e-05, + "loss": 1.282, + "step": 28 + }, + { + "epoch": 0.30927835051546393, + "grad_norm": 1.5695762634277344, + "learning_rate": 2e-05, + "loss": 2.2431, + "step": 30 + }, + { + "epoch": 0.32989690721649484, + "grad_norm": 1.308424949645996, + "learning_rate": 2e-05, + "loss": 1.0269, + "step": 32 + }, + { + "epoch": 0.35051546391752575, + "grad_norm": 0.9424493908882141, + "learning_rate": 2e-05, + "loss": 0.8531, + "step": 34 + }, + { + "epoch": 0.3711340206185567, + "grad_norm": 1.148472547531128, + "learning_rate": 2e-05, + "loss": 0.954, + "step": 36 + }, + { + "epoch": 0.3917525773195876, + "grad_norm": 2.9015464782714844, + "learning_rate": 2e-05, + "loss": 1.3365, + "step": 38 + }, + { + "epoch": 0.41237113402061853, + "grad_norm": 2.0090081691741943, + "learning_rate": 2e-05, + "loss": 1.3861, + "step": 40 + }, + { + "epoch": 0.4329896907216495, + "grad_norm": 1.2990866899490356, + "learning_rate": 2e-05, + "loss": 0.435, + "step": 42 + }, + { + "epoch": 0.4536082474226804, + "grad_norm": 1.2898091077804565, + "learning_rate": 2e-05, + "loss": 1.7354, + "step": 44 + }, + { + "epoch": 0.4742268041237113, + "grad_norm": 1.301903486251831, + "learning_rate": 2e-05, + "loss": 0.923, + "step": 46 + }, + { + "epoch": 0.4948453608247423, + "grad_norm": 1.1289761066436768, + "learning_rate": 2e-05, + "loss": 0.4642, + "step": 48 + }, + { + "epoch": 0.5154639175257731, + "grad_norm": 3.627347707748413, + "learning_rate": 2e-05, + "loss": 1.187, + "step": 50 + }, + { + "epoch": 0.5360824742268041, + "grad_norm": 0.9005461931228638, + "learning_rate": 2e-05, + "loss": 0.7929, + "step": 52 + }, + { + "epoch": 0.5567010309278351, + "grad_norm": 1.4061144590377808, + "learning_rate": 2e-05, + "loss": 1.3737, + "step": 54 + }, + { + "epoch": 0.5773195876288659, + "grad_norm": 1.6655174493789673, + "learning_rate": 2e-05, + "loss": 1.4762, + "step": 56 + }, + { + "epoch": 0.5979381443298969, + "grad_norm": 2.249619483947754, + "learning_rate": 2e-05, + "loss": 1.3758, + "step": 58 + }, + { + "epoch": 0.6185567010309279, + "grad_norm": 3.719571113586426, + "learning_rate": 2e-05, + "loss": 1.0628, + "step": 60 + }, + { + "epoch": 0.6391752577319587, + "grad_norm": 2.0385303497314453, + "learning_rate": 2e-05, + "loss": 0.8212, + "step": 62 + }, + { + "epoch": 0.6597938144329897, + "grad_norm": 1.5352033376693726, + "learning_rate": 2e-05, + "loss": 0.5521, + "step": 64 + }, + { + "epoch": 0.6804123711340206, + "grad_norm": 1.1133532524108887, + "learning_rate": 2e-05, + "loss": 1.0727, + "step": 66 + }, + { + "epoch": 0.7010309278350515, + "grad_norm": 0.3139188289642334, + "learning_rate": 2e-05, + "loss": 0.6619, + "step": 68 + }, + { + "epoch": 0.7216494845360825, + "grad_norm": 0.13998755812644958, + "learning_rate": 2e-05, + "loss": 1.2334, + "step": 70 + }, + { + "epoch": 0.7422680412371134, + "grad_norm": 0.7787773013114929, + "learning_rate": 2e-05, + "loss": 1.425, + "step": 72 + }, + { + "epoch": 0.7628865979381443, + "grad_norm": 2.650651693344116, + "learning_rate": 2e-05, + "loss": 1.5593, + "step": 74 + }, + { + "epoch": 0.7835051546391752, + "grad_norm": 2.5681259632110596, + "learning_rate": 2e-05, + "loss": 0.8564, + "step": 76 + }, + { + "epoch": 0.8041237113402062, + "grad_norm": 1.672986626625061, + "learning_rate": 2e-05, + "loss": 0.3764, + "step": 78 + }, + { + "epoch": 0.8247422680412371, + "grad_norm": 1.4562022686004639, + "learning_rate": 2e-05, + "loss": 1.0597, + "step": 80 + }, + { + "epoch": 0.845360824742268, + "grad_norm": 1.849575161933899, + "learning_rate": 2e-05, + "loss": 0.6571, + "step": 82 + }, + { + "epoch": 0.865979381443299, + "grad_norm": 1.7122550010681152, + "learning_rate": 2e-05, + "loss": 0.7316, + "step": 84 + }, + { + "epoch": 0.8865979381443299, + "grad_norm": 0.9788981080055237, + "learning_rate": 2e-05, + "loss": 1.8302, + "step": 86 + }, + { + "epoch": 0.9072164948453608, + "grad_norm": 4.261756896972656, + "learning_rate": 2e-05, + "loss": 1.748, + "step": 88 + }, + { + "epoch": 0.9278350515463918, + "grad_norm": 0.5180452466011047, + "learning_rate": 2e-05, + "loss": 0.6574, + "step": 90 + }, + { + "epoch": 0.9484536082474226, + "grad_norm": 3.8009090423583984, + "learning_rate": 2e-05, + "loss": 1.222, + "step": 92 + }, + { + "epoch": 0.9690721649484536, + "grad_norm": 2.206448793411255, + "learning_rate": 2e-05, + "loss": 2.1999, + "step": 94 + }, + { + "epoch": 0.9896907216494846, + "grad_norm": 1.8258347511291504, + "learning_rate": 2e-05, + "loss": 1.6342, + "step": 96 + }, + { + "epoch": 1.0, + "step": 97, + "total_flos": 1.975033480085504e+16, + "train_loss": 1.1381244143259894, + "train_runtime": 347.3529, + "train_samples_per_second": 1.117, + "train_steps_per_second": 0.279 + } + ], + "logging_steps": 2, + "max_steps": 97, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 1.975033480085504e+16, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round10.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..a57dac23a2b911a899f5df6631e36694bd82794f --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d75b434f434ac58ee7ff79a1192526027663a462f31003c61af666ca2c8197b +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round12.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..92e8ed501048fe1260ba65e664c7eae64422a318 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e40c641acfb84bd93aec680098654d6533f26cea5a9317dba50857689945e350 +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round15.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..791bae7dc57216d40bd4febe4b5f344aa74a9b5f --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bea02c21b18787ce374ede742d2698c2221d15bd03cac84c80e8f25d54d2f3a3 +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round17.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..189172f34788c21a1e37da4489ec049d8c6758f4 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7534dde78b8b023855befc1292d21473ab56079172d82bf4f570b1cf7959e012 +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round2.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..d5ef9e8a9c7cf1448ab8bb5cacfbfe7d636ba154 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bccb9abfe6b71dff526a503d33d640fb761439901f9e58e425b441518d29bb8d +size 791576546 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round20.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..4670a11f279222654ef2597fc700392f1a4a5ce4 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f87425298b15457fea29807819c31436245a6de280a7fc903521e6e2f831179d +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round5.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..fd425f5c92b7a1ac49d27e11d7e3243323b97b06 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f95be3295ca83cf90ef80aaf5fc6ff54eee9d129d79c3cc1ebb13d9d59085d2 +size 791576546 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round7.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..761414fa457ccce047562c592e58d3314fffc9f8 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd9b2dac41ada33dc1ed38d15ae5a8fadaec0d13690d5431ef8251f8c4a84ece +size 791576546 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_trainer_state.json b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..1156c6c059ee6cfc619ede99f2599fe46fc02e12 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_trainer_state.json @@ -0,0 +1,378 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 97, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.020618556701030927, + "grad_norm": 2.161454200744629, + "learning_rate": 2e-05, + "loss": 1.683, + "step": 2 + }, + { + "epoch": 0.041237113402061855, + "grad_norm": 0.40093937516212463, + "learning_rate": 2e-05, + "loss": 1.2557, + "step": 4 + }, + { + "epoch": 0.061855670103092786, + "grad_norm": 1.618806004524231, + "learning_rate": 2e-05, + "loss": 1.2597, + "step": 6 + }, + { + "epoch": 0.08247422680412371, + "grad_norm": 0.4591558873653412, + "learning_rate": 2e-05, + "loss": 0.6036, + "step": 8 + }, + { + "epoch": 0.10309278350515463, + "grad_norm": 2.3515193462371826, + "learning_rate": 2e-05, + "loss": 1.2634, + "step": 10 + }, + { + "epoch": 0.12371134020618557, + "grad_norm": 1.4352556467056274, + "learning_rate": 2e-05, + "loss": 0.6866, + "step": 12 + }, + { + "epoch": 0.14432989690721648, + "grad_norm": 0.4916004538536072, + "learning_rate": 2e-05, + "loss": 0.9618, + "step": 14 + }, + { + "epoch": 0.16494845360824742, + "grad_norm": 0.9008558988571167, + "learning_rate": 2e-05, + "loss": 0.8086, + "step": 16 + }, + { + "epoch": 0.18556701030927836, + "grad_norm": 0.5180691480636597, + "learning_rate": 2e-05, + "loss": 0.7023, + "step": 18 + }, + { + "epoch": 0.20618556701030927, + "grad_norm": 0.21598584949970245, + "learning_rate": 2e-05, + "loss": 0.5936, + "step": 20 + }, + { + "epoch": 0.2268041237113402, + "grad_norm": 1.9789445400238037, + "learning_rate": 2e-05, + "loss": 0.7507, + "step": 22 + }, + { + "epoch": 0.24742268041237114, + "grad_norm": 0.4040895402431488, + "learning_rate": 2e-05, + "loss": 0.926, + "step": 24 + }, + { + "epoch": 0.26804123711340205, + "grad_norm": 3.917529582977295, + "learning_rate": 2e-05, + "loss": 1.3788, + "step": 26 + }, + { + "epoch": 0.28865979381443296, + "grad_norm": 0.5209499001502991, + "learning_rate": 2e-05, + "loss": 0.3468, + "step": 28 + }, + { + "epoch": 0.30927835051546393, + "grad_norm": 0.863224446773529, + "learning_rate": 2e-05, + "loss": 0.1496, + "step": 30 + }, + { + "epoch": 0.32989690721649484, + "grad_norm": 0.8937453031539917, + "learning_rate": 2e-05, + "loss": 0.7099, + "step": 32 + }, + { + "epoch": 0.35051546391752575, + "grad_norm": 0.851498007774353, + "learning_rate": 2e-05, + "loss": 0.8454, + "step": 34 + }, + { + "epoch": 0.3711340206185567, + "grad_norm": 0.452116459608078, + "learning_rate": 2e-05, + "loss": 0.5287, + "step": 36 + }, + { + "epoch": 0.3917525773195876, + "grad_norm": 3.0233278274536133, + "learning_rate": 2e-05, + "loss": 0.4608, + "step": 38 + }, + { + "epoch": 0.41237113402061853, + "grad_norm": 0.29843541979789734, + "learning_rate": 2e-05, + "loss": 0.451, + "step": 40 + }, + { + "epoch": 0.4329896907216495, + "grad_norm": 0.8193789124488831, + "learning_rate": 2e-05, + "loss": 0.6379, + "step": 42 + }, + { + "epoch": 0.4536082474226804, + "grad_norm": 0.36019280552864075, + "learning_rate": 2e-05, + "loss": 1.0601, + "step": 44 + }, + { + "epoch": 0.4742268041237113, + "grad_norm": 0.10708494484424591, + "learning_rate": 2e-05, + "loss": 0.2343, + "step": 46 + }, + { + "epoch": 0.4948453608247423, + "grad_norm": 0.9287037253379822, + "learning_rate": 2e-05, + "loss": 0.6898, + "step": 48 + }, + { + "epoch": 0.5154639175257731, + "grad_norm": 0.7059003710746765, + "learning_rate": 2e-05, + "loss": 0.2889, + "step": 50 + }, + { + "epoch": 0.5360824742268041, + "grad_norm": 1.177734375, + "learning_rate": 2e-05, + "loss": 1.5371, + "step": 52 + }, + { + "epoch": 0.5567010309278351, + "grad_norm": 0.35798653960227966, + "learning_rate": 2e-05, + "loss": 0.4085, + "step": 54 + }, + { + "epoch": 0.5773195876288659, + "grad_norm": 0.297166109085083, + "learning_rate": 2e-05, + "loss": 0.4282, + "step": 56 + }, + { + "epoch": 0.5979381443298969, + "grad_norm": 0.6196297407150269, + "learning_rate": 2e-05, + "loss": 0.7998, + "step": 58 + }, + { + "epoch": 0.6185567010309279, + "grad_norm": 0.2350747138261795, + "learning_rate": 2e-05, + "loss": 0.8402, + "step": 60 + }, + { + "epoch": 0.6391752577319587, + "grad_norm": 5.289220809936523, + "learning_rate": 2e-05, + "loss": 1.6843, + "step": 62 + }, + { + "epoch": 0.6597938144329897, + "grad_norm": 0.5821011662483215, + "learning_rate": 2e-05, + "loss": 0.3986, + "step": 64 + }, + { + "epoch": 0.6804123711340206, + "grad_norm": 0.057488661259412766, + "learning_rate": 2e-05, + "loss": 0.3316, + "step": 66 + }, + { + "epoch": 0.7010309278350515, + "grad_norm": 0.9951735734939575, + "learning_rate": 2e-05, + "loss": 0.9058, + "step": 68 + }, + { + "epoch": 0.7216494845360825, + "grad_norm": 0.22314199805259705, + "learning_rate": 2e-05, + "loss": 0.6105, + "step": 70 + }, + { + "epoch": 0.7422680412371134, + "grad_norm": 0.26854678988456726, + "learning_rate": 2e-05, + "loss": 0.2872, + "step": 72 + }, + { + "epoch": 0.7628865979381443, + "grad_norm": 0.6667194366455078, + "learning_rate": 2e-05, + "loss": 1.655, + "step": 74 + }, + { + "epoch": 0.7835051546391752, + "grad_norm": 0.7721454501152039, + "learning_rate": 2e-05, + "loss": 0.5862, + "step": 76 + }, + { + "epoch": 0.8041237113402062, + "grad_norm": 0.5301076173782349, + "learning_rate": 2e-05, + "loss": 0.639, + "step": 78 + }, + { + "epoch": 0.8247422680412371, + "grad_norm": 1.1420249938964844, + "learning_rate": 2e-05, + "loss": 1.0943, + "step": 80 + }, + { + "epoch": 0.845360824742268, + "grad_norm": 0.5552510619163513, + "learning_rate": 2e-05, + "loss": 0.5427, + "step": 82 + }, + { + "epoch": 0.865979381443299, + "grad_norm": 0.5132323503494263, + "learning_rate": 2e-05, + "loss": 0.4128, + "step": 84 + }, + { + "epoch": 0.8865979381443299, + "grad_norm": 0.163641095161438, + "learning_rate": 2e-05, + "loss": 0.3905, + "step": 86 + }, + { + "epoch": 0.9072164948453608, + "grad_norm": 0.007550459820777178, + "learning_rate": 2e-05, + "loss": 0.1858, + "step": 88 + }, + { + "epoch": 0.9278350515463918, + "grad_norm": 0.6305935978889465, + "learning_rate": 2e-05, + "loss": 0.483, + "step": 90 + }, + { + "epoch": 0.9484536082474226, + "grad_norm": 0.3425631523132324, + "learning_rate": 2e-05, + "loss": 0.7733, + "step": 92 + }, + { + "epoch": 0.9690721649484536, + "grad_norm": 0.52589350938797, + "learning_rate": 2e-05, + "loss": 0.5945, + "step": 94 + }, + { + "epoch": 0.9896907216494846, + "grad_norm": 0.5986707210540771, + "learning_rate": 2e-05, + "loss": 0.3793, + "step": 96 + }, + { + "epoch": 1.0, + "step": 97, + "total_flos": 2.534672827416576e+16, + "train_loss": 0.7350392489089179, + "train_runtime": 388.042, + "train_samples_per_second": 1.0, + "train_steps_per_second": 0.25 + } + ], + "logging_steps": 2, + "max_steps": 97, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 2.534672827416576e+16, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/6_client_model_round10.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/6_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..1e367ced36ebbd430c024fdf4208bc849423f8b2 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/6_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ef8939484067f4bc8879f571c1a1fc48151b6b9685e5e12cecf0402b4e591c4 +size 368443438 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/6_client_model_round12.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/6_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..7dd8ef9b8ab5487e4cddb4e0aa57d915f5aaa933 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/6_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e1803daa06682cf5d6ae532ccae9f2cc50f0e42d3d32007fb186b987ee898e5 +size 368443438 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/6_client_model_round15.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/6_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..b8a9971495907a5908bf8223e7c74aa1346f116c --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/6_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75385ebaaf1878d4722692eec4c0a1d9c401b5451200470c32a3a4e3a08e1791 +size 368443438 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/6_client_model_round17.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/6_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..8947c3d46524a55e24493ecf525d51cf421a5994 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/6_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2de5b917fdfcbacc0ae61f8ffa2b82c320f8a51c29e14bd449654f8c116432f +size 368443438 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/6_client_model_round2.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/6_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..d9c9b595387e18405245f9ea5c8854a37ecbcc84 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/6_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e2e5c9fd240020769cf8d127457b49e83fcc9a26313f69f43e44824d1a16da9 +size 368442474 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/6_client_model_round20.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/6_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..9ba3cdb875535f490271c0a04555a9f57db98c90 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/6_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a14a6904ebad4cf5ecf0143d91ecc0132bd0e8293308329ee99b460f9f9c5e68 +size 368443438 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/6_client_model_round5.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/6_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..bee78b901177f6a940ae00adb05d2b588bf00ec1 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/6_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0346deaa8309e3ea825573fc36b9887b008dd5ad3973ec64229cddb69d02d375 +size 368442474 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/6_client_model_round7.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/6_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..5245bba62bb2d975470a2b858f0dffdbb2bed0fe --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/6_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12ebfbb2e16f90238a430ed917f40c6846b927f214635511fefbb17336a94b51 +size 368442474 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/6_trainer_state.json b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/6_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..513eba4e2941e5b50fb8422385d920f9ebee1542 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/6_trainer_state.json @@ -0,0 +1,378 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 97, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.020618556701030927, + "grad_norm": 5.989874362945557, + "learning_rate": 2e-05, + "loss": 1.7851, + "step": 2 + }, + { + "epoch": 0.041237113402061855, + "grad_norm": 4.076360702514648, + "learning_rate": 2e-05, + "loss": 1.874, + "step": 4 + }, + { + "epoch": 0.061855670103092786, + "grad_norm": 4.228509902954102, + "learning_rate": 2e-05, + "loss": 1.5111, + "step": 6 + }, + { + "epoch": 0.08247422680412371, + "grad_norm": 6.215860843658447, + "learning_rate": 2e-05, + "loss": 2.4282, + "step": 8 + }, + { + "epoch": 0.10309278350515463, + "grad_norm": 3.0416128635406494, + "learning_rate": 2e-05, + "loss": 1.5563, + "step": 10 + }, + { + "epoch": 0.12371134020618557, + "grad_norm": 2.27561616897583, + "learning_rate": 2e-05, + "loss": 1.5056, + "step": 12 + }, + { + "epoch": 0.14432989690721648, + "grad_norm": 7.760651111602783, + "learning_rate": 2e-05, + "loss": 3.1666, + "step": 14 + }, + { + "epoch": 0.16494845360824742, + "grad_norm": 4.179313659667969, + "learning_rate": 2e-05, + "loss": 1.3918, + "step": 16 + }, + { + "epoch": 0.18556701030927836, + "grad_norm": 3.2306151390075684, + "learning_rate": 2e-05, + "loss": 1.2013, + "step": 18 + }, + { + "epoch": 0.20618556701030927, + "grad_norm": 1.477596402168274, + "learning_rate": 2e-05, + "loss": 1.3969, + "step": 20 + }, + { + "epoch": 0.2268041237113402, + "grad_norm": 2.773430109024048, + "learning_rate": 2e-05, + "loss": 1.5245, + "step": 22 + }, + { + "epoch": 0.24742268041237114, + "grad_norm": 2.277453660964966, + "learning_rate": 2e-05, + "loss": 1.2809, + "step": 24 + }, + { + "epoch": 0.26804123711340205, + "grad_norm": 3.175544500350952, + "learning_rate": 2e-05, + "loss": 3.1848, + "step": 26 + }, + { + "epoch": 0.28865979381443296, + "grad_norm": 3.4732186794281006, + "learning_rate": 2e-05, + "loss": 2.0386, + "step": 28 + }, + { + "epoch": 0.30927835051546393, + "grad_norm": 4.694352149963379, + "learning_rate": 2e-05, + "loss": 1.2363, + "step": 30 + }, + { + "epoch": 0.32989690721649484, + "grad_norm": 1.2425066232681274, + "learning_rate": 2e-05, + "loss": 1.0511, + "step": 32 + }, + { + "epoch": 0.35051546391752575, + "grad_norm": 7.343347549438477, + "learning_rate": 2e-05, + "loss": 1.8386, + "step": 34 + }, + { + "epoch": 0.3711340206185567, + "grad_norm": 4.983409881591797, + "learning_rate": 2e-05, + "loss": 2.2939, + "step": 36 + }, + { + "epoch": 0.3917525773195876, + "grad_norm": 7.051117897033691, + "learning_rate": 2e-05, + "loss": 1.2765, + "step": 38 + }, + { + "epoch": 0.41237113402061853, + "grad_norm": 1.1056318283081055, + "learning_rate": 2e-05, + "loss": 0.4736, + "step": 40 + }, + { + "epoch": 0.4329896907216495, + "grad_norm": 3.936626434326172, + "learning_rate": 2e-05, + "loss": 1.4005, + "step": 42 + }, + { + "epoch": 0.4536082474226804, + "grad_norm": 2.9739370346069336, + "learning_rate": 2e-05, + "loss": 1.4822, + "step": 44 + }, + { + "epoch": 0.4742268041237113, + "grad_norm": 0.9875234961509705, + "learning_rate": 2e-05, + "loss": 1.503, + "step": 46 + }, + { + "epoch": 0.4948453608247423, + "grad_norm": 3.566375255584717, + "learning_rate": 2e-05, + "loss": 1.6282, + "step": 48 + }, + { + "epoch": 0.5154639175257731, + "grad_norm": 7.616732120513916, + "learning_rate": 2e-05, + "loss": 0.8635, + "step": 50 + }, + { + "epoch": 0.5360824742268041, + "grad_norm": 3.3316683769226074, + "learning_rate": 2e-05, + "loss": 0.8341, + "step": 52 + }, + { + "epoch": 0.5567010309278351, + "grad_norm": 5.425723552703857, + "learning_rate": 2e-05, + "loss": 2.3478, + "step": 54 + }, + { + "epoch": 0.5773195876288659, + "grad_norm": 8.32201862335205, + "learning_rate": 2e-05, + "loss": 2.4061, + "step": 56 + }, + { + "epoch": 0.5979381443298969, + "grad_norm": 2.7938919067382812, + "learning_rate": 2e-05, + "loss": 1.7115, + "step": 58 + }, + { + "epoch": 0.6185567010309279, + "grad_norm": 4.2429094314575195, + "learning_rate": 2e-05, + "loss": 1.8993, + "step": 60 + }, + { + "epoch": 0.6391752577319587, + "grad_norm": 2.2217226028442383, + "learning_rate": 2e-05, + "loss": 1.0326, + "step": 62 + }, + { + "epoch": 0.6597938144329897, + "grad_norm": 2.5544967651367188, + "learning_rate": 2e-05, + "loss": 1.6711, + "step": 64 + }, + { + "epoch": 0.6804123711340206, + "grad_norm": 1.2873215675354004, + "learning_rate": 2e-05, + "loss": 1.1774, + "step": 66 + }, + { + "epoch": 0.7010309278350515, + "grad_norm": 3.2555296421051025, + "learning_rate": 2e-05, + "loss": 2.1101, + "step": 68 + }, + { + "epoch": 0.7216494845360825, + "grad_norm": 5.723442554473877, + "learning_rate": 2e-05, + "loss": 3.1733, + "step": 70 + }, + { + "epoch": 0.7422680412371134, + "grad_norm": 5.4055705070495605, + "learning_rate": 2e-05, + "loss": 2.6068, + "step": 72 + }, + { + "epoch": 0.7628865979381443, + "grad_norm": 3.087639570236206, + "learning_rate": 2e-05, + "loss": 1.0038, + "step": 74 + }, + { + "epoch": 0.7835051546391752, + "grad_norm": 2.971449136734009, + "learning_rate": 2e-05, + "loss": 2.2932, + "step": 76 + }, + { + "epoch": 0.8041237113402062, + "grad_norm": 3.008423328399658, + "learning_rate": 2e-05, + "loss": 2.293, + "step": 78 + }, + { + "epoch": 0.8247422680412371, + "grad_norm": 2.3813021183013916, + "learning_rate": 2e-05, + "loss": 1.3383, + "step": 80 + }, + { + "epoch": 0.845360824742268, + "grad_norm": 5.059912204742432, + "learning_rate": 2e-05, + "loss": 2.241, + "step": 82 + }, + { + "epoch": 0.865979381443299, + "grad_norm": 1.1393848657608032, + "learning_rate": 2e-05, + "loss": 0.6499, + "step": 84 + }, + { + "epoch": 0.8865979381443299, + "grad_norm": 4.186708450317383, + "learning_rate": 2e-05, + "loss": 2.1174, + "step": 86 + }, + { + "epoch": 0.9072164948453608, + "grad_norm": 2.524853229522705, + "learning_rate": 2e-05, + "loss": 1.543, + "step": 88 + }, + { + "epoch": 0.9278350515463918, + "grad_norm": 4.4834394454956055, + "learning_rate": 2e-05, + "loss": 3.0569, + "step": 90 + }, + { + "epoch": 0.9484536082474226, + "grad_norm": 3.088503837585449, + "learning_rate": 2e-05, + "loss": 1.4262, + "step": 92 + }, + { + "epoch": 0.9690721649484536, + "grad_norm": 1.3521441221237183, + "learning_rate": 2e-05, + "loss": 0.9903, + "step": 94 + }, + { + "epoch": 0.9896907216494846, + "grad_norm": 1.630694031715393, + "learning_rate": 2e-05, + "loss": 0.9553, + "step": 96 + }, + { + "epoch": 1.0, + "step": 97, + "total_flos": 2798582845407232.0, + "train_loss": 1.7047151781849026, + "train_runtime": 216.3851, + "train_samples_per_second": 1.793, + "train_steps_per_second": 0.448 + } + ], + "logging_steps": 2, + "max_steps": 97, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 2798582845407232.0, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/7_client_model_round10.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/7_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..e11483465ca11d0268fbfe19ed4c8407966066e3 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/7_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:102a8a676c743fb2541a757071f86d126194dc3e48b6148034430e1afc2806a3 +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/7_client_model_round12.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/7_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..eb48f50723d8ff126c9bf5bca3886eb575e966ff --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/7_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9e31e478762562625ef7f53ff0742dcf297a24848572dd20e1b9c923180221e +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/7_client_model_round15.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/7_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..d6c401249b330c0c061b1d620d29f3bbabe4b61b --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/7_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e6dc21aa78f4cb6386c8caafd037ad08e62dc36ae9aa89ab2a0021e288f9722 +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/7_client_model_round17.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/7_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..ed8cfa93de2370a2116031bbe865000b49607461 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/7_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e064c532757366ff66bf2571c23585077241bf0c66039311b9a76fa6ffe5bdfa +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/7_client_model_round2.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/7_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..4afe3c77c55b80e37f9ebba2d0162c044cd918f7 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/7_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9480f77ded5faa15eb82f2d85448a0020e5b2012cc5bfc2440a8764bae41674e +size 791576546 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/7_client_model_round20.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/7_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..54f774434c7ac6c9fc263fa94d9b2e58ceee6d4d --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/7_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4e765c16b7ac5f31953885c520aba91e8423932195ee3138a8515c9c80e8b11 +size 791578182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/7_client_model_round5.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/7_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..d89afaf731d13bd6d9e8a25471e5b7d125cf033e --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/7_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dc5ed128b2f6a279f880773ae7309110ff9f546d122323d336ff098128b8253 +size 791576546 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/7_client_model_round7.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/7_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..c80de5b34028c99b693affa75149199dabdd02c8 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/7_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:045370aee174a8602a3966b9e41fd8250c5a789188fd8378a0aa54a42100cffb +size 791576546 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/7_trainer_state.json b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/7_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..1853282e22fb36dedbcafa156da9cbd6238dfada --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/7_trainer_state.json @@ -0,0 +1,378 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 97, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.020618556701030927, + "grad_norm": 2.901174783706665, + "learning_rate": 2e-05, + "loss": 1.8211, + "step": 2 + }, + { + "epoch": 0.041237113402061855, + "grad_norm": 4.28139591217041, + "learning_rate": 2e-05, + "loss": 2.6092, + "step": 4 + }, + { + "epoch": 0.061855670103092786, + "grad_norm": 2.6621718406677246, + "learning_rate": 2e-05, + "loss": 3.0119, + "step": 6 + }, + { + "epoch": 0.08247422680412371, + "grad_norm": 1.2815380096435547, + "learning_rate": 2e-05, + "loss": 1.3101, + "step": 8 + }, + { + "epoch": 0.10309278350515463, + "grad_norm": 1.2982583045959473, + "learning_rate": 2e-05, + "loss": 2.3135, + "step": 10 + }, + { + "epoch": 0.12371134020618557, + "grad_norm": 1.2952641248703003, + "learning_rate": 2e-05, + "loss": 1.2919, + "step": 12 + }, + { + "epoch": 0.14432989690721648, + "grad_norm": 2.034066677093506, + "learning_rate": 2e-05, + "loss": 1.2764, + "step": 14 + }, + { + "epoch": 0.16494845360824742, + "grad_norm": 1.7979387044906616, + "learning_rate": 2e-05, + "loss": 1.5599, + "step": 16 + }, + { + "epoch": 0.18556701030927836, + "grad_norm": 0.4818597137928009, + "learning_rate": 2e-05, + "loss": 1.0318, + "step": 18 + }, + { + "epoch": 0.20618556701030927, + "grad_norm": 0.956670343875885, + "learning_rate": 2e-05, + "loss": 0.8527, + "step": 20 + }, + { + "epoch": 0.2268041237113402, + "grad_norm": 1.3955525159835815, + "learning_rate": 2e-05, + "loss": 1.9185, + "step": 22 + }, + { + "epoch": 0.24742268041237114, + "grad_norm": 2.304298162460327, + "learning_rate": 2e-05, + "loss": 1.5558, + "step": 24 + }, + { + "epoch": 0.26804123711340205, + "grad_norm": 2.356865406036377, + "learning_rate": 2e-05, + "loss": 1.1995, + "step": 26 + }, + { + "epoch": 0.28865979381443296, + "grad_norm": 0.9977859258651733, + "learning_rate": 2e-05, + "loss": 1.0864, + "step": 28 + }, + { + "epoch": 0.30927835051546393, + "grad_norm": 0.48920851945877075, + "learning_rate": 2e-05, + "loss": 0.9896, + "step": 30 + }, + { + "epoch": 0.32989690721649484, + "grad_norm": 0.44538769125938416, + "learning_rate": 2e-05, + "loss": 0.9376, + "step": 32 + }, + { + "epoch": 0.35051546391752575, + "grad_norm": 1.5177651643753052, + "learning_rate": 2e-05, + "loss": 1.6681, + "step": 34 + }, + { + "epoch": 0.3711340206185567, + "grad_norm": 2.8961708545684814, + "learning_rate": 2e-05, + "loss": 1.6897, + "step": 36 + }, + { + "epoch": 0.3917525773195876, + "grad_norm": 1.008218765258789, + "learning_rate": 2e-05, + "loss": 1.5509, + "step": 38 + }, + { + "epoch": 0.41237113402061853, + "grad_norm": 1.176531434059143, + "learning_rate": 2e-05, + "loss": 1.4157, + "step": 40 + }, + { + "epoch": 0.4329896907216495, + "grad_norm": 3.618342876434326, + "learning_rate": 2e-05, + "loss": 0.9961, + "step": 42 + }, + { + "epoch": 0.4536082474226804, + "grad_norm": 1.0844309329986572, + "learning_rate": 2e-05, + "loss": 0.7571, + "step": 44 + }, + { + "epoch": 0.4742268041237113, + "grad_norm": 4.102534294128418, + "learning_rate": 2e-05, + "loss": 1.736, + "step": 46 + }, + { + "epoch": 0.4948453608247423, + "grad_norm": 2.684903383255005, + "learning_rate": 2e-05, + "loss": 1.8809, + "step": 48 + }, + { + "epoch": 0.5154639175257731, + "grad_norm": 3.7344889640808105, + "learning_rate": 2e-05, + "loss": 1.8809, + "step": 50 + }, + { + "epoch": 0.5360824742268041, + "grad_norm": 3.2938125133514404, + "learning_rate": 2e-05, + "loss": 1.4522, + "step": 52 + }, + { + "epoch": 0.5567010309278351, + "grad_norm": 2.4378066062927246, + "learning_rate": 2e-05, + "loss": 0.9021, + "step": 54 + }, + { + "epoch": 0.5773195876288659, + "grad_norm": 2.406059741973877, + "learning_rate": 2e-05, + "loss": 1.3394, + "step": 56 + }, + { + "epoch": 0.5979381443298969, + "grad_norm": 0.6210973262786865, + "learning_rate": 2e-05, + "loss": 1.4056, + "step": 58 + }, + { + "epoch": 0.6185567010309279, + "grad_norm": 1.2318004369735718, + "learning_rate": 2e-05, + "loss": 0.8238, + "step": 60 + }, + { + "epoch": 0.6391752577319587, + "grad_norm": 3.7087228298187256, + "learning_rate": 2e-05, + "loss": 2.1121, + "step": 62 + }, + { + "epoch": 0.6597938144329897, + "grad_norm": 0.9222784042358398, + "learning_rate": 2e-05, + "loss": 1.2021, + "step": 64 + }, + { + "epoch": 0.6804123711340206, + "grad_norm": 2.96535587310791, + "learning_rate": 2e-05, + "loss": 1.9595, + "step": 66 + }, + { + "epoch": 0.7010309278350515, + "grad_norm": 4.624764919281006, + "learning_rate": 2e-05, + "loss": 1.5927, + "step": 68 + }, + { + "epoch": 0.7216494845360825, + "grad_norm": 1.6748323440551758, + "learning_rate": 2e-05, + "loss": 1.6721, + "step": 70 + }, + { + "epoch": 0.7422680412371134, + "grad_norm": 1.2604132890701294, + "learning_rate": 2e-05, + "loss": 1.5449, + "step": 72 + }, + { + "epoch": 0.7628865979381443, + "grad_norm": 1.4816038608551025, + "learning_rate": 2e-05, + "loss": 0.9394, + "step": 74 + }, + { + "epoch": 0.7835051546391752, + "grad_norm": 0.45386260747909546, + "learning_rate": 2e-05, + "loss": 1.3483, + "step": 76 + }, + { + "epoch": 0.8041237113402062, + "grad_norm": 1.9374059438705444, + "learning_rate": 2e-05, + "loss": 1.7654, + "step": 78 + }, + { + "epoch": 0.8247422680412371, + "grad_norm": 1.082322120666504, + "learning_rate": 2e-05, + "loss": 1.7977, + "step": 80 + }, + { + "epoch": 0.845360824742268, + "grad_norm": 3.948037624359131, + "learning_rate": 2e-05, + "loss": 2.132, + "step": 82 + }, + { + "epoch": 0.865979381443299, + "grad_norm": 1.350508213043213, + "learning_rate": 2e-05, + "loss": 0.8769, + "step": 84 + }, + { + "epoch": 0.8865979381443299, + "grad_norm": 1.0008695125579834, + "learning_rate": 2e-05, + "loss": 2.2793, + "step": 86 + }, + { + "epoch": 0.9072164948453608, + "grad_norm": 1.0887056589126587, + "learning_rate": 2e-05, + "loss": 2.5544, + "step": 88 + }, + { + "epoch": 0.9278350515463918, + "grad_norm": 1.0882996320724487, + "learning_rate": 2e-05, + "loss": 1.8521, + "step": 90 + }, + { + "epoch": 0.9484536082474226, + "grad_norm": 1.3740499019622803, + "learning_rate": 2e-05, + "loss": 1.8152, + "step": 92 + }, + { + "epoch": 0.9690721649484536, + "grad_norm": 0.6833955645561218, + "learning_rate": 2e-05, + "loss": 0.3912, + "step": 94 + }, + { + "epoch": 0.9896907216494846, + "grad_norm": 1.1932474374771118, + "learning_rate": 2e-05, + "loss": 1.1816, + "step": 96 + }, + { + "epoch": 1.0, + "step": 97, + "total_flos": 8905552822272000.0, + "train_loss": 1.51465443483333, + "train_runtime": 320.9706, + "train_samples_per_second": 1.209, + "train_steps_per_second": 0.302 + } + ], + "logging_steps": 2, + "max_steps": 97, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 8905552822272000.0, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/8_client_model_round10.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/8_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..db6207fd9c2fbbe212bd20f5fa5d85ee4e94550b --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/8_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:885e34076c658f5b5d30d6de80a85f0fc509d1142032b85af73d7d4c8e857599 +size 368443438 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/8_client_model_round12.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/8_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..224a49824a85fc29a2f242801b77934134c0c50d --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/8_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3f4176f4e6332160e6abdc3796e2dbc7b1c7d52b2eceb33862503d83b4f7e36 +size 368443438 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/8_client_model_round15.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/8_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..06c54622b44f55eaff1d3955dacec25a10d12729 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/8_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a234c8e8420948f3c42cf52e2cca39e1e6d89051fdcee387747013d4f72e40d +size 368443438 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/8_client_model_round17.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/8_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..e51f6593781d8787e20a203ea458a2311557cfc8 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/8_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0aee29c2ae9e6ebf8ec1e736e5270d471088b9fa1e32cee8b1322690e4faa8da +size 368443438 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/8_client_model_round2.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/8_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..67aa9cbedf030da1924f12a110630564d338cbbe --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/8_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b58c3dc28a1e6d24407169f360d28117772a5dd65d932a50dbc9f38990bfa1f +size 368442474 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/8_client_model_round20.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/8_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..1067e28a1a2e36bbe52f31915bad8aaed52c2c20 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/8_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c27eb0e271e973ceb3ea7b9b89cb4308458aea30470c768363c50435d4df714c +size 368443438 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/8_client_model_round5.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/8_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..033f6b7f6da53789ee38ccf5b19f4c32759d55c5 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/8_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae1be7e5ecd0877436873344d91618c3840a981582c30d8dfb78bca0620de553 +size 368442474 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/8_client_model_round7.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/8_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..02cce28d2e75963f6f39f4becdf7d6185b710e6e --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/8_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3925455a9272fd1a68d27938bd90a26b5c14aa934895a1a6edc67c85f39d0c1 +size 368442474 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/8_trainer_state.json b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/8_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..623765dcb7703018325e83d44cc1adfccc2ecc01 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/8_trainer_state.json @@ -0,0 +1,378 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 97, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.020618556701030927, + "grad_norm": 4.544999599456787, + "learning_rate": 2e-05, + "loss": 2.0825, + "step": 2 + }, + { + "epoch": 0.041237113402061855, + "grad_norm": 2.283771276473999, + "learning_rate": 2e-05, + "loss": 1.7153, + "step": 4 + }, + { + "epoch": 0.061855670103092786, + "grad_norm": 2.6339378356933594, + "learning_rate": 2e-05, + "loss": 3.1062, + "step": 6 + }, + { + "epoch": 0.08247422680412371, + "grad_norm": 0.7697868347167969, + "learning_rate": 2e-05, + "loss": 3.1442, + "step": 8 + }, + { + "epoch": 0.10309278350515463, + "grad_norm": 2.3016302585601807, + "learning_rate": 2e-05, + "loss": 1.8375, + "step": 10 + }, + { + "epoch": 0.12371134020618557, + "grad_norm": 4.884305477142334, + "learning_rate": 2e-05, + "loss": 4.0098, + "step": 12 + }, + { + "epoch": 0.14432989690721648, + "grad_norm": 0.7743316292762756, + "learning_rate": 2e-05, + "loss": 1.0983, + "step": 14 + }, + { + "epoch": 0.16494845360824742, + "grad_norm": 6.767885208129883, + "learning_rate": 2e-05, + "loss": 2.5188, + "step": 16 + }, + { + "epoch": 0.18556701030927836, + "grad_norm": 1.7237461805343628, + "learning_rate": 2e-05, + "loss": 3.2709, + "step": 18 + }, + { + "epoch": 0.20618556701030927, + "grad_norm": 1.6093686819076538, + "learning_rate": 2e-05, + "loss": 1.3118, + "step": 20 + }, + { + "epoch": 0.2268041237113402, + "grad_norm": 3.587228536605835, + "learning_rate": 2e-05, + "loss": 3.9541, + "step": 22 + }, + { + "epoch": 0.24742268041237114, + "grad_norm": 5.8059515953063965, + "learning_rate": 2e-05, + "loss": 2.6989, + "step": 24 + }, + { + "epoch": 0.26804123711340205, + "grad_norm": 2.2526609897613525, + "learning_rate": 2e-05, + "loss": 3.3164, + "step": 26 + }, + { + "epoch": 0.28865979381443296, + "grad_norm": 2.765078067779541, + "learning_rate": 2e-05, + "loss": 4.3907, + "step": 28 + }, + { + "epoch": 0.30927835051546393, + "grad_norm": 2.16410756111145, + "learning_rate": 2e-05, + "loss": 2.8488, + "step": 30 + }, + { + "epoch": 0.32989690721649484, + "grad_norm": 1.8812283277511597, + "learning_rate": 2e-05, + "loss": 2.627, + "step": 32 + }, + { + "epoch": 0.35051546391752575, + "grad_norm": 3.4154915809631348, + "learning_rate": 2e-05, + "loss": 3.0798, + "step": 34 + }, + { + "epoch": 0.3711340206185567, + "grad_norm": 1.8584576845169067, + "learning_rate": 2e-05, + "loss": 2.183, + "step": 36 + }, + { + "epoch": 0.3917525773195876, + "grad_norm": 5.281542778015137, + "learning_rate": 2e-05, + "loss": 1.817, + "step": 38 + }, + { + "epoch": 0.41237113402061853, + "grad_norm": 1.8128688335418701, + "learning_rate": 2e-05, + "loss": 2.8046, + "step": 40 + }, + { + "epoch": 0.4329896907216495, + "grad_norm": 3.983124256134033, + "learning_rate": 2e-05, + "loss": 2.5806, + "step": 42 + }, + { + "epoch": 0.4536082474226804, + "grad_norm": 2.141648054122925, + "learning_rate": 2e-05, + "loss": 1.4187, + "step": 44 + }, + { + "epoch": 0.4742268041237113, + "grad_norm": 1.7750370502471924, + "learning_rate": 2e-05, + "loss": 1.6869, + "step": 46 + }, + { + "epoch": 0.4948453608247423, + "grad_norm": 1.856276512145996, + "learning_rate": 2e-05, + "loss": 2.2729, + "step": 48 + }, + { + "epoch": 0.5154639175257731, + "grad_norm": 1.578888177871704, + "learning_rate": 2e-05, + "loss": 1.7366, + "step": 50 + }, + { + "epoch": 0.5360824742268041, + "grad_norm": 3.416520595550537, + "learning_rate": 2e-05, + "loss": 2.073, + "step": 52 + }, + { + "epoch": 0.5567010309278351, + "grad_norm": 4.930846214294434, + "learning_rate": 2e-05, + "loss": 2.3818, + "step": 54 + }, + { + "epoch": 0.5773195876288659, + "grad_norm": 0.823712170124054, + "learning_rate": 2e-05, + "loss": 2.488, + "step": 56 + }, + { + "epoch": 0.5979381443298969, + "grad_norm": 3.023837089538574, + "learning_rate": 2e-05, + "loss": 2.874, + "step": 58 + }, + { + "epoch": 0.6185567010309279, + "grad_norm": 1.1760919094085693, + "learning_rate": 2e-05, + "loss": 2.1292, + "step": 60 + }, + { + "epoch": 0.6391752577319587, + "grad_norm": 1.4508178234100342, + "learning_rate": 2e-05, + "loss": 1.9028, + "step": 62 + }, + { + "epoch": 0.6597938144329897, + "grad_norm": 1.8921033143997192, + "learning_rate": 2e-05, + "loss": 3.084, + "step": 64 + }, + { + "epoch": 0.6804123711340206, + "grad_norm": 2.687537431716919, + "learning_rate": 2e-05, + "loss": 3.833, + "step": 66 + }, + { + "epoch": 0.7010309278350515, + "grad_norm": 1.8764926195144653, + "learning_rate": 2e-05, + "loss": 0.9186, + "step": 68 + }, + { + "epoch": 0.7216494845360825, + "grad_norm": 2.439419746398926, + "learning_rate": 2e-05, + "loss": 2.4868, + "step": 70 + }, + { + "epoch": 0.7422680412371134, + "grad_norm": 1.2766458988189697, + "learning_rate": 2e-05, + "loss": 3.0605, + "step": 72 + }, + { + "epoch": 0.7628865979381443, + "grad_norm": 1.5604605674743652, + "learning_rate": 2e-05, + "loss": 1.1429, + "step": 74 + }, + { + "epoch": 0.7835051546391752, + "grad_norm": 1.5391968488693237, + "learning_rate": 2e-05, + "loss": 1.6607, + "step": 76 + }, + { + "epoch": 0.8041237113402062, + "grad_norm": 1.798148512840271, + "learning_rate": 2e-05, + "loss": 2.376, + "step": 78 + }, + { + "epoch": 0.8247422680412371, + "grad_norm": 2.6645777225494385, + "learning_rate": 2e-05, + "loss": 2.0349, + "step": 80 + }, + { + "epoch": 0.845360824742268, + "grad_norm": 2.3767917156219482, + "learning_rate": 2e-05, + "loss": 1.2481, + "step": 82 + }, + { + "epoch": 0.865979381443299, + "grad_norm": 1.534809947013855, + "learning_rate": 2e-05, + "loss": 0.7783, + "step": 84 + }, + { + "epoch": 0.8865979381443299, + "grad_norm": 2.8910951614379883, + "learning_rate": 2e-05, + "loss": 3.0625, + "step": 86 + }, + { + "epoch": 0.9072164948453608, + "grad_norm": 1.5640689134597778, + "learning_rate": 2e-05, + "loss": 1.2363, + "step": 88 + }, + { + "epoch": 0.9278350515463918, + "grad_norm": 4.772906303405762, + "learning_rate": 2e-05, + "loss": 4.1424, + "step": 90 + }, + { + "epoch": 0.9484536082474226, + "grad_norm": 2.4793708324432373, + "learning_rate": 2e-05, + "loss": 3.0203, + "step": 92 + }, + { + "epoch": 0.9690721649484536, + "grad_norm": 1.2466847896575928, + "learning_rate": 2e-05, + "loss": 0.752, + "step": 94 + }, + { + "epoch": 0.9896907216494846, + "grad_norm": 5.899107933044434, + "learning_rate": 2e-05, + "loss": 0.9921, + "step": 96 + }, + { + "epoch": 1.0, + "step": 97, + "total_flos": 2136321831206912.0, + "train_loss": 2.3528099060058594, + "train_runtime": 203.1052, + "train_samples_per_second": 1.91, + "train_steps_per_second": 0.478 + } + ], + "logging_steps": 2, + "max_steps": 97, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 2136321831206912.0, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/9_client_model_round10.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/9_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..5ad0b185bf4cce222b25c96636536188bd28d0a5 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/9_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5f96bfbcd42c94975391a65b2e15f8e71951da6ea9ed9eda7db72348935930 +size 368443438 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/9_client_model_round12.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/9_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..f41d0ded73c86ebad42d5e427a05ddd9424adbef --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/9_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4203c7d3b76724925650774b286c69752fd21962c00e4d455790d57caf43d3c6 +size 368443438 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/9_client_model_round15.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/9_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..2893ac324f17aba639ef53242d7ec2fc4a3e3142 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/9_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7038bc3a1807d7acfe479bf4c62f68c2df4a87f80d9428640426b1d12452c86a +size 368443438 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/9_client_model_round17.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/9_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..23ee54f1c3720d73a04105c6287c0b440bd3aa53 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/9_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c315c1ee5e93d6fba4cb04ef8ffb05cbf1d0e88508767c690ccc68dfb39626e +size 368443438 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/9_client_model_round2.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/9_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..eb4c00e8c090cb9254a87e9e817592fb20be1a42 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/9_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a49a7ae9634e66bc845abd923b7a98922df3843072ce9068043722caaef048ac +size 368442474 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/9_client_model_round20.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/9_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..3a959f9e9c49bce972663620c36a341fd1d322cf --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/9_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8355ab15c8c7cc169658a4d85172d13ee3c80ba2eff9f28315915b99d1cedfd7 +size 368443438 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/9_client_model_round5.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/9_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..072a3d619bfc1807e9b06064ff902c1ca2576170 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/9_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12d9d15d1c23c598a8e8fd2af4fcf094551842f5169e95017522cf6a4efd68b9 +size 368442474 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/9_client_model_round7.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/9_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..d37130d1d7467e1be00e7a89b0cf850f9fe18bb5 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/9_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12ca033b5852b2c5b319e961cf1631b3f7972282a89042d76349825027dfe1bb +size 368442474 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/9_trainer_state.json b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/9_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..f31403d9ae58135e5dfdd50d769546cf177afe3a --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/9_trainer_state.json @@ -0,0 +1,378 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 97, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.020618556701030927, + "grad_norm": 3.8100907802581787, + "learning_rate": 2e-05, + "loss": 2.2904, + "step": 2 + }, + { + "epoch": 0.041237113402061855, + "grad_norm": 2.87021803855896, + "learning_rate": 2e-05, + "loss": 2.1719, + "step": 4 + }, + { + "epoch": 0.061855670103092786, + "grad_norm": 3.069092273712158, + "learning_rate": 2e-05, + "loss": 1.7753, + "step": 6 + }, + { + "epoch": 0.08247422680412371, + "grad_norm": 1.0851856470108032, + "learning_rate": 2e-05, + "loss": 2.011, + "step": 8 + }, + { + "epoch": 0.10309278350515463, + "grad_norm": 3.774862051010132, + "learning_rate": 2e-05, + "loss": 2.4611, + "step": 10 + }, + { + "epoch": 0.12371134020618557, + "grad_norm": 2.1158974170684814, + "learning_rate": 2e-05, + "loss": 2.5591, + "step": 12 + }, + { + "epoch": 0.14432989690721648, + "grad_norm": 0.7925451397895813, + "learning_rate": 2e-05, + "loss": 0.8296, + "step": 14 + }, + { + "epoch": 0.16494845360824742, + "grad_norm": 1.1956062316894531, + "learning_rate": 2e-05, + "loss": 2.0254, + "step": 16 + }, + { + "epoch": 0.18556701030927836, + "grad_norm": 4.662135601043701, + "learning_rate": 2e-05, + "loss": 2.0844, + "step": 18 + }, + { + "epoch": 0.20618556701030927, + "grad_norm": 3.827667713165283, + "learning_rate": 2e-05, + "loss": 2.2532, + "step": 20 + }, + { + "epoch": 0.2268041237113402, + "grad_norm": 3.2033684253692627, + "learning_rate": 2e-05, + "loss": 2.5698, + "step": 22 + }, + { + "epoch": 0.24742268041237114, + "grad_norm": 1.5866730213165283, + "learning_rate": 2e-05, + "loss": 1.4423, + "step": 24 + }, + { + "epoch": 0.26804123711340205, + "grad_norm": 2.4296913146972656, + "learning_rate": 2e-05, + "loss": 1.4113, + "step": 26 + }, + { + "epoch": 0.28865979381443296, + "grad_norm": 1.9395915269851685, + "learning_rate": 2e-05, + "loss": 1.6703, + "step": 28 + }, + { + "epoch": 0.30927835051546393, + "grad_norm": 4.924380302429199, + "learning_rate": 2e-05, + "loss": 2.4546, + "step": 30 + }, + { + "epoch": 0.32989690721649484, + "grad_norm": 4.495025634765625, + "learning_rate": 2e-05, + "loss": 2.2471, + "step": 32 + }, + { + "epoch": 0.35051546391752575, + "grad_norm": 5.273983001708984, + "learning_rate": 2e-05, + "loss": 1.8329, + "step": 34 + }, + { + "epoch": 0.3711340206185567, + "grad_norm": 1.2212046384811401, + "learning_rate": 2e-05, + "loss": 1.169, + "step": 36 + }, + { + "epoch": 0.3917525773195876, + "grad_norm": 6.125927448272705, + "learning_rate": 2e-05, + "loss": 1.7271, + "step": 38 + }, + { + "epoch": 0.41237113402061853, + "grad_norm": 2.8754186630249023, + "learning_rate": 2e-05, + "loss": 1.407, + "step": 40 + }, + { + "epoch": 0.4329896907216495, + "grad_norm": 1.3894823789596558, + "learning_rate": 2e-05, + "loss": 1.1003, + "step": 42 + }, + { + "epoch": 0.4536082474226804, + "grad_norm": 9.833595275878906, + "learning_rate": 2e-05, + "loss": 2.3855, + "step": 44 + }, + { + "epoch": 0.4742268041237113, + "grad_norm": 2.241000175476074, + "learning_rate": 2e-05, + "loss": 0.8884, + "step": 46 + }, + { + "epoch": 0.4948453608247423, + "grad_norm": 2.6601366996765137, + "learning_rate": 2e-05, + "loss": 1.3076, + "step": 48 + }, + { + "epoch": 0.5154639175257731, + "grad_norm": 3.584256410598755, + "learning_rate": 2e-05, + "loss": 3.0178, + "step": 50 + }, + { + "epoch": 0.5360824742268041, + "grad_norm": 5.417187213897705, + "learning_rate": 2e-05, + "loss": 2.2358, + "step": 52 + }, + { + "epoch": 0.5567010309278351, + "grad_norm": 3.2286760807037354, + "learning_rate": 2e-05, + "loss": 2.0264, + "step": 54 + }, + { + "epoch": 0.5773195876288659, + "grad_norm": 1.42276930809021, + "learning_rate": 2e-05, + "loss": 1.2761, + "step": 56 + }, + { + "epoch": 0.5979381443298969, + "grad_norm": 7.244561672210693, + "learning_rate": 2e-05, + "loss": 2.6213, + "step": 58 + }, + { + "epoch": 0.6185567010309279, + "grad_norm": 5.565174102783203, + "learning_rate": 2e-05, + "loss": 2.7817, + "step": 60 + }, + { + "epoch": 0.6391752577319587, + "grad_norm": 2.2620787620544434, + "learning_rate": 2e-05, + "loss": 1.6047, + "step": 62 + }, + { + "epoch": 0.6597938144329897, + "grad_norm": 2.922333002090454, + "learning_rate": 2e-05, + "loss": 1.8253, + "step": 64 + }, + { + "epoch": 0.6804123711340206, + "grad_norm": 3.4184505939483643, + "learning_rate": 2e-05, + "loss": 1.5283, + "step": 66 + }, + { + "epoch": 0.7010309278350515, + "grad_norm": 1.6338927745819092, + "learning_rate": 2e-05, + "loss": 1.5409, + "step": 68 + }, + { + "epoch": 0.7216494845360825, + "grad_norm": 2.8306140899658203, + "learning_rate": 2e-05, + "loss": 2.3647, + "step": 70 + }, + { + "epoch": 0.7422680412371134, + "grad_norm": 3.6244277954101562, + "learning_rate": 2e-05, + "loss": 1.6259, + "step": 72 + }, + { + "epoch": 0.7628865979381443, + "grad_norm": 2.8590328693389893, + "learning_rate": 2e-05, + "loss": 2.1455, + "step": 74 + }, + { + "epoch": 0.7835051546391752, + "grad_norm": 3.510274887084961, + "learning_rate": 2e-05, + "loss": 1.6719, + "step": 76 + }, + { + "epoch": 0.8041237113402062, + "grad_norm": 2.605745792388916, + "learning_rate": 2e-05, + "loss": 1.8196, + "step": 78 + }, + { + "epoch": 0.8247422680412371, + "grad_norm": 2.831752300262451, + "learning_rate": 2e-05, + "loss": 1.4585, + "step": 80 + }, + { + "epoch": 0.845360824742268, + "grad_norm": 1.2819002866744995, + "learning_rate": 2e-05, + "loss": 0.957, + "step": 82 + }, + { + "epoch": 0.865979381443299, + "grad_norm": 2.0344178676605225, + "learning_rate": 2e-05, + "loss": 1.6396, + "step": 84 + }, + { + "epoch": 0.8865979381443299, + "grad_norm": 17.95958709716797, + "learning_rate": 2e-05, + "loss": 2.0942, + "step": 86 + }, + { + "epoch": 0.9072164948453608, + "grad_norm": 5.369532585144043, + "learning_rate": 2e-05, + "loss": 2.6653, + "step": 88 + }, + { + "epoch": 0.9278350515463918, + "grad_norm": 6.44849157333374, + "learning_rate": 2e-05, + "loss": 1.5656, + "step": 90 + }, + { + "epoch": 0.9484536082474226, + "grad_norm": 5.2986955642700195, + "learning_rate": 2e-05, + "loss": 1.8278, + "step": 92 + }, + { + "epoch": 0.9690721649484536, + "grad_norm": 2.556934356689453, + "learning_rate": 2e-05, + "loss": 1.6021, + "step": 94 + }, + { + "epoch": 0.9896907216494846, + "grad_norm": 3.002997875213623, + "learning_rate": 2e-05, + "loss": 1.783, + "step": 96 + }, + { + "epoch": 1.0, + "step": 97, + "total_flos": 2750129647910912.0, + "train_loss": 1.865082396674402, + "train_runtime": 203.1837, + "train_samples_per_second": 1.91, + "train_steps_per_second": 0.477 + } + ], + "logging_steps": 2, + "max_steps": 97, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 2750129647910912.0, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round10_task_vector_local_weights.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round10_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..8fc4605927fe873e0f32f215e35a056e68e7b6a7 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round10_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ac86a19878cd9fce2d0ded14f23b840aeeb8c45901930520fbb1ea7e3c23720 +size 335548196 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round11_task_vector_local_weights.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round11_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..5eb3c90fe2daf01ac78020903b01ab35fad60d3b --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round11_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32ff9bc7b19e289277f3379ac0b39f2101f18e25e9eb2e1b93b2535c9326ff88 +size 335548196 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round12_task_vector_local_weights.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round12_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..af13c3dec80d87b0afd71b144f132c509139c6a2 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round12_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efbd1afac72c7a51335303bfeca89cabe5d94764785ccc52c62708fe7c18222c +size 335548196 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round13_task_vector_local_weights.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round13_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..52c051f3a412b3cf30d3b06be3d3c30aceab1aa6 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round13_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03885632d520a5dfb01a343a588e8edcc826409477cbe3e52ffe2af3307e9137 +size 335548196 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round14_task_vector_local_weights.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round14_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..7f2ea49e7fcbc501db3e7f951b328634161f4411 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round14_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6298566720de7135ae076d5049f67f0933c934628a6c2972d98a3ca4855c8d90 +size 335548196 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round15_task_vector_local_weights.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round15_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..6db92bf59060838a0f00b4d71e5af8140da2ef0e --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round15_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92bc861c060d16eb9f2afdc6ca61ed3a242cf90b25eb3d959632a7089db12123 +size 335548196 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round16_task_vector_local_weights.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round16_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..80407854bb965ab25873dbe7c3ad90ea5807f509 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round16_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87fea7e7249fe30ed74259567885d917df6473caea993f41a380bf58c30f9c75 +size 335548196 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round17_task_vector_local_weights.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round17_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..52282b539cf8570fcd0ba64bbf1e01fd26606f23 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round17_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4c8c6457c01472cc3a24df6c6ac6eb56497b4fe48869341792560892bf36667 +size 335548196 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round18_task_vector_local_weights.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round18_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..fcf05f80a30b8b919e9020d0f1af9b7c2c3020b7 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round18_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ede54a0e0fca8a3864c3b581821e88d7fe0dd94d5436d0dfb392cfd6d97d637 +size 335548196 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round19_task_vector_local_weights.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round19_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..483bae93634036822e9e78a84b5f849c3550bac2 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round19_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e99db36eb2720278ab95fdf051b564c7d61c601bb44eedfb22329bc737c22d7 +size 335548196 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round1_task_vector_local_weights.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round1_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..5540d6d02635b6bdbd5d17a49855034f91462b2f --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round1_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48a8a5b5d52e1fd2a325a93b354d40b71be87c4bcc346aae909be3141c6232a0 +size 335548182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round20_task_vector_local_weights.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round20_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..202d8194955de3b77076a705d78dcf36ea5a95cd --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round20_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08d7ad19361222024f6ecbd484522742ef2ac7afd6febb3f0094e47a5d7eb24c +size 335548196 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round2_task_vector_local_weights.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round2_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..b472647d0f9a58143abaa7e95f98e1fbb0693433 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round2_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa70c8fe6577a6840dd8f6bb649cda65f5f0c216724ab369bf2604aca7bc84ef +size 335548182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round3_task_vector_local_weights.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round3_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..2c035a52b0bb5a3bdc5ab8ab911c288f2e48f0e4 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round3_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:300a12f2b3a8cccc2e18e00aba5b7718860f952caee9a94f7ae5c544b822ed3e +size 335548182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round4_task_vector_local_weights.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round4_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..967e84301dc2a698feffc5c09290e930e6267117 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round4_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9884dbe1010210f66d494824740541064662f4b457bba8c9c8c4fb968ed3e1e4 +size 335548182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round5_task_vector_local_weights.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round5_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..203259d8595d81dea3f953752dadff01cb05791b --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round5_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c186fe784d140ab7fd29efc7e11b45acfb58c03028205657abb1f88393e4e833 +size 335548182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round6_task_vector_local_weights.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round6_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..fe0e8b3fc02a434a6c70c7758fa3a4064a082bb8 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round6_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b15eb87fd1e825687b1a8619a219ec44b00a7d12475df06d1c57080ce8ff3c29 +size 335548182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round7_task_vector_local_weights.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round7_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..ca5a4cd61cf61c8f4e23188eb73c034742d09543 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round7_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:513767d8344cf4cb8cf0e791170439fddaf5a2bc3ff43a3c704fcbd14d4e13ed +size 335548182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round8_task_vector_local_weights.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round8_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..44f25c57d7840e904c0945b2cd92f74cb7b46c99 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round8_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1839f28aa31e043da0fcdb5f7f90e6e53d8d847b0e6fcf48ae918abca7d0889 +size 335548182 diff --git a/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round9_task_vector_local_weights.pth b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round9_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..dad965819472456b44e2d50c696a2f99dd0834f3 --- /dev/null +++ b/client_states_feddualMultipqfull2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/round9_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79efa8fe8e441248bd98e124ba49ac7410e2b3bbe5c414885900ca88660f0e35 +size 335548182