diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round10.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..2d164ce90300ed49dfdba6f14b5fd026861edced --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b16768f7dc2eae664e5fd275f1c0e4a05c9147bb79c0c4b402a18aeaaf8375d +size 368443438 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round12.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..cd5bb423ac1daebcd2786e5ab7a77a46deb39fdb --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebe47cb1aefad62c1fd613c76140e6267ba060f1c514591486cf4468523c5b41 +size 368443438 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round15.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..e49f76e05a6c7c72335c5c69b176b3d3b8fda0c1 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f4e565288b1dd9e16440afea7c377fea6e8c2b86a937030cd568bd120fd038f +size 368443438 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round17.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..7119d544f1a6f5e24009e8e4d51c20c9b939cbb1 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1d356437d08bccdd3ce361ad9057428bcf4cae911a507b8332d938f41f5dc74 +size 368443438 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round2.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..d920ef217e8281e5e4ea36f6ce112d4be317a20a --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e98f5737926eedec558b34d9e5d045c45ea50e7ff4c68699fa210aaaf5120a9 +size 368442474 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round20.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..b972faf0114d53ecba00b833d1d427b5c37f90c9 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15aa028b6cced7cfa1cde28f6be8395d18b370d33f5961c4652916168c869da9 +size 368443438 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round5.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..f568194fcbec68cfdff281f396654658a6f9239c --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:421f88eb88ff09a6f10c9c0caf03a8665de01d152db170828eca4be38fb91eac +size 368442474 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round7.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..708cfc4d0dbe9472a98aac470e57b064dc589775 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:525f0f37c26b21e07d6e9178e77c0ef29b869daafb690f58a885a4a1402ea584 +size 368442474 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_trainer_state.json b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..dfcbef6be536863d656a19535475ae4ab3e2de21 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_trainer_state.json @@ -0,0 +1,378 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 97, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.020618556701030927, + "grad_norm": 4.400585174560547, + "learning_rate": 2e-05, + "loss": 2.1084, + "step": 2 + }, + { + "epoch": 0.041237113402061855, + "grad_norm": 0.24108143150806427, + "learning_rate": 2e-05, + "loss": 0.5575, + "step": 4 + }, + { + "epoch": 0.061855670103092786, + "grad_norm": 2.3387579917907715, + "learning_rate": 2e-05, + "loss": 1.3726, + "step": 6 + }, + { + "epoch": 0.08247422680412371, + "grad_norm": 3.3745932579040527, + "learning_rate": 2e-05, + "loss": 1.0676, + "step": 8 + }, + { + "epoch": 0.10309278350515463, + "grad_norm": 0.499793142080307, + "learning_rate": 2e-05, + "loss": 1.5278, + "step": 10 + }, + { + "epoch": 0.12371134020618557, + "grad_norm": 1.0053821802139282, + "learning_rate": 2e-05, + "loss": 0.4909, + "step": 12 + }, + { + "epoch": 0.14432989690721648, + "grad_norm": 1.3840383291244507, + "learning_rate": 2e-05, + "loss": 0.9338, + "step": 14 + }, + { + "epoch": 0.16494845360824742, + "grad_norm": 2.917617082595825, + "learning_rate": 2e-05, + "loss": 0.3054, + "step": 16 + }, + { + "epoch": 0.18556701030927836, + "grad_norm": 1.6473109722137451, + "learning_rate": 2e-05, + "loss": 0.8086, + "step": 18 + }, + { + "epoch": 0.20618556701030927, + "grad_norm": 1.5606623888015747, + "learning_rate": 2e-05, + "loss": 1.9234, + "step": 20 + }, + { + "epoch": 0.2268041237113402, + "grad_norm": 0.5007361173629761, + "learning_rate": 2e-05, + "loss": 0.7782, + "step": 22 + }, + { + "epoch": 0.24742268041237114, + "grad_norm": 1.6239376068115234, + "learning_rate": 2e-05, + "loss": 1.1194, + "step": 24 + }, + { + "epoch": 0.26804123711340205, + "grad_norm": 2.372718572616577, + "learning_rate": 2e-05, + "loss": 0.4856, + "step": 26 + }, + { + "epoch": 0.28865979381443296, + "grad_norm": 1.8457813262939453, + "learning_rate": 2e-05, + "loss": 1.3728, + "step": 28 + }, + { + "epoch": 0.30927835051546393, + "grad_norm": 0.855133593082428, + "learning_rate": 2e-05, + "loss": 2.0313, + "step": 30 + }, + { + "epoch": 0.32989690721649484, + "grad_norm": 1.2432137727737427, + "learning_rate": 2e-05, + "loss": 0.4426, + "step": 32 + }, + { + "epoch": 0.35051546391752575, + "grad_norm": 1.4432425498962402, + "learning_rate": 2e-05, + "loss": 0.7053, + "step": 34 + }, + { + "epoch": 0.3711340206185567, + "grad_norm": 1.024395227432251, + "learning_rate": 2e-05, + "loss": 0.6134, + "step": 36 + }, + { + "epoch": 0.3917525773195876, + "grad_norm": 1.194606900215149, + "learning_rate": 2e-05, + "loss": 0.8373, + "step": 38 + }, + { + "epoch": 0.41237113402061853, + "grad_norm": 3.11031174659729, + "learning_rate": 2e-05, + "loss": 2.5497, + "step": 40 + }, + { + "epoch": 0.4329896907216495, + "grad_norm": 1.2926805019378662, + "learning_rate": 2e-05, + "loss": 0.9482, + "step": 42 + }, + { + "epoch": 0.4536082474226804, + "grad_norm": 0.5149866938591003, + "learning_rate": 2e-05, + "loss": 0.4165, + "step": 44 + }, + { + "epoch": 0.4742268041237113, + "grad_norm": 1.190213680267334, + "learning_rate": 2e-05, + "loss": 0.9618, + "step": 46 + }, + { + "epoch": 0.4948453608247423, + "grad_norm": 0.6894278526306152, + "learning_rate": 2e-05, + "loss": 1.0249, + "step": 48 + }, + { + "epoch": 0.5154639175257731, + "grad_norm": 2.4215104579925537, + "learning_rate": 2e-05, + "loss": 2.0148, + "step": 50 + }, + { + "epoch": 0.5360824742268041, + "grad_norm": 0.714414119720459, + "learning_rate": 2e-05, + "loss": 1.3428, + "step": 52 + }, + { + "epoch": 0.5567010309278351, + "grad_norm": 1.1892106533050537, + "learning_rate": 2e-05, + "loss": 1.1607, + "step": 54 + }, + { + "epoch": 0.5773195876288659, + "grad_norm": 1.21503484249115, + "learning_rate": 2e-05, + "loss": 1.836, + "step": 56 + }, + { + "epoch": 0.5979381443298969, + "grad_norm": 0.6278855800628662, + "learning_rate": 2e-05, + "loss": 0.844, + "step": 58 + }, + { + "epoch": 0.6185567010309279, + "grad_norm": 2.5338757038116455, + "learning_rate": 2e-05, + "loss": 0.7447, + "step": 60 + }, + { + "epoch": 0.6391752577319587, + "grad_norm": 1.6841797828674316, + "learning_rate": 2e-05, + "loss": 0.8774, + "step": 62 + }, + { + "epoch": 0.6597938144329897, + "grad_norm": 0.9872264862060547, + "learning_rate": 2e-05, + "loss": 0.9218, + "step": 64 + }, + { + "epoch": 0.6804123711340206, + "grad_norm": 1.0775535106658936, + "learning_rate": 2e-05, + "loss": 0.9773, + "step": 66 + }, + { + "epoch": 0.7010309278350515, + "grad_norm": 1.7016096115112305, + "learning_rate": 2e-05, + "loss": 1.3366, + "step": 68 + }, + { + "epoch": 0.7216494845360825, + "grad_norm": 9.161294937133789, + "learning_rate": 2e-05, + "loss": 2.0726, + "step": 70 + }, + { + "epoch": 0.7422680412371134, + "grad_norm": 1.1249581575393677, + "learning_rate": 2e-05, + "loss": 0.8084, + "step": 72 + }, + { + "epoch": 0.7628865979381443, + "grad_norm": 1.4263134002685547, + "learning_rate": 2e-05, + "loss": 0.9452, + "step": 74 + }, + { + "epoch": 0.7835051546391752, + "grad_norm": 3.8015453815460205, + "learning_rate": 2e-05, + "loss": 1.3966, + "step": 76 + }, + { + "epoch": 0.8041237113402062, + "grad_norm": 1.51714026927948, + "learning_rate": 2e-05, + "loss": 1.3366, + "step": 78 + }, + { + "epoch": 0.8247422680412371, + "grad_norm": 1.001514196395874, + "learning_rate": 2e-05, + "loss": 1.2534, + "step": 80 + }, + { + "epoch": 0.845360824742268, + "grad_norm": 0.437701553106308, + "learning_rate": 2e-05, + "loss": 0.6374, + "step": 82 + }, + { + "epoch": 0.865979381443299, + "grad_norm": 0.8562130928039551, + "learning_rate": 2e-05, + "loss": 0.8362, + "step": 84 + }, + { + "epoch": 0.8865979381443299, + "grad_norm": 1.1629040241241455, + "learning_rate": 2e-05, + "loss": 0.6705, + "step": 86 + }, + { + "epoch": 0.9072164948453608, + "grad_norm": 0.7516007423400879, + "learning_rate": 2e-05, + "loss": 0.9896, + "step": 88 + }, + { + "epoch": 0.9278350515463918, + "grad_norm": 1.4195737838745117, + "learning_rate": 2e-05, + "loss": 0.8637, + "step": 90 + }, + { + "epoch": 0.9484536082474226, + "grad_norm": 2.6594505310058594, + "learning_rate": 2e-05, + "loss": 1.1106, + "step": 92 + }, + { + "epoch": 0.9690721649484536, + "grad_norm": 0.5046249628067017, + "learning_rate": 2e-05, + "loss": 0.7569, + "step": 94 + }, + { + "epoch": 0.9896907216494846, + "grad_norm": 2.1814091205596924, + "learning_rate": 2e-05, + "loss": 1.1165, + "step": 96 + }, + { + "epoch": 1.0, + "step": 97, + "total_flos": 5716895332302848.0, + "train_loss": 1.0793670944331848, + "train_runtime": 222.0474, + "train_samples_per_second": 1.747, + "train_steps_per_second": 0.437 + } + ], + "logging_steps": 2, + "max_steps": 97, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 5716895332302848.0, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round10.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..9cc3728c6439ae1e7c945a6b6884fbf5bf3c7b99 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b4cf563ddeb6cec914fa98a3339483e303ee40bcfbc8177f2de90ec07fd9f32 +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round12.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..45b18d6aeafabb58bd2e748691154a05640621f9 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d4e731a0acc1c910df1a066b29fbc699083b9afcfd305403782197d842e12ad +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round15.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..09de20201b08377fe97cd384fbbfe2fbf185268f --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72086853e3f2e6d801b2bbabd64045d8df56a4e1a9d90762650e9def4016026b +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round17.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..cff075e33fb4bcc0be1a05d1e55d777cfc0ace35 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca8e1391c42f7045fc6ae4257810e9ec6fa9b85ad051a083f1b3a6cc1c13b9e7 +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round2.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..b03e1ead0492a5552de07dcab7f2eee900ac1db8 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ad99be95eca9ecc8be94e2334e2786ea50b2df0bc5a440a7200405c66c551aa +size 791576546 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round20.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..d6f775390d02e5aa425d7fa7adb4dbac5fd2d9a8 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e370b2d3fe5711152b28b41a8df70a261223af0d600ff997c0beee58add2f883 +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round5.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..9b3cce0fe4465e8020eb48053fe1ee0f5c9ee456 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03b2c620112acbddbfdcaa58a0bcc02827da8b0c3062d0bbb0aacdbfce067764 +size 791576546 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round7.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..70a23ee0e7fa8e76f70af47ca55e1a5fb1ad143e --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9ad4a35f17fa2fa92dbf9df9678d3ab4ba7f3b43367db0b87142e429f809cd1 +size 791576546 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_trainer_state.json b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..1299ec0b47620325bd96795a8de5ce7d4b71b813 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_trainer_state.json @@ -0,0 +1,378 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 97, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.020618556701030927, + "grad_norm": 1.0367224216461182, + "learning_rate": 2e-05, + "loss": 2.1122, + "step": 2 + }, + { + "epoch": 0.041237113402061855, + "grad_norm": 1.5293935537338257, + "learning_rate": 2e-05, + "loss": 2.3105, + "step": 4 + }, + { + "epoch": 0.061855670103092786, + "grad_norm": 1.200186848640442, + "learning_rate": 2e-05, + "loss": 1.2933, + "step": 6 + }, + { + "epoch": 0.08247422680412371, + "grad_norm": 0.551851749420166, + "learning_rate": 2e-05, + "loss": 1.01, + "step": 8 + }, + { + "epoch": 0.10309278350515463, + "grad_norm": 1.2025572061538696, + "learning_rate": 2e-05, + "loss": 1.6588, + "step": 10 + }, + { + "epoch": 0.12371134020618557, + "grad_norm": 0.773492693901062, + "learning_rate": 2e-05, + "loss": 1.269, + "step": 12 + }, + { + "epoch": 0.14432989690721648, + "grad_norm": 1.1679770946502686, + "learning_rate": 2e-05, + "loss": 0.9164, + "step": 14 + }, + { + "epoch": 0.16494845360824742, + "grad_norm": 0.5977709293365479, + "learning_rate": 2e-05, + "loss": 1.4414, + "step": 16 + }, + { + "epoch": 0.18556701030927836, + "grad_norm": 1.0373786687850952, + "learning_rate": 2e-05, + "loss": 2.1323, + "step": 18 + }, + { + "epoch": 0.20618556701030927, + "grad_norm": 1.6528465747833252, + "learning_rate": 2e-05, + "loss": 1.0931, + "step": 20 + }, + { + "epoch": 0.2268041237113402, + "grad_norm": 1.2186673879623413, + "learning_rate": 2e-05, + "loss": 0.9268, + "step": 22 + }, + { + "epoch": 0.24742268041237114, + "grad_norm": 0.9843794107437134, + "learning_rate": 2e-05, + "loss": 1.4834, + "step": 24 + }, + { + "epoch": 0.26804123711340205, + "grad_norm": 1.1736723184585571, + "learning_rate": 2e-05, + "loss": 0.973, + "step": 26 + }, + { + "epoch": 0.28865979381443296, + "grad_norm": 0.9919485449790955, + "learning_rate": 2e-05, + "loss": 1.426, + "step": 28 + }, + { + "epoch": 0.30927835051546393, + "grad_norm": 0.3353116512298584, + "learning_rate": 2e-05, + "loss": 0.3913, + "step": 30 + }, + { + "epoch": 0.32989690721649484, + "grad_norm": 0.7836465835571289, + "learning_rate": 2e-05, + "loss": 0.9893, + "step": 32 + }, + { + "epoch": 0.35051546391752575, + "grad_norm": 0.6000968813896179, + "learning_rate": 2e-05, + "loss": 1.1023, + "step": 34 + }, + { + "epoch": 0.3711340206185567, + "grad_norm": 1.1263123750686646, + "learning_rate": 2e-05, + "loss": 1.2717, + "step": 36 + }, + { + "epoch": 0.3917525773195876, + "grad_norm": 1.4765498638153076, + "learning_rate": 2e-05, + "loss": 1.2275, + "step": 38 + }, + { + "epoch": 0.41237113402061853, + "grad_norm": 0.7918884754180908, + "learning_rate": 2e-05, + "loss": 1.124, + "step": 40 + }, + { + "epoch": 0.4329896907216495, + "grad_norm": 0.881719708442688, + "learning_rate": 2e-05, + "loss": 1.1614, + "step": 42 + }, + { + "epoch": 0.4536082474226804, + "grad_norm": 0.5077035427093506, + "learning_rate": 2e-05, + "loss": 0.7703, + "step": 44 + }, + { + "epoch": 0.4742268041237113, + "grad_norm": 1.0335602760314941, + "learning_rate": 2e-05, + "loss": 1.0186, + "step": 46 + }, + { + "epoch": 0.4948453608247423, + "grad_norm": 2.6902318000793457, + "learning_rate": 2e-05, + "loss": 1.4702, + "step": 48 + }, + { + "epoch": 0.5154639175257731, + "grad_norm": 0.48346254229545593, + "learning_rate": 2e-05, + "loss": 0.7069, + "step": 50 + }, + { + "epoch": 0.5360824742268041, + "grad_norm": 0.43713346123695374, + "learning_rate": 2e-05, + "loss": 0.9541, + "step": 52 + }, + { + "epoch": 0.5567010309278351, + "grad_norm": 0.7219210863113403, + "learning_rate": 2e-05, + "loss": 1.0328, + "step": 54 + }, + { + "epoch": 0.5773195876288659, + "grad_norm": 0.6687954068183899, + "learning_rate": 2e-05, + "loss": 0.9612, + "step": 56 + }, + { + "epoch": 0.5979381443298969, + "grad_norm": 0.4545569121837616, + "learning_rate": 2e-05, + "loss": 0.7134, + "step": 58 + }, + { + "epoch": 0.6185567010309279, + "grad_norm": 1.4642369747161865, + "learning_rate": 2e-05, + "loss": 1.0691, + "step": 60 + }, + { + "epoch": 0.6391752577319587, + "grad_norm": 0.866256058216095, + "learning_rate": 2e-05, + "loss": 0.9705, + "step": 62 + }, + { + "epoch": 0.6597938144329897, + "grad_norm": 0.6883927583694458, + "learning_rate": 2e-05, + "loss": 1.0837, + "step": 64 + }, + { + "epoch": 0.6804123711340206, + "grad_norm": 0.8896063566207886, + "learning_rate": 2e-05, + "loss": 1.2245, + "step": 66 + }, + { + "epoch": 0.7010309278350515, + "grad_norm": 1.008226990699768, + "learning_rate": 2e-05, + "loss": 0.8514, + "step": 68 + }, + { + "epoch": 0.7216494845360825, + "grad_norm": 0.5231401324272156, + "learning_rate": 2e-05, + "loss": 0.8315, + "step": 70 + }, + { + "epoch": 0.7422680412371134, + "grad_norm": 1.1414425373077393, + "learning_rate": 2e-05, + "loss": 1.0161, + "step": 72 + }, + { + "epoch": 0.7628865979381443, + "grad_norm": 0.8160688281059265, + "learning_rate": 2e-05, + "loss": 0.9522, + "step": 74 + }, + { + "epoch": 0.7835051546391752, + "grad_norm": 4.522146224975586, + "learning_rate": 2e-05, + "loss": 1.3154, + "step": 76 + }, + { + "epoch": 0.8041237113402062, + "grad_norm": 0.8005837798118591, + "learning_rate": 2e-05, + "loss": 1.38, + "step": 78 + }, + { + "epoch": 0.8247422680412371, + "grad_norm": 0.8043385744094849, + "learning_rate": 2e-05, + "loss": 0.7023, + "step": 80 + }, + { + "epoch": 0.845360824742268, + "grad_norm": 0.4813634753227234, + "learning_rate": 2e-05, + "loss": 1.2706, + "step": 82 + }, + { + "epoch": 0.865979381443299, + "grad_norm": 2.6377651691436768, + "learning_rate": 2e-05, + "loss": 0.7818, + "step": 84 + }, + { + "epoch": 0.8865979381443299, + "grad_norm": 0.9884634017944336, + "learning_rate": 2e-05, + "loss": 0.8094, + "step": 86 + }, + { + "epoch": 0.9072164948453608, + "grad_norm": 1.7997894287109375, + "learning_rate": 2e-05, + "loss": 0.4816, + "step": 88 + }, + { + "epoch": 0.9278350515463918, + "grad_norm": 1.9168503284454346, + "learning_rate": 2e-05, + "loss": 0.8998, + "step": 90 + }, + { + "epoch": 0.9484536082474226, + "grad_norm": 0.4715125858783722, + "learning_rate": 2e-05, + "loss": 1.7297, + "step": 92 + }, + { + "epoch": 0.9690721649484536, + "grad_norm": 0.7565422058105469, + "learning_rate": 2e-05, + "loss": 1.1934, + "step": 94 + }, + { + "epoch": 0.9896907216494846, + "grad_norm": 1.6956796646118164, + "learning_rate": 2e-05, + "loss": 1.0388, + "step": 96 + }, + { + "epoch": 1.0, + "step": 97, + "total_flos": 1.3756887170285568e+16, + "train_loss": 1.1302465065238403, + "train_runtime": 315.5064, + "train_samples_per_second": 1.23, + "train_steps_per_second": 0.307 + } + ], + "logging_steps": 2, + "max_steps": 97, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 1.3756887170285568e+16, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round10.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..4826b691271b9953251e18fb741bce723b01a147 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:623c27c6e16e61754cf9f9bde6b0a2f00c89549eada108fd4d3385eeaa29b8a5 +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round12.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..571deb570f6dd57ada8524633ee23b0409680b4a --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9394ca5cba51cc4d5f9a628c5235add0cc79e6cefcbf73aab79088eaf9958ec2 +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round15.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..46dfa65f60b440baf551d175925f94d19f14ba21 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1698991ce97c58e41af99e8d6b1461337859fc7938ede7e57f36eebb9dccf5f7 +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round17.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..fd744708440211b81ba77031e4b4568b43354905 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de7badf37bc6814c02941952260ab1c4ea0434cdd296a402f91bb67747e52c24 +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round2.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..a372debdc96ae4d0b7eae761b9fee465f18fc3c0 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c6e3bfc5a8aab513e9fe3473e92e3048bfbc4d19bd4c4176ce0141a9c69225d +size 791576546 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round20.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..5f4ac85ea80c00d462bcbbcce1d87e5f7ca77cde --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e86a679b1183d5d4cc5c15a3054fd2b160fe0443325d5f0d091c265c5eb060f +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round5.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..d714bd2513ab7eef46efaaf5e9c20044f396c472 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc8dc7440211f75b47738e72ddd3bf0a982d45c096e63747b2ba17635f45434a +size 791576546 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round7.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..20caf812267fe1f3c5c34f7a2595abb880f80d31 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:206787c858348d28620a2bc4ffbc2c93037006a7963eff3316cb95bd1e6bc540 +size 791576546 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_trainer_state.json b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..23415eef208586eb2713bea970607263d118169f --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_trainer_state.json @@ -0,0 +1,378 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 97, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.020618556701030927, + "grad_norm": 2.538358211517334, + "learning_rate": 2e-05, + "loss": 0.6608, + "step": 2 + }, + { + "epoch": 0.041237113402061855, + "grad_norm": 1.2682268619537354, + "learning_rate": 2e-05, + "loss": 0.9785, + "step": 4 + }, + { + "epoch": 0.061855670103092786, + "grad_norm": 1.937935709953308, + "learning_rate": 2e-05, + "loss": 2.3516, + "step": 6 + }, + { + "epoch": 0.08247422680412371, + "grad_norm": 1.4392732381820679, + "learning_rate": 2e-05, + "loss": 1.6785, + "step": 8 + }, + { + "epoch": 0.10309278350515463, + "grad_norm": 1.5007473230361938, + "learning_rate": 2e-05, + "loss": 1.5229, + "step": 10 + }, + { + "epoch": 0.12371134020618557, + "grad_norm": 0.6477186679840088, + "learning_rate": 2e-05, + "loss": 1.3816, + "step": 12 + }, + { + "epoch": 0.14432989690721648, + "grad_norm": 2.7069621086120605, + "learning_rate": 2e-05, + "loss": 1.319, + "step": 14 + }, + { + "epoch": 0.16494845360824742, + "grad_norm": 0.5525019764900208, + "learning_rate": 2e-05, + "loss": 0.9359, + "step": 16 + }, + { + "epoch": 0.18556701030927836, + "grad_norm": 0.7979759573936462, + "learning_rate": 2e-05, + "loss": 1.6191, + "step": 18 + }, + { + "epoch": 0.20618556701030927, + "grad_norm": 2.443120241165161, + "learning_rate": 2e-05, + "loss": 1.0461, + "step": 20 + }, + { + "epoch": 0.2268041237113402, + "grad_norm": 0.8416927456855774, + "learning_rate": 2e-05, + "loss": 1.217, + "step": 22 + }, + { + "epoch": 0.24742268041237114, + "grad_norm": 0.7521089315414429, + "learning_rate": 2e-05, + "loss": 1.0924, + "step": 24 + }, + { + "epoch": 0.26804123711340205, + "grad_norm": 1.4497734308242798, + "learning_rate": 2e-05, + "loss": 1.1838, + "step": 26 + }, + { + "epoch": 0.28865979381443296, + "grad_norm": 0.6999666690826416, + "learning_rate": 2e-05, + "loss": 1.1143, + "step": 28 + }, + { + "epoch": 0.30927835051546393, + "grad_norm": 1.1742311716079712, + "learning_rate": 2e-05, + "loss": 0.9922, + "step": 30 + }, + { + "epoch": 0.32989690721649484, + "grad_norm": 0.5971889495849609, + "learning_rate": 2e-05, + "loss": 1.6466, + "step": 32 + }, + { + "epoch": 0.35051546391752575, + "grad_norm": 1.034390926361084, + "learning_rate": 2e-05, + "loss": 0.8025, + "step": 34 + }, + { + "epoch": 0.3711340206185567, + "grad_norm": 2.665285110473633, + "learning_rate": 2e-05, + "loss": 0.9528, + "step": 36 + }, + { + "epoch": 0.3917525773195876, + "grad_norm": 0.8578566312789917, + "learning_rate": 2e-05, + "loss": 0.9949, + "step": 38 + }, + { + "epoch": 0.41237113402061853, + "grad_norm": 1.1724331378936768, + "learning_rate": 2e-05, + "loss": 0.903, + "step": 40 + }, + { + "epoch": 0.4329896907216495, + "grad_norm": 1.1174654960632324, + "learning_rate": 2e-05, + "loss": 1.1925, + "step": 42 + }, + { + "epoch": 0.4536082474226804, + "grad_norm": 1.1770066022872925, + "learning_rate": 2e-05, + "loss": 0.8522, + "step": 44 + }, + { + "epoch": 0.4742268041237113, + "grad_norm": 0.9446500539779663, + "learning_rate": 2e-05, + "loss": 1.9395, + "step": 46 + }, + { + "epoch": 0.4948453608247423, + "grad_norm": 0.4612779915332794, + "learning_rate": 2e-05, + "loss": 0.4162, + "step": 48 + }, + { + "epoch": 0.5154639175257731, + "grad_norm": 0.7479944229125977, + "learning_rate": 2e-05, + "loss": 0.953, + "step": 50 + }, + { + "epoch": 0.5360824742268041, + "grad_norm": 0.7862464189529419, + "learning_rate": 2e-05, + "loss": 0.3849, + "step": 52 + }, + { + "epoch": 0.5567010309278351, + "grad_norm": 0.7938858270645142, + "learning_rate": 2e-05, + "loss": 0.6369, + "step": 54 + }, + { + "epoch": 0.5773195876288659, + "grad_norm": 2.231029987335205, + "learning_rate": 2e-05, + "loss": 0.9901, + "step": 56 + }, + { + "epoch": 0.5979381443298969, + "grad_norm": 0.3764982223510742, + "learning_rate": 2e-05, + "loss": 0.9056, + "step": 58 + }, + { + "epoch": 0.6185567010309279, + "grad_norm": 0.9940462708473206, + "learning_rate": 2e-05, + "loss": 0.5912, + "step": 60 + }, + { + "epoch": 0.6391752577319587, + "grad_norm": 0.9223126173019409, + "learning_rate": 2e-05, + "loss": 0.6726, + "step": 62 + }, + { + "epoch": 0.6597938144329897, + "grad_norm": 0.7324680685997009, + "learning_rate": 2e-05, + "loss": 0.4076, + "step": 64 + }, + { + "epoch": 0.6804123711340206, + "grad_norm": 0.8635823130607605, + "learning_rate": 2e-05, + "loss": 0.5997, + "step": 66 + }, + { + "epoch": 0.7010309278350515, + "grad_norm": 1.428286075592041, + "learning_rate": 2e-05, + "loss": 0.9463, + "step": 68 + }, + { + "epoch": 0.7216494845360825, + "grad_norm": 0.5211204290390015, + "learning_rate": 2e-05, + "loss": 0.7596, + "step": 70 + }, + { + "epoch": 0.7422680412371134, + "grad_norm": 1.464924931526184, + "learning_rate": 2e-05, + "loss": 0.7913, + "step": 72 + }, + { + "epoch": 0.7628865979381443, + "grad_norm": 2.8257651329040527, + "learning_rate": 2e-05, + "loss": 1.2766, + "step": 74 + }, + { + "epoch": 0.7835051546391752, + "grad_norm": 2.5703413486480713, + "learning_rate": 2e-05, + "loss": 0.8435, + "step": 76 + }, + { + "epoch": 0.8041237113402062, + "grad_norm": 1.486395239830017, + "learning_rate": 2e-05, + "loss": 0.9819, + "step": 78 + }, + { + "epoch": 0.8247422680412371, + "grad_norm": 0.4546787738800049, + "learning_rate": 2e-05, + "loss": 0.2796, + "step": 80 + }, + { + "epoch": 0.845360824742268, + "grad_norm": 0.7543643116950989, + "learning_rate": 2e-05, + "loss": 0.2902, + "step": 82 + }, + { + "epoch": 0.865979381443299, + "grad_norm": 0.8718597292900085, + "learning_rate": 2e-05, + "loss": 0.5479, + "step": 84 + }, + { + "epoch": 0.8865979381443299, + "grad_norm": 2.138429880142212, + "learning_rate": 2e-05, + "loss": 1.1224, + "step": 86 + }, + { + "epoch": 0.9072164948453608, + "grad_norm": 0.581947922706604, + "learning_rate": 2e-05, + "loss": 0.9022, + "step": 88 + }, + { + "epoch": 0.9278350515463918, + "grad_norm": 1.3591723442077637, + "learning_rate": 2e-05, + "loss": 0.9803, + "step": 90 + }, + { + "epoch": 0.9484536082474226, + "grad_norm": 1.1390422582626343, + "learning_rate": 2e-05, + "loss": 1.1259, + "step": 92 + }, + { + "epoch": 0.9690721649484536, + "grad_norm": 1.318390130996704, + "learning_rate": 2e-05, + "loss": 0.9855, + "step": 94 + }, + { + "epoch": 0.9896907216494846, + "grad_norm": 1.238763451576233, + "learning_rate": 2e-05, + "loss": 0.4494, + "step": 96 + }, + { + "epoch": 1.0, + "step": 97, + "total_flos": 1.5309291128881152e+16, + "train_loss": 0.9762444643630195, + "train_runtime": 351.1873, + "train_samples_per_second": 1.105, + "train_steps_per_second": 0.276 + } + ], + "logging_steps": 2, + "max_steps": 97, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 1.5309291128881152e+16, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round10.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..a1b57662b3a7cf015b91f5ee9fe44ac0beca846e --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fc77f4acfc80e842f0c49ca07c0518a93812788236835cee6b47f88c1ce363a +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round12.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..94215e27f3a9f50bf7c6694ce84e5aa981052c11 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40d3dc701382da26808567ded7104ae77026cab4a5a03ca85a9b7408b648375f +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round15.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..fdf5098474d5d0305caea9ac02bbd9fda15d621d --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6fbb24e8df10767d6e48cd3bbe7abb171912af63f525f6830f724827e262f42 +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round17.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..5797e4fc935d04ed0c43a3e8a31a365f50acd70c --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc952fe4c8ad4ef2ce347a0fec31859d5ea7286b61fbdbd33f62cc59fc6a1db8 +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round2.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..692d714530be55bd62357c24ee0d3e2705d14e91 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b91e5497d58df5e6c88cfd96c80538d3b0489625e9c1844bc7134fc1819c132 +size 791576546 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round20.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..ddababe00b778c754f15cb4fe71ce598461f0598 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41b1e011c681191accbfee628a5d5367b45a57bb25b21cc0fb2dcc706842da26 +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round5.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..21c277b0c4680d7b722b1a2d66a979b78293f69c --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:909ae260c1b95d5769bb16ca3cc0ea471dd2f0a32764d5950ed946519bbdfa90 +size 791576546 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round7.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..6639b852e17339f453e4236dedc364f49a24f58f --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:deb5bbcfb7d060129e306207445c42c34099a7c3d3df2de2dd80ec00e2a81b15 +size 791576546 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_trainer_state.json b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..104caa1c68c321fc3b66958cae30fb4f4565a7e3 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_trainer_state.json @@ -0,0 +1,378 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 97, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.020618556701030927, + "grad_norm": 1.7036350965499878, + "learning_rate": 2e-05, + "loss": 1.1502, + "step": 2 + }, + { + "epoch": 0.041237113402061855, + "grad_norm": 0.733051061630249, + "learning_rate": 2e-05, + "loss": 0.3144, + "step": 4 + }, + { + "epoch": 0.061855670103092786, + "grad_norm": 3.021022081375122, + "learning_rate": 2e-05, + "loss": 1.523, + "step": 6 + }, + { + "epoch": 0.08247422680412371, + "grad_norm": 0.6244669556617737, + "learning_rate": 2e-05, + "loss": 0.9215, + "step": 8 + }, + { + "epoch": 0.10309278350515463, + "grad_norm": 1.675452470779419, + "learning_rate": 2e-05, + "loss": 1.2749, + "step": 10 + }, + { + "epoch": 0.12371134020618557, + "grad_norm": 0.2071010321378708, + "learning_rate": 2e-05, + "loss": 0.2043, + "step": 12 + }, + { + "epoch": 0.14432989690721648, + "grad_norm": 0.45165616273880005, + "learning_rate": 2e-05, + "loss": 0.2592, + "step": 14 + }, + { + "epoch": 0.16494845360824742, + "grad_norm": 0.9154694080352783, + "learning_rate": 2e-05, + "loss": 1.0788, + "step": 16 + }, + { + "epoch": 0.18556701030927836, + "grad_norm": 0.44769397377967834, + "learning_rate": 2e-05, + "loss": 0.672, + "step": 18 + }, + { + "epoch": 0.20618556701030927, + "grad_norm": 1.001409649848938, + "learning_rate": 2e-05, + "loss": 0.7424, + "step": 20 + }, + { + "epoch": 0.2268041237113402, + "grad_norm": 0.2860804498195648, + "learning_rate": 2e-05, + "loss": 0.7084, + "step": 22 + }, + { + "epoch": 0.24742268041237114, + "grad_norm": 0.4580197036266327, + "learning_rate": 2e-05, + "loss": 1.1849, + "step": 24 + }, + { + "epoch": 0.26804123711340205, + "grad_norm": 0.4905541241168976, + "learning_rate": 2e-05, + "loss": 0.7166, + "step": 26 + }, + { + "epoch": 0.28865979381443296, + "grad_norm": 1.433603048324585, + "learning_rate": 2e-05, + "loss": 1.5247, + "step": 28 + }, + { + "epoch": 0.30927835051546393, + "grad_norm": 2.386955738067627, + "learning_rate": 2e-05, + "loss": 0.8547, + "step": 30 + }, + { + "epoch": 0.32989690721649484, + "grad_norm": 2.032757043838501, + "learning_rate": 2e-05, + "loss": 0.5488, + "step": 32 + }, + { + "epoch": 0.35051546391752575, + "grad_norm": 1.0941940546035767, + "learning_rate": 2e-05, + "loss": 0.9551, + "step": 34 + }, + { + "epoch": 0.3711340206185567, + "grad_norm": 1.461041808128357, + "learning_rate": 2e-05, + "loss": 1.1186, + "step": 36 + }, + { + "epoch": 0.3917525773195876, + "grad_norm": 0.46292173862457275, + "learning_rate": 2e-05, + "loss": 0.9941, + "step": 38 + }, + { + "epoch": 0.41237113402061853, + "grad_norm": 0.46523961424827576, + "learning_rate": 2e-05, + "loss": 0.99, + "step": 40 + }, + { + "epoch": 0.4329896907216495, + "grad_norm": 0.5094814896583557, + "learning_rate": 2e-05, + "loss": 1.0255, + "step": 42 + }, + { + "epoch": 0.4536082474226804, + "grad_norm": 3.24894642829895, + "learning_rate": 2e-05, + "loss": 1.3442, + "step": 44 + }, + { + "epoch": 0.4742268041237113, + "grad_norm": 3.7670817375183105, + "learning_rate": 2e-05, + "loss": 1.279, + "step": 46 + }, + { + "epoch": 0.4948453608247423, + "grad_norm": 2.1132254600524902, + "learning_rate": 2e-05, + "loss": 1.7001, + "step": 48 + }, + { + "epoch": 0.5154639175257731, + "grad_norm": 0.593248724937439, + "learning_rate": 2e-05, + "loss": 0.8884, + "step": 50 + }, + { + "epoch": 0.5360824742268041, + "grad_norm": 1.4078608751296997, + "learning_rate": 2e-05, + "loss": 0.8091, + "step": 52 + }, + { + "epoch": 0.5567010309278351, + "grad_norm": 0.3955836892127991, + "learning_rate": 2e-05, + "loss": 0.3546, + "step": 54 + }, + { + "epoch": 0.5773195876288659, + "grad_norm": 0.9244691729545593, + "learning_rate": 2e-05, + "loss": 1.437, + "step": 56 + }, + { + "epoch": 0.5979381443298969, + "grad_norm": 0.4643814265727997, + "learning_rate": 2e-05, + "loss": 0.881, + "step": 58 + }, + { + "epoch": 0.6185567010309279, + "grad_norm": 0.41819217801094055, + "learning_rate": 2e-05, + "loss": 0.6405, + "step": 60 + }, + { + "epoch": 0.6391752577319587, + "grad_norm": 0.7221791744232178, + "learning_rate": 2e-05, + "loss": 0.7172, + "step": 62 + }, + { + "epoch": 0.6597938144329897, + "grad_norm": 0.44450488686561584, + "learning_rate": 2e-05, + "loss": 0.7196, + "step": 64 + }, + { + "epoch": 0.6804123711340206, + "grad_norm": 1.463599443435669, + "learning_rate": 2e-05, + "loss": 1.4753, + "step": 66 + }, + { + "epoch": 0.7010309278350515, + "grad_norm": 0.2606247365474701, + "learning_rate": 2e-05, + "loss": 0.8865, + "step": 68 + }, + { + "epoch": 0.7216494845360825, + "grad_norm": 0.3822779655456543, + "learning_rate": 2e-05, + "loss": 0.7243, + "step": 70 + }, + { + "epoch": 0.7422680412371134, + "grad_norm": 0.314899206161499, + "learning_rate": 2e-05, + "loss": 0.9963, + "step": 72 + }, + { + "epoch": 0.7628865979381443, + "grad_norm": 0.47478482127189636, + "learning_rate": 2e-05, + "loss": 0.7358, + "step": 74 + }, + { + "epoch": 0.7835051546391752, + "grad_norm": 3.180941581726074, + "learning_rate": 2e-05, + "loss": 1.546, + "step": 76 + }, + { + "epoch": 0.8041237113402062, + "grad_norm": 0.392020046710968, + "learning_rate": 2e-05, + "loss": 0.4863, + "step": 78 + }, + { + "epoch": 0.8247422680412371, + "grad_norm": 0.4663325548171997, + "learning_rate": 2e-05, + "loss": 0.3802, + "step": 80 + }, + { + "epoch": 0.845360824742268, + "grad_norm": 0.5237138867378235, + "learning_rate": 2e-05, + "loss": 0.5043, + "step": 82 + }, + { + "epoch": 0.865979381443299, + "grad_norm": 0.8400606513023376, + "learning_rate": 2e-05, + "loss": 0.8792, + "step": 84 + }, + { + "epoch": 0.8865979381443299, + "grad_norm": 0.3281240463256836, + "learning_rate": 2e-05, + "loss": 0.735, + "step": 86 + }, + { + "epoch": 0.9072164948453608, + "grad_norm": 1.076886773109436, + "learning_rate": 2e-05, + "loss": 0.9669, + "step": 88 + }, + { + "epoch": 0.9278350515463918, + "grad_norm": 0.6442875266075134, + "learning_rate": 2e-05, + "loss": 0.6857, + "step": 90 + }, + { + "epoch": 0.9484536082474226, + "grad_norm": 1.3491824865341187, + "learning_rate": 2e-05, + "loss": 0.7857, + "step": 92 + }, + { + "epoch": 0.9690721649484536, + "grad_norm": 0.4119647443294525, + "learning_rate": 2e-05, + "loss": 0.5265, + "step": 94 + }, + { + "epoch": 0.9896907216494846, + "grad_norm": 0.9270315766334534, + "learning_rate": 2e-05, + "loss": 1.2191, + "step": 96 + }, + { + "epoch": 1.0, + "step": 97, + "total_flos": 2.081554905117491e+16, + "train_loss": 0.8912827993176647, + "train_runtime": 342.0553, + "train_samples_per_second": 1.134, + "train_steps_per_second": 0.284 + } + ], + "logging_steps": 2, + "max_steps": 97, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 2.081554905117491e+16, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round10.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..6d251c9c14ea651018a48f1e1be254651c9735eb --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76222740e5b1eb701df8242a79fa98659c625a40a9d557ff4ee9ab9793e6a2de +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round12.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..ea9033974a1004ac95117874e260642b7b4f79c8 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af4abb1969b8895e24009b3474b99f4b40c4a44b2056fb6935f1f5c9fbd2b7de +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round15.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..04783e29e7d8d445f2135a725146e6ca38fa21b6 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aed5d456627b3b084bed1c6c4f40781201a9314e9ab4c7fcd0045aa87653ad93 +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round17.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..d9b7fdf5e48f8c01ed52bfc9bf43600664eb4e87 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:974c3d90766732a37f45318d13fa049f577025980b07e7b331d04ffe0c7db571 +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round2.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..4969e35b86cdf97674737cda7d4a82ef46f8b2e5 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:369ee76d02588c766be21d8792a4eb5096425d0505d617ed47d36b31ab2a7489 +size 791576546 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round20.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..88dbf6232ea449dde8b5ec452689126e3f24604d --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:724a4cb19d6636ec4851b473dc93dfec177f1eb18c9610b52336f58fe4ac864e +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round5.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..df5249c55e84b4b270de60c76f61a252f8c70745 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:296b10e3bc3a9fa0d2250f938b2eecca029ba36b1dced5a077b832d32301cc42 +size 791576546 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round7.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..15d2c98fc7a9739d1eb39c74d7b01836e25edab7 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2799db2855c1d10a215ade45151d9ac24e0793f29bfafc62c45ef363f459e35e +size 791576546 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_trainer_state.json b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..3e140fca24b6952d351b949c9061e042198c23b2 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_trainer_state.json @@ -0,0 +1,378 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 97, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.020618556701030927, + "grad_norm": 1.3807806968688965, + "learning_rate": 2e-05, + "loss": 1.2215, + "step": 2 + }, + { + "epoch": 0.041237113402061855, + "grad_norm": 5.47310209274292, + "learning_rate": 2e-05, + "loss": 1.7948, + "step": 4 + }, + { + "epoch": 0.061855670103092786, + "grad_norm": 4.091208457946777, + "learning_rate": 2e-05, + "loss": 1.4245, + "step": 6 + }, + { + "epoch": 0.08247422680412371, + "grad_norm": 2.522712230682373, + "learning_rate": 2e-05, + "loss": 1.2455, + "step": 8 + }, + { + "epoch": 0.10309278350515463, + "grad_norm": 2.400545835494995, + "learning_rate": 2e-05, + "loss": 1.4473, + "step": 10 + }, + { + "epoch": 0.12371134020618557, + "grad_norm": 2.147249937057495, + "learning_rate": 2e-05, + "loss": 0.648, + "step": 12 + }, + { + "epoch": 0.14432989690721648, + "grad_norm": 0.6440826654434204, + "learning_rate": 2e-05, + "loss": 0.1022, + "step": 14 + }, + { + "epoch": 0.16494845360824742, + "grad_norm": 1.4986751079559326, + "learning_rate": 2e-05, + "loss": 1.5813, + "step": 16 + }, + { + "epoch": 0.18556701030927836, + "grad_norm": 2.2775418758392334, + "learning_rate": 2e-05, + "loss": 0.7531, + "step": 18 + }, + { + "epoch": 0.20618556701030927, + "grad_norm": 3.2079670429229736, + "learning_rate": 2e-05, + "loss": 1.6908, + "step": 20 + }, + { + "epoch": 0.2268041237113402, + "grad_norm": 2.16922926902771, + "learning_rate": 2e-05, + "loss": 1.5928, + "step": 22 + }, + { + "epoch": 0.24742268041237114, + "grad_norm": 2.276587724685669, + "learning_rate": 2e-05, + "loss": 1.4918, + "step": 24 + }, + { + "epoch": 0.26804123711340205, + "grad_norm": 1.4131243228912354, + "learning_rate": 2e-05, + "loss": 1.7804, + "step": 26 + }, + { + "epoch": 0.28865979381443296, + "grad_norm": 3.375476121902466, + "learning_rate": 2e-05, + "loss": 1.9648, + "step": 28 + }, + { + "epoch": 0.30927835051546393, + "grad_norm": 2.6980457305908203, + "learning_rate": 2e-05, + "loss": 1.9027, + "step": 30 + }, + { + "epoch": 0.32989690721649484, + "grad_norm": 1.1185120344161987, + "learning_rate": 2e-05, + "loss": 1.2945, + "step": 32 + }, + { + "epoch": 0.35051546391752575, + "grad_norm": 1.5742499828338623, + "learning_rate": 2e-05, + "loss": 2.3652, + "step": 34 + }, + { + "epoch": 0.3711340206185567, + "grad_norm": 1.6757092475891113, + "learning_rate": 2e-05, + "loss": 1.5789, + "step": 36 + }, + { + "epoch": 0.3917525773195876, + "grad_norm": 1.5958377122879028, + "learning_rate": 2e-05, + "loss": 1.4983, + "step": 38 + }, + { + "epoch": 0.41237113402061853, + "grad_norm": 1.3994206190109253, + "learning_rate": 2e-05, + "loss": 0.8934, + "step": 40 + }, + { + "epoch": 0.4329896907216495, + "grad_norm": 0.8964346647262573, + "learning_rate": 2e-05, + "loss": 0.7392, + "step": 42 + }, + { + "epoch": 0.4536082474226804, + "grad_norm": 1.5910592079162598, + "learning_rate": 2e-05, + "loss": 0.8057, + "step": 44 + }, + { + "epoch": 0.4742268041237113, + "grad_norm": 0.8048728704452515, + "learning_rate": 2e-05, + "loss": 0.7514, + "step": 46 + }, + { + "epoch": 0.4948453608247423, + "grad_norm": 3.0406651496887207, + "learning_rate": 2e-05, + "loss": 1.271, + "step": 48 + }, + { + "epoch": 0.5154639175257731, + "grad_norm": 2.1475746631622314, + "learning_rate": 2e-05, + "loss": 1.3316, + "step": 50 + }, + { + "epoch": 0.5360824742268041, + "grad_norm": 1.973347544670105, + "learning_rate": 2e-05, + "loss": 0.9409, + "step": 52 + }, + { + "epoch": 0.5567010309278351, + "grad_norm": 0.5019800662994385, + "learning_rate": 2e-05, + "loss": 0.5754, + "step": 54 + }, + { + "epoch": 0.5773195876288659, + "grad_norm": 2.1202926635742188, + "learning_rate": 2e-05, + "loss": 1.3977, + "step": 56 + }, + { + "epoch": 0.5979381443298969, + "grad_norm": 1.2852915525436401, + "learning_rate": 2e-05, + "loss": 1.6778, + "step": 58 + }, + { + "epoch": 0.6185567010309279, + "grad_norm": 1.093619465827942, + "learning_rate": 2e-05, + "loss": 0.8222, + "step": 60 + }, + { + "epoch": 0.6391752577319587, + "grad_norm": 0.7490342259407043, + "learning_rate": 2e-05, + "loss": 0.6013, + "step": 62 + }, + { + "epoch": 0.6597938144329897, + "grad_norm": 2.6893742084503174, + "learning_rate": 2e-05, + "loss": 1.2905, + "step": 64 + }, + { + "epoch": 0.6804123711340206, + "grad_norm": 3.0177910327911377, + "learning_rate": 2e-05, + "loss": 1.7748, + "step": 66 + }, + { + "epoch": 0.7010309278350515, + "grad_norm": 1.123380422592163, + "learning_rate": 2e-05, + "loss": 0.8262, + "step": 68 + }, + { + "epoch": 0.7216494845360825, + "grad_norm": 1.6035982370376587, + "learning_rate": 2e-05, + "loss": 0.798, + "step": 70 + }, + { + "epoch": 0.7422680412371134, + "grad_norm": 0.7902660965919495, + "learning_rate": 2e-05, + "loss": 1.0709, + "step": 72 + }, + { + "epoch": 0.7628865979381443, + "grad_norm": 1.8285802602767944, + "learning_rate": 2e-05, + "loss": 1.0743, + "step": 74 + }, + { + "epoch": 0.7835051546391752, + "grad_norm": 2.9130942821502686, + "learning_rate": 2e-05, + "loss": 2.0891, + "step": 76 + }, + { + "epoch": 0.8041237113402062, + "grad_norm": 1.4661481380462646, + "learning_rate": 2e-05, + "loss": 1.1128, + "step": 78 + }, + { + "epoch": 0.8247422680412371, + "grad_norm": 2.301260471343994, + "learning_rate": 2e-05, + "loss": 1.6207, + "step": 80 + }, + { + "epoch": 0.845360824742268, + "grad_norm": 1.637123465538025, + "learning_rate": 2e-05, + "loss": 1.3459, + "step": 82 + }, + { + "epoch": 0.865979381443299, + "grad_norm": 1.056007742881775, + "learning_rate": 2e-05, + "loss": 1.2215, + "step": 84 + }, + { + "epoch": 0.8865979381443299, + "grad_norm": 1.2907710075378418, + "learning_rate": 2e-05, + "loss": 1.6295, + "step": 86 + }, + { + "epoch": 0.9072164948453608, + "grad_norm": 1.3023312091827393, + "learning_rate": 2e-05, + "loss": 1.0457, + "step": 88 + }, + { + "epoch": 0.9278350515463918, + "grad_norm": 0.39116430282592773, + "learning_rate": 2e-05, + "loss": 1.1983, + "step": 90 + }, + { + "epoch": 0.9484536082474226, + "grad_norm": 0.9639070630073547, + "learning_rate": 2e-05, + "loss": 1.1595, + "step": 92 + }, + { + "epoch": 0.9690721649484536, + "grad_norm": 1.6161588430404663, + "learning_rate": 2e-05, + "loss": 1.2601, + "step": 94 + }, + { + "epoch": 0.9896907216494846, + "grad_norm": 2.380856513977051, + "learning_rate": 2e-05, + "loss": 0.6827, + "step": 96 + }, + { + "epoch": 1.0, + "step": 97, + "total_flos": 2.074250449204019e+16, + "train_loss": 1.2486689803526574, + "train_runtime": 347.5167, + "train_samples_per_second": 1.116, + "train_steps_per_second": 0.279 + } + ], + "logging_steps": 2, + "max_steps": 97, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 2.074250449204019e+16, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round10.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..c2fe516cc7af4b02665be3f26600bab78cc19f59 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09cd08a35ceaf65f8b4b8c2b3943b855c5e7348c334be564b82fa3d4dc95bad8 +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round12.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..3ead1ef3e8b37b4658a64567bd6764b15e870cf7 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6ce216ab0402be87c84d6af509a84f0ce168cf22217ee6eb8263e51dd6142d6 +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round15.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..686f977d566cce4ca7aa2c392e85c88a7cadf747 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0970a229f1f57205586ba91eed0371c4af2fe6fbfaa4a6ec8f6aa437d820ac8d +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round17.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..f80e9e37b9cf835e1bc15dbd3e94f73e8637b168 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b873fa30a8c5d382069a0c536ec17db452e64f48a4c4c7b3c9dafca48b601f1d +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round2.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..c42b9042ee5bd48d6a8055096f971a5b331e7eb7 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99c23eb08adf5a7a45e3b25bc3f6dd68703808836dcdddf7a33aa4d8121f930d +size 791576546 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round20.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..6218c20cede4e1bbe3986e7ea1039624d513dce0 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89e5cd78ffe0c1d359e335003dc27cd066c19e38a2b3a47878ed61c28f6f3bce +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round5.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..6b610a2a8da55f3c9e9faa844db2c7465354fdfd --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd267f04fa29a90135be9135767d57deae0b1589d28cfac8bac8f884c72925d9 +size 791576546 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round7.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..5a7c9be4152d5582d1a05b4de71f6755a93cc15e --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ad78d33c14d82ffae452f34515cbdfc32084de4c73a34a2724c39f4b27cb71e +size 791576546 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_trainer_state.json b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..122520ce04d7f523e4c9e69e1bbee2e6e8c1a78e --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_trainer_state.json @@ -0,0 +1,378 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 97, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.020618556701030927, + "grad_norm": 0.2117251455783844, + "learning_rate": 2e-05, + "loss": 0.18, + "step": 2 + }, + { + "epoch": 0.041237113402061855, + "grad_norm": 3.18235445022583, + "learning_rate": 2e-05, + "loss": 1.0332, + "step": 4 + }, + { + "epoch": 0.061855670103092786, + "grad_norm": 0.6543071269989014, + "learning_rate": 2e-05, + "loss": 0.1466, + "step": 6 + }, + { + "epoch": 0.08247422680412371, + "grad_norm": 0.04175340011715889, + "learning_rate": 2e-05, + "loss": 0.0721, + "step": 8 + }, + { + "epoch": 0.10309278350515463, + "grad_norm": 5.604257106781006, + "learning_rate": 2e-05, + "loss": 2.105, + "step": 10 + }, + { + "epoch": 0.12371134020618557, + "grad_norm": 1.9834911823272705, + "learning_rate": 2e-05, + "loss": 1.3383, + "step": 12 + }, + { + "epoch": 0.14432989690721648, + "grad_norm": 0.8079286217689514, + "learning_rate": 2e-05, + "loss": 0.3371, + "step": 14 + }, + { + "epoch": 0.16494845360824742, + "grad_norm": 1.3316236734390259, + "learning_rate": 2e-05, + "loss": 0.1855, + "step": 16 + }, + { + "epoch": 0.18556701030927836, + "grad_norm": 5.571617126464844, + "learning_rate": 2e-05, + "loss": 1.2537, + "step": 18 + }, + { + "epoch": 0.20618556701030927, + "grad_norm": 0.20295646786689758, + "learning_rate": 2e-05, + "loss": 0.5626, + "step": 20 + }, + { + "epoch": 0.2268041237113402, + "grad_norm": 1.204951286315918, + "learning_rate": 2e-05, + "loss": 0.4711, + "step": 22 + }, + { + "epoch": 0.24742268041237114, + "grad_norm": 0.0033123709727078676, + "learning_rate": 2e-05, + "loss": 0.0308, + "step": 24 + }, + { + "epoch": 0.26804123711340205, + "grad_norm": 0.5536037683486938, + "learning_rate": 2e-05, + "loss": 0.3015, + "step": 26 + }, + { + "epoch": 0.28865979381443296, + "grad_norm": 0.8447141647338867, + "learning_rate": 2e-05, + "loss": 0.2536, + "step": 28 + }, + { + "epoch": 0.30927835051546393, + "grad_norm": 0.2806701064109802, + "learning_rate": 2e-05, + "loss": 0.8265, + "step": 30 + }, + { + "epoch": 0.32989690721649484, + "grad_norm": 2.9358584880828857, + "learning_rate": 2e-05, + "loss": 0.7986, + "step": 32 + }, + { + "epoch": 0.35051546391752575, + "grad_norm": 1.8837885856628418, + "learning_rate": 2e-05, + "loss": 0.869, + "step": 34 + }, + { + "epoch": 0.3711340206185567, + "grad_norm": 0.5349599719047546, + "learning_rate": 2e-05, + "loss": 0.6375, + "step": 36 + }, + { + "epoch": 0.3917525773195876, + "grad_norm": 5.246908664703369, + "learning_rate": 2e-05, + "loss": 0.7918, + "step": 38 + }, + { + "epoch": 0.41237113402061853, + "grad_norm": 0.749443769454956, + "learning_rate": 2e-05, + "loss": 0.1354, + "step": 40 + }, + { + "epoch": 0.4329896907216495, + "grad_norm": 1.6047642230987549, + "learning_rate": 2e-05, + "loss": 0.5694, + "step": 42 + }, + { + "epoch": 0.4536082474226804, + "grad_norm": 0.5995208024978638, + "learning_rate": 2e-05, + "loss": 0.3092, + "step": 44 + }, + { + "epoch": 0.4742268041237113, + "grad_norm": 0.5239794850349426, + "learning_rate": 2e-05, + "loss": 0.3072, + "step": 46 + }, + { + "epoch": 0.4948453608247423, + "grad_norm": 1.1799319982528687, + "learning_rate": 2e-05, + "loss": 0.2645, + "step": 48 + }, + { + "epoch": 0.5154639175257731, + "grad_norm": 1.342455506324768, + "learning_rate": 2e-05, + "loss": 0.7667, + "step": 50 + }, + { + "epoch": 0.5360824742268041, + "grad_norm": 1.0981117486953735, + "learning_rate": 2e-05, + "loss": 1.2677, + "step": 52 + }, + { + "epoch": 0.5567010309278351, + "grad_norm": 0.14960458874702454, + "learning_rate": 2e-05, + "loss": 0.1341, + "step": 54 + }, + { + "epoch": 0.5773195876288659, + "grad_norm": 0.7550680041313171, + "learning_rate": 2e-05, + "loss": 0.8213, + "step": 56 + }, + { + "epoch": 0.5979381443298969, + "grad_norm": 1.3047091960906982, + "learning_rate": 2e-05, + "loss": 1.2189, + "step": 58 + }, + { + "epoch": 0.6185567010309279, + "grad_norm": 2.0745363235473633, + "learning_rate": 2e-05, + "loss": 0.3516, + "step": 60 + }, + { + "epoch": 0.6391752577319587, + "grad_norm": 0.29618772864341736, + "learning_rate": 2e-05, + "loss": 0.7966, + "step": 62 + }, + { + "epoch": 0.6597938144329897, + "grad_norm": 0.525123655796051, + "learning_rate": 2e-05, + "loss": 0.3242, + "step": 64 + }, + { + "epoch": 0.6804123711340206, + "grad_norm": 0.7060384154319763, + "learning_rate": 2e-05, + "loss": 0.8251, + "step": 66 + }, + { + "epoch": 0.7010309278350515, + "grad_norm": 1.7675563097000122, + "learning_rate": 2e-05, + "loss": 1.0343, + "step": 68 + }, + { + "epoch": 0.7216494845360825, + "grad_norm": 0.7637777924537659, + "learning_rate": 2e-05, + "loss": 0.6064, + "step": 70 + }, + { + "epoch": 0.7422680412371134, + "grad_norm": 0.054561272263526917, + "learning_rate": 2e-05, + "loss": 0.0334, + "step": 72 + }, + { + "epoch": 0.7628865979381443, + "grad_norm": 0.9899354577064514, + "learning_rate": 2e-05, + "loss": 0.5814, + "step": 74 + }, + { + "epoch": 0.7835051546391752, + "grad_norm": 0.8481895923614502, + "learning_rate": 2e-05, + "loss": 0.4284, + "step": 76 + }, + { + "epoch": 0.8041237113402062, + "grad_norm": 1.1497780084609985, + "learning_rate": 2e-05, + "loss": 0.8091, + "step": 78 + }, + { + "epoch": 0.8247422680412371, + "grad_norm": 0.7620788216590881, + "learning_rate": 2e-05, + "loss": 0.5266, + "step": 80 + }, + { + "epoch": 0.845360824742268, + "grad_norm": 0.2328740805387497, + "learning_rate": 2e-05, + "loss": 0.5719, + "step": 82 + }, + { + "epoch": 0.865979381443299, + "grad_norm": 0.554115355014801, + "learning_rate": 2e-05, + "loss": 0.3597, + "step": 84 + }, + { + "epoch": 0.8865979381443299, + "grad_norm": 0.5471949577331543, + "learning_rate": 2e-05, + "loss": 0.4508, + "step": 86 + }, + { + "epoch": 0.9072164948453608, + "grad_norm": 0.12688428163528442, + "learning_rate": 2e-05, + "loss": 0.2716, + "step": 88 + }, + { + "epoch": 0.9278350515463918, + "grad_norm": 0.4092620015144348, + "learning_rate": 2e-05, + "loss": 0.3383, + "step": 90 + }, + { + "epoch": 0.9484536082474226, + "grad_norm": 0.5129708647727966, + "learning_rate": 2e-05, + "loss": 0.49, + "step": 92 + }, + { + "epoch": 0.9690721649484536, + "grad_norm": 1.2216758728027344, + "learning_rate": 2e-05, + "loss": 0.6369, + "step": 94 + }, + { + "epoch": 0.9896907216494846, + "grad_norm": 0.22560183703899384, + "learning_rate": 2e-05, + "loss": 0.1846, + "step": 96 + }, + { + "epoch": 1.0, + "step": 97, + "total_flos": 2.474919844852531e+16, + "train_loss": 0.5777954735706762, + "train_runtime": 383.7331, + "train_samples_per_second": 1.011, + "train_steps_per_second": 0.253 + } + ], + "logging_steps": 2, + "max_steps": 97, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 2.474919844852531e+16, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/6_client_model_round10.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/6_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..7e9e9d2802de0a3f7ff234b2fe8468fbe06e9ee8 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/6_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6be4a24c206539e1eb76bd167a99237ad2079cd0c7f4d1d0d967c934c7a42f5a +size 368443438 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/6_client_model_round12.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/6_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..b0b3e9b0369bb29cdc2c9509294ba987c7c69e49 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/6_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9496e73a5578309bf0cfe6644573804d2fbf7d9cb8cb4b232f1d18b4281067a2 +size 368443438 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/6_client_model_round15.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/6_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..e4e7825c3d01262af7740e6ddd93264025ee92d2 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/6_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8022741f42979460f25196487d1d52594533ee0137c39c7e2456636982cae1b7 +size 368443438 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/6_client_model_round17.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/6_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..057a5f6460ad76255da80ef3d66a9ddb86b3be23 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/6_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dbd2c2069712b9329314219db25406879f680659d2121794cccee5d386704d9 +size 368443438 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/6_client_model_round2.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/6_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..99b9b9e6edfbe6b6832fa05ad10b7a0a68ca0f8b --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/6_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:769b05b595432fbf5a675d50da02aba0d708072135a862a4205947bf9db8323f +size 368442474 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/6_client_model_round20.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/6_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..06ae49a70a4de05aefad019d4fa82ba5834338a7 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/6_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ac1d59cf33c9fc936939fe540a8d331cb67026ec24b8b43f5b56e6bfd23b581 +size 368443438 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/6_client_model_round5.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/6_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..dd1905e2383ab5fd725865d11fadf07577fe9ad6 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/6_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d03bbb0e1ff44be16912be2669c565965c7ea7c7cba83c2fa5d6f4156a8021b +size 368442474 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/6_client_model_round7.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/6_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..86cdb38eee3b26c71f96bbf8a0867a88e8446564 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/6_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11e3f2599e3937b2b81dcaf0981c0c01dd67fdea4cbc3a91082fe343cb45f178 +size 368442474 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/6_trainer_state.json b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/6_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..76941ef8e998e491c29bacc94a8fe69b855789b7 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/6_trainer_state.json @@ -0,0 +1,378 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 97, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.020618556701030927, + "grad_norm": 1.5049797296524048, + "learning_rate": 2e-05, + "loss": 2.6945, + "step": 2 + }, + { + "epoch": 0.041237113402061855, + "grad_norm": 1.4321800470352173, + "learning_rate": 2e-05, + "loss": 1.6925, + "step": 4 + }, + { + "epoch": 0.061855670103092786, + "grad_norm": 2.435985803604126, + "learning_rate": 2e-05, + "loss": 1.8773, + "step": 6 + }, + { + "epoch": 0.08247422680412371, + "grad_norm": 4.95011568069458, + "learning_rate": 2e-05, + "loss": 2.0518, + "step": 8 + }, + { + "epoch": 0.10309278350515463, + "grad_norm": 1.513716459274292, + "learning_rate": 2e-05, + "loss": 1.7783, + "step": 10 + }, + { + "epoch": 0.12371134020618557, + "grad_norm": 1.7388437986373901, + "learning_rate": 2e-05, + "loss": 1.9481, + "step": 12 + }, + { + "epoch": 0.14432989690721648, + "grad_norm": 5.991330146789551, + "learning_rate": 2e-05, + "loss": 3.0936, + "step": 14 + }, + { + "epoch": 0.16494845360824742, + "grad_norm": 2.460019111633301, + "learning_rate": 2e-05, + "loss": 2.8943, + "step": 16 + }, + { + "epoch": 0.18556701030927836, + "grad_norm": 3.995192050933838, + "learning_rate": 2e-05, + "loss": 2.8079, + "step": 18 + }, + { + "epoch": 0.20618556701030927, + "grad_norm": 1.8898335695266724, + "learning_rate": 2e-05, + "loss": 1.2867, + "step": 20 + }, + { + "epoch": 0.2268041237113402, + "grad_norm": 2.0615501403808594, + "learning_rate": 2e-05, + "loss": 0.8667, + "step": 22 + }, + { + "epoch": 0.24742268041237114, + "grad_norm": 3.1899831295013428, + "learning_rate": 2e-05, + "loss": 2.2847, + "step": 24 + }, + { + "epoch": 0.26804123711340205, + "grad_norm": 4.016243934631348, + "learning_rate": 2e-05, + "loss": 1.9658, + "step": 26 + }, + { + "epoch": 0.28865979381443296, + "grad_norm": 2.5904541015625, + "learning_rate": 2e-05, + "loss": 1.9854, + "step": 28 + }, + { + "epoch": 0.30927835051546393, + "grad_norm": 1.7917367219924927, + "learning_rate": 2e-05, + "loss": 2.0055, + "step": 30 + }, + { + "epoch": 0.32989690721649484, + "grad_norm": 4.592316627502441, + "learning_rate": 2e-05, + "loss": 2.3751, + "step": 32 + }, + { + "epoch": 0.35051546391752575, + "grad_norm": 5.915355205535889, + "learning_rate": 2e-05, + "loss": 0.9125, + "step": 34 + }, + { + "epoch": 0.3711340206185567, + "grad_norm": 3.8353493213653564, + "learning_rate": 2e-05, + "loss": 2.0201, + "step": 36 + }, + { + "epoch": 0.3917525773195876, + "grad_norm": 2.283921003341675, + "learning_rate": 2e-05, + "loss": 2.4454, + "step": 38 + }, + { + "epoch": 0.41237113402061853, + "grad_norm": 3.881675958633423, + "learning_rate": 2e-05, + "loss": 2.3843, + "step": 40 + }, + { + "epoch": 0.4329896907216495, + "grad_norm": 4.092883586883545, + "learning_rate": 2e-05, + "loss": 1.8022, + "step": 42 + }, + { + "epoch": 0.4536082474226804, + "grad_norm": 3.820995569229126, + "learning_rate": 2e-05, + "loss": 2.5039, + "step": 44 + }, + { + "epoch": 0.4742268041237113, + "grad_norm": 1.8063539266586304, + "learning_rate": 2e-05, + "loss": 1.9248, + "step": 46 + }, + { + "epoch": 0.4948453608247423, + "grad_norm": 3.515434741973877, + "learning_rate": 2e-05, + "loss": 1.9624, + "step": 48 + }, + { + "epoch": 0.5154639175257731, + "grad_norm": 2.6817257404327393, + "learning_rate": 2e-05, + "loss": 2.6696, + "step": 50 + }, + { + "epoch": 0.5360824742268041, + "grad_norm": 6.879681587219238, + "learning_rate": 2e-05, + "loss": 2.4385, + "step": 52 + }, + { + "epoch": 0.5567010309278351, + "grad_norm": 3.621436595916748, + "learning_rate": 2e-05, + "loss": 2.0796, + "step": 54 + }, + { + "epoch": 0.5773195876288659, + "grad_norm": 5.467465877532959, + "learning_rate": 2e-05, + "loss": 2.2365, + "step": 56 + }, + { + "epoch": 0.5979381443298969, + "grad_norm": 2.066556692123413, + "learning_rate": 2e-05, + "loss": 1.7823, + "step": 58 + }, + { + "epoch": 0.6185567010309279, + "grad_norm": 5.411770820617676, + "learning_rate": 2e-05, + "loss": 2.8374, + "step": 60 + }, + { + "epoch": 0.6391752577319587, + "grad_norm": 10.843588829040527, + "learning_rate": 2e-05, + "loss": 2.1689, + "step": 62 + }, + { + "epoch": 0.6597938144329897, + "grad_norm": 2.4762089252471924, + "learning_rate": 2e-05, + "loss": 1.2102, + "step": 64 + }, + { + "epoch": 0.6804123711340206, + "grad_norm": 1.8696882724761963, + "learning_rate": 2e-05, + "loss": 1.9268, + "step": 66 + }, + { + "epoch": 0.7010309278350515, + "grad_norm": 3.962611675262451, + "learning_rate": 2e-05, + "loss": 2.3607, + "step": 68 + }, + { + "epoch": 0.7216494845360825, + "grad_norm": 2.3166444301605225, + "learning_rate": 2e-05, + "loss": 2.4678, + "step": 70 + }, + { + "epoch": 0.7422680412371134, + "grad_norm": 8.877740859985352, + "learning_rate": 2e-05, + "loss": 2.9136, + "step": 72 + }, + { + "epoch": 0.7628865979381443, + "grad_norm": 4.233133792877197, + "learning_rate": 2e-05, + "loss": 1.366, + "step": 74 + }, + { + "epoch": 0.7835051546391752, + "grad_norm": 9.046269416809082, + "learning_rate": 2e-05, + "loss": 1.5894, + "step": 76 + }, + { + "epoch": 0.8041237113402062, + "grad_norm": 4.931369781494141, + "learning_rate": 2e-05, + "loss": 2.5403, + "step": 78 + }, + { + "epoch": 0.8247422680412371, + "grad_norm": 12.060054779052734, + "learning_rate": 2e-05, + "loss": 2.4096, + "step": 80 + }, + { + "epoch": 0.845360824742268, + "grad_norm": 3.3465631008148193, + "learning_rate": 2e-05, + "loss": 1.9784, + "step": 82 + }, + { + "epoch": 0.865979381443299, + "grad_norm": 2.3073983192443848, + "learning_rate": 2e-05, + "loss": 1.3059, + "step": 84 + }, + { + "epoch": 0.8865979381443299, + "grad_norm": 1.346895456314087, + "learning_rate": 2e-05, + "loss": 0.9115, + "step": 86 + }, + { + "epoch": 0.9072164948453608, + "grad_norm": 4.645529747009277, + "learning_rate": 2e-05, + "loss": 0.8408, + "step": 88 + }, + { + "epoch": 0.9278350515463918, + "grad_norm": 5.669789791107178, + "learning_rate": 2e-05, + "loss": 2.3668, + "step": 90 + }, + { + "epoch": 0.9484536082474226, + "grad_norm": 1.2507057189941406, + "learning_rate": 2e-05, + "loss": 1.4261, + "step": 92 + }, + { + "epoch": 0.9690721649484536, + "grad_norm": 4.535902976989746, + "learning_rate": 2e-05, + "loss": 1.9733, + "step": 94 + }, + { + "epoch": 0.9896907216494846, + "grad_norm": 1.9077485799789429, + "learning_rate": 2e-05, + "loss": 1.6788, + "step": 96 + }, + { + "epoch": 1.0, + "step": 97, + "total_flos": 2784250118012928.0, + "train_loss": 2.036776041247181, + "train_runtime": 204.8699, + "train_samples_per_second": 1.894, + "train_steps_per_second": 0.473 + } + ], + "logging_steps": 2, + "max_steps": 97, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 2784250118012928.0, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/7_client_model_round10.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/7_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..1d6599b5e95bef3363a6f588a3b156b95ac6e989 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/7_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35985975a45380106d92a65460d92adabd18feaee6b4ea22b74fd0f3e9988143 +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/7_client_model_round12.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/7_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..554b236809d6f7613af62111ca3cab232ffd1c01 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/7_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e25fb64114c5d2d09c63e2451880e2b806786ae0ddf3d341f98415790534f1cc +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/7_client_model_round15.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/7_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..ad5f82617505629fe1f6e6845f59c673321c338d --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/7_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26680cced61f50d73f1f70fb9a72f4800878587d3007be6d5b80a9f8db56d07d +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/7_client_model_round17.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/7_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..49dbc8fa7767dca24893015bc2d7901a871e3750 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/7_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:189f3021ef68e03332c7014953fcf1edb8205a3c1624de679e27840db873cee9 +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/7_client_model_round2.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/7_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..062ad256e24ce42de30842800e3b6483ae6eac35 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/7_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edb48b499f4762c82776ae05dbcb4eb99d7f7aa651dc43c4e30e1b5fe764e893 +size 791576546 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/7_client_model_round20.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/7_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..d3f13f3e924a1291353bd97928478c9e34f36611 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/7_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54432ad49b6fc5cc76b28826e5a18205eb938a9e9817fb17aca09e7cf0a6bd05 +size 791578182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/7_client_model_round5.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/7_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..89a80bbedf0953b525eb0be5d571e00f743bc4e6 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/7_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87ba14cc257dca96cfb12dac212054fb530556ffac4246551a91805c6910cf83 +size 791576546 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/7_client_model_round7.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/7_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..deb5290c73cac78ad42288a02a25725516d8bfc1 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/7_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8056d02556354224d5fbe381852a6ec60e4c64fcb5bb6c2a578cb352344362da +size 791576546 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/7_trainer_state.json b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/7_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..6f941512fbc638c80ae7dca5d373c8667b9568f7 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/7_trainer_state.json @@ -0,0 +1,378 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 97, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.020618556701030927, + "grad_norm": 3.3560197353363037, + "learning_rate": 2e-05, + "loss": 2.3487, + "step": 2 + }, + { + "epoch": 0.041237113402061855, + "grad_norm": 3.160369634628296, + "learning_rate": 2e-05, + "loss": 1.7639, + "step": 4 + }, + { + "epoch": 0.061855670103092786, + "grad_norm": 3.14260196685791, + "learning_rate": 2e-05, + "loss": 1.0903, + "step": 6 + }, + { + "epoch": 0.08247422680412371, + "grad_norm": 3.696504592895508, + "learning_rate": 2e-05, + "loss": 1.1641, + "step": 8 + }, + { + "epoch": 0.10309278350515463, + "grad_norm": 2.752567768096924, + "learning_rate": 2e-05, + "loss": 1.9624, + "step": 10 + }, + { + "epoch": 0.12371134020618557, + "grad_norm": 1.2239468097686768, + "learning_rate": 2e-05, + "loss": 1.1094, + "step": 12 + }, + { + "epoch": 0.14432989690721648, + "grad_norm": 1.6693317890167236, + "learning_rate": 2e-05, + "loss": 1.2449, + "step": 14 + }, + { + "epoch": 0.16494845360824742, + "grad_norm": 2.7668395042419434, + "learning_rate": 2e-05, + "loss": 1.5616, + "step": 16 + }, + { + "epoch": 0.18556701030927836, + "grad_norm": 2.974491596221924, + "learning_rate": 2e-05, + "loss": 1.2247, + "step": 18 + }, + { + "epoch": 0.20618556701030927, + "grad_norm": 1.0505852699279785, + "learning_rate": 2e-05, + "loss": 0.3947, + "step": 20 + }, + { + "epoch": 0.2268041237113402, + "grad_norm": 2.4126343727111816, + "learning_rate": 2e-05, + "loss": 1.2549, + "step": 22 + }, + { + "epoch": 0.24742268041237114, + "grad_norm": 2.14699125289917, + "learning_rate": 2e-05, + "loss": 1.3632, + "step": 24 + }, + { + "epoch": 0.26804123711340205, + "grad_norm": 2.0265958309173584, + "learning_rate": 2e-05, + "loss": 1.7524, + "step": 26 + }, + { + "epoch": 0.28865979381443296, + "grad_norm": 1.7980031967163086, + "learning_rate": 2e-05, + "loss": 1.0669, + "step": 28 + }, + { + "epoch": 0.30927835051546393, + "grad_norm": 2.1396403312683105, + "learning_rate": 2e-05, + "loss": 0.9769, + "step": 30 + }, + { + "epoch": 0.32989690721649484, + "grad_norm": 1.1520572900772095, + "learning_rate": 2e-05, + "loss": 1.1672, + "step": 32 + }, + { + "epoch": 0.35051546391752575, + "grad_norm": 1.7930545806884766, + "learning_rate": 2e-05, + "loss": 0.8409, + "step": 34 + }, + { + "epoch": 0.3711340206185567, + "grad_norm": 3.9057226181030273, + "learning_rate": 2e-05, + "loss": 1.5628, + "step": 36 + }, + { + "epoch": 0.3917525773195876, + "grad_norm": 2.967085123062134, + "learning_rate": 2e-05, + "loss": 3.0918, + "step": 38 + }, + { + "epoch": 0.41237113402061853, + "grad_norm": 1.8915605545043945, + "learning_rate": 2e-05, + "loss": 0.8876, + "step": 40 + }, + { + "epoch": 0.4329896907216495, + "grad_norm": 2.6781511306762695, + "learning_rate": 2e-05, + "loss": 1.3569, + "step": 42 + }, + { + "epoch": 0.4536082474226804, + "grad_norm": 1.9666043519973755, + "learning_rate": 2e-05, + "loss": 1.0566, + "step": 44 + }, + { + "epoch": 0.4742268041237113, + "grad_norm": 2.275099515914917, + "learning_rate": 2e-05, + "loss": 1.3208, + "step": 46 + }, + { + "epoch": 0.4948453608247423, + "grad_norm": 2.330568313598633, + "learning_rate": 2e-05, + "loss": 0.8591, + "step": 48 + }, + { + "epoch": 0.5154639175257731, + "grad_norm": 2.4660608768463135, + "learning_rate": 2e-05, + "loss": 1.0113, + "step": 50 + }, + { + "epoch": 0.5360824742268041, + "grad_norm": 3.656764268875122, + "learning_rate": 2e-05, + "loss": 0.8203, + "step": 52 + }, + { + "epoch": 0.5567010309278351, + "grad_norm": 3.277796745300293, + "learning_rate": 2e-05, + "loss": 0.8817, + "step": 54 + }, + { + "epoch": 0.5773195876288659, + "grad_norm": 1.4417256116867065, + "learning_rate": 2e-05, + "loss": 1.6225, + "step": 56 + }, + { + "epoch": 0.5979381443298969, + "grad_norm": 1.9861325025558472, + "learning_rate": 2e-05, + "loss": 0.9303, + "step": 58 + }, + { + "epoch": 0.6185567010309279, + "grad_norm": 1.4174336194992065, + "learning_rate": 2e-05, + "loss": 0.8621, + "step": 60 + }, + { + "epoch": 0.6391752577319587, + "grad_norm": 0.899995744228363, + "learning_rate": 2e-05, + "loss": 0.3048, + "step": 62 + }, + { + "epoch": 0.6597938144329897, + "grad_norm": 1.2613917589187622, + "learning_rate": 2e-05, + "loss": 1.0401, + "step": 64 + }, + { + "epoch": 0.6804123711340206, + "grad_norm": 1.7970860004425049, + "learning_rate": 2e-05, + "loss": 0.729, + "step": 66 + }, + { + "epoch": 0.7010309278350515, + "grad_norm": 3.2513511180877686, + "learning_rate": 2e-05, + "loss": 1.1038, + "step": 68 + }, + { + "epoch": 0.7216494845360825, + "grad_norm": 2.9402143955230713, + "learning_rate": 2e-05, + "loss": 0.946, + "step": 70 + }, + { + "epoch": 0.7422680412371134, + "grad_norm": 1.1939585208892822, + "learning_rate": 2e-05, + "loss": 1.0559, + "step": 72 + }, + { + "epoch": 0.7628865979381443, + "grad_norm": 8.383438110351562, + "learning_rate": 2e-05, + "loss": 2.4656, + "step": 74 + }, + { + "epoch": 0.7835051546391752, + "grad_norm": 1.598691463470459, + "learning_rate": 2e-05, + "loss": 1.2479, + "step": 76 + }, + { + "epoch": 0.8041237113402062, + "grad_norm": 5.320521831512451, + "learning_rate": 2e-05, + "loss": 2.1267, + "step": 78 + }, + { + "epoch": 0.8247422680412371, + "grad_norm": 2.8301825523376465, + "learning_rate": 2e-05, + "loss": 1.7151, + "step": 80 + }, + { + "epoch": 0.845360824742268, + "grad_norm": 3.8781251907348633, + "learning_rate": 2e-05, + "loss": 1.9324, + "step": 82 + }, + { + "epoch": 0.865979381443299, + "grad_norm": 2.334101438522339, + "learning_rate": 2e-05, + "loss": 1.3911, + "step": 84 + }, + { + "epoch": 0.8865979381443299, + "grad_norm": 2.8089377880096436, + "learning_rate": 2e-05, + "loss": 1.0724, + "step": 86 + }, + { + "epoch": 0.9072164948453608, + "grad_norm": 2.9710512161254883, + "learning_rate": 2e-05, + "loss": 3.3245, + "step": 88 + }, + { + "epoch": 0.9278350515463918, + "grad_norm": 3.564450740814209, + "learning_rate": 2e-05, + "loss": 3.2368, + "step": 90 + }, + { + "epoch": 0.9484536082474226, + "grad_norm": 5.510385513305664, + "learning_rate": 2e-05, + "loss": 1.2651, + "step": 92 + }, + { + "epoch": 0.9690721649484536, + "grad_norm": 0.7583741545677185, + "learning_rate": 2e-05, + "loss": 1.0073, + "step": 94 + }, + { + "epoch": 0.9896907216494846, + "grad_norm": 1.4346013069152832, + "learning_rate": 2e-05, + "loss": 1.7416, + "step": 96 + }, + { + "epoch": 1.0, + "step": 97, + "total_flos": 8765330117623808.0, + "train_loss": 1.3811867753254998, + "train_runtime": 315.6495, + "train_samples_per_second": 1.229, + "train_steps_per_second": 0.307 + } + ], + "logging_steps": 2, + "max_steps": 97, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 8765330117623808.0, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/8_client_model_round10.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/8_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..55e4fd741beff0c97356506334c427469622f3e4 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/8_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5e0007a3c3086bbbf711fdee4f92d723ddd2cae6850f31241ae91691e317fb4 +size 368443438 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/8_client_model_round12.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/8_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..6b7d26e6609c5f55354ca3169e23ee665bfd0751 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/8_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83e8bf59fbd2d60a166578520e6bbcd8f3d60c3b946fffe87b44b52667529764 +size 368443438 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/8_client_model_round15.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/8_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..7d87994867a20b93f998d434132bbfc62fd44a5e --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/8_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8aa11c9236bcd2ffb075704715aac9d88b63ef2c5f26ffe48db781612f933d1 +size 368443438 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/8_client_model_round17.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/8_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..537095ddc5428f122a5304ccc3572f06513f5cc4 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/8_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f534d04ae3fafed57229ce89f45c37f3fceb9e9e4a506cc8f50a6190664ce0ec +size 368443438 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/8_client_model_round2.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/8_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..f4c29dcc8c876662fed6ee053e1710673193a5ab --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/8_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:167cf1a90e083386073d32bcb9318e305a97eae91580e8d8045a002dab02a3ce +size 368442474 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/8_client_model_round20.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/8_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..b813978885f3de2d8cbae40d5fa4780f47276c76 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/8_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b4639bd702443fa9ad19a9351d7a1aa9f962daa5eb8d7bcaec4cdc37590e061 +size 368443438 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/8_client_model_round5.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/8_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..09ed0b16af50748804f793eab57b5fe12d53b709 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/8_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e3408e24980f5c2e450673273ce904772c9b74f92502187b4effbd414414c3a +size 368442474 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/8_client_model_round7.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/8_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..8cf64d9efeeb33d8d103320e08c95dda650cb913 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/8_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff51260e05bd43da61e0ec4d2d8aa190db76d11183e7819285f34d566f94b979 +size 368442474 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/8_trainer_state.json b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/8_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..5387d42b75a90a605a49a5076ec0580afd1afc28 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/8_trainer_state.json @@ -0,0 +1,378 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 97, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.020618556701030927, + "grad_norm": 1.567240834236145, + "learning_rate": 2e-05, + "loss": 1.9056, + "step": 2 + }, + { + "epoch": 0.041237113402061855, + "grad_norm": 2.8930792808532715, + "learning_rate": 2e-05, + "loss": 1.5888, + "step": 4 + }, + { + "epoch": 0.061855670103092786, + "grad_norm": 5.412844657897949, + "learning_rate": 2e-05, + "loss": 2.1581, + "step": 6 + }, + { + "epoch": 0.08247422680412371, + "grad_norm": 5.596451282501221, + "learning_rate": 2e-05, + "loss": 3.5834, + "step": 8 + }, + { + "epoch": 0.10309278350515463, + "grad_norm": 10.479601860046387, + "learning_rate": 2e-05, + "loss": 4.2448, + "step": 10 + }, + { + "epoch": 0.12371134020618557, + "grad_norm": 5.0345659255981445, + "learning_rate": 2e-05, + "loss": 1.8788, + "step": 12 + }, + { + "epoch": 0.14432989690721648, + "grad_norm": 10.572972297668457, + "learning_rate": 2e-05, + "loss": 2.336, + "step": 14 + }, + { + "epoch": 0.16494845360824742, + "grad_norm": 3.583897352218628, + "learning_rate": 2e-05, + "loss": 1.8594, + "step": 16 + }, + { + "epoch": 0.18556701030927836, + "grad_norm": 4.205115795135498, + "learning_rate": 2e-05, + "loss": 2.176, + "step": 18 + }, + { + "epoch": 0.20618556701030927, + "grad_norm": 1.4592698812484741, + "learning_rate": 2e-05, + "loss": 0.6842, + "step": 20 + }, + { + "epoch": 0.2268041237113402, + "grad_norm": 6.050905704498291, + "learning_rate": 2e-05, + "loss": 4.5928, + "step": 22 + }, + { + "epoch": 0.24742268041237114, + "grad_norm": 4.205760478973389, + "learning_rate": 2e-05, + "loss": 4.0139, + "step": 24 + }, + { + "epoch": 0.26804123711340205, + "grad_norm": 1.8052587509155273, + "learning_rate": 2e-05, + "loss": 1.0971, + "step": 26 + }, + { + "epoch": 0.28865979381443296, + "grad_norm": 4.417219638824463, + "learning_rate": 2e-05, + "loss": 3.3815, + "step": 28 + }, + { + "epoch": 0.30927835051546393, + "grad_norm": 3.5604987144470215, + "learning_rate": 2e-05, + "loss": 1.4707, + "step": 30 + }, + { + "epoch": 0.32989690721649484, + "grad_norm": 3.0618865489959717, + "learning_rate": 2e-05, + "loss": 1.4592, + "step": 32 + }, + { + "epoch": 0.35051546391752575, + "grad_norm": 1.774032711982727, + "learning_rate": 2e-05, + "loss": 0.9858, + "step": 34 + }, + { + "epoch": 0.3711340206185567, + "grad_norm": 5.8894453048706055, + "learning_rate": 2e-05, + "loss": 3.0427, + "step": 36 + }, + { + "epoch": 0.3917525773195876, + "grad_norm": 6.161194801330566, + "learning_rate": 2e-05, + "loss": 2.1527, + "step": 38 + }, + { + "epoch": 0.41237113402061853, + "grad_norm": 3.209322929382324, + "learning_rate": 2e-05, + "loss": 1.8922, + "step": 40 + }, + { + "epoch": 0.4329896907216495, + "grad_norm": 3.414322853088379, + "learning_rate": 2e-05, + "loss": 1.6244, + "step": 42 + }, + { + "epoch": 0.4536082474226804, + "grad_norm": 5.164395332336426, + "learning_rate": 2e-05, + "loss": 1.5021, + "step": 44 + }, + { + "epoch": 0.4742268041237113, + "grad_norm": 4.776827335357666, + "learning_rate": 2e-05, + "loss": 2.2015, + "step": 46 + }, + { + "epoch": 0.4948453608247423, + "grad_norm": 2.9819095134735107, + "learning_rate": 2e-05, + "loss": 1.8704, + "step": 48 + }, + { + "epoch": 0.5154639175257731, + "grad_norm": 4.729798793792725, + "learning_rate": 2e-05, + "loss": 4.5408, + "step": 50 + }, + { + "epoch": 0.5360824742268041, + "grad_norm": 1.5492188930511475, + "learning_rate": 2e-05, + "loss": 1.1445, + "step": 52 + }, + { + "epoch": 0.5567010309278351, + "grad_norm": 1.8185083866119385, + "learning_rate": 2e-05, + "loss": 1.8232, + "step": 54 + }, + { + "epoch": 0.5773195876288659, + "grad_norm": 2.1678011417388916, + "learning_rate": 2e-05, + "loss": 1.4547, + "step": 56 + }, + { + "epoch": 0.5979381443298969, + "grad_norm": 4.822456359863281, + "learning_rate": 2e-05, + "loss": 1.7718, + "step": 58 + }, + { + "epoch": 0.6185567010309279, + "grad_norm": 3.002695083618164, + "learning_rate": 2e-05, + "loss": 1.7484, + "step": 60 + }, + { + "epoch": 0.6391752577319587, + "grad_norm": 1.6367547512054443, + "learning_rate": 2e-05, + "loss": 1.6428, + "step": 62 + }, + { + "epoch": 0.6597938144329897, + "grad_norm": 3.8784584999084473, + "learning_rate": 2e-05, + "loss": 2.5032, + "step": 64 + }, + { + "epoch": 0.6804123711340206, + "grad_norm": 6.652468681335449, + "learning_rate": 2e-05, + "loss": 2.1156, + "step": 66 + }, + { + "epoch": 0.7010309278350515, + "grad_norm": 2.516002655029297, + "learning_rate": 2e-05, + "loss": 2.0728, + "step": 68 + }, + { + "epoch": 0.7216494845360825, + "grad_norm": 2.723644971847534, + "learning_rate": 2e-05, + "loss": 1.4052, + "step": 70 + }, + { + "epoch": 0.7422680412371134, + "grad_norm": 1.2017160654067993, + "learning_rate": 2e-05, + "loss": 2.3015, + "step": 72 + }, + { + "epoch": 0.7628865979381443, + "grad_norm": 4.984076499938965, + "learning_rate": 2e-05, + "loss": 1.1909, + "step": 74 + }, + { + "epoch": 0.7835051546391752, + "grad_norm": 2.584172010421753, + "learning_rate": 2e-05, + "loss": 2.2598, + "step": 76 + }, + { + "epoch": 0.8041237113402062, + "grad_norm": 3.8633651733398438, + "learning_rate": 2e-05, + "loss": 2.1217, + "step": 78 + }, + { + "epoch": 0.8247422680412371, + "grad_norm": 0.9916099309921265, + "learning_rate": 2e-05, + "loss": 0.4458, + "step": 80 + }, + { + "epoch": 0.845360824742268, + "grad_norm": 2.272331714630127, + "learning_rate": 2e-05, + "loss": 2.23, + "step": 82 + }, + { + "epoch": 0.865979381443299, + "grad_norm": 4.3678717613220215, + "learning_rate": 2e-05, + "loss": 2.9695, + "step": 84 + }, + { + "epoch": 0.8865979381443299, + "grad_norm": 5.485471248626709, + "learning_rate": 2e-05, + "loss": 1.9276, + "step": 86 + }, + { + "epoch": 0.9072164948453608, + "grad_norm": 2.6858837604522705, + "learning_rate": 2e-05, + "loss": 1.3158, + "step": 88 + }, + { + "epoch": 0.9278350515463918, + "grad_norm": 2.9462811946868896, + "learning_rate": 2e-05, + "loss": 3.1361, + "step": 90 + }, + { + "epoch": 0.9484536082474226, + "grad_norm": 3.1007044315338135, + "learning_rate": 2e-05, + "loss": 1.1987, + "step": 92 + }, + { + "epoch": 0.9690721649484536, + "grad_norm": 3.097275733947754, + "learning_rate": 2e-05, + "loss": 1.3301, + "step": 94 + }, + { + "epoch": 0.9896907216494846, + "grad_norm": 1.0503190755844116, + "learning_rate": 2e-05, + "loss": 1.5931, + "step": 96 + }, + { + "epoch": 1.0, + "step": 97, + "total_flos": 2138591853543424.0, + "train_loss": 2.0744568293856593, + "train_runtime": 201.1337, + "train_samples_per_second": 1.929, + "train_steps_per_second": 0.482 + } + ], + "logging_steps": 2, + "max_steps": 97, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 2138591853543424.0, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/9_client_model_round10.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/9_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..d2fe510cce0fac798ea9168580152f369e4e2cbe --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/9_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4a4e78b349e1701aea56582a76b0c0d791241a0877a9572114bb04c2bd90bf0 +size 368443438 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/9_client_model_round12.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/9_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..934673b2035e7a7647b2f77e2dd3b42bd7dcc744 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/9_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ceafa00e53b003e67f47fc8a6c86e221d29335cf9474cac7eb408444e4aac078 +size 368443438 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/9_client_model_round15.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/9_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..990fcba9e3135669f8d0454fddc0f0c60de7e3e6 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/9_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:202b1b9e3882dfe8e343a7a04eb60c7ca896b835401755ee2c368efb6878798e +size 368443438 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/9_client_model_round17.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/9_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..82d35edb39986dc92bc7e025d0ff894c56b620d6 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/9_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b33618694c3b0de50f08415a3957eb0da794726eb5abc33a7ff5ebee09d37455 +size 368443438 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/9_client_model_round2.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/9_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..9633f3e0b8471c3523e0939982bb6d123356d4b9 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/9_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22ba344d499a42b554df7b8b2316f944a38fedc43cd43a9ebee239a218d12306 +size 368442474 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/9_client_model_round20.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/9_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..fbf9a099e5f32326719fb523644a5437b2830b0b --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/9_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03cfa9d7eb3aee53168537064b6d4d0d2cf5a92a0759a881a140b58d4c65c448 +size 368443438 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/9_client_model_round5.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/9_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..eef7fa13d9ac8642f8adb395b87dd10de6547b45 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/9_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b25afc767cb0e751bd7a7498a90ac1a8ea292021fcb04a823dcdd763e3d1ecfe +size 368442474 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/9_client_model_round7.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/9_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..0c6402c361f5a070b72f51a72760f3f8044f99b0 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/9_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86845f17000d4fe49c926417e1c7cfe8e0b7e950449dfb0cbac9b5312eb59d26 +size 368442474 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/9_trainer_state.json b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/9_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..9d75239b6cb81791dca89d71ff108928ef8b62f1 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/9_trainer_state.json @@ -0,0 +1,378 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 97, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.020618556701030927, + "grad_norm": 4.343683242797852, + "learning_rate": 2e-05, + "loss": 2.585, + "step": 2 + }, + { + "epoch": 0.041237113402061855, + "grad_norm": 1.786333441734314, + "learning_rate": 2e-05, + "loss": 1.2904, + "step": 4 + }, + { + "epoch": 0.061855670103092786, + "grad_norm": 2.5530319213867188, + "learning_rate": 2e-05, + "loss": 1.9012, + "step": 6 + }, + { + "epoch": 0.08247422680412371, + "grad_norm": 3.4871766567230225, + "learning_rate": 2e-05, + "loss": 1.9292, + "step": 8 + }, + { + "epoch": 0.10309278350515463, + "grad_norm": 3.1063528060913086, + "learning_rate": 2e-05, + "loss": 2.1922, + "step": 10 + }, + { + "epoch": 0.12371134020618557, + "grad_norm": 2.8573386669158936, + "learning_rate": 2e-05, + "loss": 1.5091, + "step": 12 + }, + { + "epoch": 0.14432989690721648, + "grad_norm": 3.874681234359741, + "learning_rate": 2e-05, + "loss": 2.6199, + "step": 14 + }, + { + "epoch": 0.16494845360824742, + "grad_norm": 1.607343077659607, + "learning_rate": 2e-05, + "loss": 1.5671, + "step": 16 + }, + { + "epoch": 0.18556701030927836, + "grad_norm": 3.9228110313415527, + "learning_rate": 2e-05, + "loss": 2.1243, + "step": 18 + }, + { + "epoch": 0.20618556701030927, + "grad_norm": 2.8677752017974854, + "learning_rate": 2e-05, + "loss": 1.1915, + "step": 20 + }, + { + "epoch": 0.2268041237113402, + "grad_norm": 1.7636340856552124, + "learning_rate": 2e-05, + "loss": 1.1306, + "step": 22 + }, + { + "epoch": 0.24742268041237114, + "grad_norm": 7.917425155639648, + "learning_rate": 2e-05, + "loss": 2.2015, + "step": 24 + }, + { + "epoch": 0.26804123711340205, + "grad_norm": 8.771407127380371, + "learning_rate": 2e-05, + "loss": 1.8009, + "step": 26 + }, + { + "epoch": 0.28865979381443296, + "grad_norm": 3.2998952865600586, + "learning_rate": 2e-05, + "loss": 1.5343, + "step": 28 + }, + { + "epoch": 0.30927835051546393, + "grad_norm": 2.821490526199341, + "learning_rate": 2e-05, + "loss": 1.8823, + "step": 30 + }, + { + "epoch": 0.32989690721649484, + "grad_norm": 10.080333709716797, + "learning_rate": 2e-05, + "loss": 2.2163, + "step": 32 + }, + { + "epoch": 0.35051546391752575, + "grad_norm": 3.2131407260894775, + "learning_rate": 2e-05, + "loss": 0.8795, + "step": 34 + }, + { + "epoch": 0.3711340206185567, + "grad_norm": 4.264321804046631, + "learning_rate": 2e-05, + "loss": 1.9128, + "step": 36 + }, + { + "epoch": 0.3917525773195876, + "grad_norm": 2.857560396194458, + "learning_rate": 2e-05, + "loss": 2.3895, + "step": 38 + }, + { + "epoch": 0.41237113402061853, + "grad_norm": 1.894586443901062, + "learning_rate": 2e-05, + "loss": 1.7633, + "step": 40 + }, + { + "epoch": 0.4329896907216495, + "grad_norm": 5.137567520141602, + "learning_rate": 2e-05, + "loss": 2.115, + "step": 42 + }, + { + "epoch": 0.4536082474226804, + "grad_norm": 3.170315742492676, + "learning_rate": 2e-05, + "loss": 1.1037, + "step": 44 + }, + { + "epoch": 0.4742268041237113, + "grad_norm": 4.2760233879089355, + "learning_rate": 2e-05, + "loss": 2.5901, + "step": 46 + }, + { + "epoch": 0.4948453608247423, + "grad_norm": 3.841566801071167, + "learning_rate": 2e-05, + "loss": 1.9438, + "step": 48 + }, + { + "epoch": 0.5154639175257731, + "grad_norm": 2.682027578353882, + "learning_rate": 2e-05, + "loss": 2.8988, + "step": 50 + }, + { + "epoch": 0.5360824742268041, + "grad_norm": 3.4430131912231445, + "learning_rate": 2e-05, + "loss": 1.8573, + "step": 52 + }, + { + "epoch": 0.5567010309278351, + "grad_norm": 3.58681583404541, + "learning_rate": 2e-05, + "loss": 1.7103, + "step": 54 + }, + { + "epoch": 0.5773195876288659, + "grad_norm": 4.200504779815674, + "learning_rate": 2e-05, + "loss": 1.6962, + "step": 56 + }, + { + "epoch": 0.5979381443298969, + "grad_norm": 1.5903992652893066, + "learning_rate": 2e-05, + "loss": 0.7403, + "step": 58 + }, + { + "epoch": 0.6185567010309279, + "grad_norm": 3.099350690841675, + "learning_rate": 2e-05, + "loss": 1.2287, + "step": 60 + }, + { + "epoch": 0.6391752577319587, + "grad_norm": 2.2113735675811768, + "learning_rate": 2e-05, + "loss": 1.7151, + "step": 62 + }, + { + "epoch": 0.6597938144329897, + "grad_norm": 4.6003499031066895, + "learning_rate": 2e-05, + "loss": 1.4725, + "step": 64 + }, + { + "epoch": 0.6804123711340206, + "grad_norm": 2.043309450149536, + "learning_rate": 2e-05, + "loss": 1.0231, + "step": 66 + }, + { + "epoch": 0.7010309278350515, + "grad_norm": 10.309861183166504, + "learning_rate": 2e-05, + "loss": 2.2619, + "step": 68 + }, + { + "epoch": 0.7216494845360825, + "grad_norm": 8.821622848510742, + "learning_rate": 2e-05, + "loss": 2.2461, + "step": 70 + }, + { + "epoch": 0.7422680412371134, + "grad_norm": 6.0194597244262695, + "learning_rate": 2e-05, + "loss": 2.1463, + "step": 72 + }, + { + "epoch": 0.7628865979381443, + "grad_norm": 2.167174816131592, + "learning_rate": 2e-05, + "loss": 1.9554, + "step": 74 + }, + { + "epoch": 0.7835051546391752, + "grad_norm": 3.795011281967163, + "learning_rate": 2e-05, + "loss": 1.9177, + "step": 76 + }, + { + "epoch": 0.8041237113402062, + "grad_norm": 1.8492149114608765, + "learning_rate": 2e-05, + "loss": 1.136, + "step": 78 + }, + { + "epoch": 0.8247422680412371, + "grad_norm": 3.34080171585083, + "learning_rate": 2e-05, + "loss": 1.5231, + "step": 80 + }, + { + "epoch": 0.845360824742268, + "grad_norm": 6.054934501647949, + "learning_rate": 2e-05, + "loss": 2.0895, + "step": 82 + }, + { + "epoch": 0.865979381443299, + "grad_norm": 6.04076623916626, + "learning_rate": 2e-05, + "loss": 2.3188, + "step": 84 + }, + { + "epoch": 0.8865979381443299, + "grad_norm": 10.989570617675781, + "learning_rate": 2e-05, + "loss": 2.3267, + "step": 86 + }, + { + "epoch": 0.9072164948453608, + "grad_norm": 4.211029529571533, + "learning_rate": 2e-05, + "loss": 1.8569, + "step": 88 + }, + { + "epoch": 0.9278350515463918, + "grad_norm": 3.708380937576294, + "learning_rate": 2e-05, + "loss": 2.2, + "step": 90 + }, + { + "epoch": 0.9484536082474226, + "grad_norm": 1.677304744720459, + "learning_rate": 2e-05, + "loss": 1.3522, + "step": 92 + }, + { + "epoch": 0.9690721649484536, + "grad_norm": 1.7550894021987915, + "learning_rate": 2e-05, + "loss": 1.434, + "step": 94 + }, + { + "epoch": 0.9896907216494846, + "grad_norm": 3.6894521713256836, + "learning_rate": 2e-05, + "loss": 1.2783, + "step": 96 + }, + { + "epoch": 1.0, + "step": 97, + "total_flos": 2839363742334976.0, + "train_loss": 1.8154096701710494, + "train_runtime": 202.4644, + "train_samples_per_second": 1.916, + "train_steps_per_second": 0.479 + } + ], + "logging_steps": 2, + "max_steps": 97, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 2839363742334976.0, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round10_task_vector_local_weights.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round10_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..ad6abb654de76d63e4af63a6d748b3e940d1b62d --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round10_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0230e2af913b9c015d63499c3ebe55174c5c7e0b44df3694e759d4ce0818b67b +size 335548196 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round11_task_vector_local_weights.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round11_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..483ee04ceefa58418e21cc3499c0fb8955ea2ef5 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round11_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:892ef58fc4e16efe4245b555041191e5b0b2f8f6e2e422ad8677ebe37d76d844 +size 335548196 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round12_task_vector_local_weights.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round12_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..f722a70176f56c580e6fc0c3201950bab3146786 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round12_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63e5dce0428339ac97555e253fb9a7495d776a94d5ad129806f98d73bac6bc5b +size 335548196 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round13_task_vector_local_weights.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round13_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..ae4e07fb154d290451caaeb52301cd380da0358e --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round13_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eddefd157a150d94a64104c9de743a78f40c4fef417df4609169af5752ed0fc2 +size 335548196 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round14_task_vector_local_weights.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round14_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..75dc149fad127fcbda9ef27beeaac12e9bf110f9 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round14_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31fe92fd398aeab3ef5a56a3c2d78d570ea050120fe5a29fb5945f7177d111f0 +size 335548196 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round15_task_vector_local_weights.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round15_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..95805b1b224e82134a90f9a898cb756601753023 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round15_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c88bac08f7216332cd9c926ad69b85e1766ad109352d920c5549102184d33bf6 +size 335548196 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round16_task_vector_local_weights.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round16_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..a6b1bd1268dfb331256171d5bde6955686298bdd --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round16_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:517b60ce0cc260ec25afcc32b229e482c682663387a7938c9fb62b64d9731398 +size 335548196 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round17_task_vector_local_weights.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round17_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..bcc53932c72c8c5c680426762e2b68ad72d556d8 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round17_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dff61f699064cc003243923ba30dff1d68ca7434573984bffb8c077bf1873799 +size 335548196 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round18_task_vector_local_weights.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round18_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..5513f9d01688c25eea66fe9203e031e22c19ad4f --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round18_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ff056819e7dff24190e196b9ffcf3a52c504f7dcd88cbb6a44658b38daa15e0 +size 335548196 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round19_task_vector_local_weights.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round19_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..03ffdaa69e60b882ebcac971a48f69ffc9b4559e --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round19_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb2baa737c00d6b910796e4beb3ed48b177acb60f448342c71e84e41abac7748 +size 335548196 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round1_task_vector_local_weights.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round1_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..f5067fdab4fe9cbf1c5db65cc22d35968bca41e6 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round1_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a27fea31b683a7b952fb17d1b989dea83ee7957c5ce80228390e2f26f6a9d15 +size 335548182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round20_task_vector_local_weights.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round20_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..345984ae96acd1c92ff0f225bb6cba19110c533f --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round20_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e14b1e41a85540e6145351e25f12488d6c60a1724560e657c830b9e4205d4b7 +size 335548196 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round2_task_vector_local_weights.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round2_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..4dfc088e51e17bfa8cd9a121333d3eb765e4f8f3 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round2_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30b1b9ef6adffa905ad4203c943d28778f16e6dc945403a47d9cfdfbf2f748b5 +size 335548182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round3_task_vector_local_weights.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round3_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..d10c7855a630b9a9a6e70a0015ce7de8d9ab882b --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round3_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58250ff52983ca7108767329c966cb45db747a0ca465b354f3504fbf86dfdae3 +size 335548182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round4_task_vector_local_weights.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round4_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..6621aebef3bb46c5374945e3d954ca86cc37e2a8 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round4_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58d8132d9b8a4032c9437e15395b650ec3b13a4b3d20ff40abc366a5d80d235d +size 335548182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round5_task_vector_local_weights.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round5_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..3897cfe3719159ef839b826c9158bd82a27d56f5 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round5_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59df212594d739afa8703f8dd971877421aa360fc572120325356b82c606b4b1 +size 335548182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round6_task_vector_local_weights.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round6_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..8f0ba9c3f748ad9a94033868516f9695b5566658 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round6_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d68cb109ec7dcc7bf23ab3404b84f4746c56e21470990a4f7d0065032084d0c +size 335548182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round7_task_vector_local_weights.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round7_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..39235cc67ad42773b2945114b0afebf456a5d033 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round7_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18b55464f0de0de0a808549ff4a835e6f0365c483cd0445b35303ca7256ac1c4 +size 335548182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round8_task_vector_local_weights.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round8_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..cf47e5e32648ab09581fd4c60a54b7fcc0dba496 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round8_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f001ac91db334607d9aa677145db2302cc5bcf5bfd831be1c367d170a73ac64f +size 335548182 diff --git a/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round9_task_vector_local_weights.pth b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round9_task_vector_local_weights.pth new file mode 100644 index 0000000000000000000000000000000000000000..444983e7727dbaff2b13ba0e29e36d2dfef66425 --- /dev/null +++ b/client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/round9_task_vector_local_weights.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0edd46a5ddad6eca7eb31a44a2ed4ddf94a456fd6565f36676d6f5bbd051f63 +size 335548182