thkim0305 commited on May 6, 2025

Commit

8df2c01

verified ·

1 Parent(s): f1cc9e0

Upload folder using huggingface_hub

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round10.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round12.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round15.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round17.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round2.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round20.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round5.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round7.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_trainer_state.json +378 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round10.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round12.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round15.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round17.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round2.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round20.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round5.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round7.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_trainer_state.json +378 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round10.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round12.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round15.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round17.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round2.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round20.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round5.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round7.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_trainer_state.json +378 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round10.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round12.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round15.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round17.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round2.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round20.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round5.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round7.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_trainer_state.json +378 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round10.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round12.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round15.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round17.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round2.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round20.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round5.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round7.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_trainer_state.json +378 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round10.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round12.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round15.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round17.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round2.pth +3 -0

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6b16768f7dc2eae664e5fd275f1c0e4a05c9147bb79c0c4b402a18aeaaf8375d
+size 368443438

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ebe47cb1aefad62c1fd613c76140e6267ba060f1c514591486cf4468523c5b41
+size 368443438

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7f4e565288b1dd9e16440afea7c377fea6e8c2b86a937030cd568bd120fd038f
+size 368443438

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c1d356437d08bccdd3ce361ad9057428bcf4cae911a507b8332d938f41f5dc74
+size 368443438

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2e98f5737926eedec558b34d9e5d045c45ea50e7ff4c68699fa210aaaf5120a9
+size 368442474

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:15aa028b6cced7cfa1cde28f6be8395d18b370d33f5961c4652916168c869da9
+size 368443438

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:421f88eb88ff09a6f10c9c0caf03a8665de01d152db170828eca4be38fb91eac
+size 368442474

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:525f0f37c26b21e07d6e9178e77c0ef29b869daafb690f58a885a4a1402ea584
+size 368442474

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/0_trainer_state.json ADDED Viewed

	@@ -0,0 +1,378 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 97,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.020618556701030927,
+      "grad_norm": 4.400585174560547,
+      "learning_rate": 2e-05,
+      "loss": 2.1084,
+      "step": 2
+    },
+    {
+      "epoch": 0.041237113402061855,
+      "grad_norm": 0.24108143150806427,
+      "learning_rate": 2e-05,
+      "loss": 0.5575,
+      "step": 4
+    },
+    {
+      "epoch": 0.061855670103092786,
+      "grad_norm": 2.3387579917907715,
+      "learning_rate": 2e-05,
+      "loss": 1.3726,
+      "step": 6
+    },
+    {
+      "epoch": 0.08247422680412371,
+      "grad_norm": 3.3745932579040527,
+      "learning_rate": 2e-05,
+      "loss": 1.0676,
+      "step": 8
+    },
+    {
+      "epoch": 0.10309278350515463,
+      "grad_norm": 0.499793142080307,
+      "learning_rate": 2e-05,
+      "loss": 1.5278,
+      "step": 10
+    },
+    {
+      "epoch": 0.12371134020618557,
+      "grad_norm": 1.0053821802139282,
+      "learning_rate": 2e-05,
+      "loss": 0.4909,
+      "step": 12
+    },
+    {
+      "epoch": 0.14432989690721648,
+      "grad_norm": 1.3840383291244507,
+      "learning_rate": 2e-05,
+      "loss": 0.9338,
+      "step": 14
+    },
+    {
+      "epoch": 0.16494845360824742,
+      "grad_norm": 2.917617082595825,
+      "learning_rate": 2e-05,
+      "loss": 0.3054,
+      "step": 16
+    },
+    {
+      "epoch": 0.18556701030927836,
+      "grad_norm": 1.6473109722137451,
+      "learning_rate": 2e-05,
+      "loss": 0.8086,
+      "step": 18
+    },
+    {
+      "epoch": 0.20618556701030927,
+      "grad_norm": 1.5606623888015747,
+      "learning_rate": 2e-05,
+      "loss": 1.9234,
+      "step": 20
+    },
+    {
+      "epoch": 0.2268041237113402,
+      "grad_norm": 0.5007361173629761,
+      "learning_rate": 2e-05,
+      "loss": 0.7782,
+      "step": 22
+    },
+    {
+      "epoch": 0.24742268041237114,
+      "grad_norm": 1.6239376068115234,
+      "learning_rate": 2e-05,
+      "loss": 1.1194,
+      "step": 24
+    },
+    {
+      "epoch": 0.26804123711340205,
+      "grad_norm": 2.372718572616577,
+      "learning_rate": 2e-05,
+      "loss": 0.4856,
+      "step": 26
+    },
+    {
+      "epoch": 0.28865979381443296,
+      "grad_norm": 1.8457813262939453,
+      "learning_rate": 2e-05,
+      "loss": 1.3728,
+      "step": 28
+    },
+    {
+      "epoch": 0.30927835051546393,
+      "grad_norm": 0.855133593082428,
+      "learning_rate": 2e-05,
+      "loss": 2.0313,
+      "step": 30
+    },
+    {
+      "epoch": 0.32989690721649484,
+      "grad_norm": 1.2432137727737427,
+      "learning_rate": 2e-05,
+      "loss": 0.4426,
+      "step": 32
+    },
+    {
+      "epoch": 0.35051546391752575,
+      "grad_norm": 1.4432425498962402,
+      "learning_rate": 2e-05,
+      "loss": 0.7053,
+      "step": 34
+    },
+    {
+      "epoch": 0.3711340206185567,
+      "grad_norm": 1.024395227432251,
+      "learning_rate": 2e-05,
+      "loss": 0.6134,
+      "step": 36
+    },
+    {
+      "epoch": 0.3917525773195876,
+      "grad_norm": 1.194606900215149,
+      "learning_rate": 2e-05,
+      "loss": 0.8373,
+      "step": 38
+    },
+    {
+      "epoch": 0.41237113402061853,
+      "grad_norm": 3.11031174659729,
+      "learning_rate": 2e-05,
+      "loss": 2.5497,
+      "step": 40
+    },
+    {
+      "epoch": 0.4329896907216495,
+      "grad_norm": 1.2926805019378662,
+      "learning_rate": 2e-05,
+      "loss": 0.9482,
+      "step": 42
+    },
+    {
+      "epoch": 0.4536082474226804,
+      "grad_norm": 0.5149866938591003,
+      "learning_rate": 2e-05,
+      "loss": 0.4165,
+      "step": 44
+    },
+    {
+      "epoch": 0.4742268041237113,
+      "grad_norm": 1.190213680267334,
+      "learning_rate": 2e-05,
+      "loss": 0.9618,
+      "step": 46
+    },
+    {
+      "epoch": 0.4948453608247423,
+      "grad_norm": 0.6894278526306152,
+      "learning_rate": 2e-05,
+      "loss": 1.0249,
+      "step": 48
+    },
+    {
+      "epoch": 0.5154639175257731,
+      "grad_norm": 2.4215104579925537,
+      "learning_rate": 2e-05,
+      "loss": 2.0148,
+      "step": 50
+    },
+    {
+      "epoch": 0.5360824742268041,
+      "grad_norm": 0.714414119720459,
+      "learning_rate": 2e-05,
+      "loss": 1.3428,
+      "step": 52
+    },
+    {
+      "epoch": 0.5567010309278351,
+      "grad_norm": 1.1892106533050537,
+      "learning_rate": 2e-05,
+      "loss": 1.1607,
+      "step": 54
+    },
+    {
+      "epoch": 0.5773195876288659,
+      "grad_norm": 1.21503484249115,
+      "learning_rate": 2e-05,
+      "loss": 1.836,
+      "step": 56
+    },
+    {
+      "epoch": 0.5979381443298969,
+      "grad_norm": 0.6278855800628662,
+      "learning_rate": 2e-05,
+      "loss": 0.844,
+      "step": 58
+    },
+    {
+      "epoch": 0.6185567010309279,
+      "grad_norm": 2.5338757038116455,
+      "learning_rate": 2e-05,
+      "loss": 0.7447,
+      "step": 60
+    },
+    {
+      "epoch": 0.6391752577319587,
+      "grad_norm": 1.6841797828674316,
+      "learning_rate": 2e-05,
+      "loss": 0.8774,
+      "step": 62
+    },
+    {
+      "epoch": 0.6597938144329897,
+      "grad_norm": 0.9872264862060547,
+      "learning_rate": 2e-05,
+      "loss": 0.9218,
+      "step": 64
+    },
+    {
+      "epoch": 0.6804123711340206,
+      "grad_norm": 1.0775535106658936,
+      "learning_rate": 2e-05,
+      "loss": 0.9773,
+      "step": 66
+    },
+    {
+      "epoch": 0.7010309278350515,
+      "grad_norm": 1.7016096115112305,
+      "learning_rate": 2e-05,
+      "loss": 1.3366,
+      "step": 68
+    },
+    {
+      "epoch": 0.7216494845360825,
+      "grad_norm": 9.161294937133789,
+      "learning_rate": 2e-05,
+      "loss": 2.0726,
+      "step": 70
+    },
+    {
+      "epoch": 0.7422680412371134,
+      "grad_norm": 1.1249581575393677,
+      "learning_rate": 2e-05,
+      "loss": 0.8084,
+      "step": 72
+    },
+    {
+      "epoch": 0.7628865979381443,
+      "grad_norm": 1.4263134002685547,
+      "learning_rate": 2e-05,
+      "loss": 0.9452,
+      "step": 74
+    },
+    {
+      "epoch": 0.7835051546391752,
+      "grad_norm": 3.8015453815460205,
+      "learning_rate": 2e-05,
+      "loss": 1.3966,
+      "step": 76
+    },
+    {
+      "epoch": 0.8041237113402062,
+      "grad_norm": 1.51714026927948,
+      "learning_rate": 2e-05,
+      "loss": 1.3366,
+      "step": 78
+    },
+    {
+      "epoch": 0.8247422680412371,
+      "grad_norm": 1.001514196395874,
+      "learning_rate": 2e-05,
+      "loss": 1.2534,
+      "step": 80
+    },
+    {
+      "epoch": 0.845360824742268,
+      "grad_norm": 0.437701553106308,
+      "learning_rate": 2e-05,
+      "loss": 0.6374,
+      "step": 82
+    },
+    {
+      "epoch": 0.865979381443299,
+      "grad_norm": 0.8562130928039551,
+      "learning_rate": 2e-05,
+      "loss": 0.8362,
+      "step": 84
+    },
+    {
+      "epoch": 0.8865979381443299,
+      "grad_norm": 1.1629040241241455,
+      "learning_rate": 2e-05,
+      "loss": 0.6705,
+      "step": 86
+    },
+    {
+      "epoch": 0.9072164948453608,
+      "grad_norm": 0.7516007423400879,
+      "learning_rate": 2e-05,
+      "loss": 0.9896,
+      "step": 88
+    },
+    {
+      "epoch": 0.9278350515463918,
+      "grad_norm": 1.4195737838745117,
+      "learning_rate": 2e-05,
+      "loss": 0.8637,
+      "step": 90
+    },
+    {
+      "epoch": 0.9484536082474226,
+      "grad_norm": 2.6594505310058594,
+      "learning_rate": 2e-05,
+      "loss": 1.1106,
+      "step": 92
+    },
+    {
+      "epoch": 0.9690721649484536,
+      "grad_norm": 0.5046249628067017,
+      "learning_rate": 2e-05,
+      "loss": 0.7569,
+      "step": 94
+    },
+    {
+      "epoch": 0.9896907216494846,
+      "grad_norm": 2.1814091205596924,
+      "learning_rate": 2e-05,
+      "loss": 1.1165,
+      "step": 96
+    },
+    {
+      "epoch": 1.0,
+      "step": 97,
+      "total_flos": 5716895332302848.0,
+      "train_loss": 1.0793670944331848,
+      "train_runtime": 222.0474,
+      "train_samples_per_second": 1.747,
+      "train_steps_per_second": 0.437
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 97,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 5716895332302848.0,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1b4cf563ddeb6cec914fa98a3339483e303ee40bcfbc8177f2de90ec07fd9f32
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8d4e731a0acc1c910df1a066b29fbc699083b9afcfd305403782197d842e12ad
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:72086853e3f2e6d801b2bbabd64045d8df56a4e1a9d90762650e9def4016026b
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ca8e1391c42f7045fc6ae4257810e9ec6fa9b85ad051a083f1b3a6cc1c13b9e7
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7ad99be95eca9ecc8be94e2334e2786ea50b2df0bc5a440a7200405c66c551aa
+size 791576546

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e370b2d3fe5711152b28b41a8df70a261223af0d600ff997c0beee58add2f883
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:03b2c620112acbddbfdcaa58a0bcc02827da8b0c3062d0bbb0aacdbfce067764
+size 791576546

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d9ad4a35f17fa2fa92dbf9df9678d3ab4ba7f3b43367db0b87142e429f809cd1
+size 791576546

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/1_trainer_state.json ADDED Viewed

	@@ -0,0 +1,378 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 97,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.020618556701030927,
+      "grad_norm": 1.0367224216461182,
+      "learning_rate": 2e-05,
+      "loss": 2.1122,
+      "step": 2
+    },
+    {
+      "epoch": 0.041237113402061855,
+      "grad_norm": 1.5293935537338257,
+      "learning_rate": 2e-05,
+      "loss": 2.3105,
+      "step": 4
+    },
+    {
+      "epoch": 0.061855670103092786,
+      "grad_norm": 1.200186848640442,
+      "learning_rate": 2e-05,
+      "loss": 1.2933,
+      "step": 6
+    },
+    {
+      "epoch": 0.08247422680412371,
+      "grad_norm": 0.551851749420166,
+      "learning_rate": 2e-05,
+      "loss": 1.01,
+      "step": 8
+    },
+    {
+      "epoch": 0.10309278350515463,
+      "grad_norm": 1.2025572061538696,
+      "learning_rate": 2e-05,
+      "loss": 1.6588,
+      "step": 10
+    },
+    {
+      "epoch": 0.12371134020618557,
+      "grad_norm": 0.773492693901062,
+      "learning_rate": 2e-05,
+      "loss": 1.269,
+      "step": 12
+    },
+    {
+      "epoch": 0.14432989690721648,
+      "grad_norm": 1.1679770946502686,
+      "learning_rate": 2e-05,
+      "loss": 0.9164,
+      "step": 14
+    },
+    {
+      "epoch": 0.16494845360824742,
+      "grad_norm": 0.5977709293365479,
+      "learning_rate": 2e-05,
+      "loss": 1.4414,
+      "step": 16
+    },
+    {
+      "epoch": 0.18556701030927836,
+      "grad_norm": 1.0373786687850952,
+      "learning_rate": 2e-05,
+      "loss": 2.1323,
+      "step": 18
+    },
+    {
+      "epoch": 0.20618556701030927,
+      "grad_norm": 1.6528465747833252,
+      "learning_rate": 2e-05,
+      "loss": 1.0931,
+      "step": 20
+    },
+    {
+      "epoch": 0.2268041237113402,
+      "grad_norm": 1.2186673879623413,
+      "learning_rate": 2e-05,
+      "loss": 0.9268,
+      "step": 22
+    },
+    {
+      "epoch": 0.24742268041237114,
+      "grad_norm": 0.9843794107437134,
+      "learning_rate": 2e-05,
+      "loss": 1.4834,
+      "step": 24
+    },
+    {
+      "epoch": 0.26804123711340205,
+      "grad_norm": 1.1736723184585571,
+      "learning_rate": 2e-05,
+      "loss": 0.973,
+      "step": 26
+    },
+    {
+      "epoch": 0.28865979381443296,
+      "grad_norm": 0.9919485449790955,
+      "learning_rate": 2e-05,
+      "loss": 1.426,
+      "step": 28
+    },
+    {
+      "epoch": 0.30927835051546393,
+      "grad_norm": 0.3353116512298584,
+      "learning_rate": 2e-05,
+      "loss": 0.3913,
+      "step": 30
+    },
+    {
+      "epoch": 0.32989690721649484,
+      "grad_norm": 0.7836465835571289,
+      "learning_rate": 2e-05,
+      "loss": 0.9893,
+      "step": 32
+    },
+    {
+      "epoch": 0.35051546391752575,
+      "grad_norm": 0.6000968813896179,
+      "learning_rate": 2e-05,
+      "loss": 1.1023,
+      "step": 34
+    },
+    {
+      "epoch": 0.3711340206185567,
+      "grad_norm": 1.1263123750686646,
+      "learning_rate": 2e-05,
+      "loss": 1.2717,
+      "step": 36
+    },
+    {
+      "epoch": 0.3917525773195876,
+      "grad_norm": 1.4765498638153076,
+      "learning_rate": 2e-05,
+      "loss": 1.2275,
+      "step": 38
+    },
+    {
+      "epoch": 0.41237113402061853,
+      "grad_norm": 0.7918884754180908,
+      "learning_rate": 2e-05,
+      "loss": 1.124,
+      "step": 40
+    },
+    {
+      "epoch": 0.4329896907216495,
+      "grad_norm": 0.881719708442688,
+      "learning_rate": 2e-05,
+      "loss": 1.1614,
+      "step": 42
+    },
+    {
+      "epoch": 0.4536082474226804,
+      "grad_norm": 0.5077035427093506,
+      "learning_rate": 2e-05,
+      "loss": 0.7703,
+      "step": 44
+    },
+    {
+      "epoch": 0.4742268041237113,
+      "grad_norm": 1.0335602760314941,
+      "learning_rate": 2e-05,
+      "loss": 1.0186,
+      "step": 46
+    },
+    {
+      "epoch": 0.4948453608247423,
+      "grad_norm": 2.6902318000793457,
+      "learning_rate": 2e-05,
+      "loss": 1.4702,
+      "step": 48
+    },
+    {
+      "epoch": 0.5154639175257731,
+      "grad_norm": 0.48346254229545593,
+      "learning_rate": 2e-05,
+      "loss": 0.7069,
+      "step": 50
+    },
+    {
+      "epoch": 0.5360824742268041,
+      "grad_norm": 0.43713346123695374,
+      "learning_rate": 2e-05,
+      "loss": 0.9541,
+      "step": 52
+    },
+    {
+      "epoch": 0.5567010309278351,
+      "grad_norm": 0.7219210863113403,
+      "learning_rate": 2e-05,
+      "loss": 1.0328,
+      "step": 54
+    },
+    {
+      "epoch": 0.5773195876288659,
+      "grad_norm": 0.6687954068183899,
+      "learning_rate": 2e-05,
+      "loss": 0.9612,
+      "step": 56
+    },
+    {
+      "epoch": 0.5979381443298969,
+      "grad_norm": 0.4545569121837616,
+      "learning_rate": 2e-05,
+      "loss": 0.7134,
+      "step": 58
+    },
+    {
+      "epoch": 0.6185567010309279,
+      "grad_norm": 1.4642369747161865,
+      "learning_rate": 2e-05,
+      "loss": 1.0691,
+      "step": 60
+    },
+    {
+      "epoch": 0.6391752577319587,
+      "grad_norm": 0.866256058216095,
+      "learning_rate": 2e-05,
+      "loss": 0.9705,
+      "step": 62
+    },
+    {
+      "epoch": 0.6597938144329897,
+      "grad_norm": 0.6883927583694458,
+      "learning_rate": 2e-05,
+      "loss": 1.0837,
+      "step": 64
+    },
+    {
+      "epoch": 0.6804123711340206,
+      "grad_norm": 0.8896063566207886,
+      "learning_rate": 2e-05,
+      "loss": 1.2245,
+      "step": 66
+    },
+    {
+      "epoch": 0.7010309278350515,
+      "grad_norm": 1.008226990699768,
+      "learning_rate": 2e-05,
+      "loss": 0.8514,
+      "step": 68
+    },
+    {
+      "epoch": 0.7216494845360825,
+      "grad_norm": 0.5231401324272156,
+      "learning_rate": 2e-05,
+      "loss": 0.8315,
+      "step": 70
+    },
+    {
+      "epoch": 0.7422680412371134,
+      "grad_norm": 1.1414425373077393,
+      "learning_rate": 2e-05,
+      "loss": 1.0161,
+      "step": 72
+    },
+    {
+      "epoch": 0.7628865979381443,
+      "grad_norm": 0.8160688281059265,
+      "learning_rate": 2e-05,
+      "loss": 0.9522,
+      "step": 74
+    },
+    {
+      "epoch": 0.7835051546391752,
+      "grad_norm": 4.522146224975586,
+      "learning_rate": 2e-05,
+      "loss": 1.3154,
+      "step": 76
+    },
+    {
+      "epoch": 0.8041237113402062,
+      "grad_norm": 0.8005837798118591,
+      "learning_rate": 2e-05,
+      "loss": 1.38,
+      "step": 78
+    },
+    {
+      "epoch": 0.8247422680412371,
+      "grad_norm": 0.8043385744094849,
+      "learning_rate": 2e-05,
+      "loss": 0.7023,
+      "step": 80
+    },
+    {
+      "epoch": 0.845360824742268,
+      "grad_norm": 0.4813634753227234,
+      "learning_rate": 2e-05,
+      "loss": 1.2706,
+      "step": 82
+    },
+    {
+      "epoch": 0.865979381443299,
+      "grad_norm": 2.6377651691436768,
+      "learning_rate": 2e-05,
+      "loss": 0.7818,
+      "step": 84
+    },
+    {
+      "epoch": 0.8865979381443299,
+      "grad_norm": 0.9884634017944336,
+      "learning_rate": 2e-05,
+      "loss": 0.8094,
+      "step": 86
+    },
+    {
+      "epoch": 0.9072164948453608,
+      "grad_norm": 1.7997894287109375,
+      "learning_rate": 2e-05,
+      "loss": 0.4816,
+      "step": 88
+    },
+    {
+      "epoch": 0.9278350515463918,
+      "grad_norm": 1.9168503284454346,
+      "learning_rate": 2e-05,
+      "loss": 0.8998,
+      "step": 90
+    },
+    {
+      "epoch": 0.9484536082474226,
+      "grad_norm": 0.4715125858783722,
+      "learning_rate": 2e-05,
+      "loss": 1.7297,
+      "step": 92
+    },
+    {
+      "epoch": 0.9690721649484536,
+      "grad_norm": 0.7565422058105469,
+      "learning_rate": 2e-05,
+      "loss": 1.1934,
+      "step": 94
+    },
+    {
+      "epoch": 0.9896907216494846,
+      "grad_norm": 1.6956796646118164,
+      "learning_rate": 2e-05,
+      "loss": 1.0388,
+      "step": 96
+    },
+    {
+      "epoch": 1.0,
+      "step": 97,
+      "total_flos": 1.3756887170285568e+16,
+      "train_loss": 1.1302465065238403,
+      "train_runtime": 315.5064,
+      "train_samples_per_second": 1.23,
+      "train_steps_per_second": 0.307
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 97,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1.3756887170285568e+16,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:623c27c6e16e61754cf9f9bde6b0a2f00c89549eada108fd4d3385eeaa29b8a5
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9394ca5cba51cc4d5f9a628c5235add0cc79e6cefcbf73aab79088eaf9958ec2
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1698991ce97c58e41af99e8d6b1461337859fc7938ede7e57f36eebb9dccf5f7
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:de7badf37bc6814c02941952260ab1c4ea0434cdd296a402f91bb67747e52c24
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4c6e3bfc5a8aab513e9fe3473e92e3048bfbc4d19bd4c4176ce0141a9c69225d
+size 791576546

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7e86a679b1183d5d4cc5c15a3054fd2b160fe0443325d5f0d091c265c5eb060f
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fc8dc7440211f75b47738e72ddd3bf0a982d45c096e63747b2ba17635f45434a
+size 791576546

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:206787c858348d28620a2bc4ffbc2c93037006a7963eff3316cb95bd1e6bc540
+size 791576546

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/2_trainer_state.json ADDED Viewed

	@@ -0,0 +1,378 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 97,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.020618556701030927,
+      "grad_norm": 2.538358211517334,
+      "learning_rate": 2e-05,
+      "loss": 0.6608,
+      "step": 2
+    },
+    {
+      "epoch": 0.041237113402061855,
+      "grad_norm": 1.2682268619537354,
+      "learning_rate": 2e-05,
+      "loss": 0.9785,
+      "step": 4
+    },
+    {
+      "epoch": 0.061855670103092786,
+      "grad_norm": 1.937935709953308,
+      "learning_rate": 2e-05,
+      "loss": 2.3516,
+      "step": 6
+    },
+    {
+      "epoch": 0.08247422680412371,
+      "grad_norm": 1.4392732381820679,
+      "learning_rate": 2e-05,
+      "loss": 1.6785,
+      "step": 8
+    },
+    {
+      "epoch": 0.10309278350515463,
+      "grad_norm": 1.5007473230361938,
+      "learning_rate": 2e-05,
+      "loss": 1.5229,
+      "step": 10
+    },
+    {
+      "epoch": 0.12371134020618557,
+      "grad_norm": 0.6477186679840088,
+      "learning_rate": 2e-05,
+      "loss": 1.3816,
+      "step": 12
+    },
+    {
+      "epoch": 0.14432989690721648,
+      "grad_norm": 2.7069621086120605,
+      "learning_rate": 2e-05,
+      "loss": 1.319,
+      "step": 14
+    },
+    {
+      "epoch": 0.16494845360824742,
+      "grad_norm": 0.5525019764900208,
+      "learning_rate": 2e-05,
+      "loss": 0.9359,
+      "step": 16
+    },
+    {
+      "epoch": 0.18556701030927836,
+      "grad_norm": 0.7979759573936462,
+      "learning_rate": 2e-05,
+      "loss": 1.6191,
+      "step": 18
+    },
+    {
+      "epoch": 0.20618556701030927,
+      "grad_norm": 2.443120241165161,
+      "learning_rate": 2e-05,
+      "loss": 1.0461,
+      "step": 20
+    },
+    {
+      "epoch": 0.2268041237113402,
+      "grad_norm": 0.8416927456855774,
+      "learning_rate": 2e-05,
+      "loss": 1.217,
+      "step": 22
+    },
+    {
+      "epoch": 0.24742268041237114,
+      "grad_norm": 0.7521089315414429,
+      "learning_rate": 2e-05,
+      "loss": 1.0924,
+      "step": 24
+    },
+    {
+      "epoch": 0.26804123711340205,
+      "grad_norm": 1.4497734308242798,
+      "learning_rate": 2e-05,
+      "loss": 1.1838,
+      "step": 26
+    },
+    {
+      "epoch": 0.28865979381443296,
+      "grad_norm": 0.6999666690826416,
+      "learning_rate": 2e-05,
+      "loss": 1.1143,
+      "step": 28
+    },
+    {
+      "epoch": 0.30927835051546393,
+      "grad_norm": 1.1742311716079712,
+      "learning_rate": 2e-05,
+      "loss": 0.9922,
+      "step": 30
+    },
+    {
+      "epoch": 0.32989690721649484,
+      "grad_norm": 0.5971889495849609,
+      "learning_rate": 2e-05,
+      "loss": 1.6466,
+      "step": 32
+    },
+    {
+      "epoch": 0.35051546391752575,
+      "grad_norm": 1.034390926361084,
+      "learning_rate": 2e-05,
+      "loss": 0.8025,
+      "step": 34
+    },
+    {
+      "epoch": 0.3711340206185567,
+      "grad_norm": 2.665285110473633,
+      "learning_rate": 2e-05,
+      "loss": 0.9528,
+      "step": 36
+    },
+    {
+      "epoch": 0.3917525773195876,
+      "grad_norm": 0.8578566312789917,
+      "learning_rate": 2e-05,
+      "loss": 0.9949,
+      "step": 38
+    },
+    {
+      "epoch": 0.41237113402061853,
+      "grad_norm": 1.1724331378936768,
+      "learning_rate": 2e-05,
+      "loss": 0.903,
+      "step": 40
+    },
+    {
+      "epoch": 0.4329896907216495,
+      "grad_norm": 1.1174654960632324,
+      "learning_rate": 2e-05,
+      "loss": 1.1925,
+      "step": 42
+    },
+    {
+      "epoch": 0.4536082474226804,
+      "grad_norm": 1.1770066022872925,
+      "learning_rate": 2e-05,
+      "loss": 0.8522,
+      "step": 44
+    },
+    {
+      "epoch": 0.4742268041237113,
+      "grad_norm": 0.9446500539779663,
+      "learning_rate": 2e-05,
+      "loss": 1.9395,
+      "step": 46
+    },
+    {
+      "epoch": 0.4948453608247423,
+      "grad_norm": 0.4612779915332794,
+      "learning_rate": 2e-05,
+      "loss": 0.4162,
+      "step": 48
+    },
+    {
+      "epoch": 0.5154639175257731,
+      "grad_norm": 0.7479944229125977,
+      "learning_rate": 2e-05,
+      "loss": 0.953,
+      "step": 50
+    },
+    {
+      "epoch": 0.5360824742268041,
+      "grad_norm": 0.7862464189529419,
+      "learning_rate": 2e-05,
+      "loss": 0.3849,
+      "step": 52
+    },
+    {
+      "epoch": 0.5567010309278351,
+      "grad_norm": 0.7938858270645142,
+      "learning_rate": 2e-05,
+      "loss": 0.6369,
+      "step": 54
+    },
+    {
+      "epoch": 0.5773195876288659,
+      "grad_norm": 2.231029987335205,
+      "learning_rate": 2e-05,
+      "loss": 0.9901,
+      "step": 56
+    },
+    {
+      "epoch": 0.5979381443298969,
+      "grad_norm": 0.3764982223510742,
+      "learning_rate": 2e-05,
+      "loss": 0.9056,
+      "step": 58
+    },
+    {
+      "epoch": 0.6185567010309279,
+      "grad_norm": 0.9940462708473206,
+      "learning_rate": 2e-05,
+      "loss": 0.5912,
+      "step": 60
+    },
+    {
+      "epoch": 0.6391752577319587,
+      "grad_norm": 0.9223126173019409,
+      "learning_rate": 2e-05,
+      "loss": 0.6726,
+      "step": 62
+    },
+    {
+      "epoch": 0.6597938144329897,
+      "grad_norm": 0.7324680685997009,
+      "learning_rate": 2e-05,
+      "loss": 0.4076,
+      "step": 64
+    },
+    {
+      "epoch": 0.6804123711340206,
+      "grad_norm": 0.8635823130607605,
+      "learning_rate": 2e-05,
+      "loss": 0.5997,
+      "step": 66
+    },
+    {
+      "epoch": 0.7010309278350515,
+      "grad_norm": 1.428286075592041,
+      "learning_rate": 2e-05,
+      "loss": 0.9463,
+      "step": 68
+    },
+    {
+      "epoch": 0.7216494845360825,
+      "grad_norm": 0.5211204290390015,
+      "learning_rate": 2e-05,
+      "loss": 0.7596,
+      "step": 70
+    },
+    {
+      "epoch": 0.7422680412371134,
+      "grad_norm": 1.464924931526184,
+      "learning_rate": 2e-05,
+      "loss": 0.7913,
+      "step": 72
+    },
+    {
+      "epoch": 0.7628865979381443,
+      "grad_norm": 2.8257651329040527,
+      "learning_rate": 2e-05,
+      "loss": 1.2766,
+      "step": 74
+    },
+    {
+      "epoch": 0.7835051546391752,
+      "grad_norm": 2.5703413486480713,
+      "learning_rate": 2e-05,
+      "loss": 0.8435,
+      "step": 76
+    },
+    {
+      "epoch": 0.8041237113402062,
+      "grad_norm": 1.486395239830017,
+      "learning_rate": 2e-05,
+      "loss": 0.9819,
+      "step": 78
+    },
+    {
+      "epoch": 0.8247422680412371,
+      "grad_norm": 0.4546787738800049,
+      "learning_rate": 2e-05,
+      "loss": 0.2796,
+      "step": 80
+    },
+    {
+      "epoch": 0.845360824742268,
+      "grad_norm": 0.7543643116950989,
+      "learning_rate": 2e-05,
+      "loss": 0.2902,
+      "step": 82
+    },
+    {
+      "epoch": 0.865979381443299,
+      "grad_norm": 0.8718597292900085,
+      "learning_rate": 2e-05,
+      "loss": 0.5479,
+      "step": 84
+    },
+    {
+      "epoch": 0.8865979381443299,
+      "grad_norm": 2.138429880142212,
+      "learning_rate": 2e-05,
+      "loss": 1.1224,
+      "step": 86
+    },
+    {
+      "epoch": 0.9072164948453608,
+      "grad_norm": 0.581947922706604,
+      "learning_rate": 2e-05,
+      "loss": 0.9022,
+      "step": 88
+    },
+    {
+      "epoch": 0.9278350515463918,
+      "grad_norm": 1.3591723442077637,
+      "learning_rate": 2e-05,
+      "loss": 0.9803,
+      "step": 90
+    },
+    {
+      "epoch": 0.9484536082474226,
+      "grad_norm": 1.1390422582626343,
+      "learning_rate": 2e-05,
+      "loss": 1.1259,
+      "step": 92
+    },
+    {
+      "epoch": 0.9690721649484536,
+      "grad_norm": 1.318390130996704,
+      "learning_rate": 2e-05,
+      "loss": 0.9855,
+      "step": 94
+    },
+    {
+      "epoch": 0.9896907216494846,
+      "grad_norm": 1.238763451576233,
+      "learning_rate": 2e-05,
+      "loss": 0.4494,
+      "step": 96
+    },
+    {
+      "epoch": 1.0,
+      "step": 97,
+      "total_flos": 1.5309291128881152e+16,
+      "train_loss": 0.9762444643630195,
+      "train_runtime": 351.1873,
+      "train_samples_per_second": 1.105,
+      "train_steps_per_second": 0.276
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 97,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1.5309291128881152e+16,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3fc77f4acfc80e842f0c49ca07c0518a93812788236835cee6b47f88c1ce363a
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:40d3dc701382da26808567ded7104ae77026cab4a5a03ca85a9b7408b648375f
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b6fbb24e8df10767d6e48cd3bbe7abb171912af63f525f6830f724827e262f42
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fc952fe4c8ad4ef2ce347a0fec31859d5ea7286b61fbdbd33f62cc59fc6a1db8
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6b91e5497d58df5e6c88cfd96c80538d3b0489625e9c1844bc7134fc1819c132
+size 791576546

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:41b1e011c681191accbfee628a5d5367b45a57bb25b21cc0fb2dcc706842da26
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:909ae260c1b95d5769bb16ca3cc0ea471dd2f0a32764d5950ed946519bbdfa90
+size 791576546

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:deb5bbcfb7d060129e306207445c42c34099a7c3d3df2de2dd80ec00e2a81b15
+size 791576546

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/3_trainer_state.json ADDED Viewed

	@@ -0,0 +1,378 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 97,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.020618556701030927,
+      "grad_norm": 1.7036350965499878,
+      "learning_rate": 2e-05,
+      "loss": 1.1502,
+      "step": 2
+    },
+    {
+      "epoch": 0.041237113402061855,
+      "grad_norm": 0.733051061630249,
+      "learning_rate": 2e-05,
+      "loss": 0.3144,
+      "step": 4
+    },
+    {
+      "epoch": 0.061855670103092786,
+      "grad_norm": 3.021022081375122,
+      "learning_rate": 2e-05,
+      "loss": 1.523,
+      "step": 6
+    },
+    {
+      "epoch": 0.08247422680412371,
+      "grad_norm": 0.6244669556617737,
+      "learning_rate": 2e-05,
+      "loss": 0.9215,
+      "step": 8
+    },
+    {
+      "epoch": 0.10309278350515463,
+      "grad_norm": 1.675452470779419,
+      "learning_rate": 2e-05,
+      "loss": 1.2749,
+      "step": 10
+    },
+    {
+      "epoch": 0.12371134020618557,
+      "grad_norm": 0.2071010321378708,
+      "learning_rate": 2e-05,
+      "loss": 0.2043,
+      "step": 12
+    },
+    {
+      "epoch": 0.14432989690721648,
+      "grad_norm": 0.45165616273880005,
+      "learning_rate": 2e-05,
+      "loss": 0.2592,
+      "step": 14
+    },
+    {
+      "epoch": 0.16494845360824742,
+      "grad_norm": 0.9154694080352783,
+      "learning_rate": 2e-05,
+      "loss": 1.0788,
+      "step": 16
+    },
+    {
+      "epoch": 0.18556701030927836,
+      "grad_norm": 0.44769397377967834,
+      "learning_rate": 2e-05,
+      "loss": 0.672,
+      "step": 18
+    },
+    {
+      "epoch": 0.20618556701030927,
+      "grad_norm": 1.001409649848938,
+      "learning_rate": 2e-05,
+      "loss": 0.7424,
+      "step": 20
+    },
+    {
+      "epoch": 0.2268041237113402,
+      "grad_norm": 0.2860804498195648,
+      "learning_rate": 2e-05,
+      "loss": 0.7084,
+      "step": 22
+    },
+    {
+      "epoch": 0.24742268041237114,
+      "grad_norm": 0.4580197036266327,
+      "learning_rate": 2e-05,
+      "loss": 1.1849,
+      "step": 24
+    },
+    {
+      "epoch": 0.26804123711340205,
+      "grad_norm": 0.4905541241168976,
+      "learning_rate": 2e-05,
+      "loss": 0.7166,
+      "step": 26
+    },
+    {
+      "epoch": 0.28865979381443296,
+      "grad_norm": 1.433603048324585,
+      "learning_rate": 2e-05,
+      "loss": 1.5247,
+      "step": 28
+    },
+    {
+      "epoch": 0.30927835051546393,
+      "grad_norm": 2.386955738067627,
+      "learning_rate": 2e-05,
+      "loss": 0.8547,
+      "step": 30
+    },
+    {
+      "epoch": 0.32989690721649484,
+      "grad_norm": 2.032757043838501,
+      "learning_rate": 2e-05,
+      "loss": 0.5488,
+      "step": 32
+    },
+    {
+      "epoch": 0.35051546391752575,
+      "grad_norm": 1.0941940546035767,
+      "learning_rate": 2e-05,
+      "loss": 0.9551,
+      "step": 34
+    },
+    {
+      "epoch": 0.3711340206185567,
+      "grad_norm": 1.461041808128357,
+      "learning_rate": 2e-05,
+      "loss": 1.1186,
+      "step": 36
+    },
+    {
+      "epoch": 0.3917525773195876,
+      "grad_norm": 0.46292173862457275,
+      "learning_rate": 2e-05,
+      "loss": 0.9941,
+      "step": 38
+    },
+    {
+      "epoch": 0.41237113402061853,
+      "grad_norm": 0.46523961424827576,
+      "learning_rate": 2e-05,
+      "loss": 0.99,
+      "step": 40
+    },
+    {
+      "epoch": 0.4329896907216495,
+      "grad_norm": 0.5094814896583557,
+      "learning_rate": 2e-05,
+      "loss": 1.0255,
+      "step": 42
+    },
+    {
+      "epoch": 0.4536082474226804,
+      "grad_norm": 3.24894642829895,
+      "learning_rate": 2e-05,
+      "loss": 1.3442,
+      "step": 44
+    },
+    {
+      "epoch": 0.4742268041237113,
+      "grad_norm": 3.7670817375183105,
+      "learning_rate": 2e-05,
+      "loss": 1.279,
+      "step": 46
+    },
+    {
+      "epoch": 0.4948453608247423,
+      "grad_norm": 2.1132254600524902,
+      "learning_rate": 2e-05,
+      "loss": 1.7001,
+      "step": 48
+    },
+    {
+      "epoch": 0.5154639175257731,
+      "grad_norm": 0.593248724937439,
+      "learning_rate": 2e-05,
+      "loss": 0.8884,
+      "step": 50
+    },
+    {
+      "epoch": 0.5360824742268041,
+      "grad_norm": 1.4078608751296997,
+      "learning_rate": 2e-05,
+      "loss": 0.8091,
+      "step": 52
+    },
+    {
+      "epoch": 0.5567010309278351,
+      "grad_norm": 0.3955836892127991,
+      "learning_rate": 2e-05,
+      "loss": 0.3546,
+      "step": 54
+    },
+    {
+      "epoch": 0.5773195876288659,
+      "grad_norm": 0.9244691729545593,
+      "learning_rate": 2e-05,
+      "loss": 1.437,
+      "step": 56
+    },
+    {
+      "epoch": 0.5979381443298969,
+      "grad_norm": 0.4643814265727997,
+      "learning_rate": 2e-05,
+      "loss": 0.881,
+      "step": 58
+    },
+    {
+      "epoch": 0.6185567010309279,
+      "grad_norm": 0.41819217801094055,
+      "learning_rate": 2e-05,
+      "loss": 0.6405,
+      "step": 60
+    },
+    {
+      "epoch": 0.6391752577319587,
+      "grad_norm": 0.7221791744232178,
+      "learning_rate": 2e-05,
+      "loss": 0.7172,
+      "step": 62
+    },
+    {
+      "epoch": 0.6597938144329897,
+      "grad_norm": 0.44450488686561584,
+      "learning_rate": 2e-05,
+      "loss": 0.7196,
+      "step": 64
+    },
+    {
+      "epoch": 0.6804123711340206,
+      "grad_norm": 1.463599443435669,
+      "learning_rate": 2e-05,
+      "loss": 1.4753,
+      "step": 66
+    },
+    {
+      "epoch": 0.7010309278350515,
+      "grad_norm": 0.2606247365474701,
+      "learning_rate": 2e-05,
+      "loss": 0.8865,
+      "step": 68
+    },
+    {
+      "epoch": 0.7216494845360825,
+      "grad_norm": 0.3822779655456543,
+      "learning_rate": 2e-05,
+      "loss": 0.7243,
+      "step": 70
+    },
+    {
+      "epoch": 0.7422680412371134,
+      "grad_norm": 0.314899206161499,
+      "learning_rate": 2e-05,
+      "loss": 0.9963,
+      "step": 72
+    },
+    {
+      "epoch": 0.7628865979381443,
+      "grad_norm": 0.47478482127189636,
+      "learning_rate": 2e-05,
+      "loss": 0.7358,
+      "step": 74
+    },
+    {
+      "epoch": 0.7835051546391752,
+      "grad_norm": 3.180941581726074,
+      "learning_rate": 2e-05,
+      "loss": 1.546,
+      "step": 76
+    },
+    {
+      "epoch": 0.8041237113402062,
+      "grad_norm": 0.392020046710968,
+      "learning_rate": 2e-05,
+      "loss": 0.4863,
+      "step": 78
+    },
+    {
+      "epoch": 0.8247422680412371,
+      "grad_norm": 0.4663325548171997,
+      "learning_rate": 2e-05,
+      "loss": 0.3802,
+      "step": 80
+    },
+    {
+      "epoch": 0.845360824742268,
+      "grad_norm": 0.5237138867378235,
+      "learning_rate": 2e-05,
+      "loss": 0.5043,
+      "step": 82
+    },
+    {
+      "epoch": 0.865979381443299,
+      "grad_norm": 0.8400606513023376,
+      "learning_rate": 2e-05,
+      "loss": 0.8792,
+      "step": 84
+    },
+    {
+      "epoch": 0.8865979381443299,
+      "grad_norm": 0.3281240463256836,
+      "learning_rate": 2e-05,
+      "loss": 0.735,
+      "step": 86
+    },
+    {
+      "epoch": 0.9072164948453608,
+      "grad_norm": 1.076886773109436,
+      "learning_rate": 2e-05,
+      "loss": 0.9669,
+      "step": 88
+    },
+    {
+      "epoch": 0.9278350515463918,
+      "grad_norm": 0.6442875266075134,
+      "learning_rate": 2e-05,
+      "loss": 0.6857,
+      "step": 90
+    },
+    {
+      "epoch": 0.9484536082474226,
+      "grad_norm": 1.3491824865341187,
+      "learning_rate": 2e-05,
+      "loss": 0.7857,
+      "step": 92
+    },
+    {
+      "epoch": 0.9690721649484536,
+      "grad_norm": 0.4119647443294525,
+      "learning_rate": 2e-05,
+      "loss": 0.5265,
+      "step": 94
+    },
+    {
+      "epoch": 0.9896907216494846,
+      "grad_norm": 0.9270315766334534,
+      "learning_rate": 2e-05,
+      "loss": 1.2191,
+      "step": 96
+    },
+    {
+      "epoch": 1.0,
+      "step": 97,
+      "total_flos": 2.081554905117491e+16,
+      "train_loss": 0.8912827993176647,
+      "train_runtime": 342.0553,
+      "train_samples_per_second": 1.134,
+      "train_steps_per_second": 0.284
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 97,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 2.081554905117491e+16,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:76222740e5b1eb701df8242a79fa98659c625a40a9d557ff4ee9ab9793e6a2de
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:af4abb1969b8895e24009b3474b99f4b40c4a44b2056fb6935f1f5c9fbd2b7de
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:aed5d456627b3b084bed1c6c4f40781201a9314e9ab4c7fcd0045aa87653ad93
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:974c3d90766732a37f45318d13fa049f577025980b07e7b331d04ffe0c7db571
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:369ee76d02588c766be21d8792a4eb5096425d0505d617ed47d36b31ab2a7489
+size 791576546

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:724a4cb19d6636ec4851b473dc93dfec177f1eb18c9610b52336f58fe4ac864e
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:296b10e3bc3a9fa0d2250f938b2eecca029ba36b1dced5a077b832d32301cc42
+size 791576546

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2799db2855c1d10a215ade45151d9ac24e0793f29bfafc62c45ef363f459e35e
+size 791576546

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/4_trainer_state.json ADDED Viewed

	@@ -0,0 +1,378 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 97,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.020618556701030927,
+      "grad_norm": 1.3807806968688965,
+      "learning_rate": 2e-05,
+      "loss": 1.2215,
+      "step": 2
+    },
+    {
+      "epoch": 0.041237113402061855,
+      "grad_norm": 5.47310209274292,
+      "learning_rate": 2e-05,
+      "loss": 1.7948,
+      "step": 4
+    },
+    {
+      "epoch": 0.061855670103092786,
+      "grad_norm": 4.091208457946777,
+      "learning_rate": 2e-05,
+      "loss": 1.4245,
+      "step": 6
+    },
+    {
+      "epoch": 0.08247422680412371,
+      "grad_norm": 2.522712230682373,
+      "learning_rate": 2e-05,
+      "loss": 1.2455,
+      "step": 8
+    },
+    {
+      "epoch": 0.10309278350515463,
+      "grad_norm": 2.400545835494995,
+      "learning_rate": 2e-05,
+      "loss": 1.4473,
+      "step": 10
+    },
+    {
+      "epoch": 0.12371134020618557,
+      "grad_norm": 2.147249937057495,
+      "learning_rate": 2e-05,
+      "loss": 0.648,
+      "step": 12
+    },
+    {
+      "epoch": 0.14432989690721648,
+      "grad_norm": 0.6440826654434204,
+      "learning_rate": 2e-05,
+      "loss": 0.1022,
+      "step": 14
+    },
+    {
+      "epoch": 0.16494845360824742,
+      "grad_norm": 1.4986751079559326,
+      "learning_rate": 2e-05,
+      "loss": 1.5813,
+      "step": 16
+    },
+    {
+      "epoch": 0.18556701030927836,
+      "grad_norm": 2.2775418758392334,
+      "learning_rate": 2e-05,
+      "loss": 0.7531,
+      "step": 18
+    },
+    {
+      "epoch": 0.20618556701030927,
+      "grad_norm": 3.2079670429229736,
+      "learning_rate": 2e-05,
+      "loss": 1.6908,
+      "step": 20
+    },
+    {
+      "epoch": 0.2268041237113402,
+      "grad_norm": 2.16922926902771,
+      "learning_rate": 2e-05,
+      "loss": 1.5928,
+      "step": 22
+    },
+    {
+      "epoch": 0.24742268041237114,
+      "grad_norm": 2.276587724685669,
+      "learning_rate": 2e-05,
+      "loss": 1.4918,
+      "step": 24
+    },
+    {
+      "epoch": 0.26804123711340205,
+      "grad_norm": 1.4131243228912354,
+      "learning_rate": 2e-05,
+      "loss": 1.7804,
+      "step": 26
+    },
+    {
+      "epoch": 0.28865979381443296,
+      "grad_norm": 3.375476121902466,
+      "learning_rate": 2e-05,
+      "loss": 1.9648,
+      "step": 28
+    },
+    {
+      "epoch": 0.30927835051546393,
+      "grad_norm": 2.6980457305908203,
+      "learning_rate": 2e-05,
+      "loss": 1.9027,
+      "step": 30
+    },
+    {
+      "epoch": 0.32989690721649484,
+      "grad_norm": 1.1185120344161987,
+      "learning_rate": 2e-05,
+      "loss": 1.2945,
+      "step": 32
+    },
+    {
+      "epoch": 0.35051546391752575,
+      "grad_norm": 1.5742499828338623,
+      "learning_rate": 2e-05,
+      "loss": 2.3652,
+      "step": 34
+    },
+    {
+      "epoch": 0.3711340206185567,
+      "grad_norm": 1.6757092475891113,
+      "learning_rate": 2e-05,
+      "loss": 1.5789,
+      "step": 36
+    },
+    {
+      "epoch": 0.3917525773195876,
+      "grad_norm": 1.5958377122879028,
+      "learning_rate": 2e-05,
+      "loss": 1.4983,
+      "step": 38
+    },
+    {
+      "epoch": 0.41237113402061853,
+      "grad_norm": 1.3994206190109253,
+      "learning_rate": 2e-05,
+      "loss": 0.8934,
+      "step": 40
+    },
+    {
+      "epoch": 0.4329896907216495,
+      "grad_norm": 0.8964346647262573,
+      "learning_rate": 2e-05,
+      "loss": 0.7392,
+      "step": 42
+    },
+    {
+      "epoch": 0.4536082474226804,
+      "grad_norm": 1.5910592079162598,
+      "learning_rate": 2e-05,
+      "loss": 0.8057,
+      "step": 44
+    },
+    {
+      "epoch": 0.4742268041237113,
+      "grad_norm": 0.8048728704452515,
+      "learning_rate": 2e-05,
+      "loss": 0.7514,
+      "step": 46
+    },
+    {
+      "epoch": 0.4948453608247423,
+      "grad_norm": 3.0406651496887207,
+      "learning_rate": 2e-05,
+      "loss": 1.271,
+      "step": 48
+    },
+    {
+      "epoch": 0.5154639175257731,
+      "grad_norm": 2.1475746631622314,
+      "learning_rate": 2e-05,
+      "loss": 1.3316,
+      "step": 50
+    },
+    {
+      "epoch": 0.5360824742268041,
+      "grad_norm": 1.973347544670105,
+      "learning_rate": 2e-05,
+      "loss": 0.9409,
+      "step": 52
+    },
+    {
+      "epoch": 0.5567010309278351,
+      "grad_norm": 0.5019800662994385,
+      "learning_rate": 2e-05,
+      "loss": 0.5754,
+      "step": 54
+    },
+    {
+      "epoch": 0.5773195876288659,
+      "grad_norm": 2.1202926635742188,
+      "learning_rate": 2e-05,
+      "loss": 1.3977,
+      "step": 56
+    },
+    {
+      "epoch": 0.5979381443298969,
+      "grad_norm": 1.2852915525436401,
+      "learning_rate": 2e-05,
+      "loss": 1.6778,
+      "step": 58
+    },
+    {
+      "epoch": 0.6185567010309279,
+      "grad_norm": 1.093619465827942,
+      "learning_rate": 2e-05,
+      "loss": 0.8222,
+      "step": 60
+    },
+    {
+      "epoch": 0.6391752577319587,
+      "grad_norm": 0.7490342259407043,
+      "learning_rate": 2e-05,
+      "loss": 0.6013,
+      "step": 62
+    },
+    {
+      "epoch": 0.6597938144329897,
+      "grad_norm": 2.6893742084503174,
+      "learning_rate": 2e-05,
+      "loss": 1.2905,
+      "step": 64
+    },
+    {
+      "epoch": 0.6804123711340206,
+      "grad_norm": 3.0177910327911377,
+      "learning_rate": 2e-05,
+      "loss": 1.7748,
+      "step": 66
+    },
+    {
+      "epoch": 0.7010309278350515,
+      "grad_norm": 1.123380422592163,
+      "learning_rate": 2e-05,
+      "loss": 0.8262,
+      "step": 68
+    },
+    {
+      "epoch": 0.7216494845360825,
+      "grad_norm": 1.6035982370376587,
+      "learning_rate": 2e-05,
+      "loss": 0.798,
+      "step": 70
+    },
+    {
+      "epoch": 0.7422680412371134,
+      "grad_norm": 0.7902660965919495,
+      "learning_rate": 2e-05,
+      "loss": 1.0709,
+      "step": 72
+    },
+    {
+      "epoch": 0.7628865979381443,
+      "grad_norm": 1.8285802602767944,
+      "learning_rate": 2e-05,
+      "loss": 1.0743,
+      "step": 74
+    },
+    {
+      "epoch": 0.7835051546391752,
+      "grad_norm": 2.9130942821502686,
+      "learning_rate": 2e-05,
+      "loss": 2.0891,
+      "step": 76
+    },
+    {
+      "epoch": 0.8041237113402062,
+      "grad_norm": 1.4661481380462646,
+      "learning_rate": 2e-05,
+      "loss": 1.1128,
+      "step": 78
+    },
+    {
+      "epoch": 0.8247422680412371,
+      "grad_norm": 2.301260471343994,
+      "learning_rate": 2e-05,
+      "loss": 1.6207,
+      "step": 80
+    },
+    {
+      "epoch": 0.845360824742268,
+      "grad_norm": 1.637123465538025,
+      "learning_rate": 2e-05,
+      "loss": 1.3459,
+      "step": 82
+    },
+    {
+      "epoch": 0.865979381443299,
+      "grad_norm": 1.056007742881775,
+      "learning_rate": 2e-05,
+      "loss": 1.2215,
+      "step": 84
+    },
+    {
+      "epoch": 0.8865979381443299,
+      "grad_norm": 1.2907710075378418,
+      "learning_rate": 2e-05,
+      "loss": 1.6295,
+      "step": 86
+    },
+    {
+      "epoch": 0.9072164948453608,
+      "grad_norm": 1.3023312091827393,
+      "learning_rate": 2e-05,
+      "loss": 1.0457,
+      "step": 88
+    },
+    {
+      "epoch": 0.9278350515463918,
+      "grad_norm": 0.39116430282592773,
+      "learning_rate": 2e-05,
+      "loss": 1.1983,
+      "step": 90
+    },
+    {
+      "epoch": 0.9484536082474226,
+      "grad_norm": 0.9639070630073547,
+      "learning_rate": 2e-05,
+      "loss": 1.1595,
+      "step": 92
+    },
+    {
+      "epoch": 0.9690721649484536,
+      "grad_norm": 1.6161588430404663,
+      "learning_rate": 2e-05,
+      "loss": 1.2601,
+      "step": 94
+    },
+    {
+      "epoch": 0.9896907216494846,
+      "grad_norm": 2.380856513977051,
+      "learning_rate": 2e-05,
+      "loss": 0.6827,
+      "step": 96
+    },
+    {
+      "epoch": 1.0,
+      "step": 97,
+      "total_flos": 2.074250449204019e+16,
+      "train_loss": 1.2486689803526574,
+      "train_runtime": 347.5167,
+      "train_samples_per_second": 1.116,
+      "train_steps_per_second": 0.279
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 97,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 2.074250449204019e+16,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:09cd08a35ceaf65f8b4b8c2b3943b855c5e7348c334be564b82fa3d4dc95bad8
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d6ce216ab0402be87c84d6af509a84f0ce168cf22217ee6eb8263e51dd6142d6
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0970a229f1f57205586ba91eed0371c4af2fe6fbfaa4a6ec8f6aa437d820ac8d
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b873fa30a8c5d382069a0c536ec17db452e64f48a4c4c7b3c9dafca48b601f1d
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099_SEED3/5_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:99c23eb08adf5a7a45e3b25bc3f6dd68703808836dcdddf7a33aa4d8121f930d
+size 791576546