thkim0305 commited on May 5, 2025

Commit

f182f3c

verified ·

1 Parent(s): 9d619ad

Upload folder using huggingface_hub

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round10.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round12.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round15.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round17.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round2.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round20.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round5.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round7.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_trainer_state.json +378 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round10.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round12.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round15.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round17.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round2.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round20.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round5.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round7.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_trainer_state.json +378 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round10.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round12.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round15.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round17.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round2.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round20.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round5.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round7.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_trainer_state.json +378 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round10.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round12.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round15.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round17.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round2.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round20.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round5.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round7.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_trainer_state.json +378 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round10.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round12.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round15.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round17.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round2.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round20.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round5.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round7.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_trainer_state.json +378 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round10.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round12.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round15.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round17.pth +3 -0
client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round2.pth +3 -0

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f7c6682c76a002291c94ab5400f46aad989063cceafda2bb335890c225c469f6
+size 368443438

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:03ffd7f8cda1890da71515a263f4200fb94e95e55d8015c4884ebbe683b11dde
+size 368443438

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:463639587f71bcbd5b9d4481a2af8b2a50eb9728a9d1126789118ee6213c321d
+size 368443438

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:eb0d4a5ef7da16ffc179066f20f6577b695c216c334fb9207199ac0bf36085d7
+size 368443438

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6f998475c714790ced260b7d08905deaf25397487d22f12b88939abb267ba23b
+size 368442474

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e8e030d7c0cfa7e8171852dba2ae6e04bb8cd8017f7d3a490b15f7ca76d21aa1
+size 368443438

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:616c57ef296799deec39f31f99f043a4bdf1ad531074e5c884d8f1beff2d6e35
+size 368442474

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:93589c35187351c587af0cb2f9bd08601b587df4aa00cd4809909821c10c86b4
+size 368442474

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/0_trainer_state.json ADDED Viewed

	@@ -0,0 +1,378 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 97,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.020618556701030927,
+      "grad_norm": 1.443185567855835,
+      "learning_rate": 2e-05,
+      "loss": 1.0495,
+      "step": 2
+    },
+    {
+      "epoch": 0.041237113402061855,
+      "grad_norm": 1.8465604782104492,
+      "learning_rate": 2e-05,
+      "loss": 1.2367,
+      "step": 4
+    },
+    {
+      "epoch": 0.061855670103092786,
+      "grad_norm": 1.3454159498214722,
+      "learning_rate": 2e-05,
+      "loss": 1.1763,
+      "step": 6
+    },
+    {
+      "epoch": 0.08247422680412371,
+      "grad_norm": 4.38826847076416,
+      "learning_rate": 2e-05,
+      "loss": 2.243,
+      "step": 8
+    },
+    {
+      "epoch": 0.10309278350515463,
+      "grad_norm": 0.6966120600700378,
+      "learning_rate": 2e-05,
+      "loss": 0.8164,
+      "step": 10
+    },
+    {
+      "epoch": 0.12371134020618557,
+      "grad_norm": 0.5520138144493103,
+      "learning_rate": 2e-05,
+      "loss": 0.5507,
+      "step": 12
+    },
+    {
+      "epoch": 0.14432989690721648,
+      "grad_norm": 2.7041213512420654,
+      "learning_rate": 2e-05,
+      "loss": 1.2546,
+      "step": 14
+    },
+    {
+      "epoch": 0.16494845360824742,
+      "grad_norm": 4.7814555168151855,
+      "learning_rate": 2e-05,
+      "loss": 1.4361,
+      "step": 16
+    },
+    {
+      "epoch": 0.18556701030927836,
+      "grad_norm": 0.8622943758964539,
+      "learning_rate": 2e-05,
+      "loss": 0.7884,
+      "step": 18
+    },
+    {
+      "epoch": 0.20618556701030927,
+      "grad_norm": 0.8466795086860657,
+      "learning_rate": 2e-05,
+      "loss": 0.8781,
+      "step": 20
+    },
+    {
+      "epoch": 0.2268041237113402,
+      "grad_norm": 2.9229226112365723,
+      "learning_rate": 2e-05,
+      "loss": 0.7513,
+      "step": 22
+    },
+    {
+      "epoch": 0.24742268041237114,
+      "grad_norm": 1.2761527299880981,
+      "learning_rate": 2e-05,
+      "loss": 0.9905,
+      "step": 24
+    },
+    {
+      "epoch": 0.26804123711340205,
+      "grad_norm": 2.6934807300567627,
+      "learning_rate": 2e-05,
+      "loss": 1.8354,
+      "step": 26
+    },
+    {
+      "epoch": 0.28865979381443296,
+      "grad_norm": 1.0872917175292969,
+      "learning_rate": 2e-05,
+      "loss": 1.2724,
+      "step": 28
+    },
+    {
+      "epoch": 0.30927835051546393,
+      "grad_norm": 2.1482253074645996,
+      "learning_rate": 2e-05,
+      "loss": 1.6143,
+      "step": 30
+    },
+    {
+      "epoch": 0.32989690721649484,
+      "grad_norm": 0.905875563621521,
+      "learning_rate": 2e-05,
+      "loss": 1.6322,
+      "step": 32
+    },
+    {
+      "epoch": 0.35051546391752575,
+      "grad_norm": 0.6854360103607178,
+      "learning_rate": 2e-05,
+      "loss": 0.8599,
+      "step": 34
+    },
+    {
+      "epoch": 0.3711340206185567,
+      "grad_norm": 0.8919254541397095,
+      "learning_rate": 2e-05,
+      "loss": 1.0498,
+      "step": 36
+    },
+    {
+      "epoch": 0.3917525773195876,
+      "grad_norm": 1.6378024816513062,
+      "learning_rate": 2e-05,
+      "loss": 1.1343,
+      "step": 38
+    },
+    {
+      "epoch": 0.41237113402061853,
+      "grad_norm": 1.0561065673828125,
+      "learning_rate": 2e-05,
+      "loss": 1.0583,
+      "step": 40
+    },
+    {
+      "epoch": 0.4329896907216495,
+      "grad_norm": 0.7613285779953003,
+      "learning_rate": 2e-05,
+      "loss": 1.5316,
+      "step": 42
+    },
+    {
+      "epoch": 0.4536082474226804,
+      "grad_norm": 1.940731167793274,
+      "learning_rate": 2e-05,
+      "loss": 0.7388,
+      "step": 44
+    },
+    {
+      "epoch": 0.4742268041237113,
+      "grad_norm": 1.1051706075668335,
+      "learning_rate": 2e-05,
+      "loss": 1.0972,
+      "step": 46
+    },
+    {
+      "epoch": 0.4948453608247423,
+      "grad_norm": 1.7498652935028076,
+      "learning_rate": 2e-05,
+      "loss": 0.735,
+      "step": 48
+    },
+    {
+      "epoch": 0.5154639175257731,
+      "grad_norm": 1.488133192062378,
+      "learning_rate": 2e-05,
+      "loss": 1.435,
+      "step": 50
+    },
+    {
+      "epoch": 0.5360824742268041,
+      "grad_norm": 0.48400750756263733,
+      "learning_rate": 2e-05,
+      "loss": 0.219,
+      "step": 52
+    },
+    {
+      "epoch": 0.5567010309278351,
+      "grad_norm": 0.843970775604248,
+      "learning_rate": 2e-05,
+      "loss": 1.3159,
+      "step": 54
+    },
+    {
+      "epoch": 0.5773195876288659,
+      "grad_norm": 2.2032525539398193,
+      "learning_rate": 2e-05,
+      "loss": 1.2433,
+      "step": 56
+    },
+    {
+      "epoch": 0.5979381443298969,
+      "grad_norm": 2.2895724773406982,
+      "learning_rate": 2e-05,
+      "loss": 0.6293,
+      "step": 58
+    },
+    {
+      "epoch": 0.6185567010309279,
+      "grad_norm": 1.6934003829956055,
+      "learning_rate": 2e-05,
+      "loss": 0.8883,
+      "step": 60
+    },
+    {
+      "epoch": 0.6391752577319587,
+      "grad_norm": 3.9248857498168945,
+      "learning_rate": 2e-05,
+      "loss": 1.7568,
+      "step": 62
+    },
+    {
+      "epoch": 0.6597938144329897,
+      "grad_norm": 3.8822836875915527,
+      "learning_rate": 2e-05,
+      "loss": 1.358,
+      "step": 64
+    },
+    {
+      "epoch": 0.6804123711340206,
+      "grad_norm": 2.8576316833496094,
+      "learning_rate": 2e-05,
+      "loss": 0.6214,
+      "step": 66
+    },
+    {
+      "epoch": 0.7010309278350515,
+      "grad_norm": 2.46586537361145,
+      "learning_rate": 2e-05,
+      "loss": 0.39,
+      "step": 68
+    },
+    {
+      "epoch": 0.7216494845360825,
+      "grad_norm": 2.4729208946228027,
+      "learning_rate": 2e-05,
+      "loss": 0.9929,
+      "step": 70
+    },
+    {
+      "epoch": 0.7422680412371134,
+      "grad_norm": 2.4468770027160645,
+      "learning_rate": 2e-05,
+      "loss": 1.4753,
+      "step": 72
+    },
+    {
+      "epoch": 0.7628865979381443,
+      "grad_norm": 5.142044544219971,
+      "learning_rate": 2e-05,
+      "loss": 1.4092,
+      "step": 74
+    },
+    {
+      "epoch": 0.7835051546391752,
+      "grad_norm": 3.540414333343506,
+      "learning_rate": 2e-05,
+      "loss": 1.3685,
+      "step": 76
+    },
+    {
+      "epoch": 0.8041237113402062,
+      "grad_norm": 1.6057883501052856,
+      "learning_rate": 2e-05,
+      "loss": 0.8978,
+      "step": 78
+    },
+    {
+      "epoch": 0.8247422680412371,
+      "grad_norm": 2.5897274017333984,
+      "learning_rate": 2e-05,
+      "loss": 1.5045,
+      "step": 80
+    },
+    {
+      "epoch": 0.845360824742268,
+      "grad_norm": 0.60903400182724,
+      "learning_rate": 2e-05,
+      "loss": 0.97,
+      "step": 82
+    },
+    {
+      "epoch": 0.865979381443299,
+      "grad_norm": 1.9482678174972534,
+      "learning_rate": 2e-05,
+      "loss": 1.8024,
+      "step": 84
+    },
+    {
+      "epoch": 0.8865979381443299,
+      "grad_norm": 1.7348854541778564,
+      "learning_rate": 2e-05,
+      "loss": 1.105,
+      "step": 86
+    },
+    {
+      "epoch": 0.9072164948453608,
+      "grad_norm": 1.3475691080093384,
+      "learning_rate": 2e-05,
+      "loss": 1.6093,
+      "step": 88
+    },
+    {
+      "epoch": 0.9278350515463918,
+      "grad_norm": 0.98420250415802,
+      "learning_rate": 2e-05,
+      "loss": 0.6538,
+      "step": 90
+    },
+    {
+      "epoch": 0.9484536082474226,
+      "grad_norm": 1.3864518404006958,
+      "learning_rate": 2e-05,
+      "loss": 1.3196,
+      "step": 92
+    },
+    {
+      "epoch": 0.9690721649484536,
+      "grad_norm": 1.4003015756607056,
+      "learning_rate": 2e-05,
+      "loss": 0.7891,
+      "step": 94
+    },
+    {
+      "epoch": 0.9896907216494846,
+      "grad_norm": 1.4709246158599854,
+      "learning_rate": 2e-05,
+      "loss": 0.8115,
+      "step": 96
+    },
+    {
+      "epoch": 1.0,
+      "step": 97,
+      "total_flos": 5653713448337408.0,
+      "train_loss": 1.1264018225915653,
+      "train_runtime": 208.5258,
+      "train_samples_per_second": 1.861,
+      "train_steps_per_second": 0.465
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 97,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 5653713448337408.0,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:669a580e6490be915efbd67e52ae5d5eebf6ec1cfe8ed75462a0b139aaf852b9
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f5ee3bb60763f435737915de658c4663b6a667f582ed8be7e60fef7157534dd7
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dcf13622c365cefe6bc7f685fad7d20f552bf6b29003b54dcd82de9dabdc3805
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5e6c9656642a5444d90acfa6f0daa4c79a3e390288297eeb1abf064e503f5ab0
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7f0485b8a1b36390a6785f6d93b6e361d6a74346cc48938a91ac1c35ef15235b
+size 791576546

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a0517ce73a108585cff98eeb02bb4f4f800a287e04dd52f03abba4325f2a381e
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1756b6cdf77c2928be961e35efda166cc775b9055a05d892a15d0694cd5990d3
+size 791576546

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e3fdb5458b09254ba799a8103f3bdfeaae78cf8e16ddac228e526bb1887f33ba
+size 791576546

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/1_trainer_state.json ADDED Viewed

	@@ -0,0 +1,378 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 97,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.020618556701030927,
+      "grad_norm": 4.060997486114502,
+      "learning_rate": 2e-05,
+      "loss": 1.5594,
+      "step": 2
+    },
+    {
+      "epoch": 0.041237113402061855,
+      "grad_norm": 2.254009962081909,
+      "learning_rate": 2e-05,
+      "loss": 2.394,
+      "step": 4
+    },
+    {
+      "epoch": 0.061855670103092786,
+      "grad_norm": 1.4530246257781982,
+      "learning_rate": 2e-05,
+      "loss": 1.1717,
+      "step": 6
+    },
+    {
+      "epoch": 0.08247422680412371,
+      "grad_norm": 0.869075357913971,
+      "learning_rate": 2e-05,
+      "loss": 0.6181,
+      "step": 8
+    },
+    {
+      "epoch": 0.10309278350515463,
+      "grad_norm": 0.40417155623435974,
+      "learning_rate": 2e-05,
+      "loss": 0.7947,
+      "step": 10
+    },
+    {
+      "epoch": 0.12371134020618557,
+      "grad_norm": 0.7273326516151428,
+      "learning_rate": 2e-05,
+      "loss": 1.2993,
+      "step": 12
+    },
+    {
+      "epoch": 0.14432989690721648,
+      "grad_norm": 0.7000077366828918,
+      "learning_rate": 2e-05,
+      "loss": 0.9332,
+      "step": 14
+    },
+    {
+      "epoch": 0.16494845360824742,
+      "grad_norm": 0.7522069811820984,
+      "learning_rate": 2e-05,
+      "loss": 1.0824,
+      "step": 16
+    },
+    {
+      "epoch": 0.18556701030927836,
+      "grad_norm": 0.9031182527542114,
+      "learning_rate": 2e-05,
+      "loss": 0.9363,
+      "step": 18
+    },
+    {
+      "epoch": 0.20618556701030927,
+      "grad_norm": 1.0295480489730835,
+      "learning_rate": 2e-05,
+      "loss": 1.4712,
+      "step": 20
+    },
+    {
+      "epoch": 0.2268041237113402,
+      "grad_norm": 0.9623363614082336,
+      "learning_rate": 2e-05,
+      "loss": 1.1707,
+      "step": 22
+    },
+    {
+      "epoch": 0.24742268041237114,
+      "grad_norm": 0.3788335621356964,
+      "learning_rate": 2e-05,
+      "loss": 1.1249,
+      "step": 24
+    },
+    {
+      "epoch": 0.26804123711340205,
+      "grad_norm": 0.9554972648620605,
+      "learning_rate": 2e-05,
+      "loss": 0.77,
+      "step": 26
+    },
+    {
+      "epoch": 0.28865979381443296,
+      "grad_norm": 3.608424425125122,
+      "learning_rate": 2e-05,
+      "loss": 1.8768,
+      "step": 28
+    },
+    {
+      "epoch": 0.30927835051546393,
+      "grad_norm": 1.3351783752441406,
+      "learning_rate": 2e-05,
+      "loss": 1.1167,
+      "step": 30
+    },
+    {
+      "epoch": 0.32989690721649484,
+      "grad_norm": 0.9246235489845276,
+      "learning_rate": 2e-05,
+      "loss": 0.5636,
+      "step": 32
+    },
+    {
+      "epoch": 0.35051546391752575,
+      "grad_norm": 0.8108372688293457,
+      "learning_rate": 2e-05,
+      "loss": 0.6283,
+      "step": 34
+    },
+    {
+      "epoch": 0.3711340206185567,
+      "grad_norm": 2.429359197616577,
+      "learning_rate": 2e-05,
+      "loss": 0.6775,
+      "step": 36
+    },
+    {
+      "epoch": 0.3917525773195876,
+      "grad_norm": 1.0958515405654907,
+      "learning_rate": 2e-05,
+      "loss": 0.6208,
+      "step": 38
+    },
+    {
+      "epoch": 0.41237113402061853,
+      "grad_norm": 0.9364616870880127,
+      "learning_rate": 2e-05,
+      "loss": 0.9213,
+      "step": 40
+    },
+    {
+      "epoch": 0.4329896907216495,
+      "grad_norm": 2.9376447200775146,
+      "learning_rate": 2e-05,
+      "loss": 1.0253,
+      "step": 42
+    },
+    {
+      "epoch": 0.4536082474226804,
+      "grad_norm": 0.9935062527656555,
+      "learning_rate": 2e-05,
+      "loss": 1.875,
+      "step": 44
+    },
+    {
+      "epoch": 0.4742268041237113,
+      "grad_norm": 0.5480442643165588,
+      "learning_rate": 2e-05,
+      "loss": 0.5909,
+      "step": 46
+    },
+    {
+      "epoch": 0.4948453608247423,
+      "grad_norm": 0.5784210562705994,
+      "learning_rate": 2e-05,
+      "loss": 0.8151,
+      "step": 48
+    },
+    {
+      "epoch": 0.5154639175257731,
+      "grad_norm": 1.056527018547058,
+      "learning_rate": 2e-05,
+      "loss": 0.7226,
+      "step": 50
+    },
+    {
+      "epoch": 0.5360824742268041,
+      "grad_norm": 0.8988001346588135,
+      "learning_rate": 2e-05,
+      "loss": 1.1636,
+      "step": 52
+    },
+    {
+      "epoch": 0.5567010309278351,
+      "grad_norm": 3.2083346843719482,
+      "learning_rate": 2e-05,
+      "loss": 1.0256,
+      "step": 54
+    },
+    {
+      "epoch": 0.5773195876288659,
+      "grad_norm": 1.1363922357559204,
+      "learning_rate": 2e-05,
+      "loss": 1.3127,
+      "step": 56
+    },
+    {
+      "epoch": 0.5979381443298969,
+      "grad_norm": 3.8423314094543457,
+      "learning_rate": 2e-05,
+      "loss": 1.725,
+      "step": 58
+    },
+    {
+      "epoch": 0.6185567010309279,
+      "grad_norm": 1.043357253074646,
+      "learning_rate": 2e-05,
+      "loss": 1.1183,
+      "step": 60
+    },
+    {
+      "epoch": 0.6391752577319587,
+      "grad_norm": 3.4112141132354736,
+      "learning_rate": 2e-05,
+      "loss": 1.4553,
+      "step": 62
+    },
+    {
+      "epoch": 0.6597938144329897,
+      "grad_norm": 0.9900936484336853,
+      "learning_rate": 2e-05,
+      "loss": 0.6987,
+      "step": 64
+    },
+    {
+      "epoch": 0.6804123711340206,
+      "grad_norm": 1.8460667133331299,
+      "learning_rate": 2e-05,
+      "loss": 1.2903,
+      "step": 66
+    },
+    {
+      "epoch": 0.7010309278350515,
+      "grad_norm": 0.4582524299621582,
+      "learning_rate": 2e-05,
+      "loss": 1.0396,
+      "step": 68
+    },
+    {
+      "epoch": 0.7216494845360825,
+      "grad_norm": 1.4106889963150024,
+      "learning_rate": 2e-05,
+      "loss": 1.1477,
+      "step": 70
+    },
+    {
+      "epoch": 0.7422680412371134,
+      "grad_norm": 1.5957890748977661,
+      "learning_rate": 2e-05,
+      "loss": 1.1479,
+      "step": 72
+    },
+    {
+      "epoch": 0.7628865979381443,
+      "grad_norm": 0.9033636450767517,
+      "learning_rate": 2e-05,
+      "loss": 1.3359,
+      "step": 74
+    },
+    {
+      "epoch": 0.7835051546391752,
+      "grad_norm": 0.7324110269546509,
+      "learning_rate": 2e-05,
+      "loss": 0.7437,
+      "step": 76
+    },
+    {
+      "epoch": 0.8041237113402062,
+      "grad_norm": 1.1791794300079346,
+      "learning_rate": 2e-05,
+      "loss": 1.2022,
+      "step": 78
+    },
+    {
+      "epoch": 0.8247422680412371,
+      "grad_norm": 0.4742436707019806,
+      "learning_rate": 2e-05,
+      "loss": 0.7892,
+      "step": 80
+    },
+    {
+      "epoch": 0.845360824742268,
+      "grad_norm": 1.18353271484375,
+      "learning_rate": 2e-05,
+      "loss": 1.077,
+      "step": 82
+    },
+    {
+      "epoch": 0.865979381443299,
+      "grad_norm": 0.9750029444694519,
+      "learning_rate": 2e-05,
+      "loss": 0.9788,
+      "step": 84
+    },
+    {
+      "epoch": 0.8865979381443299,
+      "grad_norm": 2.6100590229034424,
+      "learning_rate": 2e-05,
+      "loss": 1.4546,
+      "step": 86
+    },
+    {
+      "epoch": 0.9072164948453608,
+      "grad_norm": 0.9122608304023743,
+      "learning_rate": 2e-05,
+      "loss": 0.6003,
+      "step": 88
+    },
+    {
+      "epoch": 0.9278350515463918,
+      "grad_norm": 1.024173617362976,
+      "learning_rate": 2e-05,
+      "loss": 0.7366,
+      "step": 90
+    },
+    {
+      "epoch": 0.9484536082474226,
+      "grad_norm": 0.7152318954467773,
+      "learning_rate": 2e-05,
+      "loss": 0.5065,
+      "step": 92
+    },
+    {
+      "epoch": 0.9690721649484536,
+      "grad_norm": 1.7300605773925781,
+      "learning_rate": 2e-05,
+      "loss": 1.4227,
+      "step": 94
+    },
+    {
+      "epoch": 0.9896907216494846,
+      "grad_norm": 1.2942312955856323,
+      "learning_rate": 2e-05,
+      "loss": 0.9952,
+      "step": 96
+    },
+    {
+      "epoch": 1.0,
+      "step": 97,
+      "total_flos": 1.3522822525616128e+16,
+      "train_loss": 1.072485186390041,
+      "train_runtime": 318.3533,
+      "train_samples_per_second": 1.219,
+      "train_steps_per_second": 0.305
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 97,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1.3522822525616128e+16,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:502b1f2466482d60ae4368748bd2bbb748c1eef0763cc3198c7c6693b693cda2
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e029bd4f689e14cf52f62173c28505256fdf4c36180fcbd2dce37e046ed0aea4
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9bae73bf0f0ce33ecd007f09d6bc20372df66c432233a979da77558ee0562266
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f6efdd67bba7b9f92913a0a5f78a80c0d2f37330882a17c1d4c937e8821b62c1
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:680cc48edce4581b07b94077943e4d9e9f8e437962c27221e4f5579517ee781a
+size 791576546

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:95325cb63bcc0510e8cdf48f2026637a13810fa472c8d4fa373deebf0c544b94
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b7742c3fe0f7d965875edeb90a118edb19499505b66dc7526653285401f38a4d
+size 791576546

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:04669bd514938a07c8c573fd80110f73a858b311023e7a52be912ff48f82d6bb
+size 791576546

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/2_trainer_state.json ADDED Viewed

	@@ -0,0 +1,378 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 97,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.020618556701030927,
+      "grad_norm": 2.7177300453186035,
+      "learning_rate": 2e-05,
+      "loss": 1.0926,
+      "step": 2
+    },
+    {
+      "epoch": 0.041237113402061855,
+      "grad_norm": 1.6555100679397583,
+      "learning_rate": 2e-05,
+      "loss": 0.6273,
+      "step": 4
+    },
+    {
+      "epoch": 0.061855670103092786,
+      "grad_norm": 4.007697105407715,
+      "learning_rate": 2e-05,
+      "loss": 2.815,
+      "step": 6
+    },
+    {
+      "epoch": 0.08247422680412371,
+      "grad_norm": 1.5810902118682861,
+      "learning_rate": 2e-05,
+      "loss": 0.7118,
+      "step": 8
+    },
+    {
+      "epoch": 0.10309278350515463,
+      "grad_norm": 2.4874520301818848,
+      "learning_rate": 2e-05,
+      "loss": 1.5025,
+      "step": 10
+    },
+    {
+      "epoch": 0.12371134020618557,
+      "grad_norm": 1.162537693977356,
+      "learning_rate": 2e-05,
+      "loss": 0.3331,
+      "step": 12
+    },
+    {
+      "epoch": 0.14432989690721648,
+      "grad_norm": 3.231822967529297,
+      "learning_rate": 2e-05,
+      "loss": 0.7719,
+      "step": 14
+    },
+    {
+      "epoch": 0.16494845360824742,
+      "grad_norm": 0.9158895015716553,
+      "learning_rate": 2e-05,
+      "loss": 0.6472,
+      "step": 16
+    },
+    {
+      "epoch": 0.18556701030927836,
+      "grad_norm": 2.0289742946624756,
+      "learning_rate": 2e-05,
+      "loss": 0.7641,
+      "step": 18
+    },
+    {
+      "epoch": 0.20618556701030927,
+      "grad_norm": 3.32369327545166,
+      "learning_rate": 2e-05,
+      "loss": 1.0675,
+      "step": 20
+    },
+    {
+      "epoch": 0.2268041237113402,
+      "grad_norm": 1.4045751094818115,
+      "learning_rate": 2e-05,
+      "loss": 0.9268,
+      "step": 22
+    },
+    {
+      "epoch": 0.24742268041237114,
+      "grad_norm": 0.6414214968681335,
+      "learning_rate": 2e-05,
+      "loss": 0.5625,
+      "step": 24
+    },
+    {
+      "epoch": 0.26804123711340205,
+      "grad_norm": 2.570258140563965,
+      "learning_rate": 2e-05,
+      "loss": 0.7383,
+      "step": 26
+    },
+    {
+      "epoch": 0.28865979381443296,
+      "grad_norm": 1.839545488357544,
+      "learning_rate": 2e-05,
+      "loss": 1.7098,
+      "step": 28
+    },
+    {
+      "epoch": 0.30927835051546393,
+      "grad_norm": 1.3686957359313965,
+      "learning_rate": 2e-05,
+      "loss": 0.596,
+      "step": 30
+    },
+    {
+      "epoch": 0.32989690721649484,
+      "grad_norm": 1.3215398788452148,
+      "learning_rate": 2e-05,
+      "loss": 0.3943,
+      "step": 32
+    },
+    {
+      "epoch": 0.35051546391752575,
+      "grad_norm": 1.1492276191711426,
+      "learning_rate": 2e-05,
+      "loss": 0.8084,
+      "step": 34
+    },
+    {
+      "epoch": 0.3711340206185567,
+      "grad_norm": 0.21739822626113892,
+      "learning_rate": 2e-05,
+      "loss": 0.5349,
+      "step": 36
+    },
+    {
+      "epoch": 0.3917525773195876,
+      "grad_norm": 0.766031801700592,
+      "learning_rate": 2e-05,
+      "loss": 0.2763,
+      "step": 38
+    },
+    {
+      "epoch": 0.41237113402061853,
+      "grad_norm": 1.4358357191085815,
+      "learning_rate": 2e-05,
+      "loss": 1.0408,
+      "step": 40
+    },
+    {
+      "epoch": 0.4329896907216495,
+      "grad_norm": 8.695076942443848,
+      "learning_rate": 2e-05,
+      "loss": 2.4291,
+      "step": 42
+    },
+    {
+      "epoch": 0.4536082474226804,
+      "grad_norm": 1.2179341316223145,
+      "learning_rate": 2e-05,
+      "loss": 0.5597,
+      "step": 44
+    },
+    {
+      "epoch": 0.4742268041237113,
+      "grad_norm": 2.2541961669921875,
+      "learning_rate": 2e-05,
+      "loss": 2.0812,
+      "step": 46
+    },
+    {
+      "epoch": 0.4948453608247423,
+      "grad_norm": 1.579424500465393,
+      "learning_rate": 2e-05,
+      "loss": 1.7606,
+      "step": 48
+    },
+    {
+      "epoch": 0.5154639175257731,
+      "grad_norm": 1.6125601530075073,
+      "learning_rate": 2e-05,
+      "loss": 1.0159,
+      "step": 50
+    },
+    {
+      "epoch": 0.5360824742268041,
+      "grad_norm": 0.2814699709415436,
+      "learning_rate": 2e-05,
+      "loss": 0.3651,
+      "step": 52
+    },
+    {
+      "epoch": 0.5567010309278351,
+      "grad_norm": 2.234740734100342,
+      "learning_rate": 2e-05,
+      "loss": 0.846,
+      "step": 54
+    },
+    {
+      "epoch": 0.5773195876288659,
+      "grad_norm": 3.462404489517212,
+      "learning_rate": 2e-05,
+      "loss": 1.4232,
+      "step": 56
+    },
+    {
+      "epoch": 0.5979381443298969,
+      "grad_norm": 1.109181523323059,
+      "learning_rate": 2e-05,
+      "loss": 0.7863,
+      "step": 58
+    },
+    {
+      "epoch": 0.6185567010309279,
+      "grad_norm": 2.8189926147460938,
+      "learning_rate": 2e-05,
+      "loss": 0.6734,
+      "step": 60
+    },
+    {
+      "epoch": 0.6391752577319587,
+      "grad_norm": 1.4701120853424072,
+      "learning_rate": 2e-05,
+      "loss": 0.7984,
+      "step": 62
+    },
+    {
+      "epoch": 0.6597938144329897,
+      "grad_norm": 1.5160466432571411,
+      "learning_rate": 2e-05,
+      "loss": 0.8513,
+      "step": 64
+    },
+    {
+      "epoch": 0.6804123711340206,
+      "grad_norm": 1.2065556049346924,
+      "learning_rate": 2e-05,
+      "loss": 0.4933,
+      "step": 66
+    },
+    {
+      "epoch": 0.7010309278350515,
+      "grad_norm": 0.5657169818878174,
+      "learning_rate": 2e-05,
+      "loss": 0.3078,
+      "step": 68
+    },
+    {
+      "epoch": 0.7216494845360825,
+      "grad_norm": 5.390564441680908,
+      "learning_rate": 2e-05,
+      "loss": 2.9097,
+      "step": 70
+    },
+    {
+      "epoch": 0.7422680412371134,
+      "grad_norm": 1.6399439573287964,
+      "learning_rate": 2e-05,
+      "loss": 0.8537,
+      "step": 72
+    },
+    {
+      "epoch": 0.7628865979381443,
+      "grad_norm": 0.35270068049430847,
+      "learning_rate": 2e-05,
+      "loss": 0.2654,
+      "step": 74
+    },
+    {
+      "epoch": 0.7835051546391752,
+      "grad_norm": 5.137968063354492,
+      "learning_rate": 2e-05,
+      "loss": 1.5669,
+      "step": 76
+    },
+    {
+      "epoch": 0.8041237113402062,
+      "grad_norm": 1.5322946310043335,
+      "learning_rate": 2e-05,
+      "loss": 0.874,
+      "step": 78
+    },
+    {
+      "epoch": 0.8247422680412371,
+      "grad_norm": 2.5663018226623535,
+      "learning_rate": 2e-05,
+      "loss": 1.0716,
+      "step": 80
+    },
+    {
+      "epoch": 0.845360824742268,
+      "grad_norm": 3.668062925338745,
+      "learning_rate": 2e-05,
+      "loss": 0.6671,
+      "step": 82
+    },
+    {
+      "epoch": 0.865979381443299,
+      "grad_norm": 0.857315182685852,
+      "learning_rate": 2e-05,
+      "loss": 0.3661,
+      "step": 84
+    },
+    {
+      "epoch": 0.8865979381443299,
+      "grad_norm": 0.98568195104599,
+      "learning_rate": 2e-05,
+      "loss": 0.67,
+      "step": 86
+    },
+    {
+      "epoch": 0.9072164948453608,
+      "grad_norm": 0.703881561756134,
+      "learning_rate": 2e-05,
+      "loss": 0.4057,
+      "step": 88
+    },
+    {
+      "epoch": 0.9278350515463918,
+      "grad_norm": 1.4584002494812012,
+      "learning_rate": 2e-05,
+      "loss": 0.5015,
+      "step": 90
+    },
+    {
+      "epoch": 0.9484536082474226,
+      "grad_norm": 2.263429880142212,
+      "learning_rate": 2e-05,
+      "loss": 1.0602,
+      "step": 92
+    },
+    {
+      "epoch": 0.9690721649484536,
+      "grad_norm": 3.9899234771728516,
+      "learning_rate": 2e-05,
+      "loss": 0.708,
+      "step": 94
+    },
+    {
+      "epoch": 0.9896907216494846,
+      "grad_norm": 2.3671796321868896,
+      "learning_rate": 2e-05,
+      "loss": 1.3029,
+      "step": 96
+    },
+    {
+      "epoch": 1.0,
+      "step": 97,
+      "total_flos": 1.5329114357497856e+16,
+      "train_loss": 0.9428910275095517,
+      "train_runtime": 354.7806,
+      "train_samples_per_second": 1.094,
+      "train_steps_per_second": 0.273
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 97,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1.5329114357497856e+16,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cedddde0d3b47f691a44fb56df8c587e70ec3e2d98120c9fef229d4e305135b3
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7b935a7315d7aba3f970d2155591a7c025d5e00762112fe9047b296da732a3b5
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:925479cb7b9cfbe13025d105ef9e24aa527cc08e95edb4a5d57f2b34856d503d
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:66d397dbb4d650578c2060e73c064390a986d117f67a0fed4b60758c4ec0bd7d
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b453f3c79b662bca0906bc6969023a652f1fd620cf5b08fc3ef0e5e309f5b990
+size 791576546

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a92e1016a632bfe164e293aeb7642d2dfbae7090da04ac409a8a7c4e00fc4226
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:222f280a081854656a1d7ef5f4fb2683f19a421ee895ac0cdae8b26f64893669
+size 791576546

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:77bfb8ce9a4a7531fec21d951852d3dbfc5b9546e416285abdd478013d712647
+size 791576546

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/3_trainer_state.json ADDED Viewed

	@@ -0,0 +1,378 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 97,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.020618556701030927,
+      "grad_norm": 0.7246163487434387,
+      "learning_rate": 2e-05,
+      "loss": 1.7324,
+      "step": 2
+    },
+    {
+      "epoch": 0.041237113402061855,
+      "grad_norm": 0.5284512042999268,
+      "learning_rate": 2e-05,
+      "loss": 2.0166,
+      "step": 4
+    },
+    {
+      "epoch": 0.061855670103092786,
+      "grad_norm": 0.49521467089653015,
+      "learning_rate": 2e-05,
+      "loss": 1.3906,
+      "step": 6
+    },
+    {
+      "epoch": 0.08247422680412371,
+      "grad_norm": 0.5752606987953186,
+      "learning_rate": 2e-05,
+      "loss": 1.1865,
+      "step": 8
+    },
+    {
+      "epoch": 0.10309278350515463,
+      "grad_norm": 0.5735695362091064,
+      "learning_rate": 2e-05,
+      "loss": 1.6631,
+      "step": 10
+    },
+    {
+      "epoch": 0.12371134020618557,
+      "grad_norm": 0.35247695446014404,
+      "learning_rate": 2e-05,
+      "loss": 1.5771,
+      "step": 12
+    },
+    {
+      "epoch": 0.14432989690721648,
+      "grad_norm": 0.7416431903839111,
+      "learning_rate": 2e-05,
+      "loss": 1.45,
+      "step": 14
+    },
+    {
+      "epoch": 0.16494845360824742,
+      "grad_norm": 0.8636322021484375,
+      "learning_rate": 2e-05,
+      "loss": 1.3813,
+      "step": 16
+    },
+    {
+      "epoch": 0.18556701030927836,
+      "grad_norm": 0.6410114765167236,
+      "learning_rate": 2e-05,
+      "loss": 1.6523,
+      "step": 18
+    },
+    {
+      "epoch": 0.20618556701030927,
+      "grad_norm": 0.35148540139198303,
+      "learning_rate": 2e-05,
+      "loss": 1.5771,
+      "step": 20
+    },
+    {
+      "epoch": 0.2268041237113402,
+      "grad_norm": 0.5244173407554626,
+      "learning_rate": 2e-05,
+      "loss": 1.5553,
+      "step": 22
+    },
+    {
+      "epoch": 0.24742268041237114,
+      "grad_norm": 0.6992729306221008,
+      "learning_rate": 2e-05,
+      "loss": 1.7803,
+      "step": 24
+    },
+    {
+      "epoch": 0.26804123711340205,
+      "grad_norm": 0.430820494890213,
+      "learning_rate": 2e-05,
+      "loss": 1.6299,
+      "step": 26
+    },
+    {
+      "epoch": 0.28865979381443296,
+      "grad_norm": 0.4983491003513336,
+      "learning_rate": 2e-05,
+      "loss": 1.321,
+      "step": 28
+    },
+    {
+      "epoch": 0.30927835051546393,
+      "grad_norm": 0.45274442434310913,
+      "learning_rate": 2e-05,
+      "loss": 1.4834,
+      "step": 30
+    },
+    {
+      "epoch": 0.32989690721649484,
+      "grad_norm": 0.653442919254303,
+      "learning_rate": 2e-05,
+      "loss": 1.5889,
+      "step": 32
+    },
+    {
+      "epoch": 0.35051546391752575,
+      "grad_norm": 0.42392614483833313,
+      "learning_rate": 2e-05,
+      "loss": 1.3359,
+      "step": 34
+    },
+    {
+      "epoch": 0.3711340206185567,
+      "grad_norm": 0.49543508887290955,
+      "learning_rate": 2e-05,
+      "loss": 1.7627,
+      "step": 36
+    },
+    {
+      "epoch": 0.3917525773195876,
+      "grad_norm": 0.4652840793132782,
+      "learning_rate": 2e-05,
+      "loss": 1.4604,
+      "step": 38
+    },
+    {
+      "epoch": 0.41237113402061853,
+      "grad_norm": 0.6317560076713562,
+      "learning_rate": 2e-05,
+      "loss": 1.6349,
+      "step": 40
+    },
+    {
+      "epoch": 0.4329896907216495,
+      "grad_norm": 0.5806442499160767,
+      "learning_rate": 2e-05,
+      "loss": 1.6519,
+      "step": 42
+    },
+    {
+      "epoch": 0.4536082474226804,
+      "grad_norm": 0.568714439868927,
+      "learning_rate": 2e-05,
+      "loss": 1.4482,
+      "step": 44
+    },
+    {
+      "epoch": 0.4742268041237113,
+      "grad_norm": 0.6616501808166504,
+      "learning_rate": 2e-05,
+      "loss": 1.5454,
+      "step": 46
+    },
+    {
+      "epoch": 0.4948453608247423,
+      "grad_norm": 1.0585500001907349,
+      "learning_rate": 2e-05,
+      "loss": 1.6943,
+      "step": 48
+    },
+    {
+      "epoch": 0.5154639175257731,
+      "grad_norm": 0.5242922306060791,
+      "learning_rate": 2e-05,
+      "loss": 1.5273,
+      "step": 50
+    },
+    {
+      "epoch": 0.5360824742268041,
+      "grad_norm": 0.6620081067085266,
+      "learning_rate": 2e-05,
+      "loss": 1.6641,
+      "step": 52
+    },
+    {
+      "epoch": 0.5567010309278351,
+      "grad_norm": 0.8729976415634155,
+      "learning_rate": 2e-05,
+      "loss": 1.3711,
+      "step": 54
+    },
+    {
+      "epoch": 0.5773195876288659,
+      "grad_norm": 0.5533149838447571,
+      "learning_rate": 2e-05,
+      "loss": 1.5024,
+      "step": 56
+    },
+    {
+      "epoch": 0.5979381443298969,
+      "grad_norm": 0.6843786239624023,
+      "learning_rate": 2e-05,
+      "loss": 1.221,
+      "step": 58
+    },
+    {
+      "epoch": 0.6185567010309279,
+      "grad_norm": 0.6899279952049255,
+      "learning_rate": 2e-05,
+      "loss": 1.6211,
+      "step": 60
+    },
+    {
+      "epoch": 0.6391752577319587,
+      "grad_norm": 0.8329319357872009,
+      "learning_rate": 2e-05,
+      "loss": 1.4404,
+      "step": 62
+    },
+    {
+      "epoch": 0.6597938144329897,
+      "grad_norm": 0.557767391204834,
+      "learning_rate": 2e-05,
+      "loss": 1.4336,
+      "step": 64
+    },
+    {
+      "epoch": 0.6804123711340206,
+      "grad_norm": 0.34819966554641724,
+      "learning_rate": 2e-05,
+      "loss": 1.3477,
+      "step": 66
+    },
+    {
+      "epoch": 0.7010309278350515,
+      "grad_norm": 0.7103057503700256,
+      "learning_rate": 2e-05,
+      "loss": 1.5186,
+      "step": 68
+    },
+    {
+      "epoch": 0.7216494845360825,
+      "grad_norm": 0.5542501211166382,
+      "learning_rate": 2e-05,
+      "loss": 1.4287,
+      "step": 70
+    },
+    {
+      "epoch": 0.7422680412371134,
+      "grad_norm": 0.5763942003250122,
+      "learning_rate": 2e-05,
+      "loss": 1.1259,
+      "step": 72
+    },
+    {
+      "epoch": 0.7628865979381443,
+      "grad_norm": 0.7207664847373962,
+      "learning_rate": 2e-05,
+      "loss": 1.3911,
+      "step": 74
+    },
+    {
+      "epoch": 0.7835051546391752,
+      "grad_norm": 0.3724093437194824,
+      "learning_rate": 2e-05,
+      "loss": 1.0917,
+      "step": 76
+    },
+    {
+      "epoch": 0.8041237113402062,
+      "grad_norm": 0.7380734086036682,
+      "learning_rate": 2e-05,
+      "loss": 1.4736,
+      "step": 78
+    },
+    {
+      "epoch": 0.8247422680412371,
+      "grad_norm": 0.7758538722991943,
+      "learning_rate": 2e-05,
+      "loss": 1.9409,
+      "step": 80
+    },
+    {
+      "epoch": 0.845360824742268,
+      "grad_norm": 1.419058084487915,
+      "learning_rate": 2e-05,
+      "loss": 1.0337,
+      "step": 82
+    },
+    {
+      "epoch": 0.865979381443299,
+      "grad_norm": 1.1800168752670288,
+      "learning_rate": 2e-05,
+      "loss": 1.5811,
+      "step": 84
+    },
+    {
+      "epoch": 0.8865979381443299,
+      "grad_norm": 1.0631232261657715,
+      "learning_rate": 2e-05,
+      "loss": 1.6145,
+      "step": 86
+    },
+    {
+      "epoch": 0.9072164948453608,
+      "grad_norm": 0.35026878118515015,
+      "learning_rate": 2e-05,
+      "loss": 1.313,
+      "step": 88
+    },
+    {
+      "epoch": 0.9278350515463918,
+      "grad_norm": 1.1856135129928589,
+      "learning_rate": 2e-05,
+      "loss": 1.0017,
+      "step": 90
+    },
+    {
+      "epoch": 0.9484536082474226,
+      "grad_norm": 0.42485421895980835,
+      "learning_rate": 2e-05,
+      "loss": 0.7556,
+      "step": 92
+    },
+    {
+      "epoch": 0.9690721649484536,
+      "grad_norm": 1.0420420169830322,
+      "learning_rate": 2e-05,
+      "loss": 1.2177,
+      "step": 94
+    },
+    {
+      "epoch": 0.9896907216494846,
+      "grad_norm": 3.806156873703003,
+      "learning_rate": 2e-05,
+      "loss": 1.3557,
+      "step": 96
+    },
+    {
+      "epoch": 1.0,
+      "step": 97,
+      "total_flos": 2.080121124238131e+16,
+      "train_loss": 1.4653891337286566,
+      "train_runtime": 338.7153,
+      "train_samples_per_second": 1.146,
+      "train_steps_per_second": 0.286
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 97,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 2.080121124238131e+16,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:78497632d8d36d7c8168d50e50a254157fc769f9322543ee181269094d28c724
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:162cde5be279d581b1f83ee039cc749ade6ab4ab374af926bad62c033d1dfba4
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:97d4a68f4353dabd81f17a777377c46d55712b0b65c491aa7fbfdbbbdf077a66
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7738f10699765a7bc84949fc0529653275795f44b59cfcc9ca3fcedaea62efcb
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6fec5310decb3f5a8a11e6204443c2e3c9371d7d258ede1f21b69d71da6ae563
+size 791576546

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bcb887b29c54ad36b3482c04658bef8c0c28760138560e9ef4edcd885bf7c3b8
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:04ac06241cdb5fb3b5ea1ce74c2d4a77507ba600b8cb9b1ee6f62ef1e75be7b7
+size 791576546

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4f8f0fe1e2e6495fc31e76e3cb7514d92d767bdc152b3aa1e3379ff7f8810311
+size 791576546

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/4_trainer_state.json ADDED Viewed

	@@ -0,0 +1,378 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 97,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.020618556701030927,
+      "grad_norm": 1.5516194105148315,
+      "learning_rate": 2e-05,
+      "loss": 0.7183,
+      "step": 2
+    },
+    {
+      "epoch": 0.041237113402061855,
+      "grad_norm": 1.6191949844360352,
+      "learning_rate": 2e-05,
+      "loss": 1.0957,
+      "step": 4
+    },
+    {
+      "epoch": 0.061855670103092786,
+      "grad_norm": 1.2471156120300293,
+      "learning_rate": 2e-05,
+      "loss": 0.7448,
+      "step": 6
+    },
+    {
+      "epoch": 0.08247422680412371,
+      "grad_norm": 3.331115484237671,
+      "learning_rate": 2e-05,
+      "loss": 0.8217,
+      "step": 8
+    },
+    {
+      "epoch": 0.10309278350515463,
+      "grad_norm": 4.650871276855469,
+      "learning_rate": 2e-05,
+      "loss": 3.3426,
+      "step": 10
+    },
+    {
+      "epoch": 0.12371134020618557,
+      "grad_norm": 3.3392367362976074,
+      "learning_rate": 2e-05,
+      "loss": 1.2304,
+      "step": 12
+    },
+    {
+      "epoch": 0.14432989690721648,
+      "grad_norm": 0.18230539560317993,
+      "learning_rate": 2e-05,
+      "loss": 0.8133,
+      "step": 14
+    },
+    {
+      "epoch": 0.16494845360824742,
+      "grad_norm": 1.041199803352356,
+      "learning_rate": 2e-05,
+      "loss": 1.1371,
+      "step": 16
+    },
+    {
+      "epoch": 0.18556701030927836,
+      "grad_norm": 0.7668745517730713,
+      "learning_rate": 2e-05,
+      "loss": 0.9596,
+      "step": 18
+    },
+    {
+      "epoch": 0.20618556701030927,
+      "grad_norm": 2.2554526329040527,
+      "learning_rate": 2e-05,
+      "loss": 1.6985,
+      "step": 20
+    },
+    {
+      "epoch": 0.2268041237113402,
+      "grad_norm": 0.37597593665122986,
+      "learning_rate": 2e-05,
+      "loss": 0.9554,
+      "step": 22
+    },
+    {
+      "epoch": 0.24742268041237114,
+      "grad_norm": 1.1484178304672241,
+      "learning_rate": 2e-05,
+      "loss": 1.4816,
+      "step": 24
+    },
+    {
+      "epoch": 0.26804123711340205,
+      "grad_norm": 0.9884140491485596,
+      "learning_rate": 2e-05,
+      "loss": 1.0887,
+      "step": 26
+    },
+    {
+      "epoch": 0.28865979381443296,
+      "grad_norm": 2.5340919494628906,
+      "learning_rate": 2e-05,
+      "loss": 1.1622,
+      "step": 28
+    },
+    {
+      "epoch": 0.30927835051546393,
+      "grad_norm": 3.164740562438965,
+      "learning_rate": 2e-05,
+      "loss": 2.0013,
+      "step": 30
+    },
+    {
+      "epoch": 0.32989690721649484,
+      "grad_norm": 1.7155555486679077,
+      "learning_rate": 2e-05,
+      "loss": 1.2095,
+      "step": 32
+    },
+    {
+      "epoch": 0.35051546391752575,
+      "grad_norm": 0.952375054359436,
+      "learning_rate": 2e-05,
+      "loss": 0.8851,
+      "step": 34
+    },
+    {
+      "epoch": 0.3711340206185567,
+      "grad_norm": 2.5268073081970215,
+      "learning_rate": 2e-05,
+      "loss": 1.4144,
+      "step": 36
+    },
+    {
+      "epoch": 0.3917525773195876,
+      "grad_norm": 3.838146924972534,
+      "learning_rate": 2e-05,
+      "loss": 1.3506,
+      "step": 38
+    },
+    {
+      "epoch": 0.41237113402061853,
+      "grad_norm": 1.9546507596969604,
+      "learning_rate": 2e-05,
+      "loss": 1.6561,
+      "step": 40
+    },
+    {
+      "epoch": 0.4329896907216495,
+      "grad_norm": 1.979039192199707,
+      "learning_rate": 2e-05,
+      "loss": 0.8316,
+      "step": 42
+    },
+    {
+      "epoch": 0.4536082474226804,
+      "grad_norm": 1.025802731513977,
+      "learning_rate": 2e-05,
+      "loss": 1.9942,
+      "step": 44
+    },
+    {
+      "epoch": 0.4742268041237113,
+      "grad_norm": 0.5559583902359009,
+      "learning_rate": 2e-05,
+      "loss": 1.0033,
+      "step": 46
+    },
+    {
+      "epoch": 0.4948453608247423,
+      "grad_norm": 0.6625217199325562,
+      "learning_rate": 2e-05,
+      "loss": 0.7507,
+      "step": 48
+    },
+    {
+      "epoch": 0.5154639175257731,
+      "grad_norm": 4.655178070068359,
+      "learning_rate": 2e-05,
+      "loss": 1.1542,
+      "step": 50
+    },
+    {
+      "epoch": 0.5360824742268041,
+      "grad_norm": 0.9145403504371643,
+      "learning_rate": 2e-05,
+      "loss": 1.3025,
+      "step": 52
+    },
+    {
+      "epoch": 0.5567010309278351,
+      "grad_norm": 1.8665916919708252,
+      "learning_rate": 2e-05,
+      "loss": 1.5428,
+      "step": 54
+    },
+    {
+      "epoch": 0.5773195876288659,
+      "grad_norm": 1.5650798082351685,
+      "learning_rate": 2e-05,
+      "loss": 1.4144,
+      "step": 56
+    },
+    {
+      "epoch": 0.5979381443298969,
+      "grad_norm": 2.973200559616089,
+      "learning_rate": 2e-05,
+      "loss": 1.6578,
+      "step": 58
+    },
+    {
+      "epoch": 0.6185567010309279,
+      "grad_norm": 2.3732833862304688,
+      "learning_rate": 2e-05,
+      "loss": 1.0927,
+      "step": 60
+    },
+    {
+      "epoch": 0.6391752577319587,
+      "grad_norm": 1.011518120765686,
+      "learning_rate": 2e-05,
+      "loss": 0.7655,
+      "step": 62
+    },
+    {
+      "epoch": 0.6597938144329897,
+      "grad_norm": 2.6628100872039795,
+      "learning_rate": 2e-05,
+      "loss": 1.0994,
+      "step": 64
+    },
+    {
+      "epoch": 0.6804123711340206,
+      "grad_norm": 1.2325425148010254,
+      "learning_rate": 2e-05,
+      "loss": 1.7863,
+      "step": 66
+    },
+    {
+      "epoch": 0.7010309278350515,
+      "grad_norm": 0.7516754865646362,
+      "learning_rate": 2e-05,
+      "loss": 0.6101,
+      "step": 68
+    },
+    {
+      "epoch": 0.7216494845360825,
+      "grad_norm": 0.32088345289230347,
+      "learning_rate": 2e-05,
+      "loss": 1.3487,
+      "step": 70
+    },
+    {
+      "epoch": 0.7422680412371134,
+      "grad_norm": 1.3543070554733276,
+      "learning_rate": 2e-05,
+      "loss": 1.4045,
+      "step": 72
+    },
+    {
+      "epoch": 0.7628865979381443,
+      "grad_norm": 2.9448294639587402,
+      "learning_rate": 2e-05,
+      "loss": 1.6153,
+      "step": 74
+    },
+    {
+      "epoch": 0.7835051546391752,
+      "grad_norm": 1.3423410654067993,
+      "learning_rate": 2e-05,
+      "loss": 0.9661,
+      "step": 76
+    },
+    {
+      "epoch": 0.8041237113402062,
+      "grad_norm": 1.4557067155838013,
+      "learning_rate": 2e-05,
+      "loss": 0.5707,
+      "step": 78
+    },
+    {
+      "epoch": 0.8247422680412371,
+      "grad_norm": 0.8707636594772339,
+      "learning_rate": 2e-05,
+      "loss": 0.7858,
+      "step": 80
+    },
+    {
+      "epoch": 0.845360824742268,
+      "grad_norm": 0.8935154676437378,
+      "learning_rate": 2e-05,
+      "loss": 0.9482,
+      "step": 82
+    },
+    {
+      "epoch": 0.865979381443299,
+      "grad_norm": 1.1275886297225952,
+      "learning_rate": 2e-05,
+      "loss": 0.8253,
+      "step": 84
+    },
+    {
+      "epoch": 0.8865979381443299,
+      "grad_norm": 1.0190774202346802,
+      "learning_rate": 2e-05,
+      "loss": 1.3923,
+      "step": 86
+    },
+    {
+      "epoch": 0.9072164948453608,
+      "grad_norm": 2.239851236343384,
+      "learning_rate": 2e-05,
+      "loss": 1.8538,
+      "step": 88
+    },
+    {
+      "epoch": 0.9278350515463918,
+      "grad_norm": 0.48686838150024414,
+      "learning_rate": 2e-05,
+      "loss": 0.5748,
+      "step": 90
+    },
+    {
+      "epoch": 0.9484536082474226,
+      "grad_norm": 2.387908458709717,
+      "learning_rate": 2e-05,
+      "loss": 1.2788,
+      "step": 92
+    },
+    {
+      "epoch": 0.9690721649484536,
+      "grad_norm": 1.8753933906555176,
+      "learning_rate": 2e-05,
+      "loss": 2.16,
+      "step": 94
+    },
+    {
+      "epoch": 0.9896907216494846,
+      "grad_norm": 1.7403647899627686,
+      "learning_rate": 2e-05,
+      "loss": 1.7309,
+      "step": 96
+    },
+    {
+      "epoch": 1.0,
+      "step": 97,
+      "total_flos": 1.975033480085504e+16,
+      "train_loss": 1.2463067905190064,
+      "train_runtime": 346.1883,
+      "train_samples_per_second": 1.121,
+      "train_steps_per_second": 0.28
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 97,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1.975033480085504e+16,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d9cb7c5fddaca66205242d49af22fb676315f063b1cc2418d18fa177390924f2
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:46eade7f1fea0f1e68e3363d9a8e4ff52e5b7305d34a81ea1379557122759d20
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b086fbc699e0302ee4ae254a9237a6f8d5448810e5885c35f09b7692fb3ba4ee
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e663701e0f36fb7a017f31c1bc0702e47930c84858f19bff02e2417a980ea566
+size 791578182

client_states_feddualMultipqfullfreezeA2_NEWAensureOrth_Bcca_T05_freq10_bs4_saveoptim_lr2e-5_5e-5_sc132_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d332bf7bdd3e9cae1a94a5236886a591c59c6ce26033bc733ef93822982945ba
+size 791576546