thkim0305
/

feddat_baselines

Model card Files Files and versions Community

thkim0305 commited on 13 days ago

Commit

36aa57a

verified ·

1 Parent(s): aeccb48

Upload folder using huggingface_hub

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/0_client_model_round10.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/0_client_model_round12.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/0_client_model_round15.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/0_client_model_round17.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/0_client_model_round2.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/0_client_model_round20.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/0_client_model_round5.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/0_client_model_round7.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/0_trainer_state.json +378 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/1_client_model_round10.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/1_client_model_round12.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/1_client_model_round15.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/1_client_model_round17.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/1_client_model_round2.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/1_client_model_round20.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/1_client_model_round5.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/1_client_model_round7.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/1_trainer_state.json +378 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/2_client_model_round10.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/2_client_model_round12.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/2_client_model_round15.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/2_client_model_round17.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/2_client_model_round2.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/2_client_model_round20.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/2_client_model_round5.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/2_client_model_round7.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/2_trainer_state.json +378 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/3_client_model_round10.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/3_client_model_round12.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/3_client_model_round15.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/3_client_model_round17.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/3_client_model_round2.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/3_client_model_round20.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/3_client_model_round5.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/3_client_model_round7.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/3_trainer_state.json +378 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/4_client_model_round10.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/4_client_model_round12.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/4_client_model_round15.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/4_client_model_round17.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/4_client_model_round2.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/4_client_model_round20.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/4_client_model_round5.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/4_client_model_round7.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/4_trainer_state.json +378 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/5_client_model_round10.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/5_client_model_round12.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/5_client_model_round15.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/5_client_model_round17.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/5_client_model_round2.pth +3 -0

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/0_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ac6e3c20c9ce2b3bd22a4ec405cfe0e9c4823d415ddd9d0a1432c7f7a7821ab6
+size 369838470

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/0_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d9faab1abc5585336f9c5217cbf9229feae7f158d14775ec6b0465ecdcd6b72c
+size 369838470

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/0_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8b911d7298ebdb70e1147918b61c660749e1a0eb1428cf862812392dc3e79ee0
+size 369838470

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/0_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:99c914f9fec69d46834a0247afa323ef2d204838bfc58478b2b70b659c6c7837
+size 369838470

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/0_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:43cd654d47bea4a0664e185ffcb76f37acdef0f55d2203b478aee301074cec65
+size 369837282

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/0_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:482a35fcc3ebc3cf030093ca637eeb0b4f1a908aa49998263fd26a4f21738ec7
+size 369838470

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/0_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:abab9ede2af77a1461e2d522138e4f5e882bed4af399616ec0dd66577cfdc753
+size 369837282

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/0_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5f38813bfe5d6e1f323702ba4809bf6db6af166cb14a2717a8eb9f1ef775cdc1
+size 369837282

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/0_trainer_state.json ADDED Viewed

	@@ -0,0 +1,378 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 97,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.020618556701030927,
+      "grad_norm": 1.2302707433700562,
+      "learning_rate": 2e-05,
+      "loss": 0.6424,
+      "step": 2
+    },
+    {
+      "epoch": 0.041237113402061855,
+      "grad_norm": 1.6121233701705933,
+      "learning_rate": 2e-05,
+      "loss": 1.0052,
+      "step": 4
+    },
+    {
+      "epoch": 0.061855670103092786,
+      "grad_norm": 1.4117467403411865,
+      "learning_rate": 2e-05,
+      "loss": 1.005,
+      "step": 6
+    },
+    {
+      "epoch": 0.08247422680412371,
+      "grad_norm": 3.630777359008789,
+      "learning_rate": 2e-05,
+      "loss": 1.6888,
+      "step": 8
+    },
+    {
+      "epoch": 0.10309278350515463,
+      "grad_norm": 0.9374276995658875,
+      "learning_rate": 2e-05,
+      "loss": 0.7314,
+      "step": 10
+    },
+    {
+      "epoch": 0.12371134020618557,
+      "grad_norm": 0.9001209139823914,
+      "learning_rate": 2e-05,
+      "loss": 0.6316,
+      "step": 12
+    },
+    {
+      "epoch": 0.14432989690721648,
+      "grad_norm": 0.801906168460846,
+      "learning_rate": 2e-05,
+      "loss": 0.9834,
+      "step": 14
+    },
+    {
+      "epoch": 0.16494845360824742,
+      "grad_norm": 1.1132997274398804,
+      "learning_rate": 2e-05,
+      "loss": 1.3636,
+      "step": 16
+    },
+    {
+      "epoch": 0.18556701030927836,
+      "grad_norm": 1.1756536960601807,
+      "learning_rate": 2e-05,
+      "loss": 0.3419,
+      "step": 18
+    },
+    {
+      "epoch": 0.20618556701030927,
+      "grad_norm": 2.3688271045684814,
+      "learning_rate": 2e-05,
+      "loss": 0.8968,
+      "step": 20
+    },
+    {
+      "epoch": 0.2268041237113402,
+      "grad_norm": 8.31472110748291,
+      "learning_rate": 2e-05,
+      "loss": 0.8141,
+      "step": 22
+    },
+    {
+      "epoch": 0.24742268041237114,
+      "grad_norm": 1.499045491218567,
+      "learning_rate": 2e-05,
+      "loss": 0.5582,
+      "step": 24
+    },
+    {
+      "epoch": 0.26804123711340205,
+      "grad_norm": 2.175128936767578,
+      "learning_rate": 2e-05,
+      "loss": 1.2834,
+      "step": 26
+    },
+    {
+      "epoch": 0.28865979381443296,
+      "grad_norm": 1.3025474548339844,
+      "learning_rate": 2e-05,
+      "loss": 0.898,
+      "step": 28
+    },
+    {
+      "epoch": 0.30927835051546393,
+      "grad_norm": 1.6166173219680786,
+      "learning_rate": 2e-05,
+      "loss": 1.2673,
+      "step": 30
+    },
+    {
+      "epoch": 0.32989690721649484,
+      "grad_norm": 0.9590756297111511,
+      "learning_rate": 2e-05,
+      "loss": 1.3175,
+      "step": 32
+    },
+    {
+      "epoch": 0.35051546391752575,
+      "grad_norm": 1.4882543087005615,
+      "learning_rate": 2e-05,
+      "loss": 0.6644,
+      "step": 34
+    },
+    {
+      "epoch": 0.3711340206185567,
+      "grad_norm": 1.2179570198059082,
+      "learning_rate": 2e-05,
+      "loss": 0.7493,
+      "step": 36
+    },
+    {
+      "epoch": 0.3917525773195876,
+      "grad_norm": 1.3930878639221191,
+      "learning_rate": 2e-05,
+      "loss": 0.7374,
+      "step": 38
+    },
+    {
+      "epoch": 0.41237113402061853,
+      "grad_norm": 2.189868688583374,
+      "learning_rate": 2e-05,
+      "loss": 0.9137,
+      "step": 40
+    },
+    {
+      "epoch": 0.4329896907216495,
+      "grad_norm": 1.1282020807266235,
+      "learning_rate": 2e-05,
+      "loss": 1.6859,
+      "step": 42
+    },
+    {
+      "epoch": 0.4536082474226804,
+      "grad_norm": 1.5559532642364502,
+      "learning_rate": 2e-05,
+      "loss": 0.528,
+      "step": 44
+    },
+    {
+      "epoch": 0.4742268041237113,
+      "grad_norm": 2.0104541778564453,
+      "learning_rate": 2e-05,
+      "loss": 0.9586,
+      "step": 46
+    },
+    {
+      "epoch": 0.4948453608247423,
+      "grad_norm": 4.215638637542725,
+      "learning_rate": 2e-05,
+      "loss": 1.0792,
+      "step": 48
+    },
+    {
+      "epoch": 0.5154639175257731,
+      "grad_norm": 3.2594962120056152,
+      "learning_rate": 2e-05,
+      "loss": 1.2841,
+      "step": 50
+    },
+    {
+      "epoch": 0.5360824742268041,
+      "grad_norm": 0.7323676943778992,
+      "learning_rate": 2e-05,
+      "loss": 0.0893,
+      "step": 52
+    },
+    {
+      "epoch": 0.5567010309278351,
+      "grad_norm": 1.5159685611724854,
+      "learning_rate": 2e-05,
+      "loss": 1.5317,
+      "step": 54
+    },
+    {
+      "epoch": 0.5773195876288659,
+      "grad_norm": 4.473369598388672,
+      "learning_rate": 2e-05,
+      "loss": 1.2966,
+      "step": 56
+    },
+    {
+      "epoch": 0.5979381443298969,
+      "grad_norm": 5.313100337982178,
+      "learning_rate": 2e-05,
+      "loss": 0.911,
+      "step": 58
+    },
+    {
+      "epoch": 0.6185567010309279,
+      "grad_norm": 2.3561482429504395,
+      "learning_rate": 2e-05,
+      "loss": 0.8127,
+      "step": 60
+    },
+    {
+      "epoch": 0.6391752577319587,
+      "grad_norm": 2.3545758724212646,
+      "learning_rate": 2e-05,
+      "loss": 0.7019,
+      "step": 62
+    },
+    {
+      "epoch": 0.6597938144329897,
+      "grad_norm": 7.38244104385376,
+      "learning_rate": 2e-05,
+      "loss": 0.86,
+      "step": 64
+    },
+    {
+      "epoch": 0.6804123711340206,
+      "grad_norm": 1.3104522228240967,
+      "learning_rate": 2e-05,
+      "loss": 0.3289,
+      "step": 66
+    },
+    {
+      "epoch": 0.7010309278350515,
+      "grad_norm": 2.5590906143188477,
+      "learning_rate": 2e-05,
+      "loss": 0.8105,
+      "step": 68
+    },
+    {
+      "epoch": 0.7216494845360825,
+      "grad_norm": 4.937007427215576,
+      "learning_rate": 2e-05,
+      "loss": 1.1369,
+      "step": 70
+    },
+    {
+      "epoch": 0.7422680412371134,
+      "grad_norm": 6.499209880828857,
+      "learning_rate": 2e-05,
+      "loss": 0.8859,
+      "step": 72
+    },
+    {
+      "epoch": 0.7628865979381443,
+      "grad_norm": 6.662985801696777,
+      "learning_rate": 2e-05,
+      "loss": 0.5822,
+      "step": 74
+    },
+    {
+      "epoch": 0.7835051546391752,
+      "grad_norm": 1.9580082893371582,
+      "learning_rate": 2e-05,
+      "loss": 1.1448,
+      "step": 76
+    },
+    {
+      "epoch": 0.8041237113402062,
+      "grad_norm": 1.697409749031067,
+      "learning_rate": 2e-05,
+      "loss": 0.8685,
+      "step": 78
+    },
+    {
+      "epoch": 0.8247422680412371,
+      "grad_norm": 9.267684936523438,
+      "learning_rate": 2e-05,
+      "loss": 2.1197,
+      "step": 80
+    },
+    {
+      "epoch": 0.845360824742268,
+      "grad_norm": 0.6946778297424316,
+      "learning_rate": 2e-05,
+      "loss": 0.6537,
+      "step": 82
+    },
+    {
+      "epoch": 0.865979381443299,
+      "grad_norm": 4.137977600097656,
+      "learning_rate": 2e-05,
+      "loss": 1.5048,
+      "step": 84
+    },
+    {
+      "epoch": 0.8865979381443299,
+      "grad_norm": 2.1147782802581787,
+      "learning_rate": 2e-05,
+      "loss": 0.9791,
+      "step": 86
+    },
+    {
+      "epoch": 0.9072164948453608,
+      "grad_norm": 2.045584201812744,
+      "learning_rate": 2e-05,
+      "loss": 0.5647,
+      "step": 88
+    },
+    {
+      "epoch": 0.9278350515463918,
+      "grad_norm": 1.7340083122253418,
+      "learning_rate": 2e-05,
+      "loss": 1.0669,
+      "step": 90
+    },
+    {
+      "epoch": 0.9484536082474226,
+      "grad_norm": 2.2718918323516846,
+      "learning_rate": 2e-05,
+      "loss": 1.3045,
+      "step": 92
+    },
+    {
+      "epoch": 0.9690721649484536,
+      "grad_norm": 2.3538527488708496,
+      "learning_rate": 2e-05,
+      "loss": 0.7428,
+      "step": 94
+    },
+    {
+      "epoch": 0.9896907216494846,
+      "grad_norm": 1.2346324920654297,
+      "learning_rate": 2e-05,
+      "loss": 0.5767,
+      "step": 96
+    },
+    {
+      "epoch": 1.0,
+      "step": 97,
+      "total_flos": 5656240185147392.0,
+      "train_loss": 0.9453033073661253,
+      "train_runtime": 235.4567,
+      "train_samples_per_second": 1.648,
+      "train_steps_per_second": 0.412
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 97,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 5656240185147392.0,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/1_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4eb57f4da4d9af2c8f88eec2c68cce411eb4ace1cd7b4b8c6cfcb2932e44e1af
+size 794708086

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/1_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:599c1c0f44c2450b50611cbf10979f3176c7fb5c97b9994e162e9afbe6589e1e
+size 794708086

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/1_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:61bc0585554474b7a6c7a46de7c089e6d367f8d84a3f2082dda108068613b90a
+size 794708086

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/1_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a364994d7ccff9361b49b861cbbf4336eb34dd9e46c7921c637fa2c7a9532a6a
+size 794708086

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/1_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c6d174170815e6f16f125a4b43e29ade7e900a8e7534df2954323e02bae74339
+size 794706058

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/1_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:085787736ea4d59641527424baeb286c6851230bafe4e1c92069427d0e2fe907
+size 794708086

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/1_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b4319cfba2f0947e6c39dae27f1f6e85fe0967d560cf49a26499af35aeba4b27
+size 794706058

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/1_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3091e8b368a7015e0b43b5db1be0a826707a5eb9ae318b117c885ee90397875a
+size 794706058

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/1_trainer_state.json ADDED Viewed

	@@ -0,0 +1,378 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 97,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.020618556701030927,
+      "grad_norm": 0.8781272172927856,
+      "learning_rate": 2e-05,
+      "loss": 0.8515,
+      "step": 2
+    },
+    {
+      "epoch": 0.041237113402061855,
+      "grad_norm": 4.043600082397461,
+      "learning_rate": 2e-05,
+      "loss": 1.9452,
+      "step": 4
+    },
+    {
+      "epoch": 0.061855670103092786,
+      "grad_norm": 1.0472830533981323,
+      "learning_rate": 2e-05,
+      "loss": 0.6496,
+      "step": 6
+    },
+    {
+      "epoch": 0.08247422680412371,
+      "grad_norm": 1.3015058040618896,
+      "learning_rate": 2e-05,
+      "loss": 0.5628,
+      "step": 8
+    },
+    {
+      "epoch": 0.10309278350515463,
+      "grad_norm": 0.2546836733818054,
+      "learning_rate": 2e-05,
+      "loss": 0.5908,
+      "step": 10
+    },
+    {
+      "epoch": 0.12371134020618557,
+      "grad_norm": 2.3884270191192627,
+      "learning_rate": 2e-05,
+      "loss": 1.1725,
+      "step": 12
+    },
+    {
+      "epoch": 0.14432989690721648,
+      "grad_norm": 1.4381201267242432,
+      "learning_rate": 2e-05,
+      "loss": 0.827,
+      "step": 14
+    },
+    {
+      "epoch": 0.16494845360824742,
+      "grad_norm": 1.5257450342178345,
+      "learning_rate": 2e-05,
+      "loss": 1.3457,
+      "step": 16
+    },
+    {
+      "epoch": 0.18556701030927836,
+      "grad_norm": 1.5005308389663696,
+      "learning_rate": 2e-05,
+      "loss": 1.1501,
+      "step": 18
+    },
+    {
+      "epoch": 0.20618556701030927,
+      "grad_norm": 1.9017939567565918,
+      "learning_rate": 2e-05,
+      "loss": 1.8049,
+      "step": 20
+    },
+    {
+      "epoch": 0.2268041237113402,
+      "grad_norm": 1.4530093669891357,
+      "learning_rate": 2e-05,
+      "loss": 0.8718,
+      "step": 22
+    },
+    {
+      "epoch": 0.24742268041237114,
+      "grad_norm": 0.9238858819007874,
+      "learning_rate": 2e-05,
+      "loss": 1.1926,
+      "step": 24
+    },
+    {
+      "epoch": 0.26804123711340205,
+      "grad_norm": 1.5560870170593262,
+      "learning_rate": 2e-05,
+      "loss": 0.8745,
+      "step": 26
+    },
+    {
+      "epoch": 0.28865979381443296,
+      "grad_norm": 3.8156371116638184,
+      "learning_rate": 2e-05,
+      "loss": 1.4656,
+      "step": 28
+    },
+    {
+      "epoch": 0.30927835051546393,
+      "grad_norm": 2.274550199508667,
+      "learning_rate": 2e-05,
+      "loss": 1.2095,
+      "step": 30
+    },
+    {
+      "epoch": 0.32989690721649484,
+      "grad_norm": 2.0850868225097656,
+      "learning_rate": 2e-05,
+      "loss": 0.546,
+      "step": 32
+    },
+    {
+      "epoch": 0.35051546391752575,
+      "grad_norm": 1.1981834173202515,
+      "learning_rate": 2e-05,
+      "loss": 0.5663,
+      "step": 34
+    },
+    {
+      "epoch": 0.3711340206185567,
+      "grad_norm": 5.242424011230469,
+      "learning_rate": 2e-05,
+      "loss": 0.7796,
+      "step": 36
+    },
+    {
+      "epoch": 0.3917525773195876,
+      "grad_norm": 1.4221488237380981,
+      "learning_rate": 2e-05,
+      "loss": 0.5759,
+      "step": 38
+    },
+    {
+      "epoch": 0.41237113402061853,
+      "grad_norm": 1.140813946723938,
+      "learning_rate": 2e-05,
+      "loss": 0.8574,
+      "step": 40
+    },
+    {
+      "epoch": 0.4329896907216495,
+      "grad_norm": 2.981257200241089,
+      "learning_rate": 2e-05,
+      "loss": 0.6415,
+      "step": 42
+    },
+    {
+      "epoch": 0.4536082474226804,
+      "grad_norm": 2.198453187942505,
+      "learning_rate": 2e-05,
+      "loss": 1.9304,
+      "step": 44
+    },
+    {
+      "epoch": 0.4742268041237113,
+      "grad_norm": 0.601679801940918,
+      "learning_rate": 2e-05,
+      "loss": 0.4595,
+      "step": 46
+    },
+    {
+      "epoch": 0.4948453608247423,
+      "grad_norm": 1.553512692451477,
+      "learning_rate": 2e-05,
+      "loss": 0.9711,
+      "step": 48
+    },
+    {
+      "epoch": 0.5154639175257731,
+      "grad_norm": 2.1878437995910645,
+      "learning_rate": 2e-05,
+      "loss": 0.7843,
+      "step": 50
+    },
+    {
+      "epoch": 0.5360824742268041,
+      "grad_norm": 1.1170060634613037,
+      "learning_rate": 2e-05,
+      "loss": 1.3049,
+      "step": 52
+    },
+    {
+      "epoch": 0.5567010309278351,
+      "grad_norm": 3.8993043899536133,
+      "learning_rate": 2e-05,
+      "loss": 1.1269,
+      "step": 54
+    },
+    {
+      "epoch": 0.5773195876288659,
+      "grad_norm": 3.7384300231933594,
+      "learning_rate": 2e-05,
+      "loss": 1.3041,
+      "step": 56
+    },
+    {
+      "epoch": 0.5979381443298969,
+      "grad_norm": 4.556199550628662,
+      "learning_rate": 2e-05,
+      "loss": 1.5492,
+      "step": 58
+    },
+    {
+      "epoch": 0.6185567010309279,
+      "grad_norm": 1.3752775192260742,
+      "learning_rate": 2e-05,
+      "loss": 1.0508,
+      "step": 60
+    },
+    {
+      "epoch": 0.6391752577319587,
+      "grad_norm": 5.783763885498047,
+      "learning_rate": 2e-05,
+      "loss": 1.7019,
+      "step": 62
+    },
+    {
+      "epoch": 0.6597938144329897,
+      "grad_norm": 1.1487605571746826,
+      "learning_rate": 2e-05,
+      "loss": 0.7288,
+      "step": 64
+    },
+    {
+      "epoch": 0.6804123711340206,
+      "grad_norm": 2.0315375328063965,
+      "learning_rate": 2e-05,
+      "loss": 1.0151,
+      "step": 66
+    },
+    {
+      "epoch": 0.7010309278350515,
+      "grad_norm": 1.0512689352035522,
+      "learning_rate": 2e-05,
+      "loss": 1.0146,
+      "step": 68
+    },
+    {
+      "epoch": 0.7216494845360825,
+      "grad_norm": 2.663738250732422,
+      "learning_rate": 2e-05,
+      "loss": 1.2133,
+      "step": 70
+    },
+    {
+      "epoch": 0.7422680412371134,
+      "grad_norm": 2.6531965732574463,
+      "learning_rate": 2e-05,
+      "loss": 0.8632,
+      "step": 72
+    },
+    {
+      "epoch": 0.7628865979381443,
+      "grad_norm": 2.310678243637085,
+      "learning_rate": 2e-05,
+      "loss": 1.6255,
+      "step": 74
+    },
+    {
+      "epoch": 0.7835051546391752,
+      "grad_norm": 1.3333702087402344,
+      "learning_rate": 2e-05,
+      "loss": 0.8103,
+      "step": 76
+    },
+    {
+      "epoch": 0.8041237113402062,
+      "grad_norm": 2.0063538551330566,
+      "learning_rate": 2e-05,
+      "loss": 1.2381,
+      "step": 78
+    },
+    {
+      "epoch": 0.8247422680412371,
+      "grad_norm": 0.6322288513183594,
+      "learning_rate": 2e-05,
+      "loss": 0.584,
+      "step": 80
+    },
+    {
+      "epoch": 0.845360824742268,
+      "grad_norm": 1.8914169073104858,
+      "learning_rate": 2e-05,
+      "loss": 1.0259,
+      "step": 82
+    },
+    {
+      "epoch": 0.865979381443299,
+      "grad_norm": 2.7294955253601074,
+      "learning_rate": 2e-05,
+      "loss": 0.9706,
+      "step": 84
+    },
+    {
+      "epoch": 0.8865979381443299,
+      "grad_norm": 3.710840940475464,
+      "learning_rate": 2e-05,
+      "loss": 1.2648,
+      "step": 86
+    },
+    {
+      "epoch": 0.9072164948453608,
+      "grad_norm": 1.3264449834823608,
+      "learning_rate": 2e-05,
+      "loss": 0.5923,
+      "step": 88
+    },
+    {
+      "epoch": 0.9278350515463918,
+      "grad_norm": 1.280088186264038,
+      "learning_rate": 2e-05,
+      "loss": 0.6826,
+      "step": 90
+    },
+    {
+      "epoch": 0.9484536082474226,
+      "grad_norm": 0.8928223252296448,
+      "learning_rate": 2e-05,
+      "loss": 0.5134,
+      "step": 92
+    },
+    {
+      "epoch": 0.9690721649484536,
+      "grad_norm": 4.573293209075928,
+      "learning_rate": 2e-05,
+      "loss": 1.0831,
+      "step": 94
+    },
+    {
+      "epoch": 0.9896907216494846,
+      "grad_norm": 2.4279978275299072,
+      "learning_rate": 2e-05,
+      "loss": 1.0474,
+      "step": 96
+    },
+    {
+      "epoch": 1.0,
+      "step": 97,
+      "total_flos": 1.3528534647570432e+16,
+      "train_loss": 1.0155205480831186,
+      "train_runtime": 413.9788,
+      "train_samples_per_second": 0.937,
+      "train_steps_per_second": 0.234
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 97,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1.3528534647570432e+16,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/2_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8e41781055739cec33a2f49d21003d32c53009bfc48cb66d73c87eaf6b9828f6
+size 794708086

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/2_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:470dcb87433ec035468bec134fe6c4d50e8a8f668c2c833a26ea926f11dbf049
+size 794708086

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/2_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f1640ce7785ab8e8e7902397e1908cbfc1011e1d5154f0e12e336affd18cd2cf
+size 794708086

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/2_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3338370d88d25ad5a15f7a9160a5b9c280ec60de889a0caceb9ece4f4b6237a4
+size 794708086

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/2_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:41bf4f1754b8137517a3a1f7c53e997d179bcddef4baab07d74c51e28d2ad3df
+size 794706058

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/2_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f7857f8fb11d2880bf457dd12ed9ca204bf7a5eef168bdcd8d1a2fc6735c0b71
+size 794708086

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/2_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bc09018e2a00817778162596d3f9610e71a8a13be41391723e59f72c0c2f0b8a
+size 794706058

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/2_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0652fdc81a19c58e14361714085bcb4172d17ffa522ffa2967dd41e5f98fe357
+size 794706058

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/2_trainer_state.json ADDED Viewed

	@@ -0,0 +1,378 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 97,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.020618556701030927,
+      "grad_norm": 2.2005271911621094,
+      "learning_rate": 2e-05,
+      "loss": 0.5353,
+      "step": 2
+    },
+    {
+      "epoch": 0.041237113402061855,
+      "grad_norm": 2.829289436340332,
+      "learning_rate": 2e-05,
+      "loss": 0.5587,
+      "step": 4
+    },
+    {
+      "epoch": 0.061855670103092786,
+      "grad_norm": 2.785386562347412,
+      "learning_rate": 2e-05,
+      "loss": 2.5733,
+      "step": 6
+    },
+    {
+      "epoch": 0.08247422680412371,
+      "grad_norm": 1.3352482318878174,
+      "learning_rate": 2e-05,
+      "loss": 0.3653,
+      "step": 8
+    },
+    {
+      "epoch": 0.10309278350515463,
+      "grad_norm": 3.0877790451049805,
+      "learning_rate": 2e-05,
+      "loss": 1.2587,
+      "step": 10
+    },
+    {
+      "epoch": 0.12371134020618557,
+      "grad_norm": 0.9194437265396118,
+      "learning_rate": 2e-05,
+      "loss": 0.605,
+      "step": 12
+    },
+    {
+      "epoch": 0.14432989690721648,
+      "grad_norm": 1.778803825378418,
+      "learning_rate": 2e-05,
+      "loss": 0.4535,
+      "step": 14
+    },
+    {
+      "epoch": 0.16494845360824742,
+      "grad_norm": 2.219306230545044,
+      "learning_rate": 2e-05,
+      "loss": 0.733,
+      "step": 16
+    },
+    {
+      "epoch": 0.18556701030927836,
+      "grad_norm": 3.0522265434265137,
+      "learning_rate": 2e-05,
+      "loss": 0.8598,
+      "step": 18
+    },
+    {
+      "epoch": 0.20618556701030927,
+      "grad_norm": 1.7349960803985596,
+      "learning_rate": 2e-05,
+      "loss": 0.6239,
+      "step": 20
+    },
+    {
+      "epoch": 0.2268041237113402,
+      "grad_norm": 2.6168980598449707,
+      "learning_rate": 2e-05,
+      "loss": 0.6977,
+      "step": 22
+    },
+    {
+      "epoch": 0.24742268041237114,
+      "grad_norm": 0.6964139938354492,
+      "learning_rate": 2e-05,
+      "loss": 0.5198,
+      "step": 24
+    },
+    {
+      "epoch": 0.26804123711340205,
+      "grad_norm": 2.2305409908294678,
+      "learning_rate": 2e-05,
+      "loss": 0.6052,
+      "step": 26
+    },
+    {
+      "epoch": 0.28865979381443296,
+      "grad_norm": 2.8250887393951416,
+      "learning_rate": 2e-05,
+      "loss": 1.6726,
+      "step": 28
+    },
+    {
+      "epoch": 0.30927835051546393,
+      "grad_norm": 1.5621683597564697,
+      "learning_rate": 2e-05,
+      "loss": 0.6449,
+      "step": 30
+    },
+    {
+      "epoch": 0.32989690721649484,
+      "grad_norm": 1.7774029970169067,
+      "learning_rate": 2e-05,
+      "loss": 0.3363,
+      "step": 32
+    },
+    {
+      "epoch": 0.35051546391752575,
+      "grad_norm": 1.4394720792770386,
+      "learning_rate": 2e-05,
+      "loss": 1.1173,
+      "step": 34
+    },
+    {
+      "epoch": 0.3711340206185567,
+      "grad_norm": 0.6797069311141968,
+      "learning_rate": 2e-05,
+      "loss": 0.6117,
+      "step": 36
+    },
+    {
+      "epoch": 0.3917525773195876,
+      "grad_norm": 0.983581006526947,
+      "learning_rate": 2e-05,
+      "loss": 0.2687,
+      "step": 38
+    },
+    {
+      "epoch": 0.41237113402061853,
+      "grad_norm": 2.0993242263793945,
+      "learning_rate": 2e-05,
+      "loss": 0.9805,
+      "step": 40
+    },
+    {
+      "epoch": 0.4329896907216495,
+      "grad_norm": 11.079167366027832,
+      "learning_rate": 2e-05,
+      "loss": 1.5928,
+      "step": 42
+    },
+    {
+      "epoch": 0.4536082474226804,
+      "grad_norm": 2.051191806793213,
+      "learning_rate": 2e-05,
+      "loss": 0.5769,
+      "step": 44
+    },
+    {
+      "epoch": 0.4742268041237113,
+      "grad_norm": 3.372947931289673,
+      "learning_rate": 2e-05,
+      "loss": 1.0517,
+      "step": 46
+    },
+    {
+      "epoch": 0.4948453608247423,
+      "grad_norm": 2.3665897846221924,
+      "learning_rate": 2e-05,
+      "loss": 1.9332,
+      "step": 48
+    },
+    {
+      "epoch": 0.5154639175257731,
+      "grad_norm": 2.36680269241333,
+      "learning_rate": 2e-05,
+      "loss": 1.1949,
+      "step": 50
+    },
+    {
+      "epoch": 0.5360824742268041,
+      "grad_norm": 0.713635265827179,
+      "learning_rate": 2e-05,
+      "loss": 0.3461,
+      "step": 52
+    },
+    {
+      "epoch": 0.5567010309278351,
+      "grad_norm": 3.4997355937957764,
+      "learning_rate": 2e-05,
+      "loss": 1.4795,
+      "step": 54
+    },
+    {
+      "epoch": 0.5773195876288659,
+      "grad_norm": 6.203523635864258,
+      "learning_rate": 2e-05,
+      "loss": 1.5504,
+      "step": 56
+    },
+    {
+      "epoch": 0.5979381443298969,
+      "grad_norm": 4.314687252044678,
+      "learning_rate": 2e-05,
+      "loss": 0.7256,
+      "step": 58
+    },
+    {
+      "epoch": 0.6185567010309279,
+      "grad_norm": 4.574437618255615,
+      "learning_rate": 2e-05,
+      "loss": 0.6266,
+      "step": 60
+    },
+    {
+      "epoch": 0.6391752577319587,
+      "grad_norm": 3.7229034900665283,
+      "learning_rate": 2e-05,
+      "loss": 0.861,
+      "step": 62
+    },
+    {
+      "epoch": 0.6597938144329897,
+      "grad_norm": 2.443660020828247,
+      "learning_rate": 2e-05,
+      "loss": 0.6011,
+      "step": 64
+    },
+    {
+      "epoch": 0.6804123711340206,
+      "grad_norm": 1.8502126932144165,
+      "learning_rate": 2e-05,
+      "loss": 0.4416,
+      "step": 66
+    },
+    {
+      "epoch": 0.7010309278350515,
+      "grad_norm": 0.3321700990200043,
+      "learning_rate": 2e-05,
+      "loss": 0.1995,
+      "step": 68
+    },
+    {
+      "epoch": 0.7216494845360825,
+      "grad_norm": 4.566008567810059,
+      "learning_rate": 2e-05,
+      "loss": 1.9874,
+      "step": 70
+    },
+    {
+      "epoch": 0.7422680412371134,
+      "grad_norm": 2.5475733280181885,
+      "learning_rate": 2e-05,
+      "loss": 0.7815,
+      "step": 72
+    },
+    {
+      "epoch": 0.7628865979381443,
+      "grad_norm": 1.5172197818756104,
+      "learning_rate": 2e-05,
+      "loss": 0.2529,
+      "step": 74
+    },
+    {
+      "epoch": 0.7835051546391752,
+      "grad_norm": 5.836910724639893,
+      "learning_rate": 2e-05,
+      "loss": 1.6699,
+      "step": 76
+    },
+    {
+      "epoch": 0.8041237113402062,
+      "grad_norm": 2.813737392425537,
+      "learning_rate": 2e-05,
+      "loss": 0.9105,
+      "step": 78
+    },
+    {
+      "epoch": 0.8247422680412371,
+      "grad_norm": 3.7902021408081055,
+      "learning_rate": 2e-05,
+      "loss": 0.9401,
+      "step": 80
+    },
+    {
+      "epoch": 0.845360824742268,
+      "grad_norm": 5.073143005371094,
+      "learning_rate": 2e-05,
+      "loss": 0.6575,
+      "step": 82
+    },
+    {
+      "epoch": 0.865979381443299,
+      "grad_norm": 0.7925168871879578,
+      "learning_rate": 2e-05,
+      "loss": 0.2744,
+      "step": 84
+    },
+    {
+      "epoch": 0.8865979381443299,
+      "grad_norm": 1.4323312044143677,
+      "learning_rate": 2e-05,
+      "loss": 0.7463,
+      "step": 86
+    },
+    {
+      "epoch": 0.9072164948453608,
+      "grad_norm": 1.573714256286621,
+      "learning_rate": 2e-05,
+      "loss": 0.4023,
+      "step": 88
+    },
+    {
+      "epoch": 0.9278350515463918,
+      "grad_norm": 2.421898126602173,
+      "learning_rate": 2e-05,
+      "loss": 0.4877,
+      "step": 90
+    },
+    {
+      "epoch": 0.9484536082474226,
+      "grad_norm": 2.748384714126587,
+      "learning_rate": 2e-05,
+      "loss": 0.759,
+      "step": 92
+    },
+    {
+      "epoch": 0.9690721649484536,
+      "grad_norm": 3.4596893787384033,
+      "learning_rate": 2e-05,
+      "loss": 0.4826,
+      "step": 94
+    },
+    {
+      "epoch": 0.9896907216494846,
+      "grad_norm": 4.076857089996338,
+      "learning_rate": 2e-05,
+      "loss": 1.2546,
+      "step": 96
+    },
+    {
+      "epoch": 1.0,
+      "step": 97,
+      "total_flos": 1.5335589188468736e+16,
+      "train_loss": 0.8459088949813056,
+      "train_runtime": 452.4686,
+      "train_samples_per_second": 0.858,
+      "train_steps_per_second": 0.214
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 97,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1.5335589188468736e+16,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/3_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7c72a9298e90c4a5026adeee75d51a6787039d4083de3ba15eb18a73fcf09a51
+size 794708086

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/3_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0e253250a37cf6cae5c4dcf7987efc8ebd71581af9371fd266869a69e9d0da10
+size 794708086

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/3_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:356b3acc7076436eb47f2e906faaa291cf6379c294c0851f177314d7b7c4e0c9
+size 794708086

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/3_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b3d7b8b4e24255f6052e1820a7a5cf87dfb846bff90e6c974c30d5767be5af55
+size 794708086

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/3_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2aafa27a73b5f8aee55adc7d15f0e86119bd2d2862a123507854e0d1bf6829e4
+size 794706058

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/3_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d1af39dc03463a4ca2ff118e308fe0798e6a515c344a632c8f0d4f0b0e5acad8
+size 794708086

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/3_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:544fa4d1ceead9f40862e2891a05492c06dd059aa8a539bc151fd1380003f039
+size 794706058

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/3_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:385be361a93fce6f9feb2df719a26a9cc1c43ee1e5e4edfb0184de4ff6f6b13b
+size 794706058

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/3_trainer_state.json ADDED Viewed

	@@ -0,0 +1,378 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 97,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.020618556701030927,
+      "grad_norm": 2.431029796600342,
+      "learning_rate": 2e-05,
+      "loss": 1.0939,
+      "step": 2
+    },
+    {
+      "epoch": 0.041237113402061855,
+      "grad_norm": 0.8722438812255859,
+      "learning_rate": 2e-05,
+      "loss": 0.9552,
+      "step": 4
+    },
+    {
+      "epoch": 0.061855670103092786,
+      "grad_norm": 1.1362252235412598,
+      "learning_rate": 2e-05,
+      "loss": 0.6326,
+      "step": 6
+    },
+    {
+      "epoch": 0.08247422680412371,
+      "grad_norm": 0.799323320388794,
+      "learning_rate": 2e-05,
+      "loss": 0.9866,
+      "step": 8
+    },
+    {
+      "epoch": 0.10309278350515463,
+      "grad_norm": 1.1111527681350708,
+      "learning_rate": 2e-05,
+      "loss": 1.0202,
+      "step": 10
+    },
+    {
+      "epoch": 0.12371134020618557,
+      "grad_norm": 1.7144205570220947,
+      "learning_rate": 2e-05,
+      "loss": 0.9727,
+      "step": 12
+    },
+    {
+      "epoch": 0.14432989690721648,
+      "grad_norm": 0.9399757981300354,
+      "learning_rate": 2e-05,
+      "loss": 0.468,
+      "step": 14
+    },
+    {
+      "epoch": 0.16494845360824742,
+      "grad_norm": 0.7109354138374329,
+      "learning_rate": 2e-05,
+      "loss": 0.4818,
+      "step": 16
+    },
+    {
+      "epoch": 0.18556701030927836,
+      "grad_norm": 1.847976565361023,
+      "learning_rate": 2e-05,
+      "loss": 1.0419,
+      "step": 18
+    },
+    {
+      "epoch": 0.20618556701030927,
+      "grad_norm": 2.183365821838379,
+      "learning_rate": 2e-05,
+      "loss": 1.4441,
+      "step": 20
+    },
+    {
+      "epoch": 0.2268041237113402,
+      "grad_norm": 0.9391213059425354,
+      "learning_rate": 2e-05,
+      "loss": 0.4735,
+      "step": 22
+    },
+    {
+      "epoch": 0.24742268041237114,
+      "grad_norm": 0.10097850859165192,
+      "learning_rate": 2e-05,
+      "loss": 0.5644,
+      "step": 24
+    },
+    {
+      "epoch": 0.26804123711340205,
+      "grad_norm": 0.9321213960647583,
+      "learning_rate": 2e-05,
+      "loss": 1.1182,
+      "step": 26
+    },
+    {
+      "epoch": 0.28865979381443296,
+      "grad_norm": 1.5129534006118774,
+      "learning_rate": 2e-05,
+      "loss": 0.9117,
+      "step": 28
+    },
+    {
+      "epoch": 0.30927835051546393,
+      "grad_norm": 1.2945747375488281,
+      "learning_rate": 2e-05,
+      "loss": 1.3779,
+      "step": 30
+    },
+    {
+      "epoch": 0.32989690721649484,
+      "grad_norm": 1.1420668363571167,
+      "learning_rate": 2e-05,
+      "loss": 0.8766,
+      "step": 32
+    },
+    {
+      "epoch": 0.35051546391752575,
+      "grad_norm": 1.9086567163467407,
+      "learning_rate": 2e-05,
+      "loss": 0.8392,
+      "step": 34
+    },
+    {
+      "epoch": 0.3711340206185567,
+      "grad_norm": 1.51237952709198,
+      "learning_rate": 2e-05,
+      "loss": 1.2022,
+      "step": 36
+    },
+    {
+      "epoch": 0.3917525773195876,
+      "grad_norm": 1.0951957702636719,
+      "learning_rate": 2e-05,
+      "loss": 1.1245,
+      "step": 38
+    },
+    {
+      "epoch": 0.41237113402061853,
+      "grad_norm": 4.724721431732178,
+      "learning_rate": 2e-05,
+      "loss": 1.3685,
+      "step": 40
+    },
+    {
+      "epoch": 0.4329896907216495,
+      "grad_norm": 1.6724278926849365,
+      "learning_rate": 2e-05,
+      "loss": 0.7964,
+      "step": 42
+    },
+    {
+      "epoch": 0.4536082474226804,
+      "grad_norm": 0.3896200954914093,
+      "learning_rate": 2e-05,
+      "loss": 0.2359,
+      "step": 44
+    },
+    {
+      "epoch": 0.4742268041237113,
+      "grad_norm": 0.6976099014282227,
+      "learning_rate": 2e-05,
+      "loss": 0.5979,
+      "step": 46
+    },
+    {
+      "epoch": 0.4948453608247423,
+      "grad_norm": 1.113963007926941,
+      "learning_rate": 2e-05,
+      "loss": 0.7774,
+      "step": 48
+    },
+    {
+      "epoch": 0.5154639175257731,
+      "grad_norm": 1.4955312013626099,
+      "learning_rate": 2e-05,
+      "loss": 0.999,
+      "step": 50
+    },
+    {
+      "epoch": 0.5360824742268041,
+      "grad_norm": 1.4446187019348145,
+      "learning_rate": 2e-05,
+      "loss": 0.3719,
+      "step": 52
+    },
+    {
+      "epoch": 0.5567010309278351,
+      "grad_norm": 1.4187099933624268,
+      "learning_rate": 2e-05,
+      "loss": 0.8836,
+      "step": 54
+    },
+    {
+      "epoch": 0.5773195876288659,
+      "grad_norm": 0.9385492205619812,
+      "learning_rate": 2e-05,
+      "loss": 1.1007,
+      "step": 56
+    },
+    {
+      "epoch": 0.5979381443298969,
+      "grad_norm": 1.1563595533370972,
+      "learning_rate": 2e-05,
+      "loss": 0.4014,
+      "step": 58
+    },
+    {
+      "epoch": 0.6185567010309279,
+      "grad_norm": 1.551350474357605,
+      "learning_rate": 2e-05,
+      "loss": 0.6619,
+      "step": 60
+    },
+    {
+      "epoch": 0.6391752577319587,
+      "grad_norm": 1.1922292709350586,
+      "learning_rate": 2e-05,
+      "loss": 0.5347,
+      "step": 62
+    },
+    {
+      "epoch": 0.6597938144329897,
+      "grad_norm": 0.8667466640472412,
+      "learning_rate": 2e-05,
+      "loss": 0.7007,
+      "step": 64
+    },
+    {
+      "epoch": 0.6804123711340206,
+      "grad_norm": 1.0623116493225098,
+      "learning_rate": 2e-05,
+      "loss": 0.5061,
+      "step": 66
+    },
+    {
+      "epoch": 0.7010309278350515,
+      "grad_norm": 0.04590483754873276,
+      "learning_rate": 2e-05,
+      "loss": 0.3285,
+      "step": 68
+    },
+    {
+      "epoch": 0.7216494845360825,
+      "grad_norm": 1.00609290599823,
+      "learning_rate": 2e-05,
+      "loss": 0.3451,
+      "step": 70
+    },
+    {
+      "epoch": 0.7422680412371134,
+      "grad_norm": 1.5188184976577759,
+      "learning_rate": 2e-05,
+      "loss": 0.6001,
+      "step": 72
+    },
+    {
+      "epoch": 0.7628865979381443,
+      "grad_norm": 0.9316257238388062,
+      "learning_rate": 2e-05,
+      "loss": 0.6777,
+      "step": 74
+    },
+    {
+      "epoch": 0.7835051546391752,
+      "grad_norm": 1.65702223777771,
+      "learning_rate": 2e-05,
+      "loss": 0.7453,
+      "step": 76
+    },
+    {
+      "epoch": 0.8041237113402062,
+      "grad_norm": 1.313071370124817,
+      "learning_rate": 2e-05,
+      "loss": 0.4345,
+      "step": 78
+    },
+    {
+      "epoch": 0.8247422680412371,
+      "grad_norm": 0.6534919738769531,
+      "learning_rate": 2e-05,
+      "loss": 0.5735,
+      "step": 80
+    },
+    {
+      "epoch": 0.845360824742268,
+      "grad_norm": 0.32963377237319946,
+      "learning_rate": 2e-05,
+      "loss": 0.1275,
+      "step": 82
+    },
+    {
+      "epoch": 0.865979381443299,
+      "grad_norm": 0.9862601161003113,
+      "learning_rate": 2e-05,
+      "loss": 0.7405,
+      "step": 84
+    },
+    {
+      "epoch": 0.8865979381443299,
+      "grad_norm": 4.502978801727295,
+      "learning_rate": 2e-05,
+      "loss": 0.8153,
+      "step": 86
+    },
+    {
+      "epoch": 0.9072164948453608,
+      "grad_norm": 1.4814475774765015,
+      "learning_rate": 2e-05,
+      "loss": 0.8128,
+      "step": 88
+    },
+    {
+      "epoch": 0.9278350515463918,
+      "grad_norm": 1.8578946590423584,
+      "learning_rate": 2e-05,
+      "loss": 0.6065,
+      "step": 90
+    },
+    {
+      "epoch": 0.9484536082474226,
+      "grad_norm": 1.3685534000396729,
+      "learning_rate": 2e-05,
+      "loss": 0.4277,
+      "step": 92
+    },
+    {
+      "epoch": 0.9690721649484536,
+      "grad_norm": 1.3430529832839966,
+      "learning_rate": 2e-05,
+      "loss": 0.7456,
+      "step": 94
+    },
+    {
+      "epoch": 0.9896907216494846,
+      "grad_norm": 1.8663636445999146,
+      "learning_rate": 2e-05,
+      "loss": 0.4437,
+      "step": 96
+    },
+    {
+      "epoch": 1.0,
+      "step": 97,
+      "total_flos": 2.0809997453623296e+16,
+      "train_loss": 0.7489266002301088,
+      "train_runtime": 524.2746,
+      "train_samples_per_second": 0.74,
+      "train_steps_per_second": 0.185
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 97,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 2.0809997453623296e+16,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/4_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7bc7c7424c2df6afa2b5bae3653afdaaad3158911d70013ce6f4f9dcbb554ba0
+size 794708086

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/4_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8c2424d1e1a49a8f746c7d30ac918d879bbbcae4726650c61cc996ef7b1fe0a8
+size 794708086

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/4_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3dc9d7da842da98082cf9c2c2fca77b3a7bd5877e8c31ae27e665ca686e55176
+size 794708086

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/4_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9eca367e33592f4a5962682369f04fb7f40d715e6eaa4faa4d68bee854a8f08a
+size 794708086

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/4_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:aca4fb55c66b3552c4255c8d6323f4e27baabe1cec491853761c693625301042
+size 794706058

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/4_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8c042ed992d8bc718a05f2f3ff9467b2ccb0dd25243c0e9c40dcfefb933fd495
+size 794708086

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/4_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cf9f9bbe51dc5519112adbd5447500bf5fef833ee61df5554c859782348e78b5
+size 794706058

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/4_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:32ff0b5147bbb9f48b017adae43e8b62e0bc9529077070959e498cc382f5470e
+size 794706058

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/4_trainer_state.json ADDED Viewed

	@@ -0,0 +1,378 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 97,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.020618556701030927,
+      "grad_norm": 0.3599570095539093,
+      "learning_rate": 2e-05,
+      "loss": 0.2675,
+      "step": 2
+    },
+    {
+      "epoch": 0.041237113402061855,
+      "grad_norm": 1.1936863660812378,
+      "learning_rate": 2e-05,
+      "loss": 0.9035,
+      "step": 4
+    },
+    {
+      "epoch": 0.061855670103092786,
+      "grad_norm": 1.3883532285690308,
+      "learning_rate": 2e-05,
+      "loss": 0.6571,
+      "step": 6
+    },
+    {
+      "epoch": 0.08247422680412371,
+      "grad_norm": 2.7608344554901123,
+      "learning_rate": 2e-05,
+      "loss": 0.4303,
+      "step": 8
+    },
+    {
+      "epoch": 0.10309278350515463,
+      "grad_norm": 5.371406078338623,
+      "learning_rate": 2e-05,
+      "loss": 2.1826,
+      "step": 10
+    },
+    {
+      "epoch": 0.12371134020618557,
+      "grad_norm": 2.3308653831481934,
+      "learning_rate": 2e-05,
+      "loss": 0.6657,
+      "step": 12
+    },
+    {
+      "epoch": 0.14432989690721648,
+      "grad_norm": 0.042726580053567886,
+      "learning_rate": 2e-05,
+      "loss": 0.2714,
+      "step": 14
+    },
+    {
+      "epoch": 0.16494845360824742,
+      "grad_norm": 1.8078577518463135,
+      "learning_rate": 2e-05,
+      "loss": 0.893,
+      "step": 16
+    },
+    {
+      "epoch": 0.18556701030927836,
+      "grad_norm": 1.4273505210876465,
+      "learning_rate": 2e-05,
+      "loss": 0.9524,
+      "step": 18
+    },
+    {
+      "epoch": 0.20618556701030927,
+      "grad_norm": 2.442458152770996,
+      "learning_rate": 2e-05,
+      "loss": 1.1022,
+      "step": 20
+    },
+    {
+      "epoch": 0.2268041237113402,
+      "grad_norm": 0.48077863454818726,
+      "learning_rate": 2e-05,
+      "loss": 0.7807,
+      "step": 22
+    },
+    {
+      "epoch": 0.24742268041237114,
+      "grad_norm": 1.495241641998291,
+      "learning_rate": 2e-05,
+      "loss": 1.4534,
+      "step": 24
+    },
+    {
+      "epoch": 0.26804123711340205,
+      "grad_norm": 1.614429235458374,
+      "learning_rate": 2e-05,
+      "loss": 0.9892,
+      "step": 26
+    },
+    {
+      "epoch": 0.28865979381443296,
+      "grad_norm": 1.6893081665039062,
+      "learning_rate": 2e-05,
+      "loss": 0.5477,
+      "step": 28
+    },
+    {
+      "epoch": 0.30927835051546393,
+      "grad_norm": 2.3914456367492676,
+      "learning_rate": 2e-05,
+      "loss": 1.8496,
+      "step": 30
+    },
+    {
+      "epoch": 0.32989690721649484,
+      "grad_norm": 1.6967483758926392,
+      "learning_rate": 2e-05,
+      "loss": 1.0244,
+      "step": 32
+    },
+    {
+      "epoch": 0.35051546391752575,
+      "grad_norm": 3.545107364654541,
+      "learning_rate": 2e-05,
+      "loss": 1.1615,
+      "step": 34
+    },
+    {
+      "epoch": 0.3711340206185567,
+      "grad_norm": 1.4850765466690063,
+      "learning_rate": 2e-05,
+      "loss": 1.1958,
+      "step": 36
+    },
+    {
+      "epoch": 0.3917525773195876,
+      "grad_norm": 5.655995845794678,
+      "learning_rate": 2e-05,
+      "loss": 1.1793,
+      "step": 38
+    },
+    {
+      "epoch": 0.41237113402061853,
+      "grad_norm": 2.4371092319488525,
+      "learning_rate": 2e-05,
+      "loss": 0.8878,
+      "step": 40
+    },
+    {
+      "epoch": 0.4329896907216495,
+      "grad_norm": 1.0520563125610352,
+      "learning_rate": 2e-05,
+      "loss": 0.431,
+      "step": 42
+    },
+    {
+      "epoch": 0.4536082474226804,
+      "grad_norm": 1.6813929080963135,
+      "learning_rate": 2e-05,
+      "loss": 1.4381,
+      "step": 44
+    },
+    {
+      "epoch": 0.4742268041237113,
+      "grad_norm": 1.9094098806381226,
+      "learning_rate": 2e-05,
+      "loss": 0.9001,
+      "step": 46
+    },
+    {
+      "epoch": 0.4948453608247423,
+      "grad_norm": 1.8786391019821167,
+      "learning_rate": 2e-05,
+      "loss": 0.3896,
+      "step": 48
+    },
+    {
+      "epoch": 0.5154639175257731,
+      "grad_norm": 4.317810535430908,
+      "learning_rate": 2e-05,
+      "loss": 1.2674,
+      "step": 50
+    },
+    {
+      "epoch": 0.5360824742268041,
+      "grad_norm": 1.5854238271713257,
+      "learning_rate": 2e-05,
+      "loss": 1.2163,
+      "step": 52
+    },
+    {
+      "epoch": 0.5567010309278351,
+      "grad_norm": 4.147825717926025,
+      "learning_rate": 2e-05,
+      "loss": 1.2768,
+      "step": 54
+    },
+    {
+      "epoch": 0.5773195876288659,
+      "grad_norm": 1.2678698301315308,
+      "learning_rate": 2e-05,
+      "loss": 1.0032,
+      "step": 56
+    },
+    {
+      "epoch": 0.5979381443298969,
+      "grad_norm": 2.2713613510131836,
+      "learning_rate": 2e-05,
+      "loss": 1.7791,
+      "step": 58
+    },
+    {
+      "epoch": 0.6185567010309279,
+      "grad_norm": 4.81284236907959,
+      "learning_rate": 2e-05,
+      "loss": 1.5097,
+      "step": 60
+    },
+    {
+      "epoch": 0.6391752577319587,
+      "grad_norm": 1.9140543937683105,
+      "learning_rate": 2e-05,
+      "loss": 0.7074,
+      "step": 62
+    },
+    {
+      "epoch": 0.6597938144329897,
+      "grad_norm": 2.5636491775512695,
+      "learning_rate": 2e-05,
+      "loss": 0.8297,
+      "step": 64
+    },
+    {
+      "epoch": 0.6804123711340206,
+      "grad_norm": 1.8870617151260376,
+      "learning_rate": 2e-05,
+      "loss": 1.2714,
+      "step": 66
+    },
+    {
+      "epoch": 0.7010309278350515,
+      "grad_norm": 1.2541420459747314,
+      "learning_rate": 2e-05,
+      "loss": 0.8347,
+      "step": 68
+    },
+    {
+      "epoch": 0.7216494845360825,
+      "grad_norm": 1.135138988494873,
+      "learning_rate": 2e-05,
+      "loss": 1.5559,
+      "step": 70
+    },
+    {
+      "epoch": 0.7422680412371134,
+      "grad_norm": 0.9652976989746094,
+      "learning_rate": 2e-05,
+      "loss": 1.1556,
+      "step": 72
+    },
+    {
+      "epoch": 0.7628865979381443,
+      "grad_norm": 1.2813061475753784,
+      "learning_rate": 2e-05,
+      "loss": 1.1862,
+      "step": 74
+    },
+    {
+      "epoch": 0.7835051546391752,
+      "grad_norm": 1.8146921396255493,
+      "learning_rate": 2e-05,
+      "loss": 0.7589,
+      "step": 76
+    },
+    {
+      "epoch": 0.8041237113402062,
+      "grad_norm": 2.7170140743255615,
+      "learning_rate": 2e-05,
+      "loss": 0.4767,
+      "step": 78
+    },
+    {
+      "epoch": 0.8247422680412371,
+      "grad_norm": 1.401162028312683,
+      "learning_rate": 2e-05,
+      "loss": 0.7998,
+      "step": 80
+    },
+    {
+      "epoch": 0.845360824742268,
+      "grad_norm": 2.1656746864318848,
+      "learning_rate": 2e-05,
+      "loss": 0.5996,
+      "step": 82
+    },
+    {
+      "epoch": 0.865979381443299,
+      "grad_norm": 1.2385340929031372,
+      "learning_rate": 2e-05,
+      "loss": 0.6788,
+      "step": 84
+    },
+    {
+      "epoch": 0.8865979381443299,
+      "grad_norm": 1.43242609500885,
+      "learning_rate": 2e-05,
+      "loss": 1.3276,
+      "step": 86
+    },
+    {
+      "epoch": 0.9072164948453608,
+      "grad_norm": 3.322465658187866,
+      "learning_rate": 2e-05,
+      "loss": 1.2779,
+      "step": 88
+    },
+    {
+      "epoch": 0.9278350515463918,
+      "grad_norm": 1.1705447435379028,
+      "learning_rate": 2e-05,
+      "loss": 0.961,
+      "step": 90
+    },
+    {
+      "epoch": 0.9484536082474226,
+      "grad_norm": 3.3328497409820557,
+      "learning_rate": 2e-05,
+      "loss": 0.9414,
+      "step": 92
+    },
+    {
+      "epoch": 0.9690721649484536,
+      "grad_norm": 4.852980136871338,
+      "learning_rate": 2e-05,
+      "loss": 1.3991,
+      "step": 94
+    },
+    {
+      "epoch": 0.9896907216494846,
+      "grad_norm": 1.702784776687622,
+      "learning_rate": 2e-05,
+      "loss": 1.4331,
+      "step": 96
+    },
+    {
+      "epoch": 1.0,
+      "step": 97,
+      "total_flos": 1.9758677338619904e+16,
+      "train_loss": 1.00918516178721,
+      "train_runtime": 540.4351,
+      "train_samples_per_second": 0.718,
+      "train_steps_per_second": 0.179
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 97,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1.9758677338619904e+16,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/5_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b7e672830c3390cebc35186306c826e13e090e04ddeafd88ffc20e8522684105
+size 794708086

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/5_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e16446a963b6b92d9b08fd590dd1a4cdf91041e770bce96813b10b4ed7f585e9
+size 794708086

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/5_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7bf8a3f7300eed94ebeadf63f4fd1bc5a1a9e9ba2ff72874542fc0d228e1751b
+size 794708086

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/5_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7b92493e926b74fe46ad8c116cac0ce0f3b74ab7eab53772caa2f2d092cbe243
+size 794708086

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_Aorthensure_Brand_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixit97_T0125_decay099/5_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7ba67ca5277a23ddc688297378f77308686101a548c5d8ded5230ede369657d6
+size 794706058