thkim0305
/

feddat_baselines

Model card Files Files and versions Community

thkim0305 commited on 15 days ago

Commit

ad2c972

verified ·

1 Parent(s): ae71b7c

Upload folder using huggingface_hub

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round10.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round12.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round15.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round17.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round2.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round20.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round5.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round7.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/0_trainer_state.json +378 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round10.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round12.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round15.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round17.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round2.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round20.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round5.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round7.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/1_trainer_state.json +378 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round10.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round12.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round15.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round17.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round2.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round20.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round5.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round7.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/2_trainer_state.json +378 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round10.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round12.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round15.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round17.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round2.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round20.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round5.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round7.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/3_trainer_state.json +378 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round10.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round12.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round15.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round17.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round2.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round20.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round5.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round7.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/4_trainer_state.json +378 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round10.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round12.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round15.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round17.pth +3 -0
client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round2.pth +3 -0

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:48b96c362a78aed601019971f00d6027bed72a085f801c5708c469b30b56e704
+size 606590838

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ffa113a087044d45e9458ac9c0cc467fc5d4efc7adf19f478aa37bcbf0caaf2f
+size 606590838

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e235f913c8f73283f7d46940c3d7efa2db6ba791511a72d27267d2ce1e562533
+size 606590838

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:38483e00ef8f3a3423e44729285077bc1efbc42c6112450c0be7069f15fde5fc
+size 606590838

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:424f036eb3473b0625a9b07031fccf681a4aa443d3d85c2dee0a124fc093d62e
+size 606588810

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ffb30d25ae19dd6ca1f01a3f066d39b79c10c0ae3937a2722a15f790a8acc3da
+size 606590838

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:16e8b9983821b40d2bccba0cb8aceacdc83d0f24b2a9d503b06bbd0e29d536c0
+size 606588810

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/0_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ce653e9bb0f893fc5b3c40b624e4375f73e384bfee5a88fcfe1d8838f649f6a2
+size 606588810

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/0_trainer_state.json ADDED Viewed

	@@ -0,0 +1,378 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 97,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.020618556701030927,
+      "grad_norm": 1.9091740846633911,
+      "learning_rate": 2e-05,
+      "loss": 1.2221,
+      "step": 2
+    },
+    {
+      "epoch": 0.041237113402061855,
+      "grad_norm": 3.158586263656616,
+      "learning_rate": 2e-05,
+      "loss": 1.0034,
+      "step": 4
+    },
+    {
+      "epoch": 0.061855670103092786,
+      "grad_norm": 0.46037667989730835,
+      "learning_rate": 2e-05,
+      "loss": 0.0698,
+      "step": 6
+    },
+    {
+      "epoch": 0.08247422680412371,
+      "grad_norm": 4.0920891761779785,
+      "learning_rate": 2e-05,
+      "loss": 0.6852,
+      "step": 8
+    },
+    {
+      "epoch": 0.10309278350515463,
+      "grad_norm": 0.10336245596408844,
+      "learning_rate": 2e-05,
+      "loss": 0.0561,
+      "step": 10
+    },
+    {
+      "epoch": 0.12371134020618557,
+      "grad_norm": 2.5557003021240234,
+      "learning_rate": 2e-05,
+      "loss": 0.5174,
+      "step": 12
+    },
+    {
+      "epoch": 0.14432989690721648,
+      "grad_norm": 1.9013806581497192,
+      "learning_rate": 2e-05,
+      "loss": 0.3884,
+      "step": 14
+    },
+    {
+      "epoch": 0.16494845360824742,
+      "grad_norm": 0.5343479514122009,
+      "learning_rate": 2e-05,
+      "loss": 1.0633,
+      "step": 16
+    },
+    {
+      "epoch": 0.18556701030927836,
+      "grad_norm": 1.3988330364227295,
+      "learning_rate": 2e-05,
+      "loss": 0.4331,
+      "step": 18
+    },
+    {
+      "epoch": 0.20618556701030927,
+      "grad_norm": 0.7816677093505859,
+      "learning_rate": 2e-05,
+      "loss": 0.1989,
+      "step": 20
+    },
+    {
+      "epoch": 0.2268041237113402,
+      "grad_norm": 1.7695223093032837,
+      "learning_rate": 2e-05,
+      "loss": 0.3803,
+      "step": 22
+    },
+    {
+      "epoch": 0.24742268041237114,
+      "grad_norm": 2.075623035430908,
+      "learning_rate": 2e-05,
+      "loss": 0.6594,
+      "step": 24
+    },
+    {
+      "epoch": 0.26804123711340205,
+      "grad_norm": 1.132662296295166,
+      "learning_rate": 2e-05,
+      "loss": 0.3909,
+      "step": 26
+    },
+    {
+      "epoch": 0.28865979381443296,
+      "grad_norm": 1.9386407136917114,
+      "learning_rate": 2e-05,
+      "loss": 0.9071,
+      "step": 28
+    },
+    {
+      "epoch": 0.30927835051546393,
+      "grad_norm": 1.1776388883590698,
+      "learning_rate": 2e-05,
+      "loss": 0.1846,
+      "step": 30
+    },
+    {
+      "epoch": 0.32989690721649484,
+      "grad_norm": 2.3658692836761475,
+      "learning_rate": 2e-05,
+      "loss": 0.2869,
+      "step": 32
+    },
+    {
+      "epoch": 0.35051546391752575,
+      "grad_norm": 1.8401161432266235,
+      "learning_rate": 2e-05,
+      "loss": 0.4268,
+      "step": 34
+    },
+    {
+      "epoch": 0.3711340206185567,
+      "grad_norm": 6.151878356933594,
+      "learning_rate": 2e-05,
+      "loss": 0.8957,
+      "step": 36
+    },
+    {
+      "epoch": 0.3917525773195876,
+      "grad_norm": 1.4062762260437012,
+      "learning_rate": 2e-05,
+      "loss": 0.1458,
+      "step": 38
+    },
+    {
+      "epoch": 0.41237113402061853,
+      "grad_norm": 1.788042426109314,
+      "learning_rate": 2e-05,
+      "loss": 0.1687,
+      "step": 40
+    },
+    {
+      "epoch": 0.4329896907216495,
+      "grad_norm": 3.1902451515197754,
+      "learning_rate": 2e-05,
+      "loss": 0.6988,
+      "step": 42
+    },
+    {
+      "epoch": 0.4536082474226804,
+      "grad_norm": 4.431184768676758,
+      "learning_rate": 2e-05,
+      "loss": 0.4197,
+      "step": 44
+    },
+    {
+      "epoch": 0.4742268041237113,
+      "grad_norm": 0.8136569857597351,
+      "learning_rate": 2e-05,
+      "loss": 0.0892,
+      "step": 46
+    },
+    {
+      "epoch": 0.4948453608247423,
+      "grad_norm": 0.2823968529701233,
+      "learning_rate": 2e-05,
+      "loss": 0.3095,
+      "step": 48
+    },
+    {
+      "epoch": 0.5154639175257731,
+      "grad_norm": 2.880483627319336,
+      "learning_rate": 2e-05,
+      "loss": 0.2591,
+      "step": 50
+    },
+    {
+      "epoch": 0.5360824742268041,
+      "grad_norm": 5.056119918823242,
+      "learning_rate": 2e-05,
+      "loss": 0.8428,
+      "step": 52
+    },
+    {
+      "epoch": 0.5567010309278351,
+      "grad_norm": 0.07207974791526794,
+      "learning_rate": 2e-05,
+      "loss": 0.0128,
+      "step": 54
+    },
+    {
+      "epoch": 0.5773195876288659,
+      "grad_norm": 1.1768360137939453,
+      "learning_rate": 2e-05,
+      "loss": 0.1406,
+      "step": 56
+    },
+    {
+      "epoch": 0.5979381443298969,
+      "grad_norm": 3.5694682598114014,
+      "learning_rate": 2e-05,
+      "loss": 0.5909,
+      "step": 58
+    },
+    {
+      "epoch": 0.6185567010309279,
+      "grad_norm": 0.23515310883522034,
+      "learning_rate": 2e-05,
+      "loss": 0.325,
+      "step": 60
+    },
+    {
+      "epoch": 0.6391752577319587,
+      "grad_norm": 0.7991934418678284,
+      "learning_rate": 2e-05,
+      "loss": 0.2351,
+      "step": 62
+    },
+    {
+      "epoch": 0.6597938144329897,
+      "grad_norm": 0.023807095363736153,
+      "learning_rate": 2e-05,
+      "loss": 0.0073,
+      "step": 64
+    },
+    {
+      "epoch": 0.6804123711340206,
+      "grad_norm": 1.7518260478973389,
+      "learning_rate": 2e-05,
+      "loss": 0.0999,
+      "step": 66
+    },
+    {
+      "epoch": 0.7010309278350515,
+      "grad_norm": 2.0427582263946533,
+      "learning_rate": 2e-05,
+      "loss": 0.176,
+      "step": 68
+    },
+    {
+      "epoch": 0.7216494845360825,
+      "grad_norm": 2.179276466369629,
+      "learning_rate": 2e-05,
+      "loss": 0.139,
+      "step": 70
+    },
+    {
+      "epoch": 0.7422680412371134,
+      "grad_norm": 0.9427316188812256,
+      "learning_rate": 2e-05,
+      "loss": 0.0631,
+      "step": 72
+    },
+    {
+      "epoch": 0.7628865979381443,
+      "grad_norm": 4.460165500640869,
+      "learning_rate": 2e-05,
+      "loss": 0.643,
+      "step": 74
+    },
+    {
+      "epoch": 0.7835051546391752,
+      "grad_norm": 3.386460542678833,
+      "learning_rate": 2e-05,
+      "loss": 0.632,
+      "step": 76
+    },
+    {
+      "epoch": 0.8041237113402062,
+      "grad_norm": 2.405658483505249,
+      "learning_rate": 2e-05,
+      "loss": 0.2599,
+      "step": 78
+    },
+    {
+      "epoch": 0.8247422680412371,
+      "grad_norm": 4.817083358764648,
+      "learning_rate": 2e-05,
+      "loss": 0.834,
+      "step": 80
+    },
+    {
+      "epoch": 0.845360824742268,
+      "grad_norm": 5.088555812835693,
+      "learning_rate": 2e-05,
+      "loss": 0.4744,
+      "step": 82
+    },
+    {
+      "epoch": 0.865979381443299,
+      "grad_norm": 0.05794494226574898,
+      "learning_rate": 2e-05,
+      "loss": 0.6645,
+      "step": 84
+    },
+    {
+      "epoch": 0.8865979381443299,
+      "grad_norm": 0.06005644053220749,
+      "learning_rate": 2e-05,
+      "loss": 0.3662,
+      "step": 86
+    },
+    {
+      "epoch": 0.9072164948453608,
+      "grad_norm": 0.3105262219905853,
+      "learning_rate": 2e-05,
+      "loss": 0.374,
+      "step": 88
+    },
+    {
+      "epoch": 0.9278350515463918,
+      "grad_norm": 1.043837547302246,
+      "learning_rate": 2e-05,
+      "loss": 0.2253,
+      "step": 90
+    },
+    {
+      "epoch": 0.9484536082474226,
+      "grad_norm": 3.3620216846466064,
+      "learning_rate": 2e-05,
+      "loss": 1.0345,
+      "step": 92
+    },
+    {
+      "epoch": 0.9690721649484536,
+      "grad_norm": 0.1824847310781479,
+      "learning_rate": 2e-05,
+      "loss": 0.1119,
+      "step": 94
+    },
+    {
+      "epoch": 0.9896907216494846,
+      "grad_norm": 0.09524671733379364,
+      "learning_rate": 2e-05,
+      "loss": 0.1297,
+      "step": 96
+    },
+    {
+      "epoch": 1.0,
+      "step": 97,
+      "total_flos": 2866814929338368.0,
+      "train_loss": 0.4281441053164374,
+      "train_runtime": 417.1615,
+      "train_samples_per_second": 0.93,
+      "train_steps_per_second": 0.233
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 97,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 2866814929338368.0,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cf5b1b07a962367241a2790e3b47841d377d0a5859a24e0bd572bbb2e9a5dad4
+size 606590838

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bcaa8b85b90be439bd3bf93fa1b50be8a1a524c0e2551727713f22186123d1f0
+size 606590838

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ad9f7eab0ddc66d1c63eaf3d04cce2d870464e591c10a0a0cd59c04943163477
+size 606590838

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a74dcff81385ce7d01fd715bfe9cd9115994a33b4f2116a5a42c2e3b9691c0b7
+size 606590838

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0a7215205419c641a43021b684e80c528adf84563ea906d6c2e68c6843e62d71
+size 606588810

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3ebdc8a3d437a1ef847589521c74c09d29530143a00ceb9bef8a458f47d6c12c
+size 606590838

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:45bb1653c987aae96fe205a4517a078a0ac54e4b545c86cea875b9dabae7b576
+size 606588810

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/1_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b0793485bc61d7c2e0c75e7ca0f596a805ee2682aaf4bbb6109607da5e979984
+size 606588810

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/1_trainer_state.json ADDED Viewed

	@@ -0,0 +1,378 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 97,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.020618556701030927,
+      "grad_norm": 0.00990249216556549,
+      "learning_rate": 2e-05,
+      "loss": 0.0343,
+      "step": 2
+    },
+    {
+      "epoch": 0.041237113402061855,
+      "grad_norm": 0.24752184748649597,
+      "learning_rate": 2e-05,
+      "loss": 0.0285,
+      "step": 4
+    },
+    {
+      "epoch": 0.061855670103092786,
+      "grad_norm": 0.11016274988651276,
+      "learning_rate": 2e-05,
+      "loss": 0.1125,
+      "step": 6
+    },
+    {
+      "epoch": 0.08247422680412371,
+      "grad_norm": 0.015819694846868515,
+      "learning_rate": 2e-05,
+      "loss": 0.0193,
+      "step": 8
+    },
+    {
+      "epoch": 0.10309278350515463,
+      "grad_norm": 0.0025153865572065115,
+      "learning_rate": 2e-05,
+      "loss": 0.0022,
+      "step": 10
+    },
+    {
+      "epoch": 0.12371134020618557,
+      "grad_norm": 0.018475506454706192,
+      "learning_rate": 2e-05,
+      "loss": 0.002,
+      "step": 12
+    },
+    {
+      "epoch": 0.14432989690721648,
+      "grad_norm": 5.484030723571777,
+      "learning_rate": 2e-05,
+      "loss": 0.5337,
+      "step": 14
+    },
+    {
+      "epoch": 0.16494845360824742,
+      "grad_norm": 0.01962272636592388,
+      "learning_rate": 2e-05,
+      "loss": 0.1908,
+      "step": 16
+    },
+    {
+      "epoch": 0.18556701030927836,
+      "grad_norm": 0.02493014559149742,
+      "learning_rate": 2e-05,
+      "loss": 0.0014,
+      "step": 18
+    },
+    {
+      "epoch": 0.20618556701030927,
+      "grad_norm": 0.09554272145032883,
+      "learning_rate": 2e-05,
+      "loss": 0.71,
+      "step": 20
+    },
+    {
+      "epoch": 0.2268041237113402,
+      "grad_norm": 0.007511932868510485,
+      "learning_rate": 2e-05,
+      "loss": 0.0032,
+      "step": 22
+    },
+    {
+      "epoch": 0.24742268041237114,
+      "grad_norm": 0.6068776845932007,
+      "learning_rate": 2e-05,
+      "loss": 0.0584,
+      "step": 24
+    },
+    {
+      "epoch": 0.26804123711340205,
+      "grad_norm": 0.019293755292892456,
+      "learning_rate": 2e-05,
+      "loss": 0.0174,
+      "step": 26
+    },
+    {
+      "epoch": 0.28865979381443296,
+      "grad_norm": 0.006605098024010658,
+      "learning_rate": 2e-05,
+      "loss": 0.0035,
+      "step": 28
+    },
+    {
+      "epoch": 0.30927835051546393,
+      "grad_norm": 0.38141685724258423,
+      "learning_rate": 2e-05,
+      "loss": 0.4474,
+      "step": 30
+    },
+    {
+      "epoch": 0.32989690721649484,
+      "grad_norm": 0.03302409499883652,
+      "learning_rate": 2e-05,
+      "loss": 0.0047,
+      "step": 32
+    },
+    {
+      "epoch": 0.35051546391752575,
+      "grad_norm": 6.83150577545166,
+      "learning_rate": 2e-05,
+      "loss": 0.324,
+      "step": 34
+    },
+    {
+      "epoch": 0.3711340206185567,
+      "grad_norm": 0.10726940631866455,
+      "learning_rate": 2e-05,
+      "loss": 0.0058,
+      "step": 36
+    },
+    {
+      "epoch": 0.3917525773195876,
+      "grad_norm": 0.44090333580970764,
+      "learning_rate": 2e-05,
+      "loss": 0.0431,
+      "step": 38
+    },
+    {
+      "epoch": 0.41237113402061853,
+      "grad_norm": 0.19889701902866364,
+      "learning_rate": 2e-05,
+      "loss": 0.7427,
+      "step": 40
+    },
+    {
+      "epoch": 0.4329896907216495,
+      "grad_norm": 1.034143090248108,
+      "learning_rate": 2e-05,
+      "loss": 0.0863,
+      "step": 42
+    },
+    {
+      "epoch": 0.4536082474226804,
+      "grad_norm": 0.22705499827861786,
+      "learning_rate": 2e-05,
+      "loss": 0.357,
+      "step": 44
+    },
+    {
+      "epoch": 0.4742268041237113,
+      "grad_norm": 0.7536527514457703,
+      "learning_rate": 2e-05,
+      "loss": 0.1098,
+      "step": 46
+    },
+    {
+      "epoch": 0.4948453608247423,
+      "grad_norm": 0.056017301976680756,
+      "learning_rate": 2e-05,
+      "loss": 0.0064,
+      "step": 48
+    },
+    {
+      "epoch": 0.5154639175257731,
+      "grad_norm": 0.006744038313627243,
+      "learning_rate": 2e-05,
+      "loss": 0.0006,
+      "step": 50
+    },
+    {
+      "epoch": 0.5360824742268041,
+      "grad_norm": 0.9016902446746826,
+      "learning_rate": 2e-05,
+      "loss": 0.1382,
+      "step": 52
+    },
+    {
+      "epoch": 0.5567010309278351,
+      "grad_norm": 0.11894352734088898,
+      "learning_rate": 2e-05,
+      "loss": 0.0104,
+      "step": 54
+    },
+    {
+      "epoch": 0.5773195876288659,
+      "grad_norm": 0.39221423864364624,
+      "learning_rate": 2e-05,
+      "loss": 0.032,
+      "step": 56
+    },
+    {
+      "epoch": 0.5979381443298969,
+      "grad_norm": 0.09858262538909912,
+      "learning_rate": 2e-05,
+      "loss": 0.049,
+      "step": 58
+    },
+    {
+      "epoch": 0.6185567010309279,
+      "grad_norm": 0.005559508688747883,
+      "learning_rate": 2e-05,
+      "loss": 0.1089,
+      "step": 60
+    },
+    {
+      "epoch": 0.6391752577319587,
+      "grad_norm": 1.6431413888931274,
+      "learning_rate": 2e-05,
+      "loss": 0.1877,
+      "step": 62
+    },
+    {
+      "epoch": 0.6597938144329897,
+      "grad_norm": 0.004421388264745474,
+      "learning_rate": 2e-05,
+      "loss": 0.0127,
+      "step": 64
+    },
+    {
+      "epoch": 0.6804123711340206,
+      "grad_norm": 0.002455125330016017,
+      "learning_rate": 2e-05,
+      "loss": 0.0007,
+      "step": 66
+    },
+    {
+      "epoch": 0.7010309278350515,
+      "grad_norm": 2.288174629211426,
+      "learning_rate": 2e-05,
+      "loss": 0.593,
+      "step": 68
+    },
+    {
+      "epoch": 0.7216494845360825,
+      "grad_norm": 0.5138911604881287,
+      "learning_rate": 2e-05,
+      "loss": 0.7277,
+      "step": 70
+    },
+    {
+      "epoch": 0.7422680412371134,
+      "grad_norm": 0.2915093004703522,
+      "learning_rate": 2e-05,
+      "loss": 0.0794,
+      "step": 72
+    },
+    {
+      "epoch": 0.7628865979381443,
+      "grad_norm": 0.012635215185582638,
+      "learning_rate": 2e-05,
+      "loss": 0.0644,
+      "step": 74
+    },
+    {
+      "epoch": 0.7835051546391752,
+      "grad_norm": 0.5793916583061218,
+      "learning_rate": 2e-05,
+      "loss": 0.2267,
+      "step": 76
+    },
+    {
+      "epoch": 0.8041237113402062,
+      "grad_norm": 2.189505100250244,
+      "learning_rate": 2e-05,
+      "loss": 0.6962,
+      "step": 78
+    },
+    {
+      "epoch": 0.8247422680412371,
+      "grad_norm": 0.004708629101514816,
+      "learning_rate": 2e-05,
+      "loss": 0.0011,
+      "step": 80
+    },
+    {
+      "epoch": 0.845360824742268,
+      "grad_norm": 0.007471214048564434,
+      "learning_rate": 2e-05,
+      "loss": 0.0018,
+      "step": 82
+    },
+    {
+      "epoch": 0.865979381443299,
+      "grad_norm": 0.014228110201656818,
+      "learning_rate": 2e-05,
+      "loss": 0.0012,
+      "step": 84
+    },
+    {
+      "epoch": 0.8865979381443299,
+      "grad_norm": 0.01875714771449566,
+      "learning_rate": 2e-05,
+      "loss": 0.0231,
+      "step": 86
+    },
+    {
+      "epoch": 0.9072164948453608,
+      "grad_norm": 0.010902749374508858,
+      "learning_rate": 2e-05,
+      "loss": 0.0009,
+      "step": 88
+    },
+    {
+      "epoch": 0.9278350515463918,
+      "grad_norm": 0.6271221041679382,
+      "learning_rate": 2e-05,
+      "loss": 0.0795,
+      "step": 90
+    },
+    {
+      "epoch": 0.9484536082474226,
+      "grad_norm": 1.3592969179153442,
+      "learning_rate": 2e-05,
+      "loss": 0.106,
+      "step": 92
+    },
+    {
+      "epoch": 0.9690721649484536,
+      "grad_norm": 0.4871022403240204,
+      "learning_rate": 2e-05,
+      "loss": 0.0463,
+      "step": 94
+    },
+    {
+      "epoch": 0.9896907216494846,
+      "grad_norm": 0.0031653214246034622,
+      "learning_rate": 2e-05,
+      "loss": 0.0005,
+      "step": 96
+    },
+    {
+      "epoch": 1.0,
+      "step": 97,
+      "total_flos": 2888162800041984.0,
+      "train_loss": 0.1450096553133935,
+      "train_runtime": 415.6208,
+      "train_samples_per_second": 0.934,
+      "train_steps_per_second": 0.233
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 97,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 2888162800041984.0,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:117c5018b1144fbe01a8a0b3e5b5f28be996c6cd1ced5dd5ebae894b7b20764f
+size 978821398

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:46882a8e42fbde28008f5736f9a52d0589cd87b83849c4fd9c2719a7737d7caf
+size 978821398

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2f0198020029a280ceab5c502fcc1630094eccd304142cbe991b7716d5e76909
+size 978821398

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1bb825c00a750f5b116888f6e06e8a0f1899b7080a2228e4f85b242dabe7b805
+size 978821398

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0285e24aa92adaeb50c6942d77c9baad30255eac5a6072995e1689b161fae85e
+size 978818810

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cc759a1821037662e3bc31ea98126c55b6efe62a25eff727fe0d32a32c1ecc96
+size 978821398

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a25b0ef58db4a2b67f05037fa400effaa9f3be59bae025b818883e74667a446d
+size 978818810

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/2_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f1e176a28f5e8d10fdc2c78c18da653d7d6816ea6950bedf534d204526cd4a1e
+size 978818810

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/2_trainer_state.json ADDED Viewed

	@@ -0,0 +1,378 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 97,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.020618556701030927,
+      "grad_norm": 1.143397331237793,
+      "learning_rate": 2e-05,
+      "loss": 0.5443,
+      "step": 2
+    },
+    {
+      "epoch": 0.041237113402061855,
+      "grad_norm": 1.2255475521087646,
+      "learning_rate": 2e-05,
+      "loss": 0.9587,
+      "step": 4
+    },
+    {
+      "epoch": 0.061855670103092786,
+      "grad_norm": 1.8370898962020874,
+      "learning_rate": 2e-05,
+      "loss": 1.182,
+      "step": 6
+    },
+    {
+      "epoch": 0.08247422680412371,
+      "grad_norm": 0.24408237636089325,
+      "learning_rate": 2e-05,
+      "loss": 0.2572,
+      "step": 8
+    },
+    {
+      "epoch": 0.10309278350515463,
+      "grad_norm": 0.2356729656457901,
+      "learning_rate": 2e-05,
+      "loss": 0.3236,
+      "step": 10
+    },
+    {
+      "epoch": 0.12371134020618557,
+      "grad_norm": 0.12980803847312927,
+      "learning_rate": 2e-05,
+      "loss": 0.359,
+      "step": 12
+    },
+    {
+      "epoch": 0.14432989690721648,
+      "grad_norm": 0.34007528424263,
+      "learning_rate": 2e-05,
+      "loss": 0.1969,
+      "step": 14
+    },
+    {
+      "epoch": 0.16494845360824742,
+      "grad_norm": 0.8254105448722839,
+      "learning_rate": 2e-05,
+      "loss": 0.7104,
+      "step": 16
+    },
+    {
+      "epoch": 0.18556701030927836,
+      "grad_norm": 0.665677011013031,
+      "learning_rate": 2e-05,
+      "loss": 0.2014,
+      "step": 18
+    },
+    {
+      "epoch": 0.20618556701030927,
+      "grad_norm": 0.9692237973213196,
+      "learning_rate": 2e-05,
+      "loss": 0.6621,
+      "step": 20
+    },
+    {
+      "epoch": 0.2268041237113402,
+      "grad_norm": 0.43489089608192444,
+      "learning_rate": 2e-05,
+      "loss": 0.6234,
+      "step": 22
+    },
+    {
+      "epoch": 0.24742268041237114,
+      "grad_norm": 2.537994861602783,
+      "learning_rate": 2e-05,
+      "loss": 0.9041,
+      "step": 24
+    },
+    {
+      "epoch": 0.26804123711340205,
+      "grad_norm": 1.01339590549469,
+      "learning_rate": 2e-05,
+      "loss": 0.3681,
+      "step": 26
+    },
+    {
+      "epoch": 0.28865979381443296,
+      "grad_norm": 0.37009069323539734,
+      "learning_rate": 2e-05,
+      "loss": 0.4056,
+      "step": 28
+    },
+    {
+      "epoch": 0.30927835051546393,
+      "grad_norm": 0.044184956699609756,
+      "learning_rate": 2e-05,
+      "loss": 0.1972,
+      "step": 30
+    },
+    {
+      "epoch": 0.32989690721649484,
+      "grad_norm": 1.3115153312683105,
+      "learning_rate": 2e-05,
+      "loss": 0.3582,
+      "step": 32
+    },
+    {
+      "epoch": 0.35051546391752575,
+      "grad_norm": 0.7034705281257629,
+      "learning_rate": 2e-05,
+      "loss": 0.2604,
+      "step": 34
+    },
+    {
+      "epoch": 0.3711340206185567,
+      "grad_norm": 0.5956244468688965,
+      "learning_rate": 2e-05,
+      "loss": 0.9219,
+      "step": 36
+    },
+    {
+      "epoch": 0.3917525773195876,
+      "grad_norm": 1.4682765007019043,
+      "learning_rate": 2e-05,
+      "loss": 0.7098,
+      "step": 38
+    },
+    {
+      "epoch": 0.41237113402061853,
+      "grad_norm": 2.516416311264038,
+      "learning_rate": 2e-05,
+      "loss": 1.1477,
+      "step": 40
+    },
+    {
+      "epoch": 0.4329896907216495,
+      "grad_norm": 2.4257423877716064,
+      "learning_rate": 2e-05,
+      "loss": 1.0164,
+      "step": 42
+    },
+    {
+      "epoch": 0.4536082474226804,
+      "grad_norm": 0.3192073404788971,
+      "learning_rate": 2e-05,
+      "loss": 0.3794,
+      "step": 44
+    },
+    {
+      "epoch": 0.4742268041237113,
+      "grad_norm": 2.1369898319244385,
+      "learning_rate": 2e-05,
+      "loss": 0.5324,
+      "step": 46
+    },
+    {
+      "epoch": 0.4948453608247423,
+      "grad_norm": 0.22400034964084625,
+      "learning_rate": 2e-05,
+      "loss": 1.7004,
+      "step": 48
+    },
+    {
+      "epoch": 0.5154639175257731,
+      "grad_norm": 1.9823366403579712,
+      "learning_rate": 2e-05,
+      "loss": 0.9041,
+      "step": 50
+    },
+    {
+      "epoch": 0.5360824742268041,
+      "grad_norm": 1.1424986124038696,
+      "learning_rate": 2e-05,
+      "loss": 0.2122,
+      "step": 52
+    },
+    {
+      "epoch": 0.5567010309278351,
+      "grad_norm": 1.1508723497390747,
+      "learning_rate": 2e-05,
+      "loss": 0.2551,
+      "step": 54
+    },
+    {
+      "epoch": 0.5773195876288659,
+      "grad_norm": 1.047311544418335,
+      "learning_rate": 2e-05,
+      "loss": 0.3889,
+      "step": 56
+    },
+    {
+      "epoch": 0.5979381443298969,
+      "grad_norm": 0.28297775983810425,
+      "learning_rate": 2e-05,
+      "loss": 1.2793,
+      "step": 58
+    },
+    {
+      "epoch": 0.6185567010309279,
+      "grad_norm": 0.2760946452617645,
+      "learning_rate": 2e-05,
+      "loss": 0.4845,
+      "step": 60
+    },
+    {
+      "epoch": 0.6391752577319587,
+      "grad_norm": 3.4843385219573975,
+      "learning_rate": 2e-05,
+      "loss": 0.725,
+      "step": 62
+    },
+    {
+      "epoch": 0.6597938144329897,
+      "grad_norm": 0.1845403015613556,
+      "learning_rate": 2e-05,
+      "loss": 0.2025,
+      "step": 64
+    },
+    {
+      "epoch": 0.6804123711340206,
+      "grad_norm": 1.3841183185577393,
+      "learning_rate": 2e-05,
+      "loss": 0.6707,
+      "step": 66
+    },
+    {
+      "epoch": 0.7010309278350515,
+      "grad_norm": 0.6219921708106995,
+      "learning_rate": 2e-05,
+      "loss": 0.3708,
+      "step": 68
+    },
+    {
+      "epoch": 0.7216494845360825,
+      "grad_norm": 1.2532652616500854,
+      "learning_rate": 2e-05,
+      "loss": 0.6669,
+      "step": 70
+    },
+    {
+      "epoch": 0.7422680412371134,
+      "grad_norm": 1.8839783668518066,
+      "learning_rate": 2e-05,
+      "loss": 0.4824,
+      "step": 72
+    },
+    {
+      "epoch": 0.7628865979381443,
+      "grad_norm": 1.2260621786117554,
+      "learning_rate": 2e-05,
+      "loss": 0.8137,
+      "step": 74
+    },
+    {
+      "epoch": 0.7835051546391752,
+      "grad_norm": 1.1083022356033325,
+      "learning_rate": 2e-05,
+      "loss": 0.9023,
+      "step": 76
+    },
+    {
+      "epoch": 0.8041237113402062,
+      "grad_norm": 0.7099221348762512,
+      "learning_rate": 2e-05,
+      "loss": 0.3594,
+      "step": 78
+    },
+    {
+      "epoch": 0.8247422680412371,
+      "grad_norm": 1.9942265748977661,
+      "learning_rate": 2e-05,
+      "loss": 0.4561,
+      "step": 80
+    },
+    {
+      "epoch": 0.845360824742268,
+      "grad_norm": 3.795022964477539,
+      "learning_rate": 2e-05,
+      "loss": 1.0328,
+      "step": 82
+    },
+    {
+      "epoch": 0.865979381443299,
+      "grad_norm": 0.9263180494308472,
+      "learning_rate": 2e-05,
+      "loss": 0.6605,
+      "step": 84
+    },
+    {
+      "epoch": 0.8865979381443299,
+      "grad_norm": 1.9401521682739258,
+      "learning_rate": 2e-05,
+      "loss": 1.3343,
+      "step": 86
+    },
+    {
+      "epoch": 0.9072164948453608,
+      "grad_norm": 1.5276206731796265,
+      "learning_rate": 2e-05,
+      "loss": 0.6242,
+      "step": 88
+    },
+    {
+      "epoch": 0.9278350515463918,
+      "grad_norm": 2.310457229614258,
+      "learning_rate": 2e-05,
+      "loss": 0.854,
+      "step": 90
+    },
+    {
+      "epoch": 0.9484536082474226,
+      "grad_norm": 1.974561333656311,
+      "learning_rate": 2e-05,
+      "loss": 0.8861,
+      "step": 92
+    },
+    {
+      "epoch": 0.9690721649484536,
+      "grad_norm": 2.190361499786377,
+      "learning_rate": 2e-05,
+      "loss": 1.0974,
+      "step": 94
+    },
+    {
+      "epoch": 0.9896907216494846,
+      "grad_norm": 1.6531275510787964,
+      "learning_rate": 2e-05,
+      "loss": 0.7672,
+      "step": 96
+    },
+    {
+      "epoch": 1.0,
+      "step": 97,
+      "total_flos": 5270224836231168.0,
+      "train_loss": 0.6526356726577601,
+      "train_runtime": 527.3005,
+      "train_samples_per_second": 0.736,
+      "train_steps_per_second": 0.184
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 97,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 5270224836231168.0,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c7f38637be273d636ae4bf42e45ac88bd68d613b9db39c4011385158e57cfc82
+size 606590838

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:15d4a001460770d6133cfe80cb6b1118d692eac140ab64b0b5dbe135a59035d9
+size 606590838

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:79870074898564ea9937eef2cb84f972f35f15ef60ff83d4d5e9221c910c1649
+size 606590838

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5072ca902f0faeb5daf4f968b0859f0fd9c37293147851a3bf30d319ee022741
+size 606590838

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:89b72835c7dcc77117ee65d0b8a56db8bcef201336153949791586c6cf628dbb
+size 606588810

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f5da7ae67d07bffcb1ca91e721216e9bb57862eaf28b3fd5621c55e61375a5e0
+size 606590838

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e0ddcc5243cf0cbb1c7689c4e85a09a645f7f24a043fbffea59babe8a120ff12
+size 606588810

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/3_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b38eb64e42265ae8776bbe390aeea5b07ff1fa63c9ecc1aeae053eae53259c4c
+size 606588810

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/3_trainer_state.json ADDED Viewed

	@@ -0,0 +1,378 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 97,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.020618556701030927,
+      "grad_norm": 0.8621726036071777,
+      "learning_rate": 2e-05,
+      "loss": 0.784,
+      "step": 2
+    },
+    {
+      "epoch": 0.041237113402061855,
+      "grad_norm": 0.5997222661972046,
+      "learning_rate": 2e-05,
+      "loss": 0.6114,
+      "step": 4
+    },
+    {
+      "epoch": 0.061855670103092786,
+      "grad_norm": 3.3685293197631836,
+      "learning_rate": 2e-05,
+      "loss": 1.8636,
+      "step": 6
+    },
+    {
+      "epoch": 0.08247422680412371,
+      "grad_norm": 1.9444336891174316,
+      "learning_rate": 2e-05,
+      "loss": 0.7377,
+      "step": 8
+    },
+    {
+      "epoch": 0.10309278350515463,
+      "grad_norm": 3.8980281352996826,
+      "learning_rate": 2e-05,
+      "loss": 2.0884,
+      "step": 10
+    },
+    {
+      "epoch": 0.12371134020618557,
+      "grad_norm": 3.079683542251587,
+      "learning_rate": 2e-05,
+      "loss": 1.1494,
+      "step": 12
+    },
+    {
+      "epoch": 0.14432989690721648,
+      "grad_norm": 3.4189367294311523,
+      "learning_rate": 2e-05,
+      "loss": 0.9661,
+      "step": 14
+    },
+    {
+      "epoch": 0.16494845360824742,
+      "grad_norm": 1.382783055305481,
+      "learning_rate": 2e-05,
+      "loss": 1.0355,
+      "step": 16
+    },
+    {
+      "epoch": 0.18556701030927836,
+      "grad_norm": 5.828529357910156,
+      "learning_rate": 2e-05,
+      "loss": 1.5671,
+      "step": 18
+    },
+    {
+      "epoch": 0.20618556701030927,
+      "grad_norm": 2.367591142654419,
+      "learning_rate": 2e-05,
+      "loss": 0.8609,
+      "step": 20
+    },
+    {
+      "epoch": 0.2268041237113402,
+      "grad_norm": 1.9332449436187744,
+      "learning_rate": 2e-05,
+      "loss": 0.9275,
+      "step": 22
+    },
+    {
+      "epoch": 0.24742268041237114,
+      "grad_norm": 1.3459978103637695,
+      "learning_rate": 2e-05,
+      "loss": 0.8898,
+      "step": 24
+    },
+    {
+      "epoch": 0.26804123711340205,
+      "grad_norm": 1.5858796834945679,
+      "learning_rate": 2e-05,
+      "loss": 0.3414,
+      "step": 26
+    },
+    {
+      "epoch": 0.28865979381443296,
+      "grad_norm": 1.9047499895095825,
+      "learning_rate": 2e-05,
+      "loss": 3.4836,
+      "step": 28
+    },
+    {
+      "epoch": 0.30927835051546393,
+      "grad_norm": 3.298762321472168,
+      "learning_rate": 2e-05,
+      "loss": 1.4902,
+      "step": 30
+    },
+    {
+      "epoch": 0.32989690721649484,
+      "grad_norm": 1.7490943670272827,
+      "learning_rate": 2e-05,
+      "loss": 0.759,
+      "step": 32
+    },
+    {
+      "epoch": 0.35051546391752575,
+      "grad_norm": 0.9601039290428162,
+      "learning_rate": 2e-05,
+      "loss": 0.5406,
+      "step": 34
+    },
+    {
+      "epoch": 0.3711340206185567,
+      "grad_norm": 1.696427345275879,
+      "learning_rate": 2e-05,
+      "loss": 0.5591,
+      "step": 36
+    },
+    {
+      "epoch": 0.3917525773195876,
+      "grad_norm": 4.497976779937744,
+      "learning_rate": 2e-05,
+      "loss": 1.48,
+      "step": 38
+    },
+    {
+      "epoch": 0.41237113402061853,
+      "grad_norm": 1.4220675230026245,
+      "learning_rate": 2e-05,
+      "loss": 1.9096,
+      "step": 40
+    },
+    {
+      "epoch": 0.4329896907216495,
+      "grad_norm": 0.5704763531684875,
+      "learning_rate": 2e-05,
+      "loss": 1.0739,
+      "step": 42
+    },
+    {
+      "epoch": 0.4536082474226804,
+      "grad_norm": 3.798910140991211,
+      "learning_rate": 2e-05,
+      "loss": 0.8083,
+      "step": 44
+    },
+    {
+      "epoch": 0.4742268041237113,
+      "grad_norm": 0.6530976891517639,
+      "learning_rate": 2e-05,
+      "loss": 0.3467,
+      "step": 46
+    },
+    {
+      "epoch": 0.4948453608247423,
+      "grad_norm": 2.5659232139587402,
+      "learning_rate": 2e-05,
+      "loss": 1.2449,
+      "step": 48
+    },
+    {
+      "epoch": 0.5154639175257731,
+      "grad_norm": 1.7021549940109253,
+      "learning_rate": 2e-05,
+      "loss": 0.991,
+      "step": 50
+    },
+    {
+      "epoch": 0.5360824742268041,
+      "grad_norm": 2.904054880142212,
+      "learning_rate": 2e-05,
+      "loss": 0.9027,
+      "step": 52
+    },
+    {
+      "epoch": 0.5567010309278351,
+      "grad_norm": 0.40748944878578186,
+      "learning_rate": 2e-05,
+      "loss": 0.3164,
+      "step": 54
+    },
+    {
+      "epoch": 0.5773195876288659,
+      "grad_norm": 1.6402074098587036,
+      "learning_rate": 2e-05,
+      "loss": 0.4264,
+      "step": 56
+    },
+    {
+      "epoch": 0.5979381443298969,
+      "grad_norm": 3.439208984375,
+      "learning_rate": 2e-05,
+      "loss": 2.0284,
+      "step": 58
+    },
+    {
+      "epoch": 0.6185567010309279,
+      "grad_norm": 2.8119544982910156,
+      "learning_rate": 2e-05,
+      "loss": 1.5881,
+      "step": 60
+    },
+    {
+      "epoch": 0.6391752577319587,
+      "grad_norm": 1.5405571460723877,
+      "learning_rate": 2e-05,
+      "loss": 0.9022,
+      "step": 62
+    },
+    {
+      "epoch": 0.6597938144329897,
+      "grad_norm": 4.333232402801514,
+      "learning_rate": 2e-05,
+      "loss": 1.2758,
+      "step": 64
+    },
+    {
+      "epoch": 0.6804123711340206,
+      "grad_norm": 1.6036462783813477,
+      "learning_rate": 2e-05,
+      "loss": 0.7932,
+      "step": 66
+    },
+    {
+      "epoch": 0.7010309278350515,
+      "grad_norm": 0.596666157245636,
+      "learning_rate": 2e-05,
+      "loss": 0.7625,
+      "step": 68
+    },
+    {
+      "epoch": 0.7216494845360825,
+      "grad_norm": 2.8570806980133057,
+      "learning_rate": 2e-05,
+      "loss": 1.7929,
+      "step": 70
+    },
+    {
+      "epoch": 0.7422680412371134,
+      "grad_norm": 2.321223020553589,
+      "learning_rate": 2e-05,
+      "loss": 1.2169,
+      "step": 72
+    },
+    {
+      "epoch": 0.7628865979381443,
+      "grad_norm": 4.413544178009033,
+      "learning_rate": 2e-05,
+      "loss": 1.3534,
+      "step": 74
+    },
+    {
+      "epoch": 0.7835051546391752,
+      "grad_norm": 1.6249202489852905,
+      "learning_rate": 2e-05,
+      "loss": 0.6887,
+      "step": 76
+    },
+    {
+      "epoch": 0.8041237113402062,
+      "grad_norm": 3.379758834838867,
+      "learning_rate": 2e-05,
+      "loss": 2.4109,
+      "step": 78
+    },
+    {
+      "epoch": 0.8247422680412371,
+      "grad_norm": 1.7662537097930908,
+      "learning_rate": 2e-05,
+      "loss": 0.8549,
+      "step": 80
+    },
+    {
+      "epoch": 0.845360824742268,
+      "grad_norm": 2.5819923877716064,
+      "learning_rate": 2e-05,
+      "loss": 0.6496,
+      "step": 82
+    },
+    {
+      "epoch": 0.865979381443299,
+      "grad_norm": 2.989832878112793,
+      "learning_rate": 2e-05,
+      "loss": 1.1886,
+      "step": 84
+    },
+    {
+      "epoch": 0.8865979381443299,
+      "grad_norm": 1.8118072748184204,
+      "learning_rate": 2e-05,
+      "loss": 1.149,
+      "step": 86
+    },
+    {
+      "epoch": 0.9072164948453608,
+      "grad_norm": 1.4145994186401367,
+      "learning_rate": 2e-05,
+      "loss": 0.8608,
+      "step": 88
+    },
+    {
+      "epoch": 0.9278350515463918,
+      "grad_norm": 1.3375070095062256,
+      "learning_rate": 2e-05,
+      "loss": 0.9514,
+      "step": 90
+    },
+    {
+      "epoch": 0.9484536082474226,
+      "grad_norm": 5.697417259216309,
+      "learning_rate": 2e-05,
+      "loss": 1.387,
+      "step": 92
+    },
+    {
+      "epoch": 0.9690721649484536,
+      "grad_norm": 3.187375545501709,
+      "learning_rate": 2e-05,
+      "loss": 0.7515,
+      "step": 94
+    },
+    {
+      "epoch": 0.9896907216494846,
+      "grad_norm": 4.534388542175293,
+      "learning_rate": 2e-05,
+      "loss": 1.2819,
+      "step": 96
+    },
+    {
+      "epoch": 1.0,
+      "step": 97,
+      "total_flos": 2928335550152704.0,
+      "train_loss": 1.1240325613120168,
+      "train_runtime": 413.8678,
+      "train_samples_per_second": 0.937,
+      "train_steps_per_second": 0.234
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 97,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 2928335550152704.0,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2ede28fdd2cede10ccf106490cbc2da115e8236fc942f0fc8573f1f3127100ea
+size 978821398

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a41cc09a59ab65452ba45d80dcde938e20a6d1c74313d8d819237825ecc5c129
+size 978821398

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0231971052f8cadaf5af44030be3e4a0d1119e6cd551875513b30a19e2ba16ae
+size 978821398

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d03f1b6ddfea3320be70db4eec5aaea28b3cb748e1b15df3c1c0241f193f5de4
+size 978821398

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3c540936a1e1cfa6e1e8ac3eab7ab2ad6ef4730a3d071d311b3d2e6888cfda4f
+size 978818810

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b455529478842b55f61e1722446272f3df530a1f55a1a44c5e36df6879739386
+size 978821398

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c4c4f909649374c7493c39988abbb17b7a6ec2b86497510258894a8ca3398f0e
+size 978818810

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/4_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6a6fd9c6fe317a9688edc469a71b86ddcb698e23fbe087692d2d4d5f8bda91a5
+size 978818810

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/4_trainer_state.json ADDED Viewed

	@@ -0,0 +1,378 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 97,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.020618556701030927,
+      "grad_norm": 1.9402724504470825,
+      "learning_rate": 2e-05,
+      "loss": 0.5838,
+      "step": 2
+    },
+    {
+      "epoch": 0.041237113402061855,
+      "grad_norm": 2.4250800609588623,
+      "learning_rate": 2e-05,
+      "loss": 1.2304,
+      "step": 4
+    },
+    {
+      "epoch": 0.061855670103092786,
+      "grad_norm": 1.5540610551834106,
+      "learning_rate": 2e-05,
+      "loss": 0.3604,
+      "step": 6
+    },
+    {
+      "epoch": 0.08247422680412371,
+      "grad_norm": 0.7538492679595947,
+      "learning_rate": 2e-05,
+      "loss": 0.6599,
+      "step": 8
+    },
+    {
+      "epoch": 0.10309278350515463,
+      "grad_norm": 0.9257169365882874,
+      "learning_rate": 2e-05,
+      "loss": 0.6932,
+      "step": 10
+    },
+    {
+      "epoch": 0.12371134020618557,
+      "grad_norm": 0.5299786329269409,
+      "learning_rate": 2e-05,
+      "loss": 0.5977,
+      "step": 12
+    },
+    {
+      "epoch": 0.14432989690721648,
+      "grad_norm": 1.8260445594787598,
+      "learning_rate": 2e-05,
+      "loss": 0.7848,
+      "step": 14
+    },
+    {
+      "epoch": 0.16494845360824742,
+      "grad_norm": 1.0459568500518799,
+      "learning_rate": 2e-05,
+      "loss": 0.423,
+      "step": 16
+    },
+    {
+      "epoch": 0.18556701030927836,
+      "grad_norm": 0.7857280373573303,
+      "learning_rate": 2e-05,
+      "loss": 0.5644,
+      "step": 18
+    },
+    {
+      "epoch": 0.20618556701030927,
+      "grad_norm": 1.1462950706481934,
+      "learning_rate": 2e-05,
+      "loss": 1.446,
+      "step": 20
+    },
+    {
+      "epoch": 0.2268041237113402,
+      "grad_norm": 2.205085039138794,
+      "learning_rate": 2e-05,
+      "loss": 1.4026,
+      "step": 22
+    },
+    {
+      "epoch": 0.24742268041237114,
+      "grad_norm": 0.7716929316520691,
+      "learning_rate": 2e-05,
+      "loss": 0.312,
+      "step": 24
+    },
+    {
+      "epoch": 0.26804123711340205,
+      "grad_norm": 1.7518846988677979,
+      "learning_rate": 2e-05,
+      "loss": 0.9049,
+      "step": 26
+    },
+    {
+      "epoch": 0.28865979381443296,
+      "grad_norm": 0.8513244390487671,
+      "learning_rate": 2e-05,
+      "loss": 0.7163,
+      "step": 28
+    },
+    {
+      "epoch": 0.30927835051546393,
+      "grad_norm": 1.708772897720337,
+      "learning_rate": 2e-05,
+      "loss": 0.848,
+      "step": 30
+    },
+    {
+      "epoch": 0.32989690721649484,
+      "grad_norm": 1.2805875539779663,
+      "learning_rate": 2e-05,
+      "loss": 0.8176,
+      "step": 32
+    },
+    {
+      "epoch": 0.35051546391752575,
+      "grad_norm": 0.7299635410308838,
+      "learning_rate": 2e-05,
+      "loss": 0.3226,
+      "step": 34
+    },
+    {
+      "epoch": 0.3711340206185567,
+      "grad_norm": 0.9453825354576111,
+      "learning_rate": 2e-05,
+      "loss": 0.4467,
+      "step": 36
+    },
+    {
+      "epoch": 0.3917525773195876,
+      "grad_norm": 0.4364389181137085,
+      "learning_rate": 2e-05,
+      "loss": 0.4499,
+      "step": 38
+    },
+    {
+      "epoch": 0.41237113402061853,
+      "grad_norm": 0.4604692757129669,
+      "learning_rate": 2e-05,
+      "loss": 0.7041,
+      "step": 40
+    },
+    {
+      "epoch": 0.4329896907216495,
+      "grad_norm": 0.42262014746665955,
+      "learning_rate": 2e-05,
+      "loss": 0.5528,
+      "step": 42
+    },
+    {
+      "epoch": 0.4536082474226804,
+      "grad_norm": 0.2717072069644928,
+      "learning_rate": 2e-05,
+      "loss": 0.2196,
+      "step": 44
+    },
+    {
+      "epoch": 0.4742268041237113,
+      "grad_norm": 1.1014915704727173,
+      "learning_rate": 2e-05,
+      "loss": 0.4718,
+      "step": 46
+    },
+    {
+      "epoch": 0.4948453608247423,
+      "grad_norm": 0.48280566930770874,
+      "learning_rate": 2e-05,
+      "loss": 0.1461,
+      "step": 48
+    },
+    {
+      "epoch": 0.5154639175257731,
+      "grad_norm": 1.16571843624115,
+      "learning_rate": 2e-05,
+      "loss": 0.7124,
+      "step": 50
+    },
+    {
+      "epoch": 0.5360824742268041,
+      "grad_norm": 0.14320193231105804,
+      "learning_rate": 2e-05,
+      "loss": 0.7823,
+      "step": 52
+    },
+    {
+      "epoch": 0.5567010309278351,
+      "grad_norm": 1.8387656211853027,
+      "learning_rate": 2e-05,
+      "loss": 0.3319,
+      "step": 54
+    },
+    {
+      "epoch": 0.5773195876288659,
+      "grad_norm": 0.9942914247512817,
+      "learning_rate": 2e-05,
+      "loss": 0.4071,
+      "step": 56
+    },
+    {
+      "epoch": 0.5979381443298969,
+      "grad_norm": 1.0944980382919312,
+      "learning_rate": 2e-05,
+      "loss": 0.617,
+      "step": 58
+    },
+    {
+      "epoch": 0.6185567010309279,
+      "grad_norm": 1.0097112655639648,
+      "learning_rate": 2e-05,
+      "loss": 0.2987,
+      "step": 60
+    },
+    {
+      "epoch": 0.6391752577319587,
+      "grad_norm": 1.1440106630325317,
+      "learning_rate": 2e-05,
+      "loss": 0.7794,
+      "step": 62
+    },
+    {
+      "epoch": 0.6597938144329897,
+      "grad_norm": 0.9374860525131226,
+      "learning_rate": 2e-05,
+      "loss": 0.737,
+      "step": 64
+    },
+    {
+      "epoch": 0.6804123711340206,
+      "grad_norm": 1.6988123655319214,
+      "learning_rate": 2e-05,
+      "loss": 0.7242,
+      "step": 66
+    },
+    {
+      "epoch": 0.7010309278350515,
+      "grad_norm": 1.1150574684143066,
+      "learning_rate": 2e-05,
+      "loss": 0.2495,
+      "step": 68
+    },
+    {
+      "epoch": 0.7216494845360825,
+      "grad_norm": 1.318420171737671,
+      "learning_rate": 2e-05,
+      "loss": 1.0947,
+      "step": 70
+    },
+    {
+      "epoch": 0.7422680412371134,
+      "grad_norm": 0.7494012713432312,
+      "learning_rate": 2e-05,
+      "loss": 0.4376,
+      "step": 72
+    },
+    {
+      "epoch": 0.7628865979381443,
+      "grad_norm": 0.5291847586631775,
+      "learning_rate": 2e-05,
+      "loss": 1.1724,
+      "step": 74
+    },
+    {
+      "epoch": 0.7835051546391752,
+      "grad_norm": 0.8617143630981445,
+      "learning_rate": 2e-05,
+      "loss": 0.552,
+      "step": 76
+    },
+    {
+      "epoch": 0.8041237113402062,
+      "grad_norm": 0.4218270480632782,
+      "learning_rate": 2e-05,
+      "loss": 0.1633,
+      "step": 78
+    },
+    {
+      "epoch": 0.8247422680412371,
+      "grad_norm": 1.3452715873718262,
+      "learning_rate": 2e-05,
+      "loss": 0.8789,
+      "step": 80
+    },
+    {
+      "epoch": 0.845360824742268,
+      "grad_norm": 1.967393398284912,
+      "learning_rate": 2e-05,
+      "loss": 0.4333,
+      "step": 82
+    },
+    {
+      "epoch": 0.865979381443299,
+      "grad_norm": 1.4400347471237183,
+      "learning_rate": 2e-05,
+      "loss": 0.9299,
+      "step": 84
+    },
+    {
+      "epoch": 0.8865979381443299,
+      "grad_norm": 0.30658483505249023,
+      "learning_rate": 2e-05,
+      "loss": 1.0109,
+      "step": 86
+    },
+    {
+      "epoch": 0.9072164948453608,
+      "grad_norm": 0.16921880841255188,
+      "learning_rate": 2e-05,
+      "loss": 0.2108,
+      "step": 88
+    },
+    {
+      "epoch": 0.9278350515463918,
+      "grad_norm": 0.4752196669578552,
+      "learning_rate": 2e-05,
+      "loss": 0.4654,
+      "step": 90
+    },
+    {
+      "epoch": 0.9484536082474226,
+      "grad_norm": 2.074636936187744,
+      "learning_rate": 2e-05,
+      "loss": 0.8971,
+      "step": 92
+    },
+    {
+      "epoch": 0.9690721649484536,
+      "grad_norm": 1.7106537818908691,
+      "learning_rate": 2e-05,
+      "loss": 1.0818,
+      "step": 94
+    },
+    {
+      "epoch": 0.9896907216494846,
+      "grad_norm": 0.6808597445487976,
+      "learning_rate": 2e-05,
+      "loss": 0.6208,
+      "step": 96
+    },
+    {
+      "epoch": 1.0,
+      "step": 97,
+      "total_flos": 6081635527163904.0,
+      "train_loss": 0.6636996711652303,
+      "train_runtime": 526.4308,
+      "train_samples_per_second": 0.737,
+      "train_steps_per_second": 0.184
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 97,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 6081635527163904.0,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1e1ca40ac7a86695907ed50ab92b3322e850ce3c6b20d88160df8fea655233b1
+size 978821398

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dd30b73f84f40cfc88d63e9fc388b5f992dd60422583b803e4554908460b5e99
+size 978821398

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7daa10dfe387d89f37538ddaf13b254637fcf67fec290c83210cf4e18f936ec8
+size 978821398

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:84e1d84adca8d5f3beff7b2330eaacb77d10fc1382a4a63da515bd4d30c4402e
+size 978821398

client_states_feddualMultipqfullfreeze_homoAgg_moe_T05_freq10_bs4_saveoptim_lr2e-5_sc1316_4tasks_5rounds_fixitr97_T0125_decay099/5_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ace73a466487a0e201e84be96ae47e72b535f683a7e17c5ddf448191f327469e
+size 978818810