thkim0305
/

feddat_baselines

Model card Files Files and versions Community

thkim0305 commited on 12 days ago

Commit

89af0dc

verified ·

1 Parent(s): 653cc5e

Upload folder using huggingface_hub

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/0_client_model_round10.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/0_client_model_round12.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/0_client_model_round15.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/0_client_model_round17.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/0_client_model_round2.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/0_client_model_round20.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/0_client_model_round5.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/0_client_model_round7.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/0_trainer_state.json +217 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/1_client_model_round10.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/1_client_model_round12.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/1_client_model_round15.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/1_client_model_round17.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/1_client_model_round2.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/1_client_model_round20.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/1_client_model_round5.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/1_client_model_round7.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/1_trainer_state.json +217 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/2_client_model_round10.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/2_client_model_round12.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/2_client_model_round15.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/2_client_model_round17.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/2_client_model_round2.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/2_client_model_round20.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/2_client_model_round5.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/2_client_model_round7.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/2_trainer_state.json +217 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/3_client_model_round10.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/3_client_model_round12.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/3_client_model_round15.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/3_client_model_round17.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/3_client_model_round2.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/3_client_model_round20.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/3_client_model_round5.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/3_client_model_round7.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/3_trainer_state.json +217 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/4_client_model_round10.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/4_client_model_round12.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/4_client_model_round15.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/4_client_model_round17.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/4_client_model_round2.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/4_client_model_round20.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/4_client_model_round5.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/4_client_model_round7.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/4_trainer_state.json +217 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/5_client_model_round10.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/5_client_model_round12.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/5_client_model_round15.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/5_client_model_round17.pth +3 -0
client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/5_client_model_round2.pth +3 -0

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/0_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7187654c3b2b4a311de981775f06ff9aaec06521ba6f2d55fe0cca74a083b1b8
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/0_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8cb851df31a265321fab4c368129ff8bdfbcfb7e63e72bb40c7b878badc6ba4d
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/0_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0571775d806cb5694d12bbbb59deb5715b149b625563380d3b53f0b2c4a0e406
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/0_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:11bb9051b5c160af184c1a503e926ded05fb4faa720a3b2ac735df443714d0b7
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/0_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:242baa74ecd2e89b8949e441e1eb503db5855524efbfd97bc9c9e937ad7f281a
+size 778341034

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/0_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:28f97f86483164a291e4dfb7b1b7323fe209e49380184a1ab9edb5093a58c2c2
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/0_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:50eb45b2ed832ed4563d161d284a70b3fd463cd5d377c0fe903be291076a7133
+size 778341034

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/0_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:928ec6d986859b197e14f18c3d237108b5a867442d77ef59f22e5e74a1481437
+size 778341034

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/0_trainer_state.json ADDED Viewed

	@@ -0,0 +1,217 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 50,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.08,
+      "grad_norm": 17.835098266601562,
+      "learning_rate": 2e-05,
+      "loss": 1.2723,
+      "step": 2
+    },
+    {
+      "epoch": 0.16,
+      "grad_norm": 5.935124397277832,
+      "learning_rate": 2e-05,
+      "loss": 0.3235,
+      "step": 4
+    },
+    {
+      "epoch": 0.24,
+      "grad_norm": 11.949447631835938,
+      "learning_rate": 2e-05,
+      "loss": 0.6892,
+      "step": 6
+    },
+    {
+      "epoch": 0.32,
+      "grad_norm": 4.54430627822876,
+      "learning_rate": 2e-05,
+      "loss": 0.5368,
+      "step": 8
+    },
+    {
+      "epoch": 0.4,
+      "grad_norm": 16.603609085083008,
+      "learning_rate": 2e-05,
+      "loss": 0.9215,
+      "step": 10
+    },
+    {
+      "epoch": 0.48,
+      "grad_norm": 6.623965263366699,
+      "learning_rate": 2e-05,
+      "loss": 0.798,
+      "step": 12
+    },
+    {
+      "epoch": 0.56,
+      "grad_norm": 5.242029666900635,
+      "learning_rate": 2e-05,
+      "loss": 0.3287,
+      "step": 14
+    },
+    {
+      "epoch": 0.64,
+      "grad_norm": 3.1021950244903564,
+      "learning_rate": 2e-05,
+      "loss": 0.1253,
+      "step": 16
+    },
+    {
+      "epoch": 0.72,
+      "grad_norm": 4.434370517730713,
+      "learning_rate": 2e-05,
+      "loss": 0.5437,
+      "step": 18
+    },
+    {
+      "epoch": 0.8,
+      "grad_norm": 1.40633225440979,
+      "learning_rate": 2e-05,
+      "loss": 0.4146,
+      "step": 20
+    },
+    {
+      "epoch": 0.88,
+      "grad_norm": 5.0599894523620605,
+      "learning_rate": 2e-05,
+      "loss": 0.4193,
+      "step": 22
+    },
+    {
+      "epoch": 0.96,
+      "grad_norm": 3.8830926418304443,
+      "learning_rate": 2e-05,
+      "loss": 0.4138,
+      "step": 24
+    },
+    {
+      "epoch": 1.04,
+      "grad_norm": 4.712460517883301,
+      "learning_rate": 2e-05,
+      "loss": 0.3751,
+      "step": 26
+    },
+    {
+      "epoch": 1.12,
+      "grad_norm": 3.2360763549804688,
+      "learning_rate": 2e-05,
+      "loss": 0.1469,
+      "step": 28
+    },
+    {
+      "epoch": 1.2,
+      "grad_norm": 2.5379559993743896,
+      "learning_rate": 2e-05,
+      "loss": 0.4358,
+      "step": 30
+    },
+    {
+      "epoch": 1.28,
+      "grad_norm": 8.039641380310059,
+      "learning_rate": 2e-05,
+      "loss": 0.3871,
+      "step": 32
+    },
+    {
+      "epoch": 1.36,
+      "grad_norm": 0.877090334892273,
+      "learning_rate": 2e-05,
+      "loss": 0.1099,
+      "step": 34
+    },
+    {
+      "epoch": 1.44,
+      "grad_norm": 2.0384771823883057,
+      "learning_rate": 2e-05,
+      "loss": 0.2192,
+      "step": 36
+    },
+    {
+      "epoch": 1.52,
+      "grad_norm": 11.140633583068848,
+      "learning_rate": 2e-05,
+      "loss": 0.8123,
+      "step": 38
+    },
+    {
+      "epoch": 1.6,
+      "grad_norm": 6.476287364959717,
+      "learning_rate": 2e-05,
+      "loss": 0.3829,
+      "step": 40
+    },
+    {
+      "epoch": 1.68,
+      "grad_norm": 3.3182876110076904,
+      "learning_rate": 2e-05,
+      "loss": 0.6873,
+      "step": 42
+    },
+    {
+      "epoch": 1.76,
+      "grad_norm": 2.2434990406036377,
+      "learning_rate": 2e-05,
+      "loss": 0.2576,
+      "step": 44
+    },
+    {
+      "epoch": 1.84,
+      "grad_norm": 5.116442680358887,
+      "learning_rate": 2e-05,
+      "loss": 0.2816,
+      "step": 46
+    },
+    {
+      "epoch": 1.92,
+      "grad_norm": 0.7951710820198059,
+      "learning_rate": 2e-05,
+      "loss": 0.3147,
+      "step": 48
+    },
+    {
+      "epoch": 2.0,
+      "grad_norm": 0.8207076191902161,
+      "learning_rate": 2e-05,
+      "loss": 0.3024,
+      "step": 50
+    },
+    {
+      "epoch": 2.0,
+      "step": 50,
+      "total_flos": 5262842336903168.0,
+      "train_loss": 0.4599846029281616,
+      "train_runtime": 188.7148,
+      "train_samples_per_second": 1.06,
+      "train_steps_per_second": 0.265
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 50,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 5262842336903168.0,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/1_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a99edaae05995e51b6df8fbbe76020d1d486ec42021f513ad5178460e3caf352
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/1_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8ea5209a560b65ca173a1db13c7882797c188b5f65cd986de2c86f36a11b818b
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/1_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6b6bd292c09e6962198a402a9c211d7fac264c0dbd9a6790e5fd52fed5cda0ea
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/1_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:15284a64a6f8f75bd6b4569811f3589ea26f5f4201e28360866fdc2e53febe13
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/1_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5711178c5463f7ab46aa53c7536f6313fea20d64a6ab19d533937da9107ba298
+size 778341034

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/1_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c3e45fd3aced541c26cc0e326088f986e7d84f3d20c3f8178f1de7b27303044c
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/1_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c4aaa54fadfb0db8bc6921f83398260e95c0c7a12df124a447f18c8a99c608c7
+size 778341034

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/1_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1bf21825f399573276b614a5a9d8af30444b25aa7421f5be03a7df223b109e28
+size 778341034

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/1_trainer_state.json ADDED Viewed

	@@ -0,0 +1,217 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 50,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.08,
+      "grad_norm": 0.446603924036026,
+      "learning_rate": 2e-05,
+      "loss": 0.1359,
+      "step": 2
+    },
+    {
+      "epoch": 0.16,
+      "grad_norm": 0.10891813039779663,
+      "learning_rate": 2e-05,
+      "loss": 0.0153,
+      "step": 4
+    },
+    {
+      "epoch": 0.24,
+      "grad_norm": 0.08321043103933334,
+      "learning_rate": 2e-05,
+      "loss": 0.0524,
+      "step": 6
+    },
+    {
+      "epoch": 0.32,
+      "grad_norm": 1.2470159530639648,
+      "learning_rate": 2e-05,
+      "loss": 0.0364,
+      "step": 8
+    },
+    {
+      "epoch": 0.4,
+      "grad_norm": 0.0992945060133934,
+      "learning_rate": 2e-05,
+      "loss": 0.082,
+      "step": 10
+    },
+    {
+      "epoch": 0.48,
+      "grad_norm": 1.0286638736724854,
+      "learning_rate": 2e-05,
+      "loss": 0.0263,
+      "step": 12
+    },
+    {
+      "epoch": 0.56,
+      "grad_norm": 1.4307641983032227,
+      "learning_rate": 2e-05,
+      "loss": 0.0744,
+      "step": 14
+    },
+    {
+      "epoch": 0.64,
+      "grad_norm": 0.12711121141910553,
+      "learning_rate": 2e-05,
+      "loss": 0.0168,
+      "step": 16
+    },
+    {
+      "epoch": 0.72,
+      "grad_norm": 1.582565426826477,
+      "learning_rate": 2e-05,
+      "loss": 0.0624,
+      "step": 18
+    },
+    {
+      "epoch": 0.8,
+      "grad_norm": 1.4729337692260742,
+      "learning_rate": 2e-05,
+      "loss": 0.048,
+      "step": 20
+    },
+    {
+      "epoch": 0.88,
+      "grad_norm": 0.009418491274118423,
+      "learning_rate": 2e-05,
+      "loss": 0.0155,
+      "step": 22
+    },
+    {
+      "epoch": 0.96,
+      "grad_norm": 0.010489478707313538,
+      "learning_rate": 2e-05,
+      "loss": 0.0151,
+      "step": 24
+    },
+    {
+      "epoch": 1.04,
+      "grad_norm": 1.960877537727356,
+      "learning_rate": 2e-05,
+      "loss": 0.0259,
+      "step": 26
+    },
+    {
+      "epoch": 1.12,
+      "grad_norm": 0.009839626960456371,
+      "learning_rate": 2e-05,
+      "loss": 0.015,
+      "step": 28
+    },
+    {
+      "epoch": 1.2,
+      "grad_norm": 0.08140977472066879,
+      "learning_rate": 2e-05,
+      "loss": 0.0953,
+      "step": 30
+    },
+    {
+      "epoch": 1.28,
+      "grad_norm": 0.023913130164146423,
+      "learning_rate": 2e-05,
+      "loss": 0.0145,
+      "step": 32
+    },
+    {
+      "epoch": 1.36,
+      "grad_norm": 3.580852746963501,
+      "learning_rate": 2e-05,
+      "loss": 0.1049,
+      "step": 34
+    },
+    {
+      "epoch": 1.44,
+      "grad_norm": 0.009584111161530018,
+      "learning_rate": 2e-05,
+      "loss": 0.0209,
+      "step": 36
+    },
+    {
+      "epoch": 1.52,
+      "grad_norm": 0.00926352571696043,
+      "learning_rate": 2e-05,
+      "loss": 0.0158,
+      "step": 38
+    },
+    {
+      "epoch": 1.6,
+      "grad_norm": 0.022018805146217346,
+      "learning_rate": 2e-05,
+      "loss": 0.0144,
+      "step": 40
+    },
+    {
+      "epoch": 1.68,
+      "grad_norm": 0.022947989404201508,
+      "learning_rate": 2e-05,
+      "loss": 0.0272,
+      "step": 42
+    },
+    {
+      "epoch": 1.76,
+      "grad_norm": 0.031829629093408585,
+      "learning_rate": 2e-05,
+      "loss": 0.0144,
+      "step": 44
+    },
+    {
+      "epoch": 1.84,
+      "grad_norm": 0.00818221177905798,
+      "learning_rate": 2e-05,
+      "loss": 0.0142,
+      "step": 46
+    },
+    {
+      "epoch": 1.92,
+      "grad_norm": 0.017826130613684654,
+      "learning_rate": 2e-05,
+      "loss": 0.1101,
+      "step": 48
+    },
+    {
+      "epoch": 2.0,
+      "grad_norm": 0.02396584488451481,
+      "learning_rate": 2e-05,
+      "loss": 0.0145,
+      "step": 50
+    },
+    {
+      "epoch": 2.0,
+      "step": 50,
+      "total_flos": 5308165734268928.0,
+      "train_loss": 0.042700646072626115,
+      "train_runtime": 188.7069,
+      "train_samples_per_second": 1.06,
+      "train_steps_per_second": 0.265
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 50,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 5308165734268928.0,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/2_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a678ec3a1eebf6cd19b4a3a86fcfa17a0a3d1bff7e4b323c0e9b39aab849835d
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/2_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:002c0fd0d45d95aab8737555c4d1ab0d6d7268708d58af0a97d03cefe871a06a
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/2_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:046b63fd84fdf6ddc23d19f4dfe01cc64d7136a420c811c5306034ed8dff2828
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/2_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:776b2874adc5a806bfa2f0a2f117b8262c20d7fe6fd49bc20e85d61f785f03a0
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/2_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5dc57a934def0e07593f099a111cf66256aa931634f2b19e1d7ab37987939278
+size 778341034

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/2_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2a554f530ff8c965c942e193a07af99983d5d0c26ef275eff9d868203f414b78
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/2_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d095e74a0ace44252b160479986b0e2eee7fa4ca6ca4e8022714bf37b8d5a571
+size 778341034

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/2_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:709a8cae47012ee03fc01a7f0662490660e0669cdaf3b30fd4faa18163209de5
+size 778341034

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/2_trainer_state.json ADDED Viewed

	@@ -0,0 +1,217 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 50,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.08,
+      "grad_norm": 7.620423316955566,
+      "learning_rate": 2e-05,
+      "loss": 0.469,
+      "step": 2
+    },
+    {
+      "epoch": 0.16,
+      "grad_norm": 1.0009398460388184,
+      "learning_rate": 2e-05,
+      "loss": 0.0558,
+      "step": 4
+    },
+    {
+      "epoch": 0.24,
+      "grad_norm": 7.3740949630737305,
+      "learning_rate": 2e-05,
+      "loss": 0.2361,
+      "step": 6
+    },
+    {
+      "epoch": 0.32,
+      "grad_norm": 5.340544700622559,
+      "learning_rate": 2e-05,
+      "loss": 0.375,
+      "step": 8
+    },
+    {
+      "epoch": 0.4,
+      "grad_norm": 3.0642282962799072,
+      "learning_rate": 2e-05,
+      "loss": 0.1286,
+      "step": 10
+    },
+    {
+      "epoch": 0.48,
+      "grad_norm": 8.644904136657715,
+      "learning_rate": 2e-05,
+      "loss": 0.3327,
+      "step": 12
+    },
+    {
+      "epoch": 0.56,
+      "grad_norm": 2.4434633255004883,
+      "learning_rate": 2e-05,
+      "loss": 0.492,
+      "step": 14
+    },
+    {
+      "epoch": 0.64,
+      "grad_norm": 2.4134719371795654,
+      "learning_rate": 2e-05,
+      "loss": 0.452,
+      "step": 16
+    },
+    {
+      "epoch": 0.72,
+      "grad_norm": 2.4050092697143555,
+      "learning_rate": 2e-05,
+      "loss": 0.2468,
+      "step": 18
+    },
+    {
+      "epoch": 0.8,
+      "grad_norm": 2.544926643371582,
+      "learning_rate": 2e-05,
+      "loss": 0.2707,
+      "step": 20
+    },
+    {
+      "epoch": 0.88,
+      "grad_norm": 0.4770296514034271,
+      "learning_rate": 2e-05,
+      "loss": 0.094,
+      "step": 22
+    },
+    {
+      "epoch": 0.96,
+      "grad_norm": 4.732265949249268,
+      "learning_rate": 2e-05,
+      "loss": 0.2453,
+      "step": 24
+    },
+    {
+      "epoch": 1.04,
+      "grad_norm": 8.252790451049805,
+      "learning_rate": 2e-05,
+      "loss": 0.363,
+      "step": 26
+    },
+    {
+      "epoch": 1.12,
+      "grad_norm": 0.9622191786766052,
+      "learning_rate": 2e-05,
+      "loss": 0.1234,
+      "step": 28
+    },
+    {
+      "epoch": 1.2,
+      "grad_norm": 4.3495564460754395,
+      "learning_rate": 2e-05,
+      "loss": 0.1236,
+      "step": 30
+    },
+    {
+      "epoch": 1.28,
+      "grad_norm": 6.503274440765381,
+      "learning_rate": 2e-05,
+      "loss": 0.7048,
+      "step": 32
+    },
+    {
+      "epoch": 1.36,
+      "grad_norm": 3.046657085418701,
+      "learning_rate": 2e-05,
+      "loss": 0.2559,
+      "step": 34
+    },
+    {
+      "epoch": 1.44,
+      "grad_norm": 6.2532219886779785,
+      "learning_rate": 2e-05,
+      "loss": 0.4904,
+      "step": 36
+    },
+    {
+      "epoch": 1.52,
+      "grad_norm": 5.003266334533691,
+      "learning_rate": 2e-05,
+      "loss": 0.1991,
+      "step": 38
+    },
+    {
+      "epoch": 1.6,
+      "grad_norm": 7.434990406036377,
+      "learning_rate": 2e-05,
+      "loss": 0.4284,
+      "step": 40
+    },
+    {
+      "epoch": 1.68,
+      "grad_norm": 11.749560356140137,
+      "learning_rate": 2e-05,
+      "loss": 0.7576,
+      "step": 42
+    },
+    {
+      "epoch": 1.76,
+      "grad_norm": 0.8847981095314026,
+      "learning_rate": 2e-05,
+      "loss": 0.0488,
+      "step": 44
+    },
+    {
+      "epoch": 1.84,
+      "grad_norm": 3.2899725437164307,
+      "learning_rate": 2e-05,
+      "loss": 0.2683,
+      "step": 46
+    },
+    {
+      "epoch": 1.92,
+      "grad_norm": 10.162389755249023,
+      "learning_rate": 2e-05,
+      "loss": 0.3719,
+      "step": 48
+    },
+    {
+      "epoch": 2.0,
+      "grad_norm": 3.9631645679473877,
+      "learning_rate": 2e-05,
+      "loss": 0.2006,
+      "step": 50
+    },
+    {
+      "epoch": 2.0,
+      "step": 50,
+      "total_flos": 5203228526379008.0,
+      "train_loss": 0.30934857606887817,
+      "train_runtime": 194.6247,
+      "train_samples_per_second": 1.028,
+      "train_steps_per_second": 0.257
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 50,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 5203228526379008.0,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/3_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2fbb9b3083f4adea56fa40d73ef2d276d34dd1141a1e0b879214fa5297f2a67e
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/3_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c2d2bbd2320db1c97e9b8c19641cc4013bd3bdbcb441849f2f5b71259205ef67
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/3_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e5cf9bee6f3298e1ddf6509dc4d30689d7f14c53515c656a5938157a99ce5038
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/3_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:847972a0a4cc0969f6079db8ca3e297823e60fdf891791df893b8be17a649f6d
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/3_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5b735d618d85e4fcdf832aa2fa46fc1704052fa38a48cfffefe5432589d28adf
+size 778341034

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/3_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:668b35e725756d711bf9548304118bdff091fc57487f08deec840e08de74ef0a
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/3_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9ff73fbd2d92a8f6232c87ae094040bfb7e7ca7e47656fdcd9bce8f5823f4092
+size 778341034

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/3_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8bbb12f3d11eb2d3337fc2eddfec53dc06daec64b872efa8fc71743ee8239c95
+size 778341034

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/3_trainer_state.json ADDED Viewed

	@@ -0,0 +1,217 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 50,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.08,
+      "grad_norm": 12.495404243469238,
+      "learning_rate": 2e-05,
+      "loss": 0.779,
+      "step": 2
+    },
+    {
+      "epoch": 0.16,
+      "grad_norm": 6.629724502563477,
+      "learning_rate": 2e-05,
+      "loss": 0.5,
+      "step": 4
+    },
+    {
+      "epoch": 0.24,
+      "grad_norm": 7.101356029510498,
+      "learning_rate": 2e-05,
+      "loss": 0.7022,
+      "step": 6
+    },
+    {
+      "epoch": 0.32,
+      "grad_norm": 7.535829067230225,
+      "learning_rate": 2e-05,
+      "loss": 0.9247,
+      "step": 8
+    },
+    {
+      "epoch": 0.4,
+      "grad_norm": 2.729475259780884,
+      "learning_rate": 2e-05,
+      "loss": 0.4091,
+      "step": 10
+    },
+    {
+      "epoch": 0.48,
+      "grad_norm": 8.636240005493164,
+      "learning_rate": 2e-05,
+      "loss": 0.8681,
+      "step": 12
+    },
+    {
+      "epoch": 0.56,
+      "grad_norm": 8.66524600982666,
+      "learning_rate": 2e-05,
+      "loss": 0.7492,
+      "step": 14
+    },
+    {
+      "epoch": 0.64,
+      "grad_norm": 3.2647829055786133,
+      "learning_rate": 2e-05,
+      "loss": 0.4108,
+      "step": 16
+    },
+    {
+      "epoch": 0.72,
+      "grad_norm": 5.925101280212402,
+      "learning_rate": 2e-05,
+      "loss": 0.6516,
+      "step": 18
+    },
+    {
+      "epoch": 0.8,
+      "grad_norm": 3.2308082580566406,
+      "learning_rate": 2e-05,
+      "loss": 0.4492,
+      "step": 20
+    },
+    {
+      "epoch": 0.88,
+      "grad_norm": 4.235790729522705,
+      "learning_rate": 2e-05,
+      "loss": 0.6326,
+      "step": 22
+    },
+    {
+      "epoch": 0.96,
+      "grad_norm": 4.701728343963623,
+      "learning_rate": 2e-05,
+      "loss": 0.3093,
+      "step": 24
+    },
+    {
+      "epoch": 1.04,
+      "grad_norm": 8.327908515930176,
+      "learning_rate": 2e-05,
+      "loss": 0.5139,
+      "step": 26
+    },
+    {
+      "epoch": 1.12,
+      "grad_norm": 4.828310966491699,
+      "learning_rate": 2e-05,
+      "loss": 0.6246,
+      "step": 28
+    },
+    {
+      "epoch": 1.2,
+      "grad_norm": 7.388039588928223,
+      "learning_rate": 2e-05,
+      "loss": 0.8027,
+      "step": 30
+    },
+    {
+      "epoch": 1.28,
+      "grad_norm": 6.946700096130371,
+      "learning_rate": 2e-05,
+      "loss": 0.5852,
+      "step": 32
+    },
+    {
+      "epoch": 1.36,
+      "grad_norm": 0.9494185447692871,
+      "learning_rate": 2e-05,
+      "loss": 0.3423,
+      "step": 34
+    },
+    {
+      "epoch": 1.44,
+      "grad_norm": 4.723056316375732,
+      "learning_rate": 2e-05,
+      "loss": 0.6249,
+      "step": 36
+    },
+    {
+      "epoch": 1.52,
+      "grad_norm": 3.943333148956299,
+      "learning_rate": 2e-05,
+      "loss": 0.2556,
+      "step": 38
+    },
+    {
+      "epoch": 1.6,
+      "grad_norm": 2.8990371227264404,
+      "learning_rate": 2e-05,
+      "loss": 0.3113,
+      "step": 40
+    },
+    {
+      "epoch": 1.68,
+      "grad_norm": 5.895607948303223,
+      "learning_rate": 2e-05,
+      "loss": 0.687,
+      "step": 42
+    },
+    {
+      "epoch": 1.76,
+      "grad_norm": 2.503542184829712,
+      "learning_rate": 2e-05,
+      "loss": 0.5024,
+      "step": 44
+    },
+    {
+      "epoch": 1.84,
+      "grad_norm": 6.042721748352051,
+      "learning_rate": 2e-05,
+      "loss": 0.4905,
+      "step": 46
+    },
+    {
+      "epoch": 1.92,
+      "grad_norm": 1.758901834487915,
+      "learning_rate": 2e-05,
+      "loss": 0.7268,
+      "step": 48
+    },
+    {
+      "epoch": 2.0,
+      "grad_norm": 4.603387355804443,
+      "learning_rate": 2e-05,
+      "loss": 0.2878,
+      "step": 50
+    },
+    {
+      "epoch": 2.0,
+      "step": 50,
+      "total_flos": 5379871421235200.0,
+      "train_loss": 0.5656331896781921,
+      "train_runtime": 188.8767,
+      "train_samples_per_second": 1.059,
+      "train_steps_per_second": 0.265
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 50,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 5379871421235200.0,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/4_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:eb08e16fa47f8165cdd04de2f96bf67351d5afb5e26d3062daaca4add4cacb6e
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/4_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d2c7a3ebf6b75ad8d563055649dd9a3c67c241c89d20f465d03c9cea0290283e
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/4_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:93c7d386f0503d5012cab1569ee8733707f70dba8032da855daf25e67911039b
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/4_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a4e4be141eba949984993e2c890086131a2d212ae51629882e4cb2e8a7ed944d
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/4_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b853c0ef95591cbd7c88b47800c735ac8c4fda60dfd5924f47714cf9d0b9f334
+size 778341034

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/4_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f0114a706b3459ce20699f3ed2de459d76ff071595681598c417000763c3845c
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/4_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6038955452646355952c1af52aa0938ec96a5155c97e81eeebbf3385676f6e3d
+size 778341034

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/4_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9dce5d8b262c68011e3e8b47d0940963239afc7c98986a7b48601fd1f7483f41
+size 778341034

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/4_trainer_state.json ADDED Viewed

	@@ -0,0 +1,217 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 50,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.08,
+      "grad_norm": 0.3974245488643646,
+      "learning_rate": 2e-05,
+      "loss": 0.319,
+      "step": 2
+    },
+    {
+      "epoch": 0.16,
+      "grad_norm": 0.6956784725189209,
+      "learning_rate": 2e-05,
+      "loss": 0.0874,
+      "step": 4
+    },
+    {
+      "epoch": 0.24,
+      "grad_norm": 4.481583118438721,
+      "learning_rate": 2e-05,
+      "loss": 0.3417,
+      "step": 6
+    },
+    {
+      "epoch": 0.32,
+      "grad_norm": 2.996901512145996,
+      "learning_rate": 2e-05,
+      "loss": 0.4057,
+      "step": 8
+    },
+    {
+      "epoch": 0.4,
+      "grad_norm": 3.626215696334839,
+      "learning_rate": 2e-05,
+      "loss": 0.1893,
+      "step": 10
+    },
+    {
+      "epoch": 0.48,
+      "grad_norm": 3.7142386436462402,
+      "learning_rate": 2e-05,
+      "loss": 0.3213,
+      "step": 12
+    },
+    {
+      "epoch": 0.56,
+      "grad_norm": 3.844820737838745,
+      "learning_rate": 2e-05,
+      "loss": 0.252,
+      "step": 14
+    },
+    {
+      "epoch": 0.64,
+      "grad_norm": 0.8332847952842712,
+      "learning_rate": 2e-05,
+      "loss": 0.4195,
+      "step": 16
+    },
+    {
+      "epoch": 0.72,
+      "grad_norm": 2.419525623321533,
+      "learning_rate": 2e-05,
+      "loss": 0.1124,
+      "step": 18
+    },
+    {
+      "epoch": 0.8,
+      "grad_norm": 4.048295497894287,
+      "learning_rate": 2e-05,
+      "loss": 0.4657,
+      "step": 20
+    },
+    {
+      "epoch": 0.88,
+      "grad_norm": 1.1390035152435303,
+      "learning_rate": 2e-05,
+      "loss": 0.2091,
+      "step": 22
+    },
+    {
+      "epoch": 0.96,
+      "grad_norm": 9.533462524414062,
+      "learning_rate": 2e-05,
+      "loss": 0.5139,
+      "step": 24
+    },
+    {
+      "epoch": 1.04,
+      "grad_norm": 8.884787559509277,
+      "learning_rate": 2e-05,
+      "loss": 0.72,
+      "step": 26
+    },
+    {
+      "epoch": 1.12,
+      "grad_norm": 11.820172309875488,
+      "learning_rate": 2e-05,
+      "loss": 0.7309,
+      "step": 28
+    },
+    {
+      "epoch": 1.2,
+      "grad_norm": 3.786125421524048,
+      "learning_rate": 2e-05,
+      "loss": 0.2382,
+      "step": 30
+    },
+    {
+      "epoch": 1.28,
+      "grad_norm": 4.292237758636475,
+      "learning_rate": 2e-05,
+      "loss": 0.516,
+      "step": 32
+    },
+    {
+      "epoch": 1.36,
+      "grad_norm": 4.905089378356934,
+      "learning_rate": 2e-05,
+      "loss": 0.4936,
+      "step": 34
+    },
+    {
+      "epoch": 1.44,
+      "grad_norm": 4.8835859298706055,
+      "learning_rate": 2e-05,
+      "loss": 0.425,
+      "step": 36
+    },
+    {
+      "epoch": 1.52,
+      "grad_norm": 5.083212375640869,
+      "learning_rate": 2e-05,
+      "loss": 0.3309,
+      "step": 38
+    },
+    {
+      "epoch": 1.6,
+      "grad_norm": 3.6019129753112793,
+      "learning_rate": 2e-05,
+      "loss": 0.4558,
+      "step": 40
+    },
+    {
+      "epoch": 1.68,
+      "grad_norm": 2.5178937911987305,
+      "learning_rate": 2e-05,
+      "loss": 0.3123,
+      "step": 42
+    },
+    {
+      "epoch": 1.76,
+      "grad_norm": 3.1368069648742676,
+      "learning_rate": 2e-05,
+      "loss": 0.2818,
+      "step": 44
+    },
+    {
+      "epoch": 1.84,
+      "grad_norm": 2.9503908157348633,
+      "learning_rate": 2e-05,
+      "loss": 0.2565,
+      "step": 46
+    },
+    {
+      "epoch": 1.92,
+      "grad_norm": 3.0946178436279297,
+      "learning_rate": 2e-05,
+      "loss": 0.4001,
+      "step": 48
+    },
+    {
+      "epoch": 2.0,
+      "grad_norm": 7.015686988830566,
+      "learning_rate": 2e-05,
+      "loss": 0.3228,
+      "step": 50
+    },
+    {
+      "epoch": 2.0,
+      "step": 50,
+      "total_flos": 6019810878029824.0,
+      "train_loss": 0.36482719421386717,
+      "train_runtime": 190.5862,
+      "train_samples_per_second": 1.049,
+      "train_steps_per_second": 0.262
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 50,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 6019810878029824.0,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/5_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4632c0a7954ad392899f25b025e91ff1a12fb835b79f8cc033da3d88b2763a89
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/5_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:af08c046b78b082c9a7a6c1b948e2ffa1b866fcde980f8adbe1e06e2b3e767bb
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/5_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3ae2b9cf0d05969ee3ed4f5adde29f1d459afe52b86afd14e56335252e22841e
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/5_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6afa1969e53cc2e368fc21263bc63819b02f23c15ed64631e61c910144d2eae9
+size 778341886

client_states_ditto_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixit50_T0125_decay099_SEED2/5_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:787b721dcc19ec1b987482642be00562f9b7c59cce7f7870cd1d113cab978fc0
+size 778341034