thkim0305
/

feddat_baselines

Model card Files Files and versions Community

thkim0305 commited on about 1 month ago

Commit

54b6f9d

verified ·

1 Parent(s): ee2b77a

Upload folder using huggingface_hub

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/0_client_model_round10.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/0_client_model_round12.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/0_client_model_round15.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/0_client_model_round17.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/0_client_model_round2.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/0_client_model_round20.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/0_client_model_round5.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/0_client_model_round7.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/0_trainer_state.json +126 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/1_client_model_round10.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/1_client_model_round12.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/1_client_model_round15.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/1_client_model_round17.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/1_client_model_round2.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/1_client_model_round20.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/1_client_model_round5.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/1_client_model_round7.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/1_trainer_state.json +126 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/2_client_model_round10.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/2_client_model_round12.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/2_client_model_round15.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/2_client_model_round17.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/2_client_model_round2.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/2_client_model_round20.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/2_client_model_round5.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/2_client_model_round7.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/2_trainer_state.json +126 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/3_client_model_round10.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/3_client_model_round12.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/3_client_model_round15.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/3_client_model_round17.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/3_client_model_round2.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/3_client_model_round20.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/3_client_model_round5.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/3_client_model_round7.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/3_trainer_state.json +126 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/4_client_model_round10.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/4_client_model_round12.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/4_client_model_round15.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/4_client_model_round17.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/4_client_model_round2.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/4_client_model_round20.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/4_client_model_round5.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/4_client_model_round7.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/4_trainer_state.json +126 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/5_client_model_round10.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/5_client_model_round12.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/5_client_model_round15.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/5_client_model_round17.pth +3 -0
client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/5_client_model_round2.pth +3 -0

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/0_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b9c8b688e7142618dcaf75b8821e014cceda3e8979fdce5093a9069a4a1a4ec9
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/0_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ff1a052e82f4eec62a35dd8764b6aad1cbebfe9014a124bb5ba10ef4da7d8f00
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/0_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:81e8decf5dcc4fb57f4b87504e65019c233bee4c47314f4ea16cb985e230fa53
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/0_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2f1d5afb7dd124ccb5cc85da7598e84be573f582e7f939d1d62706208f509aba
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/0_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:45586c6182565a1259c385222e9e0ce6254e0caf263527bc1e7d5a4329d199ca
+size 1167511866

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/0_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e284ece48ddd1a8a3b8dd541af6aa3681f6ea653d2297d78c229020ce04ee233
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/0_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3651434d61d8d6f5b342f17dbdf811e02b3e075489657fd6da20fbe7c30e969d
+size 1167511866

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/0_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d59111607207bd02602038a0e259bd8995126bbf701addb0c29168eb26291efb
+size 1167511866

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/0_trainer_state.json ADDED Viewed

	@@ -0,0 +1,126 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 25,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.16,
+      "grad_norm": 2.21482253074646,
+      "learning_rate": 2e-05,
+      "loss": 0.254,
+      "step": 2
+    },
+    {
+      "epoch": 0.32,
+      "grad_norm": 4.312131881713867,
+      "learning_rate": 2e-05,
+      "loss": 0.1656,
+      "step": 4
+    },
+    {
+      "epoch": 0.48,
+      "grad_norm": 1.3984471559524536,
+      "learning_rate": 2e-05,
+      "loss": 0.046,
+      "step": 6
+    },
+    {
+      "epoch": 0.64,
+      "grad_norm": 1.9168689250946045,
+      "learning_rate": 2e-05,
+      "loss": 0.0957,
+      "step": 8
+    },
+    {
+      "epoch": 0.8,
+      "grad_norm": 2.0672812461853027,
+      "learning_rate": 2e-05,
+      "loss": 0.281,
+      "step": 10
+    },
+    {
+      "epoch": 0.96,
+      "grad_norm": 0.5915671586990356,
+      "learning_rate": 2e-05,
+      "loss": 0.0233,
+      "step": 12
+    },
+    {
+      "epoch": 1.12,
+      "grad_norm": 2.9408771991729736,
+      "learning_rate": 2e-05,
+      "loss": 0.4947,
+      "step": 14
+    },
+    {
+      "epoch": 1.28,
+      "grad_norm": 2.808587074279785,
+      "learning_rate": 2e-05,
+      "loss": 0.1121,
+      "step": 16
+    },
+    {
+      "epoch": 1.44,
+      "grad_norm": 0.9880923628807068,
+      "learning_rate": 2e-05,
+      "loss": 0.0909,
+      "step": 18
+    },
+    {
+      "epoch": 1.6,
+      "grad_norm": 0.9719083905220032,
+      "learning_rate": 2e-05,
+      "loss": 0.0377,
+      "step": 20
+    },
+    {
+      "epoch": 1.76,
+      "grad_norm": 3.7146573066711426,
+      "learning_rate": 2e-05,
+      "loss": 0.1087,
+      "step": 22
+    },
+    {
+      "epoch": 1.92,
+      "grad_norm": 1.7789965867996216,
+      "learning_rate": 2e-05,
+      "loss": 0.2933,
+      "step": 24
+    },
+    {
+      "epoch": 2.0,
+      "step": 25,
+      "total_flos": 2776472045486080.0,
+      "train_loss": 0.16410446166992188,
+      "train_runtime": 127.3475,
+      "train_samples_per_second": 0.785,
+      "train_steps_per_second": 0.196
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 25,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 2776472045486080.0,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/1_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f5d734864daeeef65eb7021dea9335af29f9eb355c5c24bd18f1f4c800053454
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/1_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:84fb2ded09a75d5375a6580465a16635b5647ea5747b60010cf13c0ff84aad83
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/1_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:100f1537486f1307e3311d9dff294c4f3f7ea4855d42a169a52b0478a17f20dc
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/1_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:499d6a2dc853680f34ad981ad4ebcc92ade1be79e80bae61d9e21313f4749473
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/1_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bbdfaa7ec410f0e21e4be7406985d711d6442247f71b2940a42598fede71a62a
+size 1167511866

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/1_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e599b8fca50af010e1b7f3b36515b2d844e07af4e70c799597761b47654e3f7d
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/1_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cc518d42a7836ec09008231870f9f4a7ed123eaeeeb09ddeaa7890249744b85e
+size 1167511866

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/1_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:717b1af67a9b2cf721e2297314d6294216f3aacd81c35d45554c3b7af1d22e52
+size 1167511866

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/1_trainer_state.json ADDED Viewed

	@@ -0,0 +1,126 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 25,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.16,
+      "grad_norm": 0.9727327823638916,
+      "learning_rate": 2e-05,
+      "loss": 0.1592,
+      "step": 2
+    },
+    {
+      "epoch": 0.32,
+      "grad_norm": 0.6119529008865356,
+      "learning_rate": 2e-05,
+      "loss": 0.0155,
+      "step": 4
+    },
+    {
+      "epoch": 0.48,
+      "grad_norm": 0.3699932098388672,
+      "learning_rate": 2e-05,
+      "loss": 0.1359,
+      "step": 6
+    },
+    {
+      "epoch": 0.64,
+      "grad_norm": 0.8428669571876526,
+      "learning_rate": 2e-05,
+      "loss": 0.0421,
+      "step": 8
+    },
+    {
+      "epoch": 0.8,
+      "grad_norm": 0.8032307028770447,
+      "learning_rate": 2e-05,
+      "loss": 0.0221,
+      "step": 10
+    },
+    {
+      "epoch": 0.96,
+      "grad_norm": 3.484509229660034,
+      "learning_rate": 2e-05,
+      "loss": 0.0962,
+      "step": 12
+    },
+    {
+      "epoch": 1.12,
+      "grad_norm": 0.48723894357681274,
+      "learning_rate": 2e-05,
+      "loss": 0.0181,
+      "step": 14
+    },
+    {
+      "epoch": 1.28,
+      "grad_norm": 1.0781177282333374,
+      "learning_rate": 2e-05,
+      "loss": 0.0448,
+      "step": 16
+    },
+    {
+      "epoch": 1.44,
+      "grad_norm": 2.618180513381958,
+      "learning_rate": 2e-05,
+      "loss": 0.0524,
+      "step": 18
+    },
+    {
+      "epoch": 1.6,
+      "grad_norm": 1.0576213598251343,
+      "learning_rate": 2e-05,
+      "loss": 0.0496,
+      "step": 20
+    },
+    {
+      "epoch": 1.76,
+      "grad_norm": 0.34326815605163574,
+      "learning_rate": 2e-05,
+      "loss": 0.0519,
+      "step": 22
+    },
+    {
+      "epoch": 1.92,
+      "grad_norm": 0.4327654540538788,
+      "learning_rate": 2e-05,
+      "loss": 0.0183,
+      "step": 24
+    },
+    {
+      "epoch": 2.0,
+      "step": 25,
+      "total_flos": 2795254289793024.0,
+      "train_loss": 0.056924142837524415,
+      "train_runtime": 128.058,
+      "train_samples_per_second": 0.781,
+      "train_steps_per_second": 0.195
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 25,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 2795254289793024.0,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/2_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:04fecbc85501e3f0cbafe9f13108201d8d0cc03eee280d106fab39629624a568
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/2_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:900c97291ffa7ede12bdecdf80234c6c599d18f68c242a39b512946e6c2f8cf8
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/2_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:13ca03010d565b6648c1c2de72ac1971fc3ee336ef441ce2e2aed880590d3b3a
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/2_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3a1389dff1c58aca0343be04ac4ada1f12834b18b9ba70342bcb3bb424deb3eb
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/2_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:53b54b947a97e393bb76780d4174ca2bbe266b6d5e26d162c4f4a73a0797ac57
+size 1167511866

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/2_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:adb0272b9ee55de14b7c86ea70901588d1a894e126974d841e223f610b306e7a
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/2_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c44442470cf3659d87e0e4d6a63a497b9fbf71c54dce14abe746671e4579c02e
+size 1167511866

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/2_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2e9064a8ac3feffdefe6bf934222792abbcf01e91958439277a311697049e0fd
+size 1167511866

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/2_trainer_state.json ADDED Viewed

	@@ -0,0 +1,126 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 25,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.16,
+      "grad_norm": 3.542206287384033,
+      "learning_rate": 2e-05,
+      "loss": 0.3763,
+      "step": 2
+    },
+    {
+      "epoch": 0.32,
+      "grad_norm": 0.5754655003547668,
+      "learning_rate": 2e-05,
+      "loss": 0.0481,
+      "step": 4
+    },
+    {
+      "epoch": 0.48,
+      "grad_norm": 2.7304298877716064,
+      "learning_rate": 2e-05,
+      "loss": 0.3178,
+      "step": 6
+    },
+    {
+      "epoch": 0.64,
+      "grad_norm": 0.6067225337028503,
+      "learning_rate": 2e-05,
+      "loss": 0.1304,
+      "step": 8
+    },
+    {
+      "epoch": 0.8,
+      "grad_norm": 2.869699478149414,
+      "learning_rate": 2e-05,
+      "loss": 0.3075,
+      "step": 10
+    },
+    {
+      "epoch": 0.96,
+      "grad_norm": 0.8252665400505066,
+      "learning_rate": 2e-05,
+      "loss": 0.052,
+      "step": 12
+    },
+    {
+      "epoch": 1.12,
+      "grad_norm": 0.7447052001953125,
+      "learning_rate": 2e-05,
+      "loss": 0.1314,
+      "step": 14
+    },
+    {
+      "epoch": 1.28,
+      "grad_norm": 1.8536393642425537,
+      "learning_rate": 2e-05,
+      "loss": 0.156,
+      "step": 16
+    },
+    {
+      "epoch": 1.44,
+      "grad_norm": 2.449882984161377,
+      "learning_rate": 2e-05,
+      "loss": 0.4599,
+      "step": 18
+    },
+    {
+      "epoch": 1.6,
+      "grad_norm": 2.2815041542053223,
+      "learning_rate": 2e-05,
+      "loss": 0.1967,
+      "step": 20
+    },
+    {
+      "epoch": 1.76,
+      "grad_norm": 1.0439902544021606,
+      "learning_rate": 2e-05,
+      "loss": 0.0865,
+      "step": 22
+    },
+    {
+      "epoch": 1.92,
+      "grad_norm": 0.8892500400543213,
+      "learning_rate": 2e-05,
+      "loss": 0.1329,
+      "step": 24
+    },
+    {
+      "epoch": 2.0,
+      "step": 25,
+      "total_flos": 2742967366320128.0,
+      "train_loss": 0.20229598999023438,
+      "train_runtime": 129.0449,
+      "train_samples_per_second": 0.775,
+      "train_steps_per_second": 0.194
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 25,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 2742967366320128.0,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/3_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:62a56161ae4aea304a7df9a9a113695fb5847d8c18e181bc080678fcc6fb4875
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/3_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0b4398903d3135bc4481596590877e68395fdc308315b96f238f1c15f0d16e57
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/3_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:970b453869a990122c0c8f00dc95e9ff5ad81f43dfaa9885da5faf1fb482cc8d
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/3_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b858ad0106605ad21b9dd5c0180ee9eeed29295087cc8068531e7f9819399952
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/3_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4057d89e942597802e900271f93eb3596ee5ffd6f4e859a52c304255d17b01d8
+size 1167511866

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/3_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:90afaea929330aaaa94280ce0cd71eefce98e1860fc5097ccd03750f0ae8c2b3
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/3_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:064b3b483d035f11c9129805ff0c111cf83b048c71e2b9e14c46ba3da0f819da
+size 1167511866

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/3_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:66ed624f357ad2a852d69c1eadc605ac44e8b42f8db87c045ce8b8d10a5057c2
+size 1167511866

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/3_trainer_state.json ADDED Viewed

	@@ -0,0 +1,126 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 25,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.16,
+      "grad_norm": 2.5665788650512695,
+      "learning_rate": 2e-05,
+      "loss": 0.6774,
+      "step": 2
+    },
+    {
+      "epoch": 0.32,
+      "grad_norm": 3.874232053756714,
+      "learning_rate": 2e-05,
+      "loss": 0.4658,
+      "step": 4
+    },
+    {
+      "epoch": 0.48,
+      "grad_norm": 2.8483521938323975,
+      "learning_rate": 2e-05,
+      "loss": 0.2574,
+      "step": 6
+    },
+    {
+      "epoch": 0.64,
+      "grad_norm": 2.191157579421997,
+      "learning_rate": 2e-05,
+      "loss": 0.1927,
+      "step": 8
+    },
+    {
+      "epoch": 0.8,
+      "grad_norm": 3.0909106731414795,
+      "learning_rate": 2e-05,
+      "loss": 0.311,
+      "step": 10
+    },
+    {
+      "epoch": 0.96,
+      "grad_norm": 2.030684232711792,
+      "learning_rate": 2e-05,
+      "loss": 0.2952,
+      "step": 12
+    },
+    {
+      "epoch": 1.12,
+      "grad_norm": 2.7925920486450195,
+      "learning_rate": 2e-05,
+      "loss": 0.3441,
+      "step": 14
+    },
+    {
+      "epoch": 1.28,
+      "grad_norm": 3.240939140319824,
+      "learning_rate": 2e-05,
+      "loss": 0.3284,
+      "step": 16
+    },
+    {
+      "epoch": 1.44,
+      "grad_norm": 2.8805136680603027,
+      "learning_rate": 2e-05,
+      "loss": 0.351,
+      "step": 18
+    },
+    {
+      "epoch": 1.6,
+      "grad_norm": 2.0048928260803223,
+      "learning_rate": 2e-05,
+      "loss": 0.4163,
+      "step": 20
+    },
+    {
+      "epoch": 1.76,
+      "grad_norm": 1.862860918045044,
+      "learning_rate": 2e-05,
+      "loss": 0.2851,
+      "step": 22
+    },
+    {
+      "epoch": 1.92,
+      "grad_norm": 3.4276328086853027,
+      "learning_rate": 2e-05,
+      "loss": 0.3383,
+      "step": 24
+    },
+    {
+      "epoch": 2.0,
+      "step": 25,
+      "total_flos": 2838752368001024.0,
+      "train_loss": 0.3459229278564453,
+      "train_runtime": 127.6119,
+      "train_samples_per_second": 0.784,
+      "train_steps_per_second": 0.196
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 25,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 2838752368001024.0,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/4_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:eaa403e2cab3dc6a153a854eafe26b8c044eace3fd625339aaa2f842064ce6fc
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/4_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6ac8eadce9154f4ccc978ff304d55ad47849b685fa2a8d507d9412b4da249b5b
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/4_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bc05bcb183cd20f96a0281e831fa50420f07adbcbaca8a204d153a639ea32559
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/4_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f444a8ed2f532a74b9e774e41a3f3738217f0c5956d255d807db6847712ae547
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/4_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f6d0f1358c23df3d76db42b1a746bb4bccaefd9f82304f58330fd74aff529339
+size 1167511866

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/4_client_model_round20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9dab3512773e75eaf70c2cc65274792a114aaf002f765de81df59c5ef3ee2cac
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/4_client_model_round5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8e75fd605342d2ef9e69fe71a7a48af89c32d5940c0b1e0c7fe6ae1cda4426e9
+size 1167511866

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/4_client_model_round7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e15e9678154d5ba223b7e407839330af436f55e9d8a70e19ebd34091df309eb2
+size 1167511866

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/4_trainer_state.json ADDED Viewed

	@@ -0,0 +1,126 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 25,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.16,
+      "grad_norm": 4.487705230712891,
+      "learning_rate": 2e-05,
+      "loss": 0.4972,
+      "step": 2
+    },
+    {
+      "epoch": 0.32,
+      "grad_norm": 0.9496861100196838,
+      "learning_rate": 2e-05,
+      "loss": 0.1444,
+      "step": 4
+    },
+    {
+      "epoch": 0.48,
+      "grad_norm": 3.0709917545318604,
+      "learning_rate": 2e-05,
+      "loss": 0.4052,
+      "step": 6
+    },
+    {
+      "epoch": 0.64,
+      "grad_norm": 1.8949023485183716,
+      "learning_rate": 2e-05,
+      "loss": 0.2446,
+      "step": 8
+    },
+    {
+      "epoch": 0.8,
+      "grad_norm": 1.549836277961731,
+      "learning_rate": 2e-05,
+      "loss": 0.1589,
+      "step": 10
+    },
+    {
+      "epoch": 0.96,
+      "grad_norm": 2.86405611038208,
+      "learning_rate": 2e-05,
+      "loss": 0.1817,
+      "step": 12
+    },
+    {
+      "epoch": 1.12,
+      "grad_norm": 2.9263083934783936,
+      "learning_rate": 2e-05,
+      "loss": 0.2236,
+      "step": 14
+    },
+    {
+      "epoch": 1.28,
+      "grad_norm": 3.8913233280181885,
+      "learning_rate": 2e-05,
+      "loss": 0.4171,
+      "step": 16
+    },
+    {
+      "epoch": 1.44,
+      "grad_norm": 1.5427923202514648,
+      "learning_rate": 2e-05,
+      "loss": 0.2518,
+      "step": 18
+    },
+    {
+      "epoch": 1.6,
+      "grad_norm": 0.7112218141555786,
+      "learning_rate": 2e-05,
+      "loss": 0.1182,
+      "step": 20
+    },
+    {
+      "epoch": 1.76,
+      "grad_norm": 2.249495267868042,
+      "learning_rate": 2e-05,
+      "loss": 0.2611,
+      "step": 22
+    },
+    {
+      "epoch": 1.92,
+      "grad_norm": 0.6617293357849121,
+      "learning_rate": 2e-05,
+      "loss": 0.0596,
+      "step": 24
+    },
+    {
+      "epoch": 2.0,
+      "step": 25,
+      "total_flos": 3177992868069376.0,
+      "train_loss": 0.24374237060546874,
+      "train_runtime": 129.5612,
+      "train_samples_per_second": 0.772,
+      "train_steps_per_second": 0.193
+    }
+  ],
+  "logging_steps": 2,
+  "max_steps": 25,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": false,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 3177992868069376.0,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/5_client_model_round10.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cbfc914d9fb77a9a27937b96bae1f4c35e85707f3dc2bca9f39e234f6b15da6c
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/5_client_model_round12.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5f71948f039dbd0c495f3488ae535041a78add0a84677408ae64140352e50b7a
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/5_client_model_round15.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bcfc5d301bcfcf1205745180936f62723fae2c47eef4b29122357a98aa6459c7
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/5_client_model_round17.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e0a1d7b998b28a6967c389f2f77276745d8a966dd0fed0fdc88c44477f0b59c2
+size 1167513110

client_states_feddat_bs4_saveoptim_lr2e-5_sc310_4tasks_5rounds_fixitr25_T0125_decay099/5_client_model_round2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c56f66437b479eac7767ffb1c7468ce29eb22eefe6042a309c694a7ccfe53099
+size 1167511866