thkim0305 commited on
Commit
466415b
·
verified ·
1 Parent(s): 6372514

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/0_client_model_round10.pth +3 -0
  2. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/0_client_model_round12.pth +3 -0
  3. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/0_client_model_round15.pth +3 -0
  4. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/0_client_model_round17.pth +3 -0
  5. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/0_client_model_round2.pth +3 -0
  6. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/0_client_model_round20.pth +3 -0
  7. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/0_client_model_round5.pth +3 -0
  8. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/0_client_model_round7.pth +3 -0
  9. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/0_trainer_state.json +217 -0
  10. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/1_client_model_round10.pth +3 -0
  11. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/1_client_model_round12.pth +3 -0
  12. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/1_client_model_round15.pth +3 -0
  13. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/1_client_model_round17.pth +3 -0
  14. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/1_client_model_round2.pth +3 -0
  15. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/1_client_model_round20.pth +3 -0
  16. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/1_client_model_round5.pth +3 -0
  17. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/1_client_model_round7.pth +3 -0
  18. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/1_trainer_state.json +217 -0
  19. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/2_client_model_round10.pth +3 -0
  20. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/2_client_model_round12.pth +3 -0
  21. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/2_client_model_round15.pth +3 -0
  22. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/2_client_model_round17.pth +3 -0
  23. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/2_client_model_round2.pth +3 -0
  24. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/2_client_model_round20.pth +3 -0
  25. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/2_client_model_round5.pth +3 -0
  26. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/2_client_model_round7.pth +3 -0
  27. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/2_trainer_state.json +217 -0
  28. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/3_client_model_round10.pth +3 -0
  29. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/3_client_model_round12.pth +3 -0
  30. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/3_client_model_round15.pth +3 -0
  31. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/3_client_model_round17.pth +3 -0
  32. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/3_client_model_round2.pth +3 -0
  33. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/3_client_model_round20.pth +3 -0
  34. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/3_client_model_round5.pth +3 -0
  35. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/3_client_model_round7.pth +3 -0
  36. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/3_trainer_state.json +217 -0
  37. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/4_client_model_round10.pth +3 -0
  38. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/4_client_model_round12.pth +3 -0
  39. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/4_client_model_round15.pth +3 -0
  40. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/4_client_model_round17.pth +3 -0
  41. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/4_client_model_round2.pth +3 -0
  42. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/4_client_model_round20.pth +3 -0
  43. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/4_client_model_round5.pth +3 -0
  44. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/4_client_model_round7.pth +3 -0
  45. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/4_trainer_state.json +217 -0
  46. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/5_client_model_round10.pth +3 -0
  47. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/5_client_model_round12.pth +3 -0
  48. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/5_client_model_round15.pth +3 -0
  49. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/5_client_model_round17.pth +3 -0
  50. client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/5_client_model_round2.pth +3 -0
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/0_client_model_round10.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:baac5c7fa34f7abbe70a9da273a82920695c3701cd55ab77f909e37a1d5f981b
3
+ size 552665798
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/0_client_model_round12.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51ab1440183e159defe4b19c41f9616ce88b8fd601ab70bc16fd402c11836bc2
3
+ size 552665798
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/0_client_model_round15.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e43bf4412ef4c452ee595f310fa274a05dda02620848265ef888e6babebd168
3
+ size 552665798
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/0_client_model_round17.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9b2ae12f7fa3263983913d324347a7b8b95b167b8365d44988d0635ca1ff711
3
+ size 552665798
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/0_client_model_round2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57ce84cb92420647782926637a39060335b94fb366ad3ee969f27b8db17e0924
3
+ size 552664386
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/0_client_model_round20.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78e18d1749cfd317a4280abff888be0428df7e2ca560740a9fc4532992594528
3
+ size 552665798
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/0_client_model_round5.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0251bd78c66dade13402bc0c1dcab5cb5bfaecff500c3e179b9819f7d8e7471d
3
+ size 552664386
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/0_client_model_round7.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0aaa3d9af1c7c73a11b97dd6719cc38e2e5c6198a599f7a594b00deae218ce39
3
+ size 552664386
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/0_trainer_state.json ADDED
@@ -0,0 +1,217 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 2.0,
5
+ "eval_steps": 500,
6
+ "global_step": 50,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.08,
13
+ "grad_norm": 2.932952880859375,
14
+ "learning_rate": 2e-05,
15
+ "loss": 0.5314,
16
+ "step": 2
17
+ },
18
+ {
19
+ "epoch": 0.16,
20
+ "grad_norm": 3.822000741958618,
21
+ "learning_rate": 2e-05,
22
+ "loss": 0.3525,
23
+ "step": 4
24
+ },
25
+ {
26
+ "epoch": 0.24,
27
+ "grad_norm": 5.802279472351074,
28
+ "learning_rate": 2e-05,
29
+ "loss": 0.3069,
30
+ "step": 6
31
+ },
32
+ {
33
+ "epoch": 0.32,
34
+ "grad_norm": 3.4869275093078613,
35
+ "learning_rate": 2e-05,
36
+ "loss": 0.4767,
37
+ "step": 8
38
+ },
39
+ {
40
+ "epoch": 0.4,
41
+ "grad_norm": 2.567089796066284,
42
+ "learning_rate": 2e-05,
43
+ "loss": 0.3478,
44
+ "step": 10
45
+ },
46
+ {
47
+ "epoch": 0.48,
48
+ "grad_norm": 3.539039134979248,
49
+ "learning_rate": 2e-05,
50
+ "loss": 0.283,
51
+ "step": 12
52
+ },
53
+ {
54
+ "epoch": 0.56,
55
+ "grad_norm": 4.298175811767578,
56
+ "learning_rate": 2e-05,
57
+ "loss": 0.5666,
58
+ "step": 14
59
+ },
60
+ {
61
+ "epoch": 0.64,
62
+ "grad_norm": 1.6652226448059082,
63
+ "learning_rate": 2e-05,
64
+ "loss": 0.3015,
65
+ "step": 16
66
+ },
67
+ {
68
+ "epoch": 0.72,
69
+ "grad_norm": 2.662271022796631,
70
+ "learning_rate": 2e-05,
71
+ "loss": 0.3835,
72
+ "step": 18
73
+ },
74
+ {
75
+ "epoch": 0.8,
76
+ "grad_norm": 2.015277147293091,
77
+ "learning_rate": 2e-05,
78
+ "loss": 0.3641,
79
+ "step": 20
80
+ },
81
+ {
82
+ "epoch": 0.88,
83
+ "grad_norm": 5.836124420166016,
84
+ "learning_rate": 2e-05,
85
+ "loss": 0.3512,
86
+ "step": 22
87
+ },
88
+ {
89
+ "epoch": 0.96,
90
+ "grad_norm": 3.8210253715515137,
91
+ "learning_rate": 2e-05,
92
+ "loss": 0.543,
93
+ "step": 24
94
+ },
95
+ {
96
+ "epoch": 1.04,
97
+ "grad_norm": 2.18196177482605,
98
+ "learning_rate": 2e-05,
99
+ "loss": 0.3859,
100
+ "step": 26
101
+ },
102
+ {
103
+ "epoch": 1.12,
104
+ "grad_norm": 4.2598490715026855,
105
+ "learning_rate": 2e-05,
106
+ "loss": 0.513,
107
+ "step": 28
108
+ },
109
+ {
110
+ "epoch": 1.2,
111
+ "grad_norm": 4.595355033874512,
112
+ "learning_rate": 2e-05,
113
+ "loss": 0.499,
114
+ "step": 30
115
+ },
116
+ {
117
+ "epoch": 1.28,
118
+ "grad_norm": 1.4477527141571045,
119
+ "learning_rate": 2e-05,
120
+ "loss": 0.2842,
121
+ "step": 32
122
+ },
123
+ {
124
+ "epoch": 1.36,
125
+ "grad_norm": 1.8463199138641357,
126
+ "learning_rate": 2e-05,
127
+ "loss": 0.3556,
128
+ "step": 34
129
+ },
130
+ {
131
+ "epoch": 1.44,
132
+ "grad_norm": 2.7618906497955322,
133
+ "learning_rate": 2e-05,
134
+ "loss": 0.3364,
135
+ "step": 36
136
+ },
137
+ {
138
+ "epoch": 1.52,
139
+ "grad_norm": 1.7495309114456177,
140
+ "learning_rate": 2e-05,
141
+ "loss": 0.4357,
142
+ "step": 38
143
+ },
144
+ {
145
+ "epoch": 1.6,
146
+ "grad_norm": 1.9298914670944214,
147
+ "learning_rate": 2e-05,
148
+ "loss": 0.3546,
149
+ "step": 40
150
+ },
151
+ {
152
+ "epoch": 1.68,
153
+ "grad_norm": 1.783296823501587,
154
+ "learning_rate": 2e-05,
155
+ "loss": 0.3618,
156
+ "step": 42
157
+ },
158
+ {
159
+ "epoch": 1.76,
160
+ "grad_norm": 2.6802752017974854,
161
+ "learning_rate": 2e-05,
162
+ "loss": 0.2909,
163
+ "step": 44
164
+ },
165
+ {
166
+ "epoch": 1.84,
167
+ "grad_norm": 4.639962196350098,
168
+ "learning_rate": 2e-05,
169
+ "loss": 0.4994,
170
+ "step": 46
171
+ },
172
+ {
173
+ "epoch": 1.92,
174
+ "grad_norm": 2.44413423538208,
175
+ "learning_rate": 2e-05,
176
+ "loss": 0.2855,
177
+ "step": 48
178
+ },
179
+ {
180
+ "epoch": 2.0,
181
+ "grad_norm": 2.5618817806243896,
182
+ "learning_rate": 2e-05,
183
+ "loss": 0.4125,
184
+ "step": 50
185
+ },
186
+ {
187
+ "epoch": 2.0,
188
+ "step": 50,
189
+ "total_flos": 6495660656295936.0,
190
+ "train_loss": 0.39289794921875,
191
+ "train_runtime": 218.0875,
192
+ "train_samples_per_second": 0.917,
193
+ "train_steps_per_second": 0.229
194
+ }
195
+ ],
196
+ "logging_steps": 2,
197
+ "max_steps": 50,
198
+ "num_input_tokens_seen": 0,
199
+ "num_train_epochs": 1,
200
+ "save_steps": 500,
201
+ "stateful_callbacks": {
202
+ "TrainerControl": {
203
+ "args": {
204
+ "should_epoch_stop": false,
205
+ "should_evaluate": false,
206
+ "should_log": false,
207
+ "should_save": false,
208
+ "should_training_stop": false
209
+ },
210
+ "attributes": {}
211
+ }
212
+ },
213
+ "total_flos": 6495660656295936.0,
214
+ "train_batch_size": 1,
215
+ "trial_name": null,
216
+ "trial_params": null
217
+ }
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/1_client_model_round10.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1e2f51e5c4b4ce8b50dd156885f154dc9a1835600722644b602927c82464181
3
+ size 1187368166
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/1_client_model_round12.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a0d19843aa4cde7bd0328aeeb235d0b580643798f5c0b5382401f2a2147fca7
3
+ size 1187368166
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/1_client_model_round15.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1befb229ebaa2464096851934340eb02dc86e6153da3ec998204e22b1a9f948
3
+ size 1187368166
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/1_client_model_round17.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d9383d3115a5d5416d2074ea72f9e096ac05d26b65fb44322a6ab774a600ce8
3
+ size 1187368166
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/1_client_model_round2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:615b867e4d61e590ab06abc5774b2193679d80500b822238575ff2d14a50c2bc
3
+ size 1187365746
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/1_client_model_round20.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1dd8314b48d43020977fba59192e7bb5ae9c69fac55ddc2a1f08a7bb0432d4ea
3
+ size 1187368166
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/1_client_model_round5.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd58cc9991de32e09b77a096799786646b7239b8ac77d50ed4db19bf6eed3809
3
+ size 1187365746
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/1_client_model_round7.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:379e9901e0f0b82e410228552fe224862cdd4ef747b71f1e4061368040fd9f1f
3
+ size 1187365746
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/1_trainer_state.json ADDED
@@ -0,0 +1,217 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 2.0,
5
+ "eval_steps": 500,
6
+ "global_step": 50,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.08,
13
+ "grad_norm": 2.749955177307129,
14
+ "learning_rate": 2e-05,
15
+ "loss": 0.2649,
16
+ "step": 2
17
+ },
18
+ {
19
+ "epoch": 0.16,
20
+ "grad_norm": 1.4382448196411133,
21
+ "learning_rate": 2e-05,
22
+ "loss": 0.2711,
23
+ "step": 4
24
+ },
25
+ {
26
+ "epoch": 0.24,
27
+ "grad_norm": 4.895969867706299,
28
+ "learning_rate": 2e-05,
29
+ "loss": 0.2815,
30
+ "step": 6
31
+ },
32
+ {
33
+ "epoch": 0.32,
34
+ "grad_norm": 5.649667263031006,
35
+ "learning_rate": 2e-05,
36
+ "loss": 0.3085,
37
+ "step": 8
38
+ },
39
+ {
40
+ "epoch": 0.4,
41
+ "grad_norm": 0.716244101524353,
42
+ "learning_rate": 2e-05,
43
+ "loss": 0.24,
44
+ "step": 10
45
+ },
46
+ {
47
+ "epoch": 0.48,
48
+ "grad_norm": 1.6991527080535889,
49
+ "learning_rate": 2e-05,
50
+ "loss": 0.3214,
51
+ "step": 12
52
+ },
53
+ {
54
+ "epoch": 0.56,
55
+ "grad_norm": 1.6699107885360718,
56
+ "learning_rate": 2e-05,
57
+ "loss": 0.2465,
58
+ "step": 14
59
+ },
60
+ {
61
+ "epoch": 0.64,
62
+ "grad_norm": 2.105787754058838,
63
+ "learning_rate": 2e-05,
64
+ "loss": 0.3417,
65
+ "step": 16
66
+ },
67
+ {
68
+ "epoch": 0.72,
69
+ "grad_norm": 4.364802837371826,
70
+ "learning_rate": 2e-05,
71
+ "loss": 0.3676,
72
+ "step": 18
73
+ },
74
+ {
75
+ "epoch": 0.8,
76
+ "grad_norm": 2.29569935798645,
77
+ "learning_rate": 2e-05,
78
+ "loss": 0.281,
79
+ "step": 20
80
+ },
81
+ {
82
+ "epoch": 0.88,
83
+ "grad_norm": 1.7581946849822998,
84
+ "learning_rate": 2e-05,
85
+ "loss": 0.3416,
86
+ "step": 22
87
+ },
88
+ {
89
+ "epoch": 0.96,
90
+ "grad_norm": 3.826268434524536,
91
+ "learning_rate": 2e-05,
92
+ "loss": 0.2493,
93
+ "step": 24
94
+ },
95
+ {
96
+ "epoch": 1.04,
97
+ "grad_norm": 3.0750234127044678,
98
+ "learning_rate": 2e-05,
99
+ "loss": 0.2869,
100
+ "step": 26
101
+ },
102
+ {
103
+ "epoch": 1.12,
104
+ "grad_norm": 1.9488271474838257,
105
+ "learning_rate": 2e-05,
106
+ "loss": 0.1758,
107
+ "step": 28
108
+ },
109
+ {
110
+ "epoch": 1.2,
111
+ "grad_norm": 4.114802360534668,
112
+ "learning_rate": 2e-05,
113
+ "loss": 0.2838,
114
+ "step": 30
115
+ },
116
+ {
117
+ "epoch": 1.28,
118
+ "grad_norm": 0.724159300327301,
119
+ "learning_rate": 2e-05,
120
+ "loss": 0.2123,
121
+ "step": 32
122
+ },
123
+ {
124
+ "epoch": 1.36,
125
+ "grad_norm": 1.6088128089904785,
126
+ "learning_rate": 2e-05,
127
+ "loss": 0.3138,
128
+ "step": 34
129
+ },
130
+ {
131
+ "epoch": 1.44,
132
+ "grad_norm": 0.7843464612960815,
133
+ "learning_rate": 2e-05,
134
+ "loss": 0.1969,
135
+ "step": 36
136
+ },
137
+ {
138
+ "epoch": 1.52,
139
+ "grad_norm": 3.61417555809021,
140
+ "learning_rate": 2e-05,
141
+ "loss": 0.2673,
142
+ "step": 38
143
+ },
144
+ {
145
+ "epoch": 1.6,
146
+ "grad_norm": 1.9792591333389282,
147
+ "learning_rate": 2e-05,
148
+ "loss": 0.4543,
149
+ "step": 40
150
+ },
151
+ {
152
+ "epoch": 1.68,
153
+ "grad_norm": 0.7923887968063354,
154
+ "learning_rate": 2e-05,
155
+ "loss": 0.1804,
156
+ "step": 42
157
+ },
158
+ {
159
+ "epoch": 1.76,
160
+ "grad_norm": 1.6938939094543457,
161
+ "learning_rate": 2e-05,
162
+ "loss": 0.3715,
163
+ "step": 44
164
+ },
165
+ {
166
+ "epoch": 1.84,
167
+ "grad_norm": 6.056423664093018,
168
+ "learning_rate": 2e-05,
169
+ "loss": 0.4008,
170
+ "step": 46
171
+ },
172
+ {
173
+ "epoch": 1.92,
174
+ "grad_norm": 4.530152797698975,
175
+ "learning_rate": 2e-05,
176
+ "loss": 0.2846,
177
+ "step": 48
178
+ },
179
+ {
180
+ "epoch": 2.0,
181
+ "grad_norm": 2.6243064403533936,
182
+ "learning_rate": 2e-05,
183
+ "loss": 0.3465,
184
+ "step": 50
185
+ },
186
+ {
187
+ "epoch": 2.0,
188
+ "step": 50,
189
+ "total_flos": 1.4215755016962048e+16,
190
+ "train_loss": 0.2916001892089844,
191
+ "train_runtime": 387.8399,
192
+ "train_samples_per_second": 0.516,
193
+ "train_steps_per_second": 0.129
194
+ }
195
+ ],
196
+ "logging_steps": 2,
197
+ "max_steps": 50,
198
+ "num_input_tokens_seen": 0,
199
+ "num_train_epochs": 1,
200
+ "save_steps": 500,
201
+ "stateful_callbacks": {
202
+ "TrainerControl": {
203
+ "args": {
204
+ "should_epoch_stop": false,
205
+ "should_evaluate": false,
206
+ "should_log": false,
207
+ "should_save": false,
208
+ "should_training_stop": false
209
+ },
210
+ "attributes": {}
211
+ }
212
+ },
213
+ "total_flos": 1.4215755016962048e+16,
214
+ "train_batch_size": 1,
215
+ "trial_name": null,
216
+ "trial_params": null
217
+ }
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/2_client_model_round10.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a21c2139a4174460f7c0d04af2be4e3042d81f2cc8eb01c396770c000ffe2be
3
+ size 1187368166
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/2_client_model_round12.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6572415c32ad9dfa2917fea3c74c68394140361dc0e3973c7f7bd40a70e3b49
3
+ size 1187368166
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/2_client_model_round15.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:688bcb956c0d91fb7205f6b81d6ad5cd0aee3e9693d8771d0a398c01faaafa1c
3
+ size 1187368166
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/2_client_model_round17.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07432c3da93d004c13b7dbbd7c3201ccd2dc6ab4db4657c2de1579c488c50948
3
+ size 1187368166
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/2_client_model_round2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d194f859ed4b51668bd52e6eee922b7d8221d87668c547ae273c6530534fda7a
3
+ size 1187365746
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/2_client_model_round20.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2ae74fd22bff8e1c43217046417eb3104afa95be6b8197439601360dcf330f9
3
+ size 1187368166
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/2_client_model_round5.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1af0d169f1995278d2e4566cdb320da339e9bc22c08c9328a1dd7fac5ad03959
3
+ size 1187365746
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/2_client_model_round7.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:699af45d647dd93265f825382f017c41e17cf0f528760ab997a1438e7779e2e0
3
+ size 1187365746
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/2_trainer_state.json ADDED
@@ -0,0 +1,217 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 2.0,
5
+ "eval_steps": 500,
6
+ "global_step": 50,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.08,
13
+ "grad_norm": 1.0149972438812256,
14
+ "learning_rate": 2e-05,
15
+ "loss": 0.2957,
16
+ "step": 2
17
+ },
18
+ {
19
+ "epoch": 0.16,
20
+ "grad_norm": 3.677619218826294,
21
+ "learning_rate": 2e-05,
22
+ "loss": 0.1877,
23
+ "step": 4
24
+ },
25
+ {
26
+ "epoch": 0.24,
27
+ "grad_norm": 1.4091416597366333,
28
+ "learning_rate": 2e-05,
29
+ "loss": 0.5256,
30
+ "step": 6
31
+ },
32
+ {
33
+ "epoch": 0.32,
34
+ "grad_norm": 5.1624979972839355,
35
+ "learning_rate": 2e-05,
36
+ "loss": 0.3192,
37
+ "step": 8
38
+ },
39
+ {
40
+ "epoch": 0.4,
41
+ "grad_norm": 3.683704376220703,
42
+ "learning_rate": 2e-05,
43
+ "loss": 0.2963,
44
+ "step": 10
45
+ },
46
+ {
47
+ "epoch": 0.48,
48
+ "grad_norm": 4.079484939575195,
49
+ "learning_rate": 2e-05,
50
+ "loss": 0.2549,
51
+ "step": 12
52
+ },
53
+ {
54
+ "epoch": 0.56,
55
+ "grad_norm": 1.7549387216567993,
56
+ "learning_rate": 2e-05,
57
+ "loss": 0.2847,
58
+ "step": 14
59
+ },
60
+ {
61
+ "epoch": 0.64,
62
+ "grad_norm": 3.3598456382751465,
63
+ "learning_rate": 2e-05,
64
+ "loss": 0.2677,
65
+ "step": 16
66
+ },
67
+ {
68
+ "epoch": 0.72,
69
+ "grad_norm": 2.487851619720459,
70
+ "learning_rate": 2e-05,
71
+ "loss": 0.1727,
72
+ "step": 18
73
+ },
74
+ {
75
+ "epoch": 0.8,
76
+ "grad_norm": 4.575611114501953,
77
+ "learning_rate": 2e-05,
78
+ "loss": 0.3743,
79
+ "step": 20
80
+ },
81
+ {
82
+ "epoch": 0.88,
83
+ "grad_norm": 3.5113894939422607,
84
+ "learning_rate": 2e-05,
85
+ "loss": 0.1855,
86
+ "step": 22
87
+ },
88
+ {
89
+ "epoch": 0.96,
90
+ "grad_norm": 6.549233913421631,
91
+ "learning_rate": 2e-05,
92
+ "loss": 0.3081,
93
+ "step": 24
94
+ },
95
+ {
96
+ "epoch": 1.04,
97
+ "grad_norm": 3.901048421859741,
98
+ "learning_rate": 2e-05,
99
+ "loss": 0.205,
100
+ "step": 26
101
+ },
102
+ {
103
+ "epoch": 1.12,
104
+ "grad_norm": 3.9782521724700928,
105
+ "learning_rate": 2e-05,
106
+ "loss": 0.4042,
107
+ "step": 28
108
+ },
109
+ {
110
+ "epoch": 1.2,
111
+ "grad_norm": 4.073624134063721,
112
+ "learning_rate": 2e-05,
113
+ "loss": 0.2591,
114
+ "step": 30
115
+ },
116
+ {
117
+ "epoch": 1.28,
118
+ "grad_norm": 3.9109604358673096,
119
+ "learning_rate": 2e-05,
120
+ "loss": 0.4173,
121
+ "step": 32
122
+ },
123
+ {
124
+ "epoch": 1.36,
125
+ "grad_norm": 6.071135520935059,
126
+ "learning_rate": 2e-05,
127
+ "loss": 0.3733,
128
+ "step": 34
129
+ },
130
+ {
131
+ "epoch": 1.44,
132
+ "grad_norm": 6.133024215698242,
133
+ "learning_rate": 2e-05,
134
+ "loss": 0.6257,
135
+ "step": 36
136
+ },
137
+ {
138
+ "epoch": 1.52,
139
+ "grad_norm": 2.1732125282287598,
140
+ "learning_rate": 2e-05,
141
+ "loss": 0.2811,
142
+ "step": 38
143
+ },
144
+ {
145
+ "epoch": 1.6,
146
+ "grad_norm": 2.2726752758026123,
147
+ "learning_rate": 2e-05,
148
+ "loss": 0.1669,
149
+ "step": 40
150
+ },
151
+ {
152
+ "epoch": 1.68,
153
+ "grad_norm": 0.8473740816116333,
154
+ "learning_rate": 2e-05,
155
+ "loss": 0.1666,
156
+ "step": 42
157
+ },
158
+ {
159
+ "epoch": 1.76,
160
+ "grad_norm": 2.050222635269165,
161
+ "learning_rate": 2e-05,
162
+ "loss": 0.4076,
163
+ "step": 44
164
+ },
165
+ {
166
+ "epoch": 1.84,
167
+ "grad_norm": 1.9538583755493164,
168
+ "learning_rate": 2e-05,
169
+ "loss": 0.1928,
170
+ "step": 46
171
+ },
172
+ {
173
+ "epoch": 1.92,
174
+ "grad_norm": 1.3469185829162598,
175
+ "learning_rate": 2e-05,
176
+ "loss": 0.1972,
177
+ "step": 48
178
+ },
179
+ {
180
+ "epoch": 2.0,
181
+ "grad_norm": 4.158794403076172,
182
+ "learning_rate": 2e-05,
183
+ "loss": 0.3584,
184
+ "step": 50
185
+ },
186
+ {
187
+ "epoch": 2.0,
188
+ "step": 50,
189
+ "total_flos": 1.8116071156350976e+16,
190
+ "train_loss": 0.3010967254638672,
191
+ "train_runtime": 452.156,
192
+ "train_samples_per_second": 0.442,
193
+ "train_steps_per_second": 0.111
194
+ }
195
+ ],
196
+ "logging_steps": 2,
197
+ "max_steps": 50,
198
+ "num_input_tokens_seen": 0,
199
+ "num_train_epochs": 1,
200
+ "save_steps": 500,
201
+ "stateful_callbacks": {
202
+ "TrainerControl": {
203
+ "args": {
204
+ "should_epoch_stop": false,
205
+ "should_evaluate": false,
206
+ "should_log": false,
207
+ "should_save": false,
208
+ "should_training_stop": false
209
+ },
210
+ "attributes": {}
211
+ }
212
+ },
213
+ "total_flos": 1.8116071156350976e+16,
214
+ "train_batch_size": 1,
215
+ "trial_name": null,
216
+ "trial_params": null
217
+ }
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/3_client_model_round10.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d698acd95f40ab3060ac3aa526de719af960b152b0b437a2707477bb865cf0af
3
+ size 1187368166
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/3_client_model_round12.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:942bc7ceef8a14a461573119471404f95f9341e13cf97d4b56b571288891ee94
3
+ size 1187368166
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/3_client_model_round15.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53f66ac08d30899d6a57527753550b5ddd498d5600cc6f6f58ae4b9a6e1ba82b
3
+ size 1187368166
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/3_client_model_round17.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37ea55a67945bca5519f033574b5772fae38b547e467b56849f4c7d585a5945a
3
+ size 1187368166
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/3_client_model_round2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa673f5e88836a15162182ed95bb1798ebcbae0015512daeebb49bc2ea256b86
3
+ size 1187365746
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/3_client_model_round20.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abe1d695e062f17cdaddaef6f9ac69997347fa1ef12a91b6c2cf1cdad0c31056
3
+ size 1187368166
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/3_client_model_round5.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98a337b23b0fdf59f688cc3902aac882acb1372212f18790538301fbc3dd4fab
3
+ size 1187365746
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/3_client_model_round7.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88948bb2670bd770428fd892299e745e45909787d362238d4f975b1c309e513c
3
+ size 1187365746
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/3_trainer_state.json ADDED
@@ -0,0 +1,217 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 2.0,
5
+ "eval_steps": 500,
6
+ "global_step": 50,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.08,
13
+ "grad_norm": 0.9954308271408081,
14
+ "learning_rate": 2e-05,
15
+ "loss": 0.3463,
16
+ "step": 2
17
+ },
18
+ {
19
+ "epoch": 0.16,
20
+ "grad_norm": 5.380747318267822,
21
+ "learning_rate": 2e-05,
22
+ "loss": 0.402,
23
+ "step": 4
24
+ },
25
+ {
26
+ "epoch": 0.24,
27
+ "grad_norm": 3.027390956878662,
28
+ "learning_rate": 2e-05,
29
+ "loss": 0.3679,
30
+ "step": 6
31
+ },
32
+ {
33
+ "epoch": 0.32,
34
+ "grad_norm": 3.477867364883423,
35
+ "learning_rate": 2e-05,
36
+ "loss": 0.35,
37
+ "step": 8
38
+ },
39
+ {
40
+ "epoch": 0.4,
41
+ "grad_norm": 1.466752529144287,
42
+ "learning_rate": 2e-05,
43
+ "loss": 0.3335,
44
+ "step": 10
45
+ },
46
+ {
47
+ "epoch": 0.48,
48
+ "grad_norm": 2.5924768447875977,
49
+ "learning_rate": 2e-05,
50
+ "loss": 0.3094,
51
+ "step": 12
52
+ },
53
+ {
54
+ "epoch": 0.56,
55
+ "grad_norm": 1.57817542552948,
56
+ "learning_rate": 2e-05,
57
+ "loss": 0.2201,
58
+ "step": 14
59
+ },
60
+ {
61
+ "epoch": 0.64,
62
+ "grad_norm": 2.9312920570373535,
63
+ "learning_rate": 2e-05,
64
+ "loss": 0.4944,
65
+ "step": 16
66
+ },
67
+ {
68
+ "epoch": 0.72,
69
+ "grad_norm": 2.0879368782043457,
70
+ "learning_rate": 2e-05,
71
+ "loss": 0.399,
72
+ "step": 18
73
+ },
74
+ {
75
+ "epoch": 0.8,
76
+ "grad_norm": 1.32192862033844,
77
+ "learning_rate": 2e-05,
78
+ "loss": 0.3558,
79
+ "step": 20
80
+ },
81
+ {
82
+ "epoch": 0.88,
83
+ "grad_norm": 3.584916591644287,
84
+ "learning_rate": 2e-05,
85
+ "loss": 0.3141,
86
+ "step": 22
87
+ },
88
+ {
89
+ "epoch": 0.96,
90
+ "grad_norm": 1.5875033140182495,
91
+ "learning_rate": 2e-05,
92
+ "loss": 0.2867,
93
+ "step": 24
94
+ },
95
+ {
96
+ "epoch": 1.04,
97
+ "grad_norm": 2.598944664001465,
98
+ "learning_rate": 2e-05,
99
+ "loss": 0.3165,
100
+ "step": 26
101
+ },
102
+ {
103
+ "epoch": 1.12,
104
+ "grad_norm": 1.0258618593215942,
105
+ "learning_rate": 2e-05,
106
+ "loss": 0.3818,
107
+ "step": 28
108
+ },
109
+ {
110
+ "epoch": 1.2,
111
+ "grad_norm": 1.5218331813812256,
112
+ "learning_rate": 2e-05,
113
+ "loss": 0.3254,
114
+ "step": 30
115
+ },
116
+ {
117
+ "epoch": 1.28,
118
+ "grad_norm": 1.9529523849487305,
119
+ "learning_rate": 2e-05,
120
+ "loss": 0.2271,
121
+ "step": 32
122
+ },
123
+ {
124
+ "epoch": 1.36,
125
+ "grad_norm": 2.097310781478882,
126
+ "learning_rate": 2e-05,
127
+ "loss": 0.3292,
128
+ "step": 34
129
+ },
130
+ {
131
+ "epoch": 1.44,
132
+ "grad_norm": 1.6695365905761719,
133
+ "learning_rate": 2e-05,
134
+ "loss": 0.3564,
135
+ "step": 36
136
+ },
137
+ {
138
+ "epoch": 1.52,
139
+ "grad_norm": 0.7364570498466492,
140
+ "learning_rate": 2e-05,
141
+ "loss": 0.2943,
142
+ "step": 38
143
+ },
144
+ {
145
+ "epoch": 1.6,
146
+ "grad_norm": 1.299603819847107,
147
+ "learning_rate": 2e-05,
148
+ "loss": 0.2221,
149
+ "step": 40
150
+ },
151
+ {
152
+ "epoch": 1.68,
153
+ "grad_norm": 5.948718070983887,
154
+ "learning_rate": 2e-05,
155
+ "loss": 0.4884,
156
+ "step": 42
157
+ },
158
+ {
159
+ "epoch": 1.76,
160
+ "grad_norm": 2.701298475265503,
161
+ "learning_rate": 2e-05,
162
+ "loss": 0.4201,
163
+ "step": 44
164
+ },
165
+ {
166
+ "epoch": 1.84,
167
+ "grad_norm": 1.4248079061508179,
168
+ "learning_rate": 2e-05,
169
+ "loss": 0.2609,
170
+ "step": 46
171
+ },
172
+ {
173
+ "epoch": 1.92,
174
+ "grad_norm": 3.403484344482422,
175
+ "learning_rate": 2e-05,
176
+ "loss": 0.2597,
177
+ "step": 48
178
+ },
179
+ {
180
+ "epoch": 2.0,
181
+ "grad_norm": 2.023223400115967,
182
+ "learning_rate": 2e-05,
183
+ "loss": 0.2818,
184
+ "step": 50
185
+ },
186
+ {
187
+ "epoch": 2.0,
188
+ "step": 50,
189
+ "total_flos": 2.210405811434291e+16,
190
+ "train_loss": 0.3337188720703125,
191
+ "train_runtime": 509.6408,
192
+ "train_samples_per_second": 0.392,
193
+ "train_steps_per_second": 0.098
194
+ }
195
+ ],
196
+ "logging_steps": 2,
197
+ "max_steps": 50,
198
+ "num_input_tokens_seen": 0,
199
+ "num_train_epochs": 1,
200
+ "save_steps": 500,
201
+ "stateful_callbacks": {
202
+ "TrainerControl": {
203
+ "args": {
204
+ "should_epoch_stop": false,
205
+ "should_evaluate": false,
206
+ "should_log": false,
207
+ "should_save": false,
208
+ "should_training_stop": false
209
+ },
210
+ "attributes": {}
211
+ }
212
+ },
213
+ "total_flos": 2.210405811434291e+16,
214
+ "train_batch_size": 1,
215
+ "trial_name": null,
216
+ "trial_params": null
217
+ }
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/4_client_model_round10.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0785c7e8792c7b81d33266f0a9f3a354da96fc572c2ee37aa39c29a3889faee8
3
+ size 1187368166
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/4_client_model_round12.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4c06d0742acb8d276cee5b3a2e41ff603670353d442daf30aae930e3256c0b8
3
+ size 1187368166
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/4_client_model_round15.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:674cdbda888fa8e50d540dd2b7e7f0b16d617669ce3747840f064ceda4d0cbca
3
+ size 1187368166
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/4_client_model_round17.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c005519a8e7fab104d76691c87d9d004be5b458d79fad7df5d8bb3d38f06a4d0
3
+ size 1187368166
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/4_client_model_round2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5bd6b783592ba6d572207db0f3640331efbe56eecd2f9560da7ebd0977d11d8d
3
+ size 1187365746
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/4_client_model_round20.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dcb8673f4506091039e9157a289ca5d9f459ca79224c2a9c6de4df027d9545e8
3
+ size 1187368166
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/4_client_model_round5.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86cd9d1b611eb2911d44ab463974e653cefa3616e51448b1d93cd49fac30503d
3
+ size 1187365746
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/4_client_model_round7.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daea3e5b2d82cbe980735bb3f4fdefdd490542d0687277f1c35cf06b1b6f090a
3
+ size 1187365746
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/4_trainer_state.json ADDED
@@ -0,0 +1,217 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 2.0,
5
+ "eval_steps": 500,
6
+ "global_step": 50,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.08,
13
+ "grad_norm": 2.1428046226501465,
14
+ "learning_rate": 2e-05,
15
+ "loss": 0.4124,
16
+ "step": 2
17
+ },
18
+ {
19
+ "epoch": 0.16,
20
+ "grad_norm": 2.2636923789978027,
21
+ "learning_rate": 2e-05,
22
+ "loss": 0.3262,
23
+ "step": 4
24
+ },
25
+ {
26
+ "epoch": 0.24,
27
+ "grad_norm": 1.5039873123168945,
28
+ "learning_rate": 2e-05,
29
+ "loss": 0.2659,
30
+ "step": 6
31
+ },
32
+ {
33
+ "epoch": 0.32,
34
+ "grad_norm": 2.798299789428711,
35
+ "learning_rate": 2e-05,
36
+ "loss": 0.473,
37
+ "step": 8
38
+ },
39
+ {
40
+ "epoch": 0.4,
41
+ "grad_norm": 2.685647487640381,
42
+ "learning_rate": 2e-05,
43
+ "loss": 0.4659,
44
+ "step": 10
45
+ },
46
+ {
47
+ "epoch": 0.48,
48
+ "grad_norm": 1.6386606693267822,
49
+ "learning_rate": 2e-05,
50
+ "loss": 0.2308,
51
+ "step": 12
52
+ },
53
+ {
54
+ "epoch": 0.56,
55
+ "grad_norm": 2.34197998046875,
56
+ "learning_rate": 2e-05,
57
+ "loss": 0.304,
58
+ "step": 14
59
+ },
60
+ {
61
+ "epoch": 0.64,
62
+ "grad_norm": 1.686523199081421,
63
+ "learning_rate": 2e-05,
64
+ "loss": 0.4787,
65
+ "step": 16
66
+ },
67
+ {
68
+ "epoch": 0.72,
69
+ "grad_norm": 2.5239813327789307,
70
+ "learning_rate": 2e-05,
71
+ "loss": 0.3822,
72
+ "step": 18
73
+ },
74
+ {
75
+ "epoch": 0.8,
76
+ "grad_norm": 3.2457656860351562,
77
+ "learning_rate": 2e-05,
78
+ "loss": 0.413,
79
+ "step": 20
80
+ },
81
+ {
82
+ "epoch": 0.88,
83
+ "grad_norm": 3.188730478286743,
84
+ "learning_rate": 2e-05,
85
+ "loss": 0.1539,
86
+ "step": 22
87
+ },
88
+ {
89
+ "epoch": 0.96,
90
+ "grad_norm": 2.1818411350250244,
91
+ "learning_rate": 2e-05,
92
+ "loss": 0.4026,
93
+ "step": 24
94
+ },
95
+ {
96
+ "epoch": 1.04,
97
+ "grad_norm": 1.6254708766937256,
98
+ "learning_rate": 2e-05,
99
+ "loss": 0.5243,
100
+ "step": 26
101
+ },
102
+ {
103
+ "epoch": 1.12,
104
+ "grad_norm": 2.542879104614258,
105
+ "learning_rate": 2e-05,
106
+ "loss": 0.4744,
107
+ "step": 28
108
+ },
109
+ {
110
+ "epoch": 1.2,
111
+ "grad_norm": 2.871481418609619,
112
+ "learning_rate": 2e-05,
113
+ "loss": 0.4035,
114
+ "step": 30
115
+ },
116
+ {
117
+ "epoch": 1.28,
118
+ "grad_norm": 4.686084747314453,
119
+ "learning_rate": 2e-05,
120
+ "loss": 0.3615,
121
+ "step": 32
122
+ },
123
+ {
124
+ "epoch": 1.36,
125
+ "grad_norm": 4.072404861450195,
126
+ "learning_rate": 2e-05,
127
+ "loss": 0.5069,
128
+ "step": 34
129
+ },
130
+ {
131
+ "epoch": 1.44,
132
+ "grad_norm": 3.111271381378174,
133
+ "learning_rate": 2e-05,
134
+ "loss": 0.3203,
135
+ "step": 36
136
+ },
137
+ {
138
+ "epoch": 1.52,
139
+ "grad_norm": 5.3058671951293945,
140
+ "learning_rate": 2e-05,
141
+ "loss": 0.4785,
142
+ "step": 38
143
+ },
144
+ {
145
+ "epoch": 1.6,
146
+ "grad_norm": 4.508816719055176,
147
+ "learning_rate": 2e-05,
148
+ "loss": 0.4815,
149
+ "step": 40
150
+ },
151
+ {
152
+ "epoch": 1.68,
153
+ "grad_norm": 2.1121716499328613,
154
+ "learning_rate": 2e-05,
155
+ "loss": 0.2251,
156
+ "step": 42
157
+ },
158
+ {
159
+ "epoch": 1.76,
160
+ "grad_norm": 3.3726918697357178,
161
+ "learning_rate": 2e-05,
162
+ "loss": 0.5956,
163
+ "step": 44
164
+ },
165
+ {
166
+ "epoch": 1.84,
167
+ "grad_norm": 3.3394052982330322,
168
+ "learning_rate": 2e-05,
169
+ "loss": 0.3002,
170
+ "step": 46
171
+ },
172
+ {
173
+ "epoch": 1.92,
174
+ "grad_norm": 2.445279836654663,
175
+ "learning_rate": 2e-05,
176
+ "loss": 0.3145,
177
+ "step": 48
178
+ },
179
+ {
180
+ "epoch": 2.0,
181
+ "grad_norm": 3.0885345935821533,
182
+ "learning_rate": 2e-05,
183
+ "loss": 0.553,
184
+ "step": 50
185
+ },
186
+ {
187
+ "epoch": 2.0,
188
+ "step": 50,
189
+ "total_flos": 2.1678855546732544e+16,
190
+ "train_loss": 0.39391799926757814,
191
+ "train_runtime": 520.6241,
192
+ "train_samples_per_second": 0.384,
193
+ "train_steps_per_second": 0.096
194
+ }
195
+ ],
196
+ "logging_steps": 2,
197
+ "max_steps": 50,
198
+ "num_input_tokens_seen": 0,
199
+ "num_train_epochs": 1,
200
+ "save_steps": 500,
201
+ "stateful_callbacks": {
202
+ "TrainerControl": {
203
+ "args": {
204
+ "should_epoch_stop": false,
205
+ "should_evaluate": false,
206
+ "should_log": false,
207
+ "should_save": false,
208
+ "should_training_stop": false
209
+ },
210
+ "attributes": {}
211
+ }
212
+ },
213
+ "total_flos": 2.1678855546732544e+16,
214
+ "train_batch_size": 1,
215
+ "trial_name": null,
216
+ "trial_params": null
217
+ }
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/5_client_model_round10.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e3e90203db7b2620972f97bc34ec7506e45803bae2b537102b3b22cc7a180fe
3
+ size 1187368166
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/5_client_model_round12.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:660d3d0e31148c22a3c6c4ca066b26b8e59125ae23e9dee91ec0f6f352b8ceda
3
+ size 1187368166
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/5_client_model_round15.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01d6c1954d802760dcfc7dc501544800c7bec36ac8ec04f640026ef94943d280
3
+ size 1187368166
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/5_client_model_round17.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e28e418e02ca25995e7b67903aea1b8982a79845ddb2ffa115dec41741b6a291
3
+ size 1187368166
client_states_feddat_Multipqfullfreeze_pca_bs4_saveoptim_lr2e-5_sc132_4tasks_5rounds_fixiter50_T0125_decay099/5_client_model_round2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f64003175024615b1adfe76b76a261a7aeba14c2a45cfa7953ebc0691968bccf
3
+ size 1187365746