PhoenixB commited on
Commit
0e21d06
·
verified ·
1 Parent(s): 8b6e19f

Training in progress, step 90, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2ca2d0789f8cfefc3ae782c9c211e30db8fcfde8211a7aa026f963759ffa596b
3
  size 9450448
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7199f500237808236c7db3d5064a6acab3ac41d5c44eef1255b1e366d37d6ed
3
  size 9450448
last-checkpoint/global_step90/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ba7f7cb199a096c26f7bdb99e92e8e975851dc0e565c7c549a4709721b38d03
3
+ size 28320208
last-checkpoint/global_step90/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ef157cd60fb19d40e37f653a733ec88ca8ab5038fa4193ae672fe035a3ceb8e
3
+ size 28320208
last-checkpoint/global_step90/mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8501d3f6f7512e5408b13c6199ae8c726861f2db4a61e1a2f4450273f82c40f
3
+ size 9523692
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step80
 
1
+ global_step90
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2cf0b22231e0aa02f53ac9a900d016562c5e7c021c34b5088c73b5a29b90d23d
3
  size 14512
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b177fe91b634dee552bfdb8884320c1c49f5f739fd36c0751b428ca7b40e9d3f
3
  size 14512
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6f24bb0f430f282c43aa6537fcfce58560e72b7881eb48726030f0bc77debaf2
3
  size 14512
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d85625dac880f235f3fb74a29363e92179ac27ae903013848e6f9d0c8f757f8
3
  size 14512
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:49b8a1dbbf2c2a0b7fde326d57c34bd6c5e5d17e0aaf8b19016c1f721c049db1
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb97b24f34ff3e53eec5be9cf35c1a7161c58dbc2fed7dda160fb3eb64e5f353
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.1368106028217187,
5
  "eval_steps": 10,
6
- "global_step": 80,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -191,6 +191,28 @@
191
  "eval_samples_per_second": 105.229,
192
  "eval_steps_per_second": 26.467,
193
  "step": 80
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
194
  }
195
  ],
196
  "logging_steps": 5,
@@ -210,7 +232,7 @@
210
  "attributes": {}
211
  }
212
  },
213
- "total_flos": 2044930264399872.0,
214
  "train_batch_size": 2,
215
  "trial_name": null,
216
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.15391192817443353,
5
  "eval_steps": 10,
6
+ "global_step": 90,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
191
  "eval_samples_per_second": 105.229,
192
  "eval_steps_per_second": 26.467,
193
  "step": 80
194
+ },
195
+ {
196
+ "epoch": 0.1453612654980761,
197
+ "grad_norm": 32.74094009399414,
198
+ "learning_rate": 1.339745962155613e-05,
199
+ "loss": 3.1578,
200
+ "step": 85
201
+ },
202
+ {
203
+ "epoch": 0.15391192817443353,
204
+ "grad_norm": 22.851362228393555,
205
+ "learning_rate": 6.030737921409169e-06,
206
+ "loss": 3.1172,
207
+ "step": 90
208
+ },
209
+ {
210
+ "epoch": 0.15391192817443353,
211
+ "eval_loss": 3.1573593616485596,
212
+ "eval_runtime": 4.7749,
213
+ "eval_samples_per_second": 103.249,
214
+ "eval_steps_per_second": 25.969,
215
+ "step": 90
216
  }
217
  ],
218
  "logging_steps": 5,
 
232
  "attributes": {}
233
  }
234
  },
235
+ "total_flos": 2297390790868992.0,
236
  "train_batch_size": 2,
237
  "trial_name": null,
238
  "trial_params": null