Training in progress, step 24, checkpoint
Browse files- last-checkpoint/adapter_model.safetensors +1 -1
- last-checkpoint/global_step24/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step24/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step24/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step24/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step24/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step24/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step24/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step24/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step24/mp_rank_00_model_states.pt +3 -0
- last-checkpoint/latest +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +122 -2
last-checkpoint/adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 18516456
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f96ce207444d7a10e17049c94dc5648bd8f200d8da34ca1d6852ec281d5c6819
|
3 |
size 18516456
|
last-checkpoint/global_step24/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:244ee88dc4927c3cc387cc0504876e3bf70c16b3da30d871aae45b9335984618
|
3 |
+
size 13857360
|
last-checkpoint/global_step24/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ee5973f9df1a2c3425c2d40e981adf7555e5dc866dadac45599953a0446fc17
|
3 |
+
size 13856656
|
last-checkpoint/global_step24/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d43ad14e713e7fe6d19c89b75c444eec46894556bcabd66f4266bd3333d925be
|
3 |
+
size 13857360
|
last-checkpoint/global_step24/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d58e93750e65925db51f7fa86bebe5d687534e13726c52348ac1b9614cc7acc
|
3 |
+
size 13856656
|
last-checkpoint/global_step24/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2524a9ac1b47dfbd409cfe9aa79a55f2d1ff7918b1a266628d2f27c79de1ba43
|
3 |
+
size 13857424
|
last-checkpoint/global_step24/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7990927841166cf9ae42c2ef15f4927b86bc2f69fce9b77ab5f9cc9c7f7d1a55
|
3 |
+
size 13856656
|
last-checkpoint/global_step24/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4dc8a45e4c246a95e4729abae09c73ab63c85d55f97f6321e1572bad30c2b485
|
3 |
+
size 13857424
|
last-checkpoint/global_step24/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abf96ffa1e943257b9dd5f06c46f62dde5f4e5e85fdd9fc99bebd897c269a56
|
3 |
+
size 13856656
|
last-checkpoint/global_step24/mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89eec1da451cfc9002f69cf99d7bfb2c41b8702d9e83b19cb9336e55f3d8493c
|
3 |
+
size 485512632
|
last-checkpoint/latest
CHANGED
@@ -1 +1 @@
|
|
1 |
-
|
|
|
1 |
+
global_step24
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9527d2431b9400e39f4784d5d63151434952de4dfec19feb2ab624b5f1922cb0
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -2,9 +2,9 @@
|
|
2 |
"best_global_step": null,
|
3 |
"best_metric": null,
|
4 |
"best_model_checkpoint": null,
|
5 |
-
"epoch": 0.
|
6 |
"eval_steps": 500,
|
7 |
-
"global_step":
|
8 |
"is_hyper_param_search": false,
|
9 |
"is_local_process_zero": true,
|
10 |
"is_world_process_zero": true,
|
@@ -248,6 +248,126 @@
|
|
248 |
"rewards/margins": 0.1759033203125,
|
249 |
"rewards/rejected": 0.028123855590820312,
|
250 |
"step": 16
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
251 |
}
|
252 |
],
|
253 |
"logging_steps": 1,
|
|
|
2 |
"best_global_step": null,
|
3 |
"best_metric": null,
|
4 |
"best_model_checkpoint": null,
|
5 |
+
"epoch": 0.08613728129205922,
|
6 |
"eval_steps": 500,
|
7 |
+
"global_step": 24,
|
8 |
"is_hyper_param_search": false,
|
9 |
"is_local_process_zero": true,
|
10 |
"is_world_process_zero": true,
|
|
|
248 |
"rewards/margins": 0.1759033203125,
|
249 |
"rewards/rejected": 0.028123855590820312,
|
250 |
"step": 16
|
251 |
+
},
|
252 |
+
{
|
253 |
+
"epoch": 0.06101390758187528,
|
254 |
+
"grad_norm": 0.5971803069114685,
|
255 |
+
"learning_rate": 1.781071971878587e-05,
|
256 |
+
"logits/chosen": -0.8837890625,
|
257 |
+
"logits/rejected": -1.08642578125,
|
258 |
+
"logps/chosen": -505.0,
|
259 |
+
"logps/rejected": -360.375,
|
260 |
+
"loss": 0.597,
|
261 |
+
"rewards/accuracies": 0.703125,
|
262 |
+
"rewards/chosen": 0.2252197265625,
|
263 |
+
"rewards/margins": 0.21142578125,
|
264 |
+
"rewards/rejected": 0.01387786865234375,
|
265 |
+
"step": 17
|
266 |
+
},
|
267 |
+
{
|
268 |
+
"epoch": 0.06460296096904442,
|
269 |
+
"grad_norm": 0.5383909344673157,
|
270 |
+
"learning_rate": 1.5941857792939702e-05,
|
271 |
+
"logits/chosen": -0.90234375,
|
272 |
+
"logits/rejected": -1.18994140625,
|
273 |
+
"logps/chosen": -512.5,
|
274 |
+
"logps/rejected": -353.75,
|
275 |
+
"loss": 0.6096,
|
276 |
+
"rewards/accuracies": 0.65625,
|
277 |
+
"rewards/chosen": 0.218994140625,
|
278 |
+
"rewards/margins": 0.194183349609375,
|
279 |
+
"rewards/rejected": 0.0247955322265625,
|
280 |
+
"step": 18
|
281 |
+
},
|
282 |
+
{
|
283 |
+
"epoch": 0.06819201435621355,
|
284 |
+
"grad_norm": 0.6120373010635376,
|
285 |
+
"learning_rate": 1.40581422070603e-05,
|
286 |
+
"logits/chosen": -0.84521484375,
|
287 |
+
"logits/rejected": -1.1376953125,
|
288 |
+
"logps/chosen": -502.5,
|
289 |
+
"logps/rejected": -361.75,
|
290 |
+
"loss": 0.591,
|
291 |
+
"rewards/accuracies": 0.71875,
|
292 |
+
"rewards/chosen": 0.2548828125,
|
293 |
+
"rewards/margins": 0.229736328125,
|
294 |
+
"rewards/rejected": 0.025396347045898438,
|
295 |
+
"step": 19
|
296 |
+
},
|
297 |
+
{
|
298 |
+
"epoch": 0.07178106774338268,
|
299 |
+
"grad_norm": 0.5964956283569336,
|
300 |
+
"learning_rate": 1.2189280281214128e-05,
|
301 |
+
"logits/chosen": -0.84326171875,
|
302 |
+
"logits/rejected": -1.17236328125,
|
303 |
+
"logps/chosen": -515.75,
|
304 |
+
"logps/rejected": -360.25,
|
305 |
+
"loss": 0.5997,
|
306 |
+
"rewards/accuracies": 0.703125,
|
307 |
+
"rewards/chosen": 0.276123046875,
|
308 |
+
"rewards/margins": 0.2108154296875,
|
309 |
+
"rewards/rejected": 0.06536865234375,
|
310 |
+
"step": 20
|
311 |
+
},
|
312 |
+
{
|
313 |
+
"epoch": 0.07537012113055182,
|
314 |
+
"grad_norm": 0.5623295903205872,
|
315 |
+
"learning_rate": 1.036474508437579e-05,
|
316 |
+
"logits/chosen": -0.87646484375,
|
317 |
+
"logits/rejected": -1.19140625,
|
318 |
+
"logps/chosen": -519.25,
|
319 |
+
"logps/rejected": -348.5,
|
320 |
+
"loss": 0.5757,
|
321 |
+
"rewards/accuracies": 0.7578125,
|
322 |
+
"rewards/chosen": 0.3125,
|
323 |
+
"rewards/margins": 0.262451171875,
|
324 |
+
"rewards/rejected": 0.05007171630859375,
|
325 |
+
"step": 21
|
326 |
+
},
|
327 |
+
{
|
328 |
+
"epoch": 0.07895917451772096,
|
329 |
+
"grad_norm": 0.6346862316131592,
|
330 |
+
"learning_rate": 8.61331062652391e-06,
|
331 |
+
"logits/chosen": -0.84423828125,
|
332 |
+
"logits/rejected": -1.1728515625,
|
333 |
+
"logps/chosen": -509.75,
|
334 |
+
"logps/rejected": -367.5,
|
335 |
+
"loss": 0.59,
|
336 |
+
"rewards/accuracies": 0.734375,
|
337 |
+
"rewards/chosen": 0.30908203125,
|
338 |
+
"rewards/margins": 0.240966796875,
|
339 |
+
"rewards/rejected": 0.0682525634765625,
|
340 |
+
"step": 22
|
341 |
+
},
|
342 |
+
{
|
343 |
+
"epoch": 0.08254822790489008,
|
344 |
+
"grad_norm": 0.5374892354011536,
|
345 |
+
"learning_rate": 6.962598075315047e-06,
|
346 |
+
"logits/chosen": -0.8955078125,
|
347 |
+
"logits/rejected": -1.1728515625,
|
348 |
+
"logps/chosen": -540.0,
|
349 |
+
"logps/rejected": -382.875,
|
350 |
+
"loss": 0.5659,
|
351 |
+
"rewards/accuracies": 0.796875,
|
352 |
+
"rewards/chosen": 0.33544921875,
|
353 |
+
"rewards/margins": 0.2880859375,
|
354 |
+
"rewards/rejected": 0.04767608642578125,
|
355 |
+
"step": 23
|
356 |
+
},
|
357 |
+
{
|
358 |
+
"epoch": 0.08613728129205922,
|
359 |
+
"grad_norm": 0.5729860067367554,
|
360 |
+
"learning_rate": 5.438640153769654e-06,
|
361 |
+
"logits/chosen": -0.8798828125,
|
362 |
+
"logits/rejected": -1.14794921875,
|
363 |
+
"logps/chosen": -523.25,
|
364 |
+
"logps/rejected": -373.75,
|
365 |
+
"loss": 0.5696,
|
366 |
+
"rewards/accuracies": 0.7734375,
|
367 |
+
"rewards/chosen": 0.35205078125,
|
368 |
+
"rewards/margins": 0.2939453125,
|
369 |
+
"rewards/rejected": 0.05828094482421875,
|
370 |
+
"step": 24
|
371 |
}
|
372 |
],
|
373 |
"logging_steps": 1,
|