PhoenixB commited on
Commit
2543e5e
·
verified ·
1 Parent(s): c067cea

Training in progress, step 30, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3ef84cca657388b06a9b161e83e1bdc8d561986c2a18a79c148ef4ca586eef69
3
  size 50503544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c33f4768609aac9547259cbea351d0ced9847c0cca0b967b41778fe8732ac39
3
  size 50503544
last-checkpoint/optimizer.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:22613cdf5ec7837b602c185436af06b330ec2d71a2b49ac5df96ca8b6c43993d
3
  size 101199994
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:562f38cbf6b76a45ee62f324c254d16734cda287eceaeafac9ec80fcccec4179
3
  size 101199994
last-checkpoint/pytorch_model_fsdp.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0adf2c337f3fe8ac9fdc291edfdab98d620fd14cbd0dc2712a1573f7734609d2
3
  size 50577394
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b54eab572fdff651f14a5c32ce65202b8dac2e6a30bb58178aef3bed97b1d14a
3
  size 50577394
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:015707cb16790250630febca682498cb5d3456d5a13443b953687f19dc7d59ed
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2def2cd24154d8cecbaa07c36ae27e5ebb9b7273a78abfea27aa67c480e4ae2b
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.000817594636579184,
5
  "eval_steps": 500,
6
- "global_step": 20,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -307,6 +307,156 @@
307
  "rewards/margins": 16.37193489074707,
308
  "rewards/rejected": -60.71843338012695,
309
  "step": 20
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
310
  }
311
  ],
312
  "logging_steps": 1,
@@ -321,7 +471,7 @@
321
  "should_evaluate": false,
322
  "should_log": false,
323
  "should_save": true,
324
- "should_training_stop": false
325
  },
326
  "attributes": {}
327
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.0012263919548687761,
5
  "eval_steps": 500,
6
+ "global_step": 30,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
307
  "rewards/margins": 16.37193489074707,
308
  "rewards/rejected": -60.71843338012695,
309
  "step": 20
310
+ },
311
+ {
312
+ "epoch": 0.0008584743684081432,
313
+ "grad_norm": 0.08101686835289001,
314
+ "learning_rate": 5.7422070843492734e-05,
315
+ "logits/chosen": -2.6424341201782227,
316
+ "logits/rejected": -2.6488289833068848,
317
+ "logps/chosen": -511.4774169921875,
318
+ "logps/rejected": -789.3146362304688,
319
+ "loss": 0.0003,
320
+ "rewards/accuracies": 1.0,
321
+ "rewards/chosen": -36.327449798583984,
322
+ "rewards/margins": 22.020410537719727,
323
+ "rewards/rejected": -58.34785842895508,
324
+ "step": 21
325
+ },
326
+ {
327
+ "epoch": 0.0008993541002371025,
328
+ "grad_norm": 0.18042296171188354,
329
+ "learning_rate": 4.6417320502100316e-05,
330
+ "logits/chosen": -2.526277780532837,
331
+ "logits/rejected": -2.5323195457458496,
332
+ "logps/chosen": -545.796142578125,
333
+ "logps/rejected": -764.9188232421875,
334
+ "loss": 0.0436,
335
+ "rewards/accuracies": 0.875,
336
+ "rewards/chosen": -36.89508819580078,
337
+ "rewards/margins": 17.9223575592041,
338
+ "rewards/rejected": -54.81744384765625,
339
+ "step": 22
340
+ },
341
+ {
342
+ "epoch": 0.0009402338320660616,
343
+ "grad_norm": 0.29778093099594116,
344
+ "learning_rate": 3.6257601025131026e-05,
345
+ "logits/chosen": -2.4751813411712646,
346
+ "logits/rejected": -2.4851186275482178,
347
+ "logps/chosen": -803.92578125,
348
+ "logps/rejected": -1093.898681640625,
349
+ "loss": 0.0872,
350
+ "rewards/accuracies": 0.875,
351
+ "rewards/chosen": -60.56904602050781,
352
+ "rewards/margins": 24.420740127563477,
353
+ "rewards/rejected": -84.98979187011719,
354
+ "step": 23
355
+ },
356
+ {
357
+ "epoch": 0.0009811135638950208,
358
+ "grad_norm": 0.28798049688339233,
359
+ "learning_rate": 2.7103137257858868e-05,
360
+ "logits/chosen": -2.510077714920044,
361
+ "logits/rejected": -2.5210041999816895,
362
+ "logps/chosen": -463.0649108886719,
363
+ "logps/rejected": -694.3960571289062,
364
+ "loss": 0.0867,
365
+ "rewards/accuracies": 1.0,
366
+ "rewards/chosen": -33.42449951171875,
367
+ "rewards/margins": 18.504003524780273,
368
+ "rewards/rejected": -51.928504943847656,
369
+ "step": 24
370
+ },
371
+ {
372
+ "epoch": 0.0010219932957239801,
373
+ "grad_norm": 0.11364051699638367,
374
+ "learning_rate": 1.9098300562505266e-05,
375
+ "logits/chosen": -2.475249767303467,
376
+ "logits/rejected": -2.4904561042785645,
377
+ "logps/chosen": -859.90673828125,
378
+ "logps/rejected": -1117.36083984375,
379
+ "loss": 0.0006,
380
+ "rewards/accuracies": 1.0,
381
+ "rewards/chosen": -65.81514739990234,
382
+ "rewards/margins": 20.766559600830078,
383
+ "rewards/rejected": -86.58171081542969,
384
+ "step": 25
385
+ },
386
+ {
387
+ "epoch": 0.0010628730275529393,
388
+ "grad_norm": 0.009049988351762295,
389
+ "learning_rate": 1.2369331995613665e-05,
390
+ "logits/chosen": -2.4331583976745605,
391
+ "logits/rejected": -2.4311211109161377,
392
+ "logps/chosen": -680.937744140625,
393
+ "logps/rejected": -1024.9010009765625,
394
+ "loss": 0.0,
395
+ "rewards/accuracies": 1.0,
396
+ "rewards/chosen": -50.20663070678711,
397
+ "rewards/margins": 28.409120559692383,
398
+ "rewards/rejected": -78.61575317382812,
399
+ "step": 26
400
+ },
401
+ {
402
+ "epoch": 0.0011037527593818985,
403
+ "grad_norm": 0.16239921748638153,
404
+ "learning_rate": 7.022351411174866e-06,
405
+ "logits/chosen": -2.6356656551361084,
406
+ "logits/rejected": -2.6563143730163574,
407
+ "logps/chosen": -620.882080078125,
408
+ "logps/rejected": -835.9634399414062,
409
+ "loss": 0.0434,
410
+ "rewards/accuracies": 1.0,
411
+ "rewards/chosen": -41.628211975097656,
412
+ "rewards/margins": 17.292217254638672,
413
+ "rewards/rejected": -58.92042541503906,
414
+ "step": 27
415
+ },
416
+ {
417
+ "epoch": 0.0011446324912108576,
418
+ "grad_norm": 0.29876795411109924,
419
+ "learning_rate": 3.1416838871368924e-06,
420
+ "logits/chosen": -2.490878105163574,
421
+ "logits/rejected": -2.5129659175872803,
422
+ "logps/chosen": -658.1712646484375,
423
+ "logps/rejected": -935.3577880859375,
424
+ "loss": 0.0448,
425
+ "rewards/accuracies": 0.875,
426
+ "rewards/chosen": -48.216346740722656,
427
+ "rewards/margins": 22.68781852722168,
428
+ "rewards/rejected": -70.90415954589844,
429
+ "step": 28
430
+ },
431
+ {
432
+ "epoch": 0.0011855122230398168,
433
+ "grad_norm": 11.254888534545898,
434
+ "learning_rate": 7.885298685522235e-07,
435
+ "logits/chosen": -2.4710259437561035,
436
+ "logits/rejected": -2.4678666591644287,
437
+ "logps/chosen": -565.2833251953125,
438
+ "logps/rejected": -760.4554443359375,
439
+ "loss": 0.0385,
440
+ "rewards/accuracies": 1.0,
441
+ "rewards/chosen": -39.14883041381836,
442
+ "rewards/margins": 15.817726135253906,
443
+ "rewards/rejected": -54.966552734375,
444
+ "step": 29
445
+ },
446
+ {
447
+ "epoch": 0.0012263919548687761,
448
+ "grad_norm": 0.10551604628562927,
449
+ "learning_rate": 0.0,
450
+ "logits/chosen": -2.379762649536133,
451
+ "logits/rejected": -2.398367166519165,
452
+ "logps/chosen": -702.4578857421875,
453
+ "logps/rejected": -948.1409301757812,
454
+ "loss": 0.0434,
455
+ "rewards/accuracies": 0.875,
456
+ "rewards/chosen": -48.67387390136719,
457
+ "rewards/margins": 20.345170974731445,
458
+ "rewards/rejected": -69.01904296875,
459
+ "step": 30
460
  }
461
  ],
462
  "logging_steps": 1,
 
471
  "should_evaluate": false,
472
  "should_log": false,
473
  "should_save": true,
474
+ "should_training_stop": true
475
  },
476
  "attributes": {}
477
  }