avsolatorio commited on
Commit
0a91fb4
·
verified ·
1 Parent(s): 8971f88

Training in progress, step 19000, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0c363a1a59fc93c3321875d7f58013a2f10c3aab12f3af0076dff096e82ffb9c
3
  size 567860028
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1c8f434ea18d3b22fd15254827178bbe3ed96c6503f495dffba91cdd8f6000a
3
  size 567860028
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c2f24ddbe795a6b5a789b92a1ca3088daece7124054a836e4ca83341f355e4ec
3
  size 1135783354
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6bfe40ca2e2f7716947536cdec78ff3399a93f458d287f2974b9aa308cf568d4
3
  size 1135783354
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:32a2a6418efcb48342a1dc67d0b88b496c3ab628f281d571af1360b4d0af05a5
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7ddd132ae0c177184ed8a4f1a9ac2f3b51a04d85a111aa5717d5124f81bcd9e
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:189a7468f8c95c103f6fc6f9a588f85a4d6a2cdd577f74ddb50948dbca31a23b
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9de1891a9bbbac025ea7d704b1888c3c146080478050b5c9e6f8305f0eea645f
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 0.035977210849523544,
3
- "best_model_checkpoint": "doc-topic-model_eval-00_train-01/checkpoint-18000",
4
- "epoch": 8.875739644970414,
5
  "eval_steps": 1000,
6
- "global_step": 18000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -475,6 +475,32 @@
475
  "eval_samples_per_second": 306.709,
476
  "eval_steps_per_second": 19.174,
477
  "step": 18000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
478
  }
479
  ],
480
  "logging_steps": 500,
@@ -494,7 +520,7 @@
494
  "attributes": {}
495
  }
496
  },
497
- "total_flos": 407138463972036.0,
498
  "train_batch_size": 4,
499
  "trial_name": null,
500
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.035947080701589584,
3
+ "best_model_checkpoint": "doc-topic-model_eval-00_train-01/checkpoint-19000",
4
+ "epoch": 9.368836291913215,
5
  "eval_steps": 1000,
6
+ "global_step": 19000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
475
  "eval_samples_per_second": 306.709,
476
  "eval_steps_per_second": 19.174,
477
  "step": 18000
478
+ },
479
+ {
480
+ "epoch": 9.122287968441814,
481
+ "grad_norm": 0.3517369031906128,
482
+ "learning_rate": 1.755424063116371e-06,
483
+ "loss": 0.0238,
484
+ "step": 18500
485
+ },
486
+ {
487
+ "epoch": 9.368836291913215,
488
+ "grad_norm": 0.5258517265319824,
489
+ "learning_rate": 1.2623274161735703e-06,
490
+ "loss": 0.0236,
491
+ "step": 19000
492
+ },
493
+ {
494
+ "epoch": 9.368836291913215,
495
+ "eval_accuracy": 0.9880196153464574,
496
+ "eval_f1": 0.6215357062905753,
497
+ "eval_loss": 0.035947080701589584,
498
+ "eval_precision": 0.7497299632750054,
499
+ "eval_recall": 0.5307792307104076,
500
+ "eval_runtime": 26.2793,
501
+ "eval_samples_per_second": 308.608,
502
+ "eval_steps_per_second": 19.293,
503
+ "step": 19000
504
  }
505
  ],
506
  "logging_steps": 500,
 
520
  "attributes": {}
521
  }
522
  },
523
+ "total_flos": 429748313255712.0,
524
  "train_batch_size": 4,
525
  "trial_name": null,
526
  "trial_params": null