iamnguyen commited on
Commit
fac9f8d
·
verified ·
1 Parent(s): 7f69d09

Training in progress, step 112, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:33a5cf1ddf5e24ebda98f15082d6444331484a209797ef29f375faf287b2faa4
3
  size 147770496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a382456c446f34b195fbfd702a439be3a1e58d2a36d956d357f01865a9f79d8
3
  size 147770496
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7b2636679b94b781d00a8346afff4ec981364bfdb4a51d2a9b5522d462db1409
3
  size 74440308
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f98750a3e57cc2fc9efbb170ea0c2d4e6e07105ecd32dc2e6b33fd619403c2a
3
  size 74440308
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3004543ff75789c80835e4aaafc7cbfb049f5ef29584c27910625b7aef3b36b6
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de022fc7aa1925c72ae7474cead510ec1b0250a1879a157882455c4937721e6f
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:359057d9660fe2d14af7a17c1643f1a9bad16dc0d152f01e09a837e37cbd211e
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db8ff398e296fc80d27c81c792fc561b8565bd13d3296779cf24d36d13c2df0f
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.04184722312616072,
5
  "eval_steps": 500,
6
- "global_step": 108,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -763,6 +763,34 @@
763
  "learning_rate": 9.98789718527821e-06,
764
  "loss": 1.786,
765
  "step": 108
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
766
  }
767
  ],
768
  "logging_steps": 1.0,
@@ -782,7 +810,7 @@
782
  "attributes": {}
783
  }
784
  },
785
- "total_flos": 1.0647698517059789e+17,
786
  "train_batch_size": 1,
787
  "trial_name": null,
788
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.04339712027898149,
5
  "eval_steps": 500,
6
+ "global_step": 112,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
763
  "learning_rate": 9.98789718527821e-06,
764
  "loss": 1.786,
765
  "step": 108
766
+ },
767
+ {
768
+ "epoch": 0.04223469741436591,
769
+ "grad_norm": 0.13741853833198547,
770
+ "learning_rate": 9.987461264941803e-06,
771
+ "loss": 1.7147,
772
+ "step": 109
773
+ },
774
+ {
775
+ "epoch": 0.042622171702571106,
776
+ "grad_norm": 0.11314312368631363,
777
+ "learning_rate": 9.987017642222821e-06,
778
+ "loss": 1.7257,
779
+ "step": 110
780
+ },
781
+ {
782
+ "epoch": 0.04300964599077629,
783
+ "grad_norm": 0.12022025883197784,
784
+ "learning_rate": 9.986566317806374e-06,
785
+ "loss": 1.7829,
786
+ "step": 111
787
+ },
788
+ {
789
+ "epoch": 0.04339712027898149,
790
+ "grad_norm": 0.11993694305419922,
791
+ "learning_rate": 9.986107292389465e-06,
792
+ "loss": 1.7713,
793
+ "step": 112
794
  }
795
  ],
796
  "logging_steps": 1.0,
 
810
  "attributes": {}
811
  }
812
  },
813
+ "total_flos": 1.1051198111020954e+17,
814
  "train_batch_size": 1,
815
  "trial_name": null,
816
  "trial_params": null