sedrickkeh commited on
Commit
08f65ec
·
verified ·
1 Parent(s): 2824666

Training in progress, epoch 13

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:37ca22f04db2fc157fda32fa23257de9d8478f4c59977093764201bbb8e5843c
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a6027a14adbdff1938c8c49c67097b13aa7303263587bd6d5f94262c8743835
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:487c366dc447d9b9bc114e2ef838a7b1857de35d51ba39b3235dd812d0b5041a
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3fa4ad48a96bab25a5e0b2e28b097a33216d84b85b94de0f0252644e180641d
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7175b9b40df2b970bda9435e8e67da47514840c29f6a2334faa4a69bc527dd12
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ad8b56230842e96eed9b77c33bf3a249cbfde38bac90b3301e7701bcdfd63ba
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4256299218b824bbfa9e38de3237ffbf92765e70ef57f2687f9ac972cf4676d9
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa3182a93d0a5860804ddf926aa34f5a5abe2cada77fc957c12ed278c9a0a64a
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -60,3 +60,7 @@
60
  {"current_steps": 60, "total_steps": 65, "loss": 0.2719, "lr": 1.8225003740388546e-07, "epoch": 12.0, "percentage": 92.31, "elapsed_time": "1:20:48", "remaining_time": "0:06:44"}
61
  {"current_steps": 61, "total_steps": 65, "loss": 0.2767, "lr": 1.1689722144956672e-07, "epoch": 12.2, "percentage": 93.85, "elapsed_time": "1:23:10", "remaining_time": "0:05:27"}
62
  {"current_steps": 62, "total_steps": 65, "loss": 0.2726, "lr": 6.58673872923693e-08, "epoch": 12.4, "percentage": 95.38, "elapsed_time": "1:24:08", "remaining_time": "0:04:04"}
 
 
 
 
 
60
  {"current_steps": 60, "total_steps": 65, "loss": 0.2719, "lr": 1.8225003740388546e-07, "epoch": 12.0, "percentage": 92.31, "elapsed_time": "1:20:48", "remaining_time": "0:06:44"}
61
  {"current_steps": 61, "total_steps": 65, "loss": 0.2767, "lr": 1.1689722144956672e-07, "epoch": 12.2, "percentage": 93.85, "elapsed_time": "1:23:10", "remaining_time": "0:05:27"}
62
  {"current_steps": 62, "total_steps": 65, "loss": 0.2726, "lr": 6.58673872923693e-08, "epoch": 12.4, "percentage": 95.38, "elapsed_time": "1:24:08", "remaining_time": "0:04:04"}
63
+ {"current_steps": 63, "total_steps": 65, "loss": 0.2583, "lr": 2.9310214228202016e-08, "epoch": 12.6, "percentage": 96.92, "elapsed_time": "1:25:21", "remaining_time": "0:02:42"}
64
+ {"current_steps": 64, "total_steps": 65, "loss": 0.262, "lr": 7.332930744380906e-09, "epoch": 12.8, "percentage": 98.46, "elapsed_time": "1:26:23", "remaining_time": "0:01:20"}
65
+ {"current_steps": 65, "total_steps": 65, "loss": 0.2516, "lr": 0.0, "epoch": 13.0, "percentage": 100.0, "elapsed_time": "1:27:35", "remaining_time": "0:00:00"}
66
+ {"current_steps": 65, "total_steps": 65, "epoch": 13.0, "percentage": 100.0, "elapsed_time": "1:30:12", "remaining_time": "0:00:00"}