sedrickkeh commited on
Commit
191b52e
·
verified ·
1 Parent(s): a67f9ba

Training in progress, epoch 3

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d5b08b4703756c4091fedb1a9e874f38eaa78571a61362b0ad4ce83b497f4233
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4180df440ce5cd18dd6171e2e284ed0aaa2831f88cd375288774c1bf9e60bc93
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e0d2f49e69b2dd768c1f9e17feebea2ee931c43c7ba1d7c105caa51bfd8bdc78
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cda9837a8d6899eec86fc86dc8328c7f71dbef26017e41636b038f918b03ed84
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:08adbc30b1fe311391019240da30ea085a05597faed7d5da82e1b1b703680c90
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6fa5b55a76bf348f8c06e0c7d4ffad9f20760ee13d12913c11d0c7436155575
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f39885e6def2b2c441905ba3ec981ee712c923596d51a41dec55b88f343faed8
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a899bcd13f961e2731ea151e30259e62b5c6972f2a43128fcab9c638d6f64217
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -10,3 +10,8 @@
10
  {"current_steps": 10, "total_steps": 25, "loss": 0.6852, "lr": 7.703204087277989e-06, "epoch": 2.0, "percentage": 40.0, "elapsed_time": "0:12:27", "remaining_time": "0:18:40"}
11
  {"current_steps": 11, "total_steps": 25, "loss": 0.6784, "lr": 7.0770750650094335e-06, "epoch": 2.2, "percentage": 44.0, "elapsed_time": "0:14:41", "remaining_time": "0:18:41"}
12
  {"current_steps": 12, "total_steps": 25, "loss": 0.6349, "lr": 6.408662784207149e-06, "epoch": 2.4, "percentage": 48.0, "elapsed_time": "0:15:51", "remaining_time": "0:17:10"}
 
 
 
 
 
 
10
  {"current_steps": 10, "total_steps": 25, "loss": 0.6852, "lr": 7.703204087277989e-06, "epoch": 2.0, "percentage": 40.0, "elapsed_time": "0:12:27", "remaining_time": "0:18:40"}
11
  {"current_steps": 11, "total_steps": 25, "loss": 0.6784, "lr": 7.0770750650094335e-06, "epoch": 2.2, "percentage": 44.0, "elapsed_time": "0:14:41", "remaining_time": "0:18:41"}
12
  {"current_steps": 12, "total_steps": 25, "loss": 0.6349, "lr": 6.408662784207149e-06, "epoch": 2.4, "percentage": 48.0, "elapsed_time": "0:15:51", "remaining_time": "0:17:10"}
13
+ {"current_steps": 13, "total_steps": 25, "loss": 0.6179, "lr": 5.711574191366427e-06, "epoch": 2.6, "percentage": 52.0, "elapsed_time": "0:17:11", "remaining_time": "0:15:52"}
14
+ {"current_steps": 14, "total_steps": 25, "loss": 0.6468, "lr": 5e-06, "epoch": 2.8, "percentage": 56.0, "elapsed_time": "0:18:10", "remaining_time": "0:14:16"}
15
+ {"current_steps": 15, "total_steps": 25, "loss": 0.6264, "lr": 4.2884258086335755e-06, "epoch": 3.0, "percentage": 60.0, "elapsed_time": "0:19:20", "remaining_time": "0:12:53"}
16
+ {"current_steps": 16, "total_steps": 25, "loss": 0.5678, "lr": 3.5913372157928515e-06, "epoch": 3.2, "percentage": 64.0, "elapsed_time": "0:21:32", "remaining_time": "0:12:07"}
17
+ {"current_steps": 17, "total_steps": 25, "loss": 0.6467, "lr": 2.9229249349905686e-06, "epoch": 3.4, "percentage": 68.0, "elapsed_time": "0:22:49", "remaining_time": "0:10:44"}