Training in progress, step 822
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bc5dcccdfbaf96203a6f97b3697e02999b54c1d2fef673dfc0193588bef5d9e3
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44462f62b24fba70775e207ee41cf9ca89a35f4f991ff0ced9ea2cb74011b796
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b4ad3a705fbfb6d1acbeac821257603fc158bf841b8b0d46ad01c820cb78574
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:36c8a97d0e594a7ec96ec13f57adaf646c288d2cfe6cb7b4c90a748cfc9d70a9
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -801,3 +801,25 @@
|
|
801 |
{"current_steps": 799, "total_steps": 822, "loss": 0.5008, "lr": 2.388144091446498e-08, "epoch": 2.91539338654504, "percentage": 97.2, "elapsed_time": "14:59:53", "remaining_time": "0:25:54"}
|
802 |
{"current_steps": 800, "total_steps": 822, "loss": 0.4006, "lr": 2.185141944153979e-08, "epoch": 2.919042189281642, "percentage": 97.32, "elapsed_time": "15:01:03", "remaining_time": "0:24:46"}
|
803 |
{"current_steps": 801, "total_steps": 822, "loss": 0.4227, "lr": 1.9911363897677228e-08, "epoch": 2.922690992018244, "percentage": 97.45, "elapsed_time": "15:04:45", "remaining_time": "0:23:43"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
801 |
{"current_steps": 799, "total_steps": 822, "loss": 0.5008, "lr": 2.388144091446498e-08, "epoch": 2.91539338654504, "percentage": 97.2, "elapsed_time": "14:59:53", "remaining_time": "0:25:54"}
|
802 |
{"current_steps": 800, "total_steps": 822, "loss": 0.4006, "lr": 2.185141944153979e-08, "epoch": 2.919042189281642, "percentage": 97.32, "elapsed_time": "15:01:03", "remaining_time": "0:24:46"}
|
803 |
{"current_steps": 801, "total_steps": 822, "loss": 0.4227, "lr": 1.9911363897677228e-08, "epoch": 2.922690992018244, "percentage": 97.45, "elapsed_time": "15:04:45", "remaining_time": "0:23:43"}
|
804 |
+
{"current_steps": 802, "total_steps": 822, "loss": 0.4486, "lr": 1.8061309343884724e-08, "epoch": 2.926339794754846, "percentage": 97.57, "elapsed_time": "15:05:54", "remaining_time": "0:22:35"}
|
805 |
+
{"current_steps": 803, "total_steps": 822, "loss": 0.3915, "lr": 1.6301289214655236e-08, "epoch": 2.929988597491448, "percentage": 97.69, "elapsed_time": "15:07:07", "remaining_time": "0:21:27"}
|
806 |
+
{"current_steps": 804, "total_steps": 822, "loss": 0.3805, "lr": 1.4631335317365492e-08, "epoch": 2.9336374002280503, "percentage": 97.81, "elapsed_time": "15:08:29", "remaining_time": "0:20:20"}
|
807 |
+
{"current_steps": 805, "total_steps": 822, "loss": 0.3709, "lr": 1.3051477831699798e-08, "epoch": 2.9372862029646525, "percentage": 97.93, "elapsed_time": "15:09:23", "remaining_time": "0:19:12"}
|
808 |
+
{"current_steps": 806, "total_steps": 822, "loss": 0.3601, "lr": 1.1561745309105476e-08, "epoch": 2.940935005701254, "percentage": 98.05, "elapsed_time": "15:10:27", "remaining_time": "0:18:04"}
|
809 |
+
{"current_steps": 807, "total_steps": 822, "loss": 0.4369, "lr": 1.0162164672276598e-08, "epoch": 2.9445838084378564, "percentage": 98.18, "elapsed_time": "15:11:22", "remaining_time": "0:16:56"}
|
810 |
+
{"current_steps": 808, "total_steps": 822, "loss": 0.4896, "lr": 8.852761214666605e-09, "epoch": 2.9482326111744586, "percentage": 98.3, "elapsed_time": "15:12:30", "remaining_time": "0:15:48"}
|
811 |
+
{"current_steps": 809, "total_steps": 822, "loss": 0.4854, "lr": 7.633558600033675e-09, "epoch": 2.9518814139110603, "percentage": 98.42, "elapsed_time": "15:13:31", "remaining_time": "0:14:40"}
|
812 |
+
{"current_steps": 810, "total_steps": 822, "loss": 0.3978, "lr": 6.504578862009392e-09, "epoch": 2.9555302166476625, "percentage": 98.54, "elapsed_time": "15:14:44", "remaining_time": "0:13:33"}
|
813 |
+
{"current_steps": 811, "total_steps": 822, "loss": 0.4639, "lr": 5.4658424037029585e-09, "epoch": 2.9591790193842646, "percentage": 98.66, "elapsed_time": "15:15:41", "remaining_time": "0:12:25"}
|
814 |
+
{"current_steps": 812, "total_steps": 822, "loss": 0.4339, "lr": 4.5173679973337105e-09, "epoch": 2.9628278221208664, "percentage": 98.78, "elapsed_time": "15:16:55", "remaining_time": "0:11:17"}
|
815 |
+
{"current_steps": 813, "total_steps": 822, "loss": 0.4647, "lr": 3.659172783887499e-09, "epoch": 2.9664766248574685, "percentage": 98.91, "elapsed_time": "15:18:03", "remaining_time": "0:10:09"}
|
816 |
+
{"current_steps": 814, "total_steps": 822, "loss": 0.4208, "lr": 2.89127227281194e-09, "epoch": 2.9701254275940707, "percentage": 99.03, "elapsed_time": "15:19:19", "remaining_time": "0:09:02"}
|
817 |
+
{"current_steps": 815, "total_steps": 822, "loss": 0.4713, "lr": 2.213680341732194e-09, "epoch": 2.973774230330673, "percentage": 99.15, "elapsed_time": "15:20:34", "remaining_time": "0:07:54"}
|
818 |
+
{"current_steps": 816, "total_steps": 822, "loss": 0.4896, "lr": 1.6264092362028306e-09, "epoch": 2.977423033067275, "percentage": 99.27, "elapsed_time": "15:21:53", "remaining_time": "0:06:46"}
|
819 |
+
{"current_steps": 817, "total_steps": 822, "loss": 0.4482, "lr": 1.1294695694841207e-09, "epoch": 2.981071835803877, "percentage": 99.39, "elapsed_time": "15:23:04", "remaining_time": "0:05:38"}
|
820 |
+
{"current_steps": 818, "total_steps": 822, "loss": 0.3958, "lr": 7.228703223532974e-10, "epoch": 2.984720638540479, "percentage": 99.51, "elapsed_time": "15:24:20", "remaining_time": "0:04:31"}
|
821 |
+
{"current_steps": 819, "total_steps": 822, "loss": 0.4403, "lr": 4.0661884293913266e-10, "epoch": 2.988369441277081, "percentage": 99.64, "elapsed_time": "15:25:29", "remaining_time": "0:03:23"}
|
822 |
+
{"current_steps": 820, "total_steps": 822, "loss": 0.4366, "lr": 1.8072084659093158e-10, "epoch": 2.992018244013683, "percentage": 99.76, "elapsed_time": "15:26:36", "remaining_time": "0:02:15"}
|
823 |
+
{"current_steps": 821, "total_steps": 822, "loss": 0.5308, "lr": 4.518041577472598e-11, "epoch": 2.995667046750285, "percentage": 99.88, "elapsed_time": "15:27:38", "remaining_time": "0:01:07"}
|
824 |
+
{"current_steps": 822, "total_steps": 822, "loss": 0.3719, "lr": 0.0, "epoch": 2.9993158494868872, "percentage": 100.0, "elapsed_time": "15:28:56", "remaining_time": "0:00:00"}
|
825 |
+
{"current_steps": 822, "total_steps": 822, "epoch": 2.9993158494868872, "percentage": 100.0, "elapsed_time": "15:31:11", "remaining_time": "0:00:00"}
|