pmahdavi commited on
Commit
8f0c6e8
·
verified ·
1 Parent(s): 8e511b4

Upload run root files (non-recursive) - trainer_log.jsonl

Browse files
Files changed (1) hide show
  1. trainer_log.jsonl +122 -0
trainer_log.jsonl ADDED
@@ -0,0 +1,122 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"current_steps": 10, "total_steps": 1100, "loss": 0.9318, "lr": 5e-06, "epoch": 0.009087552892397694, "percentage": 0.91, "elapsed_time": "0:09:42", "remaining_time": "17:37:46"}
2
+ {"current_steps": 20, "total_steps": 1100, "loss": 0.8765, "lr": 5e-06, "epoch": 0.01817510578479539, "percentage": 1.82, "elapsed_time": "0:19:27", "remaining_time": "17:30:49"}
3
+ {"current_steps": 30, "total_steps": 1100, "loss": 0.8635, "lr": 5e-06, "epoch": 0.02726265867719308, "percentage": 2.73, "elapsed_time": "0:29:17", "remaining_time": "17:24:54"}
4
+ {"current_steps": 40, "total_steps": 1100, "loss": 0.8595, "lr": 5e-06, "epoch": 0.03635021156959078, "percentage": 3.64, "elapsed_time": "0:38:59", "remaining_time": "17:13:23"}
5
+ {"current_steps": 50, "total_steps": 1100, "loss": 0.8754, "lr": 5e-06, "epoch": 0.04543776446198847, "percentage": 4.55, "elapsed_time": "0:48:44", "remaining_time": "17:03:24"}
6
+ {"current_steps": 60, "total_steps": 1100, "loss": 0.886, "lr": 5e-06, "epoch": 0.05452531735438616, "percentage": 5.45, "elapsed_time": "0:58:29", "remaining_time": "16:53:44"}
7
+ {"current_steps": 70, "total_steps": 1100, "loss": 0.8722, "lr": 5e-06, "epoch": 0.06361287024678386, "percentage": 6.36, "elapsed_time": "1:08:22", "remaining_time": "16:46:09"}
8
+ {"current_steps": 80, "total_steps": 1100, "loss": 0.8908, "lr": 5e-06, "epoch": 0.07270042313918156, "percentage": 7.27, "elapsed_time": "1:18:12", "remaining_time": "16:37:14"}
9
+ {"current_steps": 90, "total_steps": 1100, "loss": 0.8608, "lr": 5e-06, "epoch": 0.08178797603157925, "percentage": 8.18, "elapsed_time": "1:27:55", "remaining_time": "16:26:41"}
10
+ {"current_steps": 100, "total_steps": 1100, "loss": 0.8738, "lr": 5e-06, "epoch": 0.09087552892397693, "percentage": 9.09, "elapsed_time": "1:37:40", "remaining_time": "16:16:43"}
11
+ {"current_steps": 100, "total_steps": 1100, "eval_loss": 0.8080399632453918, "epoch": 0.09087552892397693, "percentage": 9.09, "elapsed_time": "1:40:58", "remaining_time": "16:49:45"}
12
+ {"current_steps": 110, "total_steps": 1100, "loss": 0.8853, "lr": 5e-06, "epoch": 0.09996308181637463, "percentage": 10.0, "elapsed_time": "1:50:45", "remaining_time": "16:36:47"}
13
+ {"current_steps": 120, "total_steps": 1100, "loss": 0.8722, "lr": 5e-06, "epoch": 0.10905063470877233, "percentage": 10.91, "elapsed_time": "2:00:28", "remaining_time": "16:23:52"}
14
+ {"current_steps": 130, "total_steps": 1100, "loss": 0.8697, "lr": 5e-06, "epoch": 0.11813818760117002, "percentage": 11.82, "elapsed_time": "2:10:22", "remaining_time": "16:12:48"}
15
+ {"current_steps": 140, "total_steps": 1100, "loss": 0.8732, "lr": 5e-06, "epoch": 0.12722574049356772, "percentage": 12.73, "elapsed_time": "2:20:04", "remaining_time": "16:00:31"}
16
+ {"current_steps": 150, "total_steps": 1100, "loss": 0.881, "lr": 5e-06, "epoch": 0.1363132933859654, "percentage": 13.64, "elapsed_time": "2:30:01", "remaining_time": "15:50:08"}
17
+ {"current_steps": 160, "total_steps": 1100, "loss": 0.8533, "lr": 5e-06, "epoch": 0.1454008462783631, "percentage": 14.55, "elapsed_time": "2:39:56", "remaining_time": "15:39:37"}
18
+ {"current_steps": 170, "total_steps": 1100, "loss": 0.8554, "lr": 5e-06, "epoch": 0.1544883991707608, "percentage": 15.45, "elapsed_time": "2:49:39", "remaining_time": "15:28:05"}
19
+ {"current_steps": 180, "total_steps": 1100, "loss": 0.8666, "lr": 5e-06, "epoch": 0.1635759520631585, "percentage": 16.36, "elapsed_time": "2:59:19", "remaining_time": "15:16:30"}
20
+ {"current_steps": 190, "total_steps": 1100, "loss": 0.8449, "lr": 5e-06, "epoch": 0.17266350495555619, "percentage": 17.27, "elapsed_time": "3:09:03", "remaining_time": "15:05:27"}
21
+ {"current_steps": 200, "total_steps": 1100, "loss": 0.8557, "lr": 5e-06, "epoch": 0.18175105784795387, "percentage": 18.18, "elapsed_time": "3:18:53", "remaining_time": "14:55:02"}
22
+ {"current_steps": 200, "total_steps": 1100, "eval_loss": 0.8015328049659729, "epoch": 0.18175105784795387, "percentage": 18.18, "elapsed_time": "3:22:12", "remaining_time": "15:09:54"}
23
+ {"current_steps": 210, "total_steps": 1100, "loss": 0.8449, "lr": 5e-06, "epoch": 0.19083861074035158, "percentage": 19.09, "elapsed_time": "3:31:54", "remaining_time": "14:58:05"}
24
+ {"current_steps": 220, "total_steps": 1100, "loss": 0.8607, "lr": 5e-06, "epoch": 0.19992616363274926, "percentage": 20.0, "elapsed_time": "3:41:46", "remaining_time": "14:47:06"}
25
+ {"current_steps": 230, "total_steps": 1100, "loss": 0.8364, "lr": 5e-06, "epoch": 0.20901371652514697, "percentage": 20.91, "elapsed_time": "3:51:44", "remaining_time": "14:36:36"}
26
+ {"current_steps": 240, "total_steps": 1100, "loss": 0.8666, "lr": 5e-06, "epoch": 0.21810126941754465, "percentage": 21.82, "elapsed_time": "4:01:31", "remaining_time": "14:25:27"}
27
+ {"current_steps": 250, "total_steps": 1100, "loss": 0.8468, "lr": 5e-06, "epoch": 0.22718882230994236, "percentage": 22.73, "elapsed_time": "4:11:20", "remaining_time": "14:14:35"}
28
+ {"current_steps": 260, "total_steps": 1100, "loss": 0.8519, "lr": 5e-06, "epoch": 0.23627637520234004, "percentage": 23.64, "elapsed_time": "4:21:08", "remaining_time": "14:03:39"}
29
+ {"current_steps": 270, "total_steps": 1100, "loss": 0.8681, "lr": 5e-06, "epoch": 0.24536392809473773, "percentage": 24.55, "elapsed_time": "4:30:55", "remaining_time": "13:52:51"}
30
+ {"current_steps": 280, "total_steps": 1100, "loss": 0.8804, "lr": 5e-06, "epoch": 0.25445148098713544, "percentage": 25.45, "elapsed_time": "4:40:41", "remaining_time": "13:42:00"}
31
+ {"current_steps": 290, "total_steps": 1100, "loss": 0.8385, "lr": 5e-06, "epoch": 0.26353903387953315, "percentage": 26.36, "elapsed_time": "4:50:33", "remaining_time": "13:31:32"}
32
+ {"current_steps": 300, "total_steps": 1100, "loss": 0.8619, "lr": 5e-06, "epoch": 0.2726265867719308, "percentage": 27.27, "elapsed_time": "5:00:25", "remaining_time": "13:21:09"}
33
+ {"current_steps": 300, "total_steps": 1100, "eval_loss": 0.7971594333648682, "epoch": 0.2726265867719308, "percentage": 27.27, "elapsed_time": "5:03:44", "remaining_time": "13:29:57"}
34
+ {"current_steps": 310, "total_steps": 1100, "loss": 0.8621, "lr": 5e-06, "epoch": 0.2817141396643285, "percentage": 28.18, "elapsed_time": "5:13:28", "remaining_time": "13:18:51"}
35
+ {"current_steps": 320, "total_steps": 1100, "loss": 0.8369, "lr": 5e-06, "epoch": 0.2908016925567262, "percentage": 29.09, "elapsed_time": "5:23:11", "remaining_time": "13:07:46"}
36
+ {"current_steps": 330, "total_steps": 1100, "loss": 0.8748, "lr": 5e-06, "epoch": 0.2998892454491239, "percentage": 30.0, "elapsed_time": "5:32:58", "remaining_time": "12:56:56"}
37
+ {"current_steps": 340, "total_steps": 1100, "loss": 0.8158, "lr": 5e-06, "epoch": 0.3089767983415216, "percentage": 30.91, "elapsed_time": "5:42:44", "remaining_time": "12:46:08"}
38
+ {"current_steps": 350, "total_steps": 1100, "loss": 0.8522, "lr": 5e-06, "epoch": 0.3180643512339193, "percentage": 31.82, "elapsed_time": "5:52:27", "remaining_time": "12:35:15"}
39
+ {"current_steps": 360, "total_steps": 1100, "loss": 0.8465, "lr": 5e-06, "epoch": 0.327151904126317, "percentage": 32.73, "elapsed_time": "6:02:23", "remaining_time": "12:24:54"}
40
+ {"current_steps": 370, "total_steps": 1100, "loss": 0.8528, "lr": 5e-06, "epoch": 0.33623945701871466, "percentage": 33.64, "elapsed_time": "6:12:10", "remaining_time": "12:14:17"}
41
+ {"current_steps": 380, "total_steps": 1100, "loss": 0.8838, "lr": 5e-06, "epoch": 0.34532700991111237, "percentage": 34.55, "elapsed_time": "6:21:52", "remaining_time": "12:03:32"}
42
+ {"current_steps": 390, "total_steps": 1100, "loss": 0.8318, "lr": 5e-06, "epoch": 0.3544145628035101, "percentage": 35.45, "elapsed_time": "6:31:55", "remaining_time": "11:53:30"}
43
+ {"current_steps": 400, "total_steps": 1100, "loss": 0.8201, "lr": 5e-06, "epoch": 0.36350211569590773, "percentage": 36.36, "elapsed_time": "6:41:43", "remaining_time": "11:43:00"}
44
+ {"current_steps": 400, "total_steps": 1100, "eval_loss": 0.7944772839546204, "epoch": 0.36350211569590773, "percentage": 36.36, "elapsed_time": "6:45:01", "remaining_time": "11:48:47"}
45
+ {"current_steps": 410, "total_steps": 1100, "loss": 0.8416, "lr": 5e-06, "epoch": 0.37258966858830544, "percentage": 37.27, "elapsed_time": "6:54:43", "remaining_time": "11:37:56"}
46
+ {"current_steps": 420, "total_steps": 1100, "loss": 0.8544, "lr": 5e-06, "epoch": 0.38167722148070315, "percentage": 38.18, "elapsed_time": "7:04:34", "remaining_time": "11:27:23"}
47
+ {"current_steps": 430, "total_steps": 1100, "loss": 0.8676, "lr": 5e-06, "epoch": 0.39076477437310086, "percentage": 39.09, "elapsed_time": "7:14:20", "remaining_time": "11:16:45"}
48
+ {"current_steps": 440, "total_steps": 1100, "loss": 0.8436, "lr": 5e-06, "epoch": 0.3998523272654985, "percentage": 40.0, "elapsed_time": "7:24:07", "remaining_time": "11:06:11"}
49
+ {"current_steps": 450, "total_steps": 1100, "loss": 0.8385, "lr": 5e-06, "epoch": 0.40893988015789623, "percentage": 40.91, "elapsed_time": "7:34:09", "remaining_time": "10:56:00"}
50
+ {"current_steps": 460, "total_steps": 1100, "loss": 0.8473, "lr": 5e-06, "epoch": 0.41802743305029394, "percentage": 41.82, "elapsed_time": "7:44:07", "remaining_time": "10:45:43"}
51
+ {"current_steps": 470, "total_steps": 1100, "loss": 0.8213, "lr": 5e-06, "epoch": 0.4271149859426916, "percentage": 42.73, "elapsed_time": "7:54:04", "remaining_time": "10:35:27"}
52
+ {"current_steps": 480, "total_steps": 1100, "loss": 0.8613, "lr": 5e-06, "epoch": 0.4362025388350893, "percentage": 43.64, "elapsed_time": "8:03:43", "remaining_time": "10:24:48"}
53
+ {"current_steps": 490, "total_steps": 1100, "loss": 0.8602, "lr": 5e-06, "epoch": 0.445290091727487, "percentage": 44.55, "elapsed_time": "8:13:33", "remaining_time": "10:14:25"}
54
+ {"current_steps": 500, "total_steps": 1100, "loss": 0.8609, "lr": 5e-06, "epoch": 0.4543776446198847, "percentage": 45.45, "elapsed_time": "8:23:16", "remaining_time": "10:03:56"}
55
+ {"current_steps": 500, "total_steps": 1100, "eval_loss": 0.7920035123825073, "epoch": 0.4543776446198847, "percentage": 45.45, "elapsed_time": "8:26:35", "remaining_time": "10:07:54"}
56
+ {"current_steps": 510, "total_steps": 1100, "loss": 0.8516, "lr": 5e-06, "epoch": 0.4634651975122824, "percentage": 46.36, "elapsed_time": "8:36:16", "remaining_time": "9:57:15"}
57
+ {"current_steps": 520, "total_steps": 1100, "loss": 0.8239, "lr": 5e-06, "epoch": 0.4725527504046801, "percentage": 47.27, "elapsed_time": "8:46:06", "remaining_time": "9:46:49"}
58
+ {"current_steps": 530, "total_steps": 1100, "loss": 0.8421, "lr": 5e-06, "epoch": 0.4816403032970778, "percentage": 48.18, "elapsed_time": "8:55:46", "remaining_time": "9:36:12"}
59
+ {"current_steps": 540, "total_steps": 1100, "loss": 0.8498, "lr": 5e-06, "epoch": 0.49072785618947545, "percentage": 49.09, "elapsed_time": "9:05:28", "remaining_time": "9:25:40"}
60
+ {"current_steps": 550, "total_steps": 1100, "loss": 0.8472, "lr": 5e-06, "epoch": 0.49981540908187316, "percentage": 50.0, "elapsed_time": "9:15:08", "remaining_time": "9:15:08"}
61
+ {"current_steps": 560, "total_steps": 1100, "loss": 0.8166, "lr": 5e-06, "epoch": 0.5089029619742709, "percentage": 50.91, "elapsed_time": "9:24:58", "remaining_time": "9:04:47"}
62
+ {"current_steps": 570, "total_steps": 1100, "loss": 0.8717, "lr": 5e-06, "epoch": 0.5179905148666686, "percentage": 51.82, "elapsed_time": "9:34:48", "remaining_time": "8:54:28"}
63
+ {"current_steps": 580, "total_steps": 1100, "loss": 0.8406, "lr": 5e-06, "epoch": 0.5270780677590663, "percentage": 52.73, "elapsed_time": "9:44:43", "remaining_time": "8:44:14"}
64
+ {"current_steps": 590, "total_steps": 1100, "loss": 0.822, "lr": 5e-06, "epoch": 0.536165620651464, "percentage": 53.64, "elapsed_time": "9:54:28", "remaining_time": "8:33:51"}
65
+ {"current_steps": 600, "total_steps": 1100, "loss": 0.8175, "lr": 5e-06, "epoch": 0.5452531735438616, "percentage": 54.55, "elapsed_time": "10:04:21", "remaining_time": "8:23:38"}
66
+ {"current_steps": 600, "total_steps": 1100, "eval_loss": 0.7903430461883545, "epoch": 0.5452531735438616, "percentage": 54.55, "elapsed_time": "10:07:40", "remaining_time": "8:26:23"}
67
+ {"current_steps": 610, "total_steps": 1100, "loss": 0.8378, "lr": 5e-06, "epoch": 0.5543407264362593, "percentage": 55.45, "elapsed_time": "10:17:29", "remaining_time": "8:16:01"}
68
+ {"current_steps": 620, "total_steps": 1100, "loss": 0.8346, "lr": 5e-06, "epoch": 0.563428279328657, "percentage": 56.36, "elapsed_time": "10:27:08", "remaining_time": "8:05:31"}
69
+ {"current_steps": 630, "total_steps": 1100, "loss": 0.854, "lr": 5e-06, "epoch": 0.5725158322210547, "percentage": 57.27, "elapsed_time": "10:36:47", "remaining_time": "7:55:03"}
70
+ {"current_steps": 640, "total_steps": 1100, "loss": 0.842, "lr": 5e-06, "epoch": 0.5816033851134524, "percentage": 58.18, "elapsed_time": "10:46:29", "remaining_time": "7:44:40"}
71
+ {"current_steps": 650, "total_steps": 1100, "loss": 0.8503, "lr": 5e-06, "epoch": 0.5906909380058502, "percentage": 59.09, "elapsed_time": "10:56:17", "remaining_time": "7:34:21"}
72
+ {"current_steps": 660, "total_steps": 1100, "loss": 0.856, "lr": 5e-06, "epoch": 0.5997784908982478, "percentage": 60.0, "elapsed_time": "11:06:00", "remaining_time": "7:24:00"}
73
+ {"current_steps": 670, "total_steps": 1100, "loss": 0.844, "lr": 4.994840115578491e-06, "epoch": 0.6088660437906455, "percentage": 60.91, "elapsed_time": "11:15:54", "remaining_time": "7:13:47"}
74
+ {"current_steps": 680, "total_steps": 1100, "loss": 0.863, "lr": 4.977030821727762e-06, "epoch": 0.6179535966830432, "percentage": 61.82, "elapsed_time": "11:25:49", "remaining_time": "7:03:35"}
75
+ {"current_steps": 690, "total_steps": 1100, "loss": 0.8577, "lr": 4.946599146595769e-06, "epoch": 0.6270411495754409, "percentage": 62.73, "elapsed_time": "11:35:36", "remaining_time": "6:53:19"}
76
+ {"current_steps": 700, "total_steps": 1100, "loss": 0.8462, "lr": 4.903700163023421e-06, "epoch": 0.6361287024678386, "percentage": 63.64, "elapsed_time": "11:45:28", "remaining_time": "6:43:07"}
77
+ {"current_steps": 700, "total_steps": 1100, "eval_loss": 0.7885037660598755, "epoch": 0.6361287024678386, "percentage": 63.64, "elapsed_time": "11:48:46", "remaining_time": "6:45:00"}
78
+ {"current_steps": 710, "total_steps": 1100, "loss": 0.8692, "lr": 4.848552474397677e-06, "epoch": 0.6452162553602363, "percentage": 64.55, "elapsed_time": "11:58:39", "remaining_time": "6:34:45"}
79
+ {"current_steps": 720, "total_steps": 1100, "loss": 0.8427, "lr": 4.78143710069879e-06, "epoch": 0.654303808252634, "percentage": 65.45, "elapsed_time": "12:08:23", "remaining_time": "6:24:25"}
80
+ {"current_steps": 730, "total_steps": 1100, "loss": 0.8471, "lr": 4.702696046486912e-06, "epoch": 0.6633913611450316, "percentage": 66.36, "elapsed_time": "12:18:17", "remaining_time": "6:14:12"}
81
+ {"current_steps": 740, "total_steps": 1100, "loss": 0.8529, "lr": 4.6127305581252414e-06, "epoch": 0.6724789140374293, "percentage": 67.27, "elapsed_time": "12:28:00", "remaining_time": "6:03:53"}
82
+ {"current_steps": 750, "total_steps": 1100, "loss": 0.8312, "lr": 4.5119990791205335e-06, "epoch": 0.681566466929827, "percentage": 68.18, "elapsed_time": "12:37:37", "remaining_time": "5:53:33"}
83
+ {"current_steps": 760, "total_steps": 1100, "loss": 0.8278, "lr": 4.401014914000078e-06, "epoch": 0.6906540198222247, "percentage": 69.09, "elapsed_time": "12:47:28", "remaining_time": "5:43:20"}
84
+ {"current_steps": 770, "total_steps": 1100, "loss": 0.852, "lr": 4.28034361262948e-06, "epoch": 0.6997415727146225, "percentage": 70.0, "elapsed_time": "12:57:28", "remaining_time": "5:33:12"}
85
+ {"current_steps": 780, "total_steps": 1100, "loss": 0.8625, "lr": 4.150600088300188e-06, "epoch": 0.7088291256070202, "percentage": 70.91, "elapsed_time": "13:07:14", "remaining_time": "5:22:58"}
86
+ {"current_steps": 790, "total_steps": 1100, "loss": 0.881, "lr": 4.012445484272307e-06, "epoch": 0.7179166784994179, "percentage": 71.82, "elapsed_time": "13:17:03", "remaining_time": "5:12:46"}
87
+ {"current_steps": 800, "total_steps": 1100, "loss": 0.8307, "lr": 3.866583804740095e-06, "epoch": 0.7270042313918155, "percentage": 72.73, "elapsed_time": "13:26:54", "remaining_time": "5:02:35"}
88
+ {"current_steps": 800, "total_steps": 1100, "eval_loss": 0.7850208878517151, "epoch": 0.7270042313918155, "percentage": 72.73, "elapsed_time": "13:30:12", "remaining_time": "5:03:49"}
89
+ {"current_steps": 810, "total_steps": 1100, "loss": 0.7981, "lr": 3.7137583273879606e-06, "epoch": 0.7360917842842132, "percentage": 73.64, "elapsed_time": "13:40:04", "remaining_time": "4:53:36"}
90
+ {"current_steps": 820, "total_steps": 1100, "loss": 0.8711, "lr": 3.554747815817756e-06, "epoch": 0.7451793371766109, "percentage": 74.55, "elapsed_time": "13:49:50", "remaining_time": "4:43:21"}
91
+ {"current_steps": 830, "total_steps": 1100, "loss": 0.8472, "lr": 3.3903625511479745e-06, "epoch": 0.7542668900690086, "percentage": 75.45, "elapsed_time": "13:59:28", "remaining_time": "4:33:04"}
92
+ {"current_steps": 840, "total_steps": 1100, "loss": 0.8438, "lr": 3.2214402030068974e-06, "epoch": 0.7633544429614063, "percentage": 76.36, "elapsed_time": "14:09:06", "remaining_time": "4:22:49"}
93
+ {"current_steps": 850, "total_steps": 1100, "loss": 0.8275, "lr": 3.0488415609601863e-06, "epoch": 0.772441995853804, "percentage": 77.27, "elapsed_time": "14:18:59", "remaining_time": "4:12:38"}
94
+ {"current_steps": 860, "total_steps": 1100, "loss": 0.838, "lr": 2.873446148124563e-06, "epoch": 0.7815295487462017, "percentage": 78.18, "elapsed_time": "14:28:39", "remaining_time": "4:02:25"}
95
+ {"current_steps": 870, "total_steps": 1100, "loss": 0.8276, "lr": 2.696147739319613e-06, "epoch": 0.7906171016385993, "percentage": 79.09, "elapsed_time": "14:38:30", "remaining_time": "3:52:14"}
96
+ {"current_steps": 880, "total_steps": 1100, "loss": 0.8335, "lr": 2.517849806596174e-06, "epoch": 0.799704654530997, "percentage": 80.0, "elapsed_time": "14:48:16", "remaining_time": "3:42:04"}
97
+ {"current_steps": 890, "total_steps": 1100, "loss": 0.8423, "lr": 2.339460915349862e-06, "epoch": 0.8087922074233947, "percentage": 80.91, "elapsed_time": "14:58:00", "remaining_time": "3:31:53"}
98
+ {"current_steps": 900, "total_steps": 1100, "loss": 0.8595, "lr": 2.161890094480078e-06, "epoch": 0.8178797603157925, "percentage": 81.82, "elapsed_time": "15:07:55", "remaining_time": "3:21:45"}
99
+ {"current_steps": 900, "total_steps": 1100, "eval_loss": 0.7791374325752258, "epoch": 0.8178797603157925, "percentage": 81.82, "elapsed_time": "15:11:13", "remaining_time": "3:22:29"}
100
+ {"current_steps": 910, "total_steps": 1100, "loss": 0.844, "lr": 1.986042204187099e-06, "epoch": 0.8269673132081902, "percentage": 82.73, "elapsed_time": "15:21:01", "remaining_time": "3:12:18"}
101
+ {"current_steps": 920, "total_steps": 1100, "loss": 0.8302, "lr": 1.8128133250119156e-06, "epoch": 0.8360548661005879, "percentage": 83.64, "elapsed_time": "15:30:41", "remaining_time": "3:02:05"}
102
+ {"current_steps": 930, "total_steps": 1100, "loss": 0.8163, "lr": 1.643086191615194e-06, "epoch": 0.8451424189929856, "percentage": 84.55, "elapsed_time": "15:40:29", "remaining_time": "2:51:55"}
103
+ {"current_steps": 940, "total_steps": 1100, "loss": 0.8225, "lr": 1.4777256945637835e-06, "epoch": 0.8542299718853832, "percentage": 85.45, "elapsed_time": "15:50:12", "remaining_time": "2:41:44"}
104
+ {"current_steps": 950, "total_steps": 1100, "loss": 0.8363, "lr": 1.3175744730466407e-06, "epoch": 0.8633175247777809, "percentage": 86.36, "elapsed_time": "15:59:52", "remaining_time": "2:31:33"}
105
+ {"current_steps": 960, "total_steps": 1100, "loss": 0.8279, "lr": 1.163448620978674e-06, "epoch": 0.8724050776701786, "percentage": 87.27, "elapsed_time": "16:09:29", "remaining_time": "2:21:23"}
106
+ {"current_steps": 970, "total_steps": 1100, "loss": 0.8295, "lr": 1.0161335283732152e-06, "epoch": 0.8814926305625763, "percentage": 88.18, "elapsed_time": "16:19:12", "remaining_time": "2:11:14"}
107
+ {"current_steps": 980, "total_steps": 1100, "loss": 0.8335, "lr": 8.763798791745413e-07, "epoch": 0.890580183454974, "percentage": 89.09, "elapsed_time": "16:28:58", "remaining_time": "2:01:05"}
108
+ {"current_steps": 990, "total_steps": 1100, "loss": 0.8221, "lr": 7.448998259445664e-07, "epoch": 0.8996677363473717, "percentage": 90.0, "elapsed_time": "16:38:42", "remaining_time": "1:50:58"}
109
+ {"current_steps": 1000, "total_steps": 1100, "loss": 0.8116, "lr": 6.223633608966254e-07, "epoch": 0.9087552892397694, "percentage": 90.91, "elapsed_time": "16:48:24", "remaining_time": "1:40:50"}
110
+ {"current_steps": 1000, "total_steps": 1100, "eval_loss": 0.7747718691825867, "epoch": 0.9087552892397694, "percentage": 90.91, "elapsed_time": "16:51:42", "remaining_time": "1:41:10"}
111
+ {"current_steps": 1010, "total_steps": 1100, "loss": 0.7986, "lr": 5.093949017687341e-07, "epoch": 0.917842842132167, "percentage": 91.82, "elapsed_time": "17:01:36", "remaining_time": "1:31:02"}
112
+ {"current_steps": 1020, "total_steps": 1100, "loss": 0.8213, "lr": 4.0657010993391867e-07, "epoch": 0.9269303950245648, "percentage": 92.73, "elapsed_time": "17:11:21", "remaining_time": "1:20:53"}
113
+ {"current_steps": 1030, "total_steps": 1100, "loss": 0.7957, "lr": 3.14412956961819e-07, "epoch": 0.9360179479169625, "percentage": 93.64, "elapsed_time": "17:21:20", "remaining_time": "1:10:46"}
114
+ {"current_steps": 1040, "total_steps": 1100, "loss": 0.8283, "lr": 2.333930545796717e-07, "epoch": 0.9451055008093602, "percentage": 94.55, "elapsed_time": "17:30:59", "remaining_time": "1:00:38"}
115
+ {"current_steps": 1050, "total_steps": 1100, "loss": 0.8226, "lr": 1.6392326163859272e-07, "epoch": 0.9541930537017579, "percentage": 95.45, "elapsed_time": "17:40:42", "remaining_time": "0:50:30"}
116
+ {"current_steps": 1060, "total_steps": 1100, "loss": 0.835, "lr": 1.0635758027950887e-07, "epoch": 0.9632806065941556, "percentage": 96.36, "elapsed_time": "17:50:24", "remaining_time": "0:40:23"}
117
+ {"current_steps": 1070, "total_steps": 1100, "loss": 0.8229, "lr": 6.098935201939188e-08, "epoch": 0.9723681594865533, "percentage": 97.27, "elapsed_time": "18:00:24", "remaining_time": "0:30:17"}
118
+ {"current_steps": 1080, "total_steps": 1100, "loss": 0.8353, "lr": 2.8049762950126125e-08, "epoch": 0.9814557123789509, "percentage": 98.18, "elapsed_time": "18:10:13", "remaining_time": "0:20:11"}
119
+ {"current_steps": 1090, "total_steps": 1100, "loss": 0.8146, "lr": 7.70666566718009e-09, "epoch": 0.9905432652713486, "percentage": 99.09, "elapsed_time": "18:20:04", "remaining_time": "0:10:05"}
120
+ {"current_steps": 1100, "total_steps": 1100, "loss": 0.8221, "lr": 6.372393125203546e-11, "epoch": 0.9996308181637463, "percentage": 100.0, "elapsed_time": "18:29:47", "remaining_time": "0:00:00"}
121
+ {"current_steps": 1100, "total_steps": 1100, "eval_loss": 0.7736018896102905, "epoch": 0.9996308181637463, "percentage": 100.0, "elapsed_time": "18:33:05", "remaining_time": "0:00:00"}
122
+ {"current_steps": 1100, "total_steps": 1100, "epoch": 0.9996308181637463, "percentage": 100.0, "elapsed_time": "18:34:28", "remaining_time": "0:00:00"}