Training in progress, step 100
Browse files- model-00001-of-00006.safetensors +1 -1
- model-00002-of-00006.safetensors +1 -1
- model-00003-of-00006.safetensors +1 -1
- model-00004-of-00006.safetensors +1 -1
- model-00005-of-00006.safetensors +1 -1
- model-00006-of-00006.safetensors +1 -1
- trainer_log.jsonl +104 -303
- training_args.bin +1 -1
model-00001-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4986211280
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d82dd7f90f7f6c9b70f0e7753819c3fa71bccd9aa74dd03ae6672bd38484966d
|
3 |
size 4986211280
|
model-00002-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4954847344
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c78e4538a333365c98ceb93cc85f5c78fa42efd4089a5b2242868e8b9d952e6b
|
3 |
size 4954847344
|
model-00003-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4954847392
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:17b85702e46976fdf1c77cc95b1987e9f64fc0df7340c4ac31e409fd1e51ddfb
|
3 |
size 4954847392
|
model-00004-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4954847392
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f6663530eff6728d9312e7308fadb1c66e593990eebdafb12bbf01942223887
|
3 |
size 4954847392
|
model-00005-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4954847392
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1bbcffbbe2f8665513e52e82a2f425b0177393343e1237064577f9b7fa65bc1
|
3 |
size 4954847392
|
model-00006-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4734533160
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae19f1c4e691285c93fbb028c1b3c542852f5312b5878af32f74b3833d9de97e
|
3 |
size 4734533160
|
trainer_log.jsonl
CHANGED
@@ -1,303 +1,104 @@
|
|
1 |
-
{"current_steps": 1, "total_steps": 459, "loss": 0.9033, "lr": 0.0, "epoch": 0.006528835690968444, "percentage": 0.22, "elapsed_time": "0:01:30", "remaining_time": "11:
|
2 |
-
{"current_steps": 2, "total_steps": 459, "loss": 0.8778, "lr": 2.173913043478261e-07, "epoch": 0.013057671381936888, "percentage": 0.44, "elapsed_time": "0:02:47", "remaining_time": "10:
|
3 |
-
{"current_steps": 3, "total_steps": 459, "loss": 0.
|
4 |
-
{"current_steps": 4, "total_steps": 459, "loss": 0.
|
5 |
-
{"current_steps": 5, "total_steps": 459, "loss": 0.9429, "lr": 8.695652173913044e-07, "epoch": 0.03264417845484222, "percentage": 1.09, "elapsed_time": "0:06:
|
6 |
-
{"current_steps": 6, "total_steps": 459, "loss": 0.
|
7 |
-
{"current_steps": 7, "total_steps": 459, "loss": 0.8914, "lr": 1.3043478260869566e-06, "epoch": 0.04570184983677911, "percentage": 1.53, "elapsed_time": "0:08:
|
8 |
-
{"current_steps": 8, "total_steps": 459, "loss": 0.
|
9 |
-
{"current_steps": 9, "total_steps": 459, "loss": 0.
|
10 |
-
{"current_steps": 10, "total_steps": 459, "loss": 0.
|
11 |
-
{"current_steps": 11, "total_steps": 459, "loss": 0.
|
12 |
-
{"current_steps": 12, "total_steps": 459, "loss": 0.
|
13 |
-
{"current_steps": 13, "total_steps": 459, "loss": 0.
|
14 |
-
{"current_steps": 14, "total_steps": 459, "loss": 0.
|
15 |
-
{"current_steps": 15, "total_steps": 459, "loss": 0.
|
16 |
-
{"current_steps": 16, "total_steps": 459, "loss": 0.
|
17 |
-
{"current_steps": 17, "total_steps": 459, "loss": 0.
|
18 |
-
{"current_steps": 18, "total_steps": 459, "loss": 0.
|
19 |
-
{"current_steps": 19, "total_steps": 459, "loss": 0.
|
20 |
-
{"current_steps": 20, "total_steps": 459, "loss": 0.
|
21 |
-
{"current_steps": 21, "total_steps": 459, "loss": 0.5785, "lr": 4.347826086956522e-06, "epoch": 0.13710554951033732, "percentage": 4.58, "elapsed_time": "0:24:
|
22 |
-
{"current_steps": 22, "total_steps": 459, "loss": 0.
|
23 |
-
{"current_steps": 23, "total_steps": 459, "loss": 0.
|
24 |
-
{"current_steps": 24, "total_steps": 459, "loss": 0.
|
25 |
-
{"current_steps": 25, "total_steps": 459, "loss": 0.
|
26 |
-
{"current_steps": 26, "total_steps": 459, "loss": 0.
|
27 |
-
{"current_steps": 27, "total_steps": 459, "loss": 0.
|
28 |
-
{"current_steps": 28, "total_steps": 459, "loss": 0.
|
29 |
-
{"current_steps": 29, "total_steps": 459, "loss": 0.
|
30 |
-
{"current_steps": 30, "total_steps": 459, "loss": 0.
|
31 |
-
{"current_steps": 31, "total_steps": 459, "loss": 0.
|
32 |
-
{"current_steps": 32, "total_steps": 459, "loss": 0.
|
33 |
-
{"current_steps": 33, "total_steps": 459, "loss": 0.
|
34 |
-
{"current_steps": 34, "total_steps": 459, "loss": 0.
|
35 |
-
{"current_steps": 35, "total_steps": 459, "loss": 0.
|
36 |
-
{"current_steps": 36, "total_steps": 459, "loss": 0.
|
37 |
-
{"current_steps": 37, "total_steps": 459, "loss": 0.
|
38 |
-
{"current_steps": 38, "total_steps": 459, "loss": 0.
|
39 |
-
{"current_steps": 39, "total_steps": 459, "loss": 0.
|
40 |
-
{"current_steps": 40, "total_steps": 459, "loss": 0.
|
41 |
-
{"current_steps": 41, "total_steps": 459, "loss": 0.
|
42 |
-
{"current_steps": 42, "total_steps": 459, "loss": 0.
|
43 |
-
{"current_steps": 43, "total_steps": 459, "loss": 0.
|
44 |
-
{"current_steps": 44, "total_steps": 459, "loss": 0.
|
45 |
-
{"current_steps": 45, "total_steps": 459, "loss": 0.
|
46 |
-
{"current_steps": 46, "total_steps": 459, "loss": 0.
|
47 |
-
{"current_steps": 47, "total_steps": 459, "loss": 0.
|
48 |
-
{"current_steps": 48, "total_steps": 459, "loss": 0.
|
49 |
-
{"current_steps": 49, "total_steps": 459, "loss": 0.
|
50 |
-
{"current_steps": 50, "total_steps": 459, "loss": 0.
|
51 |
-
{"current_steps": 51, "total_steps": 459, "loss": 0.
|
52 |
-
{"current_steps": 52, "total_steps": 459, "loss": 0.
|
53 |
-
{"current_steps": 53, "total_steps": 459, "loss": 0.
|
54 |
-
{"current_steps": 54, "total_steps": 459, "loss": 0.
|
55 |
-
{"current_steps": 55, "total_steps": 459, "loss": 0.
|
56 |
-
{"current_steps": 56, "total_steps": 459, "loss": 0.
|
57 |
-
{"current_steps": 57, "total_steps": 459, "loss": 0.
|
58 |
-
{"current_steps": 58, "total_steps": 459, "loss": 0.
|
59 |
-
{"current_steps": 59, "total_steps": 459, "loss": 0.
|
60 |
-
{"current_steps": 60, "total_steps": 459, "loss": 0.
|
61 |
-
{"current_steps": 61, "total_steps": 459, "loss": 0.
|
62 |
-
{"current_steps": 62, "total_steps": 459, "loss": 0.
|
63 |
-
{"current_steps": 63, "total_steps": 459, "loss": 0.
|
64 |
-
{"current_steps": 64, "total_steps": 459, "loss": 0.
|
65 |
-
{"current_steps": 65, "total_steps": 459, "loss": 0.
|
66 |
-
{"current_steps": 66, "total_steps": 459, "loss": 0.
|
67 |
-
{"current_steps": 67, "total_steps": 459, "loss": 0.
|
68 |
-
{"current_steps": 68, "total_steps": 459, "loss": 0.
|
69 |
-
{"current_steps": 69, "total_steps": 459, "loss": 0.
|
70 |
-
{"current_steps": 70, "total_steps": 459, "loss": 0.
|
71 |
-
{"current_steps": 71, "total_steps": 459, "loss": 0.
|
72 |
-
{"current_steps": 72, "total_steps": 459, "loss": 0.
|
73 |
-
{"current_steps": 73, "total_steps": 459, "loss": 0.
|
74 |
-
{"current_steps": 74, "total_steps": 459, "loss": 0.
|
75 |
-
{"current_steps": 75, "total_steps": 459, "loss": 0.
|
76 |
-
{"current_steps": 76, "total_steps": 459, "loss": 0.4522, "lr": 9.878835952587559e-06, "epoch": 0.4961915125136017, "percentage": 16.56, "elapsed_time": "1:27:
|
77 |
-
{"current_steps": 77, "total_steps": 459, "loss": 0.
|
78 |
-
{"current_steps": 78, "total_steps": 459, "loss": 0.
|
79 |
-
{"current_steps": 79, "total_steps": 459, "loss": 0.
|
80 |
-
{"current_steps": 80, "total_steps": 459, "loss": 0.
|
81 |
-
{"current_steps": 81, "total_steps": 459, "loss": 0.
|
82 |
-
{"current_steps": 82, "total_steps": 459, "loss": 0.
|
83 |
-
{"current_steps": 83, "total_steps": 459, "loss": 0.
|
84 |
-
{"current_steps": 84, "total_steps": 459, "loss": 0.
|
85 |
-
{"current_steps": 85, "total_steps": 459, "loss": 0.
|
86 |
-
{"current_steps": 86, "total_steps": 459, "loss": 0.
|
87 |
-
{"current_steps": 87, "total_steps": 459, "loss": 0.
|
88 |
-
{"current_steps": 88, "total_steps": 459, "loss": 0.
|
89 |
-
{"current_steps": 89, "total_steps": 459, "loss": 0.
|
90 |
-
{"current_steps": 90, "total_steps": 459, "loss": 0.
|
91 |
-
{"current_steps": 91, "total_steps": 459, "loss": 0.
|
92 |
-
{"current_steps": 92, "total_steps": 459, "loss": 0.
|
93 |
-
{"current_steps": 93, "total_steps": 459, "loss": 0.
|
94 |
-
{"current_steps": 94, "total_steps": 459, "loss": 0.
|
95 |
-
{"current_steps": 95, "total_steps": 459, "loss": 0.
|
96 |
-
{"current_steps": 96, "total_steps": 459, "loss": 0.
|
97 |
-
{"current_steps": 97, "total_steps": 459, "loss": 0.3667, "lr": 9.64269588322561e-06, "epoch": 0.6332970620239391, "percentage": 21.13, "elapsed_time": "1:50:
|
98 |
-
{"current_steps": 98, "total_steps": 459, "loss": 0.
|
99 |
-
{"current_steps": 99, "total_steps": 459, "loss": 0.
|
100 |
-
{"current_steps": 100, "total_steps": 459, "loss": 0.
|
101 |
-
{"current_steps": 101, "total_steps": 459, "loss": 0.
|
102 |
-
{"current_steps": 102, "total_steps": 459, "loss": 0.
|
103 |
-
{"current_steps": 103, "total_steps": 459, "loss": 0.
|
104 |
-
{"current_steps": 104, "total_steps": 459, "loss": 0.4406, "lr": 9.537326253216685e-06, "epoch": 0.6789989118607181, "percentage": 22.66, "elapsed_time": "2:01:
|
105 |
-
{"current_steps": 105, "total_steps": 459, "loss": 0.3913, "lr": 9.521216100904379e-06, "epoch": 0.6855277475516867, "percentage": 22.88, "elapsed_time": "2:02:45", "remaining_time": "6:53:52"}
|
106 |
-
{"current_steps": 106, "total_steps": 459, "loss": 0.3939, "lr": 9.504844339512096e-06, "epoch": 0.6920565832426551, "percentage": 23.09, "elapsed_time": "2:03:57", "remaining_time": "6:52:47"}
|
107 |
-
{"current_steps": 107, "total_steps": 459, "loss": 0.4215, "lr": 9.488211916351656e-06, "epoch": 0.6985854189336235, "percentage": 23.31, "elapsed_time": "2:05:03", "remaining_time": "6:51:24"}
|
108 |
-
{"current_steps": 108, "total_steps": 459, "loss": 0.4018, "lr": 9.471319793817427e-06, "epoch": 0.705114254624592, "percentage": 23.53, "elapsed_time": "2:06:20", "remaining_time": "6:50:37"}
|
109 |
-
{"current_steps": 109, "total_steps": 459, "loss": 0.4137, "lr": 9.454168949330644e-06, "epoch": 0.7116430903155604, "percentage": 23.75, "elapsed_time": "2:07:33", "remaining_time": "6:49:35"}
|
110 |
-
{"current_steps": 110, "total_steps": 459, "loss": 0.41, "lr": 9.436760375282858e-06, "epoch": 0.7181719260065288, "percentage": 23.97, "elapsed_time": "2:08:39", "remaining_time": "6:48:12"}
|
111 |
-
{"current_steps": 111, "total_steps": 459, "loss": 0.4062, "lr": 9.419095078978506e-06, "epoch": 0.7247007616974973, "percentage": 24.18, "elapsed_time": "2:09:42", "remaining_time": "6:46:39"}
|
112 |
-
{"current_steps": 112, "total_steps": 459, "loss": 0.4438, "lr": 9.40117408257663e-06, "epoch": 0.7312295973884657, "percentage": 24.4, "elapsed_time": "2:10:24", "remaining_time": "6:44:02"}
|
113 |
-
{"current_steps": 113, "total_steps": 459, "loss": 0.4084, "lr": 9.382998423031728e-06, "epoch": 0.7377584330794341, "percentage": 24.62, "elapsed_time": "2:11:30", "remaining_time": "6:42:41"}
|
114 |
-
{"current_steps": 114, "total_steps": 459, "loss": 0.4159, "lr": 9.364569152033756e-06, "epoch": 0.7442872687704026, "percentage": 24.84, "elapsed_time": "2:12:21", "remaining_time": "6:40:33"}
|
115 |
-
{"current_steps": 115, "total_steps": 459, "loss": 0.4249, "lr": 9.345887335947281e-06, "epoch": 0.750816104461371, "percentage": 25.05, "elapsed_time": "2:13:58", "remaining_time": "6:40:46"}
|
116 |
-
{"current_steps": 116, "total_steps": 459, "loss": 0.4266, "lr": 9.326954055749767e-06, "epoch": 0.7573449401523396, "percentage": 25.27, "elapsed_time": "2:15:10", "remaining_time": "6:39:42"}
|
117 |
-
{"current_steps": 117, "total_steps": 459, "loss": 0.391, "lr": 9.307770406969032e-06, "epoch": 0.763873775843308, "percentage": 25.49, "elapsed_time": "2:16:18", "remaining_time": "6:38:27"}
|
118 |
-
{"current_steps": 118, "total_steps": 459, "loss": 0.4132, "lr": 9.288337499619856e-06, "epoch": 0.7704026115342764, "percentage": 25.71, "elapsed_time": "2:17:33", "remaining_time": "6:37:31"}
|
119 |
-
{"current_steps": 119, "total_steps": 459, "loss": 0.4122, "lr": 9.268656458139763e-06, "epoch": 0.7769314472252449, "percentage": 25.93, "elapsed_time": "2:18:36", "remaining_time": "6:36:02"}
|
120 |
-
{"current_steps": 120, "total_steps": 459, "loss": 0.4441, "lr": 9.24872842132394e-06, "epoch": 0.7834602829162133, "percentage": 26.14, "elapsed_time": "2:19:40", "remaining_time": "6:34:35"}
|
121 |
-
{"current_steps": 121, "total_steps": 459, "loss": 0.3968, "lr": 9.22855454225936e-06, "epoch": 0.7899891186071817, "percentage": 26.36, "elapsed_time": "2:20:54", "remaining_time": "6:33:36"}
|
122 |
-
{"current_steps": 122, "total_steps": 459, "loss": 0.427, "lr": 9.20813598825805e-06, "epoch": 0.7965179542981502, "percentage": 26.58, "elapsed_time": "2:21:53", "remaining_time": "6:31:56"}
|
123 |
-
{"current_steps": 123, "total_steps": 459, "loss": 0.3624, "lr": 9.187473940789558e-06, "epoch": 0.8030467899891186, "percentage": 26.8, "elapsed_time": "2:22:56", "remaining_time": "6:30:28"}
|
124 |
-
{"current_steps": 124, "total_steps": 459, "loss": 0.4224, "lr": 9.166569595412576e-06, "epoch": 0.809575625680087, "percentage": 27.02, "elapsed_time": "2:23:58", "remaining_time": "6:28:56"}
|
125 |
-
{"current_steps": 125, "total_steps": 459, "loss": 0.4247, "lr": 9.145424161705777e-06, "epoch": 0.8161044613710555, "percentage": 27.23, "elapsed_time": "2:25:04", "remaining_time": "6:27:38"}
|
126 |
-
{"current_steps": 126, "total_steps": 459, "loss": 0.3671, "lr": 9.124038863197817e-06, "epoch": 0.8226332970620239, "percentage": 27.45, "elapsed_time": "2:25:57", "remaining_time": "6:25:46"}
|
127 |
-
{"current_steps": 127, "total_steps": 459, "loss": 0.388, "lr": 9.102414937296542e-06, "epoch": 0.8291621327529923, "percentage": 27.67, "elapsed_time": "2:27:04", "remaining_time": "6:24:29"}
|
128 |
-
{"current_steps": 128, "total_steps": 459, "loss": 0.406, "lr": 9.080553635217379e-06, "epoch": 0.8356909684439608, "percentage": 27.89, "elapsed_time": "2:28:06", "remaining_time": "6:23:00"}
|
129 |
-
{"current_steps": 129, "total_steps": 459, "loss": 0.3815, "lr": 9.058456221910956e-06, "epoch": 0.8422198041349293, "percentage": 28.1, "elapsed_time": "2:29:34", "remaining_time": "6:22:37"}
|
130 |
-
{"current_steps": 130, "total_steps": 459, "loss": 0.4293, "lr": 9.036123975989893e-06, "epoch": 0.8487486398258978, "percentage": 28.32, "elapsed_time": "2:30:38", "remaining_time": "6:21:15"}
|
131 |
-
{"current_steps": 131, "total_steps": 459, "loss": 0.4018, "lr": 9.013558189654819e-06, "epoch": 0.8552774755168662, "percentage": 28.54, "elapsed_time": "2:31:53", "remaining_time": "6:20:17"}
|
132 |
-
{"current_steps": 132, "total_steps": 459, "loss": 0.4431, "lr": 8.990760168619616e-06, "epoch": 0.8618063112078346, "percentage": 28.76, "elapsed_time": "2:32:58", "remaining_time": "6:18:57"}
|
133 |
-
{"current_steps": 133, "total_steps": 459, "loss": 0.3856, "lr": 8.967731232035848e-06, "epoch": 0.8683351468988031, "percentage": 28.98, "elapsed_time": "2:34:07", "remaining_time": "6:17:45"}
|
134 |
-
{"current_steps": 134, "total_steps": 459, "loss": 0.3938, "lr": 8.944472712416448e-06, "epoch": 0.8748639825897715, "percentage": 29.19, "elapsed_time": "2:35:06", "remaining_time": "6:16:11"}
|
135 |
-
{"current_steps": 135, "total_steps": 459, "loss": 0.4076, "lr": 8.9209859555586e-06, "epoch": 0.8813928182807399, "percentage": 29.41, "elapsed_time": "2:36:09", "remaining_time": "6:14:46"}
|
136 |
-
{"current_steps": 136, "total_steps": 459, "loss": 0.4226, "lr": 8.897272320465887e-06, "epoch": 0.8879216539717084, "percentage": 29.63, "elapsed_time": "2:37:32", "remaining_time": "6:14:09"}
|
137 |
-
{"current_steps": 137, "total_steps": 459, "loss": 0.3976, "lr": 8.873333179269635e-06, "epoch": 0.8944504896626768, "percentage": 29.85, "elapsed_time": "2:38:34", "remaining_time": "6:12:43"}
|
138 |
-
{"current_steps": 138, "total_steps": 459, "loss": 0.4357, "lr": 8.849169917149532e-06, "epoch": 0.9009793253536452, "percentage": 30.07, "elapsed_time": "2:40:10", "remaining_time": "6:12:34"}
|
139 |
-
{"current_steps": 139, "total_steps": 459, "loss": 0.4299, "lr": 8.824783932253472e-06, "epoch": 0.9075081610446137, "percentage": 30.28, "elapsed_time": "2:41:38", "remaining_time": "6:12:06"}
|
140 |
-
{"current_steps": 140, "total_steps": 459, "loss": 0.4206, "lr": 8.800176635616658e-06, "epoch": 0.9140369967355821, "percentage": 30.5, "elapsed_time": "2:42:39", "remaining_time": "6:10:37"}
|
141 |
-
{"current_steps": 141, "total_steps": 459, "loss": 0.3624, "lr": 8.775349451079948e-06, "epoch": 0.9205658324265505, "percentage": 30.72, "elapsed_time": "2:43:53", "remaining_time": "6:09:38"}
|
142 |
-
{"current_steps": 142, "total_steps": 459, "loss": 0.3737, "lr": 8.750303815207487e-06, "epoch": 0.9270946681175191, "percentage": 30.94, "elapsed_time": "2:44:45", "remaining_time": "6:07:48"}
|
143 |
-
{"current_steps": 143, "total_steps": 459, "loss": 0.3924, "lr": 8.725041177203556e-06, "epoch": 0.9336235038084875, "percentage": 31.15, "elapsed_time": "2:45:44", "remaining_time": "6:06:15"}
|
144 |
-
{"current_steps": 144, "total_steps": 459, "loss": 0.3654, "lr": 8.699562998828739e-06, "epoch": 0.940152339499456, "percentage": 31.37, "elapsed_time": "2:46:45", "remaining_time": "6:04:45"}
|
145 |
-
{"current_steps": 145, "total_steps": 459, "loss": 0.3814, "lr": 8.673870754315336e-06, "epoch": 0.9466811751904244, "percentage": 31.59, "elapsed_time": "2:47:40", "remaining_time": "6:03:06"}
|
146 |
-
{"current_steps": 146, "total_steps": 459, "loss": 0.3905, "lr": 8.64796593028206e-06, "epoch": 0.9532100108813928, "percentage": 31.81, "elapsed_time": "2:48:41", "remaining_time": "6:01:39"}
|
147 |
-
{"current_steps": 147, "total_steps": 459, "loss": 0.3746, "lr": 8.621850025648008e-06, "epoch": 0.9597388465723613, "percentage": 32.03, "elapsed_time": "2:49:57", "remaining_time": "6:00:43"}
|
148 |
-
{"current_steps": 148, "total_steps": 459, "loss": 0.4056, "lr": 8.59552455154595e-06, "epoch": 0.9662676822633297, "percentage": 32.24, "elapsed_time": "2:51:00", "remaining_time": "5:59:20"}
|
149 |
-
{"current_steps": 149, "total_steps": 459, "loss": 0.3741, "lr": 8.56899103123487e-06, "epoch": 0.9727965179542981, "percentage": 32.46, "elapsed_time": "2:51:59", "remaining_time": "5:57:49"}
|
150 |
-
{"current_steps": 150, "total_steps": 459, "loss": 0.3942, "lr": 8.54225100001184e-06, "epoch": 0.9793253536452666, "percentage": 32.68, "elapsed_time": "2:53:05", "remaining_time": "5:56:34"}
|
151 |
-
{"current_steps": 151, "total_steps": 459, "loss": 0.3977, "lr": 8.51530600512318e-06, "epoch": 0.985854189336235, "percentage": 32.9, "elapsed_time": "2:53:55", "remaining_time": "5:54:45"}
|
152 |
-
{"current_steps": 152, "total_steps": 459, "loss": 0.411, "lr": 8.488157605674924e-06, "epoch": 0.9923830250272034, "percentage": 33.12, "elapsed_time": "2:54:53", "remaining_time": "5:53:13"}
|
153 |
-
{"current_steps": 153, "total_steps": 459, "loss": 0.416, "lr": 8.460807372542618e-06, "epoch": 0.998911860718172, "percentage": 33.33, "elapsed_time": "2:56:03", "remaining_time": "5:52:07"}
|
154 |
-
{"current_steps": 154, "total_steps": 459, "loss": 0.3556, "lr": 8.433256888280422e-06, "epoch": 1.0, "percentage": 33.55, "elapsed_time": "2:56:14", "remaining_time": "5:49:03"}
|
155 |
-
{"current_steps": 155, "total_steps": 459, "loss": 0.2629, "lr": 8.405507747029524e-06, "epoch": 1.0065288356909685, "percentage": 33.77, "elapsed_time": "2:57:12", "remaining_time": "5:47:33"}
|
156 |
-
{"current_steps": 156, "total_steps": 459, "loss": 0.2586, "lr": 8.377561554425923e-06, "epoch": 1.0130576713819368, "percentage": 33.99, "elapsed_time": "2:58:30", "remaining_time": "5:46:43"}
|
157 |
-
{"current_steps": 157, "total_steps": 459, "loss": 0.2697, "lr": 8.349419927507505e-06, "epoch": 1.0195865070729053, "percentage": 34.2, "elapsed_time": "2:59:33", "remaining_time": "5:45:23"}
|
158 |
-
{"current_steps": 158, "total_steps": 459, "loss": 0.2862, "lr": 8.321084494620489e-06, "epoch": 1.0261153427638738, "percentage": 34.42, "elapsed_time": "3:00:17", "remaining_time": "5:43:27"}
|
159 |
-
{"current_steps": 159, "total_steps": 459, "loss": 0.2616, "lr": 8.292556895325195e-06, "epoch": 1.0326441784548421, "percentage": 34.64, "elapsed_time": "3:01:03", "remaining_time": "5:41:37"}
|
160 |
-
{"current_steps": 160, "total_steps": 459, "loss": 0.2327, "lr": 8.263838780301182e-06, "epoch": 1.0391730141458106, "percentage": 34.86, "elapsed_time": "3:01:50", "remaining_time": "5:39:48"}
|
161 |
-
{"current_steps": 161, "total_steps": 459, "loss": 0.2552, "lr": 8.234931811251739e-06, "epoch": 1.0457018498367792, "percentage": 35.08, "elapsed_time": "3:02:55", "remaining_time": "5:38:35"}
|
162 |
-
{"current_steps": 162, "total_steps": 459, "loss": 0.2209, "lr": 8.205837660807726e-06, "epoch": 1.0522306855277475, "percentage": 35.29, "elapsed_time": "3:04:12", "remaining_time": "5:37:43"}
|
163 |
-
{"current_steps": 163, "total_steps": 459, "loss": 0.2481, "lr": 8.176558012430792e-06, "epoch": 1.058759521218716, "percentage": 35.51, "elapsed_time": "3:05:27", "remaining_time": "5:36:47"}
|
164 |
-
{"current_steps": 164, "total_steps": 459, "loss": 0.2416, "lr": 8.147094560315978e-06, "epoch": 1.0652883569096845, "percentage": 35.73, "elapsed_time": "3:06:28", "remaining_time": "5:35:26"}
|
165 |
-
{"current_steps": 165, "total_steps": 459, "loss": 0.2242, "lr": 8.117449009293668e-06, "epoch": 1.071817192600653, "percentage": 35.95, "elapsed_time": "3:07:19", "remaining_time": "5:33:47"}
|
166 |
-
{"current_steps": 166, "total_steps": 459, "loss": 0.2067, "lr": 8.08762307473096e-06, "epoch": 1.0783460282916213, "percentage": 36.17, "elapsed_time": "3:08:26", "remaining_time": "5:32:36"}
|
167 |
-
{"current_steps": 167, "total_steps": 459, "loss": 0.2331, "lr": 8.057618482432399e-06, "epoch": 1.0848748639825898, "percentage": 36.38, "elapsed_time": "3:09:30", "remaining_time": "5:31:22"}
|
168 |
-
{"current_steps": 168, "total_steps": 459, "loss": 0.2306, "lr": 8.027436968540124e-06, "epoch": 1.0914036996735583, "percentage": 36.6, "elapsed_time": "3:10:32", "remaining_time": "5:30:02"}
|
169 |
-
{"current_steps": 169, "total_steps": 459, "loss": 0.2367, "lr": 7.997080279433402e-06, "epoch": 1.0979325353645266, "percentage": 36.82, "elapsed_time": "3:11:26", "remaining_time": "5:28:31"}
|
170 |
-
{"current_steps": 170, "total_steps": 459, "loss": 0.2326, "lr": 7.966550171627592e-06, "epoch": 1.1044613710554951, "percentage": 37.04, "elapsed_time": "3:12:47", "remaining_time": "5:27:45"}
|
171 |
-
{"current_steps": 171, "total_steps": 459, "loss": 0.2341, "lr": 7.935848411672499e-06, "epoch": 1.1109902067464636, "percentage": 37.25, "elapsed_time": "3:13:55", "remaining_time": "5:26:36"}
|
172 |
-
{"current_steps": 172, "total_steps": 459, "loss": 0.2124, "lr": 7.904976776050156e-06, "epoch": 1.117519042437432, "percentage": 37.47, "elapsed_time": "3:14:57", "remaining_time": "5:25:18"}
|
173 |
-
{"current_steps": 173, "total_steps": 459, "loss": 0.2319, "lr": 7.873937051072037e-06, "epoch": 1.1240478781284005, "percentage": 37.69, "elapsed_time": "3:16:17", "remaining_time": "5:24:29"}
|
174 |
-
{"current_steps": 174, "total_steps": 459, "loss": 0.2132, "lr": 7.842731032775688e-06, "epoch": 1.130576713819369, "percentage": 37.91, "elapsed_time": "3:17:15", "remaining_time": "5:23:06"}
|
175 |
-
{"current_steps": 175, "total_steps": 459, "loss": 0.2129, "lr": 7.81136052682082e-06, "epoch": 1.1371055495103373, "percentage": 38.13, "elapsed_time": "3:18:00", "remaining_time": "5:21:20"}
|
176 |
-
{"current_steps": 176, "total_steps": 459, "loss": 0.2435, "lr": 7.779827348384814e-06, "epoch": 1.1436343852013058, "percentage": 38.34, "elapsed_time": "3:19:08", "remaining_time": "5:20:12"}
|
177 |
-
{"current_steps": 177, "total_steps": 459, "loss": 0.2242, "lr": 7.748133322057693e-06, "epoch": 1.1501632208922743, "percentage": 38.56, "elapsed_time": "3:20:14", "remaining_time": "5:19:01"}
|
178 |
-
{"current_steps": 178, "total_steps": 459, "loss": 0.226, "lr": 7.716280281736553e-06, "epoch": 1.1566920565832426, "percentage": 38.78, "elapsed_time": "3:21:10", "remaining_time": "5:17:35"}
|
179 |
-
{"current_steps": 179, "total_steps": 459, "loss": 0.2564, "lr": 7.68427007051944e-06, "epoch": 1.163220892274211, "percentage": 39.0, "elapsed_time": "3:22:27", "remaining_time": "5:16:42"}
|
180 |
-
{"current_steps": 180, "total_steps": 459, "loss": 0.2273, "lr": 7.652104540598712e-06, "epoch": 1.1697497279651796, "percentage": 39.22, "elapsed_time": "3:23:20", "remaining_time": "5:15:10"}
|
181 |
-
{"current_steps": 181, "total_steps": 459, "loss": 0.2425, "lr": 7.619785553153864e-06, "epoch": 1.176278563656148, "percentage": 39.43, "elapsed_time": "3:24:28", "remaining_time": "5:14:03"}
|
182 |
-
{"current_steps": 182, "total_steps": 459, "loss": 0.2365, "lr": 7.5873149782438295e-06, "epoch": 1.1828073993471164, "percentage": 39.65, "elapsed_time": "3:25:33", "remaining_time": "5:12:51"}
|
183 |
-
{"current_steps": 183, "total_steps": 459, "loss": 0.2224, "lr": 7.554694694698783e-06, "epoch": 1.189336235038085, "percentage": 39.87, "elapsed_time": "3:26:40", "remaining_time": "5:11:42"}
|
184 |
-
{"current_steps": 184, "total_steps": 459, "loss": 0.2155, "lr": 7.521926590011419e-06, "epoch": 1.1958650707290532, "percentage": 40.09, "elapsed_time": "3:27:35", "remaining_time": "5:10:16"}
|
185 |
-
{"current_steps": 185, "total_steps": 459, "loss": 0.2278, "lr": 7.489012560227742e-06, "epoch": 1.2023939064200218, "percentage": 40.31, "elapsed_time": "3:28:26", "remaining_time": "5:08:42"}
|
186 |
-
{"current_steps": 186, "total_steps": 459, "loss": 0.2062, "lr": 7.455954509837352e-06, "epoch": 1.2089227421109903, "percentage": 40.52, "elapsed_time": "3:29:21", "remaining_time": "5:07:16"}
|
187 |
-
{"current_steps": 187, "total_steps": 459, "loss": 0.2225, "lr": 7.422754351663252e-06, "epoch": 1.2154515778019586, "percentage": 40.74, "elapsed_time": "3:30:18", "remaining_time": "5:05:53"}
|
188 |
-
{"current_steps": 188, "total_steps": 459, "loss": 0.2277, "lr": 7.389414006751159e-06, "epoch": 1.221980413492927, "percentage": 40.96, "elapsed_time": "3:31:22", "remaining_time": "5:04:41"}
|
189 |
-
{"current_steps": 189, "total_steps": 459, "loss": 0.2145, "lr": 7.355935404258354e-06, "epoch": 1.2285092491838956, "percentage": 41.18, "elapsed_time": "3:32:41", "remaining_time": "5:03:50"}
|
190 |
-
{"current_steps": 190, "total_steps": 459, "loss": 0.2266, "lr": 7.322320481342053e-06, "epoch": 1.2350380848748639, "percentage": 41.39, "elapsed_time": "3:33:43", "remaining_time": "5:02:35"}
|
191 |
-
{"current_steps": 191, "total_steps": 459, "loss": 0.2164, "lr": 7.288571183047321e-06, "epoch": 1.2415669205658324, "percentage": 41.61, "elapsed_time": "3:34:51", "remaining_time": "5:01:28"}
|
192 |
-
{"current_steps": 192, "total_steps": 459, "loss": 0.2059, "lr": 7.254689462194522e-06, "epoch": 1.248095756256801, "percentage": 41.83, "elapsed_time": "3:36:09", "remaining_time": "5:00:36"}
|
193 |
-
{"current_steps": 193, "total_steps": 459, "loss": 0.2232, "lr": 7.220677279266327e-06, "epoch": 1.2546245919477692, "percentage": 42.05, "elapsed_time": "3:37:35", "remaining_time": "4:59:53"}
|
194 |
-
{"current_steps": 194, "total_steps": 459, "loss": 0.2084, "lr": 7.186536602294278e-06, "epoch": 1.2611534276387377, "percentage": 42.27, "elapsed_time": "3:39:05", "remaining_time": "4:59:17"}
|
195 |
-
{"current_steps": 195, "total_steps": 459, "loss": 0.234, "lr": 7.152269406744904e-06, "epoch": 1.2676822633297062, "percentage": 42.48, "elapsed_time": "3:40:17", "remaining_time": "4:58:13"}
|
196 |
-
{"current_steps": 196, "total_steps": 459, "loss": 0.2084, "lr": 7.117877675405427e-06, "epoch": 1.2742110990206745, "percentage": 42.7, "elapsed_time": "3:41:34", "remaining_time": "4:57:18"}
|
197 |
-
{"current_steps": 197, "total_steps": 459, "loss": 0.2317, "lr": 7.083363398269022e-06, "epoch": 1.280739934711643, "percentage": 42.92, "elapsed_time": "3:42:42", "remaining_time": "4:56:11"}
|
198 |
-
{"current_steps": 198, "total_steps": 459, "loss": 0.2487, "lr": 7.048728572419681e-06, "epoch": 1.2872687704026116, "percentage": 43.14, "elapsed_time": "3:43:50", "remaining_time": "4:55:03"}
|
199 |
-
{"current_steps": 199, "total_steps": 459, "loss": 0.2421, "lr": 7.0139752019166474e-06, "epoch": 1.2937976060935799, "percentage": 43.36, "elapsed_time": "3:45:05", "remaining_time": "4:54:05"}
|
200 |
-
{"current_steps": 200, "total_steps": 459, "loss": 0.2244, "lr": 6.979105297678462e-06, "epoch": 1.3003264417845484, "percentage": 43.57, "elapsed_time": "3:46:03", "remaining_time": "4:52:45"}
|
201 |
-
{"current_steps": 201, "total_steps": 459, "loss": 0.2394, "lr": 6.944120877366605e-06, "epoch": 1.3068552774755169, "percentage": 43.79, "elapsed_time": "3:50:42", "remaining_time": "4:56:08"}
|
202 |
-
{"current_steps": 202, "total_steps": 459, "loss": 0.2167, "lr": 6.909023965268746e-06, "epoch": 1.3133841131664852, "percentage": 44.01, "elapsed_time": "3:51:54", "remaining_time": "4:55:03"}
|
203 |
-
{"current_steps": 203, "total_steps": 459, "loss": 0.2505, "lr": 6.873816592181617e-06, "epoch": 1.3199129488574537, "percentage": 44.23, "elapsed_time": "3:53:17", "remaining_time": "4:54:12"}
|
204 |
-
{"current_steps": 204, "total_steps": 459, "loss": 0.251, "lr": 6.838500795293506e-06, "epoch": 1.3264417845484222, "percentage": 44.44, "elapsed_time": "3:54:24", "remaining_time": "4:53:00"}
|
205 |
-
{"current_steps": 205, "total_steps": 459, "loss": 0.222, "lr": 6.803078618066378e-06, "epoch": 1.3329706202393907, "percentage": 44.66, "elapsed_time": "3:55:22", "remaining_time": "4:51:37"}
|
206 |
-
{"current_steps": 206, "total_steps": 459, "loss": 0.2264, "lr": 6.767552110117631e-06, "epoch": 1.339499455930359, "percentage": 44.88, "elapsed_time": "3:56:46", "remaining_time": "4:50:47"}
|
207 |
-
{"current_steps": 207, "total_steps": 459, "loss": 0.2501, "lr": 6.7319233271015104e-06, "epoch": 1.3460282916213275, "percentage": 45.1, "elapsed_time": "3:58:01", "remaining_time": "4:49:45"}
|
208 |
-
{"current_steps": 208, "total_steps": 459, "loss": 0.2351, "lr": 6.6961943305901515e-06, "epoch": 1.352557127312296, "percentage": 45.32, "elapsed_time": "3:58:55", "remaining_time": "4:48:19"}
|
209 |
-
{"current_steps": 209, "total_steps": 459, "loss": 0.2136, "lr": 6.660367187954304e-06, "epoch": 1.3590859630032643, "percentage": 45.53, "elapsed_time": "3:59:54", "remaining_time": "4:46:57"}
|
210 |
-
{"current_steps": 210, "total_steps": 459, "loss": 0.1964, "lr": 6.6244439722436985e-06, "epoch": 1.3656147986942329, "percentage": 45.75, "elapsed_time": "4:00:56", "remaining_time": "4:45:40"}
|
211 |
-
{"current_steps": 211, "total_steps": 459, "loss": 0.2181, "lr": 6.588426762067099e-06, "epoch": 1.3721436343852014, "percentage": 45.97, "elapsed_time": "4:01:50", "remaining_time": "4:44:14"}
|
212 |
-
{"current_steps": 212, "total_steps": 459, "loss": 0.2542, "lr": 6.552317641472027e-06, "epoch": 1.3786724700761699, "percentage": 46.19, "elapsed_time": "4:03:04", "remaining_time": "4:43:12"}
|
213 |
-
{"current_steps": 213, "total_steps": 459, "loss": 0.2228, "lr": 6.516118699824179e-06, "epoch": 1.3852013057671382, "percentage": 46.41, "elapsed_time": "4:04:07", "remaining_time": "4:41:57"}
|
214 |
-
{"current_steps": 214, "total_steps": 459, "loss": 0.2146, "lr": 6.479832031686522e-06, "epoch": 1.3917301414581067, "percentage": 46.62, "elapsed_time": "4:05:06", "remaining_time": "4:40:36"}
|
215 |
-
{"current_steps": 215, "total_steps": 459, "loss": 0.1831, "lr": 6.443459736698106e-06, "epoch": 1.3982589771490752, "percentage": 46.84, "elapsed_time": "4:06:05", "remaining_time": "4:39:16"}
|
216 |
-
{"current_steps": 216, "total_steps": 459, "loss": 0.2096, "lr": 6.407003919452565e-06, "epoch": 1.4047878128400435, "percentage": 47.06, "elapsed_time": "4:07:44", "remaining_time": "4:38:42"}
|
217 |
-
{"current_steps": 217, "total_steps": 459, "loss": 0.2558, "lr": 6.370466689376343e-06, "epoch": 1.411316648531012, "percentage": 47.28, "elapsed_time": "4:08:50", "remaining_time": "4:37:30"}
|
218 |
-
{"current_steps": 218, "total_steps": 459, "loss": 0.2302, "lr": 6.333850160606641e-06, "epoch": 1.4178454842219805, "percentage": 47.49, "elapsed_time": "4:10:21", "remaining_time": "4:36:45"}
|
219 |
-
{"current_steps": 219, "total_steps": 459, "loss": 0.2063, "lr": 6.297156451869082e-06, "epoch": 1.4243743199129488, "percentage": 47.71, "elapsed_time": "4:11:32", "remaining_time": "4:35:39"}
|
220 |
-
{"current_steps": 220, "total_steps": 459, "loss": 0.2393, "lr": 6.260387686355121e-06, "epoch": 1.4309031556039173, "percentage": 47.93, "elapsed_time": "4:12:42", "remaining_time": "4:34:32"}
|
221 |
-
{"current_steps": 221, "total_steps": 459, "loss": 0.2343, "lr": 6.223545991599184e-06, "epoch": 1.4374319912948859, "percentage": 48.15, "elapsed_time": "4:14:08", "remaining_time": "4:33:40"}
|
222 |
-
{"current_steps": 222, "total_steps": 459, "loss": 0.2372, "lr": 6.186633499355576e-06, "epoch": 1.4439608269858542, "percentage": 48.37, "elapsed_time": "4:15:24", "remaining_time": "4:32:39"}
|
223 |
-
{"current_steps": 223, "total_steps": 459, "loss": 0.2165, "lr": 6.149652345475118e-06, "epoch": 1.4504896626768227, "percentage": 48.58, "elapsed_time": "4:16:31", "remaining_time": "4:31:29"}
|
224 |
-
{"current_steps": 224, "total_steps": 459, "loss": 0.2251, "lr": 6.112604669781572e-06, "epoch": 1.4570184983677912, "percentage": 48.8, "elapsed_time": "4:17:33", "remaining_time": "4:30:12"}
|
225 |
-
{"current_steps": 225, "total_steps": 459, "loss": 0.2428, "lr": 6.075492615947824e-06, "epoch": 1.4635473340587595, "percentage": 49.02, "elapsed_time": "4:18:40", "remaining_time": "4:29:01"}
|
226 |
-
{"current_steps": 226, "total_steps": 459, "loss": 0.2233, "lr": 6.038318331371836e-06, "epoch": 1.470076169749728, "percentage": 49.24, "elapsed_time": "4:19:44", "remaining_time": "4:27:47"}
|
227 |
-
{"current_steps": 227, "total_steps": 459, "loss": 0.2521, "lr": 6.001083967052408e-06, "epoch": 1.4766050054406965, "percentage": 49.46, "elapsed_time": "4:20:41", "remaining_time": "4:26:26"}
|
228 |
-
{"current_steps": 228, "total_steps": 459, "loss": 0.2164, "lr": 5.963791677464696e-06, "epoch": 1.4831338411316648, "percentage": 49.67, "elapsed_time": "4:21:41", "remaining_time": "4:25:08"}
|
229 |
-
{"current_steps": 229, "total_steps": 459, "loss": 0.2429, "lr": 5.926443620435572e-06, "epoch": 1.4896626768226333, "percentage": 49.89, "elapsed_time": "4:23:05", "remaining_time": "4:24:14"}
|
230 |
-
{"current_steps": 230, "total_steps": 459, "loss": 0.2468, "lr": 5.889041957018745e-06, "epoch": 1.4961915125136018, "percentage": 50.11, "elapsed_time": "4:24:13", "remaining_time": "4:23:04"}
|
231 |
-
{"current_steps": 231, "total_steps": 459, "loss": 0.2496, "lr": 5.85158885136973e-06, "epoch": 1.5027203482045701, "percentage": 50.33, "elapsed_time": "4:25:12", "remaining_time": "4:21:45"}
|
232 |
-
{"current_steps": 232, "total_steps": 459, "loss": 0.2163, "lr": 5.81408647062062e-06, "epoch": 1.5092491838955386, "percentage": 50.54, "elapsed_time": "4:26:37", "remaining_time": "4:20:52"}
|
233 |
-
{"current_steps": 233, "total_steps": 459, "loss": 0.2084, "lr": 5.776536984754691e-06, "epoch": 1.5157780195865072, "percentage": 50.76, "elapsed_time": "4:27:46", "remaining_time": "4:19:44"}
|
234 |
-
{"current_steps": 234, "total_steps": 459, "loss": 0.2521, "lr": 5.738942566480839e-06, "epoch": 1.5223068552774754, "percentage": 50.98, "elapsed_time": "4:28:51", "remaining_time": "4:18:31"}
|
235 |
-
{"current_steps": 235, "total_steps": 459, "loss": 0.2324, "lr": 5.701305391107868e-06, "epoch": 1.528835690968444, "percentage": 51.2, "elapsed_time": "4:29:52", "remaining_time": "4:17:14"}
|
236 |
-
{"current_steps": 236, "total_steps": 459, "loss": 0.2323, "lr": 5.663627636418611e-06, "epoch": 1.5353645266594125, "percentage": 51.42, "elapsed_time": "4:31:06", "remaining_time": "4:16:10"}
|
237 |
-
{"current_steps": 237, "total_steps": 459, "loss": 0.2225, "lr": 5.625911482543928e-06, "epoch": 1.5418933623503808, "percentage": 51.63, "elapsed_time": "4:32:16", "remaining_time": "4:15:02"}
|
238 |
-
{"current_steps": 238, "total_steps": 459, "loss": 0.2364, "lr": 5.588159111836553e-06, "epoch": 1.5484221980413493, "percentage": 51.85, "elapsed_time": "4:33:27", "remaining_time": "4:13:55"}
|
239 |
-
{"current_steps": 239, "total_steps": 459, "loss": 0.2292, "lr": 5.5503727087448155e-06, "epoch": 1.5549510337323178, "percentage": 52.07, "elapsed_time": "4:34:30", "remaining_time": "4:12:41"}
|
240 |
-
{"current_steps": 240, "total_steps": 459, "loss": 0.2346, "lr": 5.5125544596862505e-06, "epoch": 1.561479869423286, "percentage": 52.29, "elapsed_time": "4:35:39", "remaining_time": "4:11:32"}
|
241 |
-
{"current_steps": 241, "total_steps": 459, "loss": 0.2435, "lr": 5.474706552921074e-06, "epoch": 1.5680087051142546, "percentage": 52.51, "elapsed_time": "4:36:51", "remaining_time": "4:10:26"}
|
242 |
-
{"current_steps": 242, "total_steps": 459, "loss": 0.2172, "lr": 5.436831178425582e-06, "epoch": 1.5745375408052231, "percentage": 52.72, "elapsed_time": "4:38:22", "remaining_time": "4:09:37"}
|
243 |
-
{"current_steps": 243, "total_steps": 459, "loss": 0.2201, "lr": 5.398930527765416e-06, "epoch": 1.5810663764961914, "percentage": 52.94, "elapsed_time": "4:39:16", "remaining_time": "4:08:14"}
|
244 |
-
{"current_steps": 244, "total_steps": 459, "loss": 0.2375, "lr": 5.361006793968764e-06, "epoch": 1.58759521218716, "percentage": 53.16, "elapsed_time": "4:40:26", "remaining_time": "4:07:06"}
|
245 |
-
{"current_steps": 245, "total_steps": 459, "loss": 0.2265, "lr": 5.32306217139946e-06, "epoch": 1.5941240478781284, "percentage": 53.38, "elapsed_time": "4:41:23", "remaining_time": "4:05:47"}
|
246 |
-
{"current_steps": 246, "total_steps": 459, "loss": 0.239, "lr": 5.28509885563002e-06, "epoch": 1.6006528835690967, "percentage": 53.59, "elapsed_time": "4:42:27", "remaining_time": "4:04:34"}
|
247 |
-
{"current_steps": 247, "total_steps": 459, "loss": 0.2314, "lr": 5.247119043314592e-06, "epoch": 1.6071817192600653, "percentage": 53.81, "elapsed_time": "4:43:46", "remaining_time": "4:03:33"}
|
248 |
-
{"current_steps": 248, "total_steps": 459, "loss": 0.2525, "lr": 5.209124932061862e-06, "epoch": 1.6137105549510338, "percentage": 54.03, "elapsed_time": "4:45:09", "remaining_time": "4:02:37"}
|
249 |
-
{"current_steps": 249, "total_steps": 459, "loss": 0.2214, "lr": 5.1711187203078826e-06, "epoch": 1.620239390642002, "percentage": 54.25, "elapsed_time": "4:45:56", "remaining_time": "4:01:09"}
|
250 |
-
{"current_steps": 250, "total_steps": 459, "loss": 0.1996, "lr": 5.133102607188875e-06, "epoch": 1.6267682263329706, "percentage": 54.47, "elapsed_time": "4:46:57", "remaining_time": "3:59:53"}
|
251 |
-
{"current_steps": 251, "total_steps": 459, "loss": 0.2345, "lr": 5.095078792413976e-06, "epoch": 1.633297062023939, "percentage": 54.68, "elapsed_time": "4:48:15", "remaining_time": "3:58:52"}
|
252 |
-
{"current_steps": 252, "total_steps": 459, "loss": 0.2248, "lr": 5.057049476137968e-06, "epoch": 1.6398258977149074, "percentage": 54.9, "elapsed_time": "4:49:09", "remaining_time": "3:57:31"}
|
253 |
-
{"current_steps": 253, "total_steps": 459, "loss": 0.2286, "lr": 5.019016858833954e-06, "epoch": 1.646354733405876, "percentage": 55.12, "elapsed_time": "4:49:52", "remaining_time": "3:56:01"}
|
254 |
-
{"current_steps": 254, "total_steps": 459, "loss": 0.2224, "lr": 4.980983141166047e-06, "epoch": 1.6528835690968444, "percentage": 55.34, "elapsed_time": "4:51:07", "remaining_time": "3:54:57"}
|
255 |
-
{"current_steps": 255, "total_steps": 459, "loss": 0.2036, "lr": 4.942950523862033e-06, "epoch": 1.6594124047878127, "percentage": 55.56, "elapsed_time": "4:52:31", "remaining_time": "3:54:00"}
|
256 |
-
{"current_steps": 256, "total_steps": 459, "loss": 0.2028, "lr": 4.904921207586025e-06, "epoch": 1.6659412404787814, "percentage": 55.77, "elapsed_time": "4:54:01", "remaining_time": "3:53:09"}
|
257 |
-
{"current_steps": 257, "total_steps": 459, "loss": 0.1781, "lr": 4.866897392811127e-06, "epoch": 1.6724700761697497, "percentage": 55.99, "elapsed_time": "4:55:20", "remaining_time": "3:52:08"}
|
258 |
-
{"current_steps": 258, "total_steps": 459, "loss": 0.2158, "lr": 4.828881279692118e-06, "epoch": 1.678998911860718, "percentage": 56.21, "elapsed_time": "4:56:32", "remaining_time": "3:51:01"}
|
259 |
-
{"current_steps": 259, "total_steps": 459, "loss": 0.1823, "lr": 4.7908750679381386e-06, "epoch": 1.6855277475516868, "percentage": 56.43, "elapsed_time": "4:57:39", "remaining_time": "3:49:51"}
|
260 |
-
{"current_steps": 260, "total_steps": 459, "loss": 0.234, "lr": 4.752880956685407e-06, "epoch": 1.692056583242655, "percentage": 56.64, "elapsed_time": "4:59:04", "remaining_time": "3:48:54"}
|
261 |
-
{"current_steps": 261, "total_steps": 459, "loss": 0.235, "lr": 4.714901144369982e-06, "epoch": 1.6985854189336234, "percentage": 56.86, "elapsed_time": "5:00:15", "remaining_time": "3:47:47"}
|
262 |
-
{"current_steps": 262, "total_steps": 459, "loss": 0.2225, "lr": 4.676937828600542e-06, "epoch": 1.705114254624592, "percentage": 57.08, "elapsed_time": "5:01:19", "remaining_time": "3:46:34"}
|
263 |
-
{"current_steps": 263, "total_steps": 459, "loss": 0.2081, "lr": 4.638993206031238e-06, "epoch": 1.7116430903155604, "percentage": 57.3, "elapsed_time": "5:02:42", "remaining_time": "3:45:35"}
|
264 |
-
{"current_steps": 264, "total_steps": 459, "loss": 0.2295, "lr": 4.601069472234584e-06, "epoch": 1.7181719260065287, "percentage": 57.52, "elapsed_time": "5:03:45", "remaining_time": "3:44:22"}
|
265 |
-
{"current_steps": 265, "total_steps": 459, "loss": 0.2466, "lr": 4.56316882157442e-06, "epoch": 1.7247007616974974, "percentage": 57.73, "elapsed_time": "5:04:45", "remaining_time": "3:43:06"}
|
266 |
-
{"current_steps": 266, "total_steps": 459, "loss": 0.2273, "lr": 4.525293447078927e-06, "epoch": 1.7312295973884657, "percentage": 57.95, "elapsed_time": "5:06:03", "remaining_time": "3:42:04"}
|
267 |
-
{"current_steps": 267, "total_steps": 459, "loss": 0.208, "lr": 4.487445540313752e-06, "epoch": 1.737758433079434, "percentage": 58.17, "elapsed_time": "5:07:14", "remaining_time": "3:40:56"}
|
268 |
-
{"current_steps": 268, "total_steps": 459, "loss": 0.2209, "lr": 4.4496272912551845e-06, "epoch": 1.7442872687704027, "percentage": 58.39, "elapsed_time": "5:08:35", "remaining_time": "3:39:55"}
|
269 |
-
{"current_steps": 269, "total_steps": 459, "loss": 0.2078, "lr": 4.411840888163449e-06, "epoch": 1.750816104461371, "percentage": 58.61, "elapsed_time": "5:09:37", "remaining_time": "3:38:41"}
|
270 |
-
{"current_steps": 270, "total_steps": 459, "loss": 0.2414, "lr": 4.374088517456074e-06, "epoch": 1.7573449401523396, "percentage": 58.82, "elapsed_time": "5:10:51", "remaining_time": "3:37:36"}
|
271 |
-
{"current_steps": 271, "total_steps": 459, "loss": 0.2282, "lr": 4.336372363581391e-06, "epoch": 1.763873775843308, "percentage": 59.04, "elapsed_time": "5:11:51", "remaining_time": "3:36:20"}
|
272 |
-
{"current_steps": 272, "total_steps": 459, "loss": 0.2262, "lr": 4.298694608892134e-06, "epoch": 1.7704026115342764, "percentage": 59.26, "elapsed_time": "5:13:03", "remaining_time": "3:35:13"}
|
273 |
-
{"current_steps": 273, "total_steps": 459, "loss": 0.2522, "lr": 4.2610574335191615e-06, "epoch": 1.7769314472252449, "percentage": 59.48, "elapsed_time": "5:14:10", "remaining_time": "3:34:02"}
|
274 |
-
{"current_steps": 274, "total_steps": 459, "loss": 0.2475, "lr": 4.223463015245311e-06, "epoch": 1.7834602829162134, "percentage": 59.69, "elapsed_time": "5:15:19", "remaining_time": "3:32:54"}
|
275 |
-
{"current_steps": 275, "total_steps": 459, "loss": 0.213, "lr": 4.185913529379381e-06, "epoch": 1.7899891186071817, "percentage": 59.91, "elapsed_time": "5:16:24", "remaining_time": "3:31:42"}
|
276 |
-
{"current_steps": 276, "total_steps": 459, "loss": 0.1942, "lr": 4.148411148630271e-06, "epoch": 1.7965179542981502, "percentage": 60.13, "elapsed_time": "5:17:32", "remaining_time": "3:30:32"}
|
277 |
-
{"current_steps": 277, "total_steps": 459, "loss": 0.1973, "lr": 4.110958042981256e-06, "epoch": 1.8030467899891187, "percentage": 60.35, "elapsed_time": "5:18:58", "remaining_time": "3:29:34"}
|
278 |
-
{"current_steps": 278, "total_steps": 459, "loss": 0.2296, "lr": 4.073556379564429e-06, "epoch": 1.809575625680087, "percentage": 60.57, "elapsed_time": "5:20:09", "remaining_time": "3:28:27"}
|
279 |
-
{"current_steps": 279, "total_steps": 459, "loss": 0.2288, "lr": 4.036208322535304e-06, "epoch": 1.8161044613710555, "percentage": 60.78, "elapsed_time": "5:21:17", "remaining_time": "3:27:17"}
|
280 |
-
{"current_steps": 280, "total_steps": 459, "loss": 0.2085, "lr": 3.998916032947594e-06, "epoch": 1.822633297062024, "percentage": 61.0, "elapsed_time": "5:22:08", "remaining_time": "3:25:56"}
|
281 |
-
{"current_steps": 281, "total_steps": 459, "loss": 0.2258, "lr": 3.9616816686281636e-06, "epoch": 1.8291621327529923, "percentage": 61.22, "elapsed_time": "5:23:08", "remaining_time": "3:24:41"}
|
282 |
-
{"current_steps": 282, "total_steps": 459, "loss": 0.1992, "lr": 3.924507384052177e-06, "epoch": 1.8356909684439608, "percentage": 61.44, "elapsed_time": "5:24:25", "remaining_time": "3:23:37"}
|
283 |
-
{"current_steps": 283, "total_steps": 459, "loss": 0.2175, "lr": 3.887395330218429e-06, "epoch": 1.8422198041349294, "percentage": 61.66, "elapsed_time": "5:25:29", "remaining_time": "3:22:25"}
|
284 |
-
{"current_steps": 284, "total_steps": 459, "loss": 0.2317, "lr": 3.850347654524884e-06, "epoch": 1.8487486398258977, "percentage": 61.87, "elapsed_time": "5:26:33", "remaining_time": "3:21:13"}
|
285 |
-
{"current_steps": 285, "total_steps": 459, "loss": 0.1964, "lr": 3.813366500644426e-06, "epoch": 1.8552774755168662, "percentage": 62.09, "elapsed_time": "5:27:49", "remaining_time": "3:20:08"}
|
286 |
-
{"current_steps": 286, "total_steps": 459, "loss": 0.1872, "lr": 3.7764540084008166e-06, "epoch": 1.8618063112078347, "percentage": 62.31, "elapsed_time": "5:29:22", "remaining_time": "3:19:14"}
|
287 |
-
{"current_steps": 287, "total_steps": 459, "loss": 0.2079, "lr": 3.7396123136448824e-06, "epoch": 1.868335146898803, "percentage": 62.53, "elapsed_time": "5:30:21", "remaining_time": "3:17:58"}
|
288 |
-
{"current_steps": 288, "total_steps": 459, "loss": 0.2197, "lr": 3.70284354813092e-06, "epoch": 1.8748639825897715, "percentage": 62.75, "elapsed_time": "5:31:27", "remaining_time": "3:16:48"}
|
289 |
-
{"current_steps": 289, "total_steps": 459, "loss": 0.2046, "lr": 3.6661498393933612e-06, "epoch": 1.88139281828074, "percentage": 62.96, "elapsed_time": "5:32:43", "remaining_time": "3:15:43"}
|
290 |
-
{"current_steps": 290, "total_steps": 459, "loss": 0.2234, "lr": 3.629533310623658e-06, "epoch": 1.8879216539717083, "percentage": 63.18, "elapsed_time": "5:33:45", "remaining_time": "3:14:29"}
|
291 |
-
{"current_steps": 291, "total_steps": 459, "loss": 0.2332, "lr": 3.5929960805474386e-06, "epoch": 1.8944504896626768, "percentage": 63.4, "elapsed_time": "5:35:02", "remaining_time": "3:13:25"}
|
292 |
-
{"current_steps": 292, "total_steps": 459, "loss": 0.2372, "lr": 3.5565402633018963e-06, "epoch": 1.9009793253536453, "percentage": 63.62, "elapsed_time": "5:36:08", "remaining_time": "3:12:14"}
|
293 |
-
{"current_steps": 293, "total_steps": 459, "loss": 0.222, "lr": 3.5201679683134793e-06, "epoch": 1.9075081610446136, "percentage": 63.83, "elapsed_time": "5:37:36", "remaining_time": "3:11:16"}
|
294 |
-
{"current_steps": 294, "total_steps": 459, "loss": 0.2132, "lr": 3.483881300175823e-06, "epoch": 1.9140369967355821, "percentage": 64.05, "elapsed_time": "5:38:33", "remaining_time": "3:10:00"}
|
295 |
-
{"current_steps": 295, "total_steps": 459, "loss": 0.2202, "lr": 3.4476823585279745e-06, "epoch": 1.9205658324265507, "percentage": 64.27, "elapsed_time": "5:39:44", "remaining_time": "3:08:52"}
|
296 |
-
{"current_steps": 296, "total_steps": 459, "loss": 0.2177, "lr": 3.4115732379329038e-06, "epoch": 1.927094668117519, "percentage": 64.49, "elapsed_time": "5:40:58", "remaining_time": "3:07:45"}
|
297 |
-
{"current_steps": 297, "total_steps": 459, "loss": 0.2268, "lr": 3.3755560277563028e-06, "epoch": 1.9336235038084875, "percentage": 64.71, "elapsed_time": "5:41:52", "remaining_time": "3:06:28"}
|
298 |
-
{"current_steps": 298, "total_steps": 459, "loss": 0.2032, "lr": 3.3396328120456968e-06, "epoch": 1.940152339499456, "percentage": 64.92, "elapsed_time": "5:43:01", "remaining_time": "3:05:19"}
|
299 |
-
{"current_steps": 299, "total_steps": 459, "loss": 0.2254, "lr": 3.3038056694098485e-06, "epoch": 1.9466811751904243, "percentage": 65.14, "elapsed_time": "5:43:58", "remaining_time": "3:04:04"}
|
300 |
-
{"current_steps": 300, "total_steps": 459, "loss": 0.2407, "lr": 3.268076672898492e-06, "epoch": 1.9532100108813928, "percentage": 65.36, "elapsed_time": "5:45:01", "remaining_time": "3:02:52"}
|
301 |
-
{"current_steps": 301, "total_steps": 459, "loss": 0.2257, "lr": 3.232447889882371e-06, "epoch": 1.9597388465723613, "percentage": 65.58, "elapsed_time": "5:50:18", "remaining_time": "3:03:53"}
|
302 |
-
{"current_steps": 302, "total_steps": 459, "loss": 0.2206, "lr": 3.196921381933624e-06, "epoch": 1.9662676822633296, "percentage": 65.8, "elapsed_time": "5:51:31", "remaining_time": "3:02:44"}
|
303 |
-
{"current_steps": 303, "total_steps": 459, "loss": 0.2483, "lr": 3.1614992047064947e-06, "epoch": 1.9727965179542981, "percentage": 66.01, "elapsed_time": "5:52:22", "remaining_time": "3:01:25"}
|
|
|
1 |
+
{"current_steps": 1, "total_steps": 459, "loss": 0.9033, "lr": 0.0, "epoch": 0.006528835690968444, "percentage": 0.22, "elapsed_time": "0:01:30", "remaining_time": "11:28:26"}
|
2 |
+
{"current_steps": 2, "total_steps": 459, "loss": 0.8778, "lr": 2.173913043478261e-07, "epoch": 0.013057671381936888, "percentage": 0.44, "elapsed_time": "0:02:47", "remaining_time": "10:39:01"}
|
3 |
+
{"current_steps": 3, "total_steps": 459, "loss": 0.8486, "lr": 4.347826086956522e-07, "epoch": 0.01958650707290533, "percentage": 0.65, "elapsed_time": "0:04:15", "remaining_time": "10:47:59"}
|
4 |
+
{"current_steps": 4, "total_steps": 459, "loss": 0.8763, "lr": 6.521739130434783e-07, "epoch": 0.026115342763873776, "percentage": 0.87, "elapsed_time": "0:05:09", "remaining_time": "9:47:41"}
|
5 |
+
{"current_steps": 5, "total_steps": 459, "loss": 0.9429, "lr": 8.695652173913044e-07, "epoch": 0.03264417845484222, "percentage": 1.09, "elapsed_time": "0:06:23", "remaining_time": "9:40:44"}
|
6 |
+
{"current_steps": 6, "total_steps": 459, "loss": 0.8436, "lr": 1.0869565217391306e-06, "epoch": 0.03917301414581066, "percentage": 1.31, "elapsed_time": "0:07:31", "remaining_time": "9:28:02"}
|
7 |
+
{"current_steps": 7, "total_steps": 459, "loss": 0.8914, "lr": 1.3043478260869566e-06, "epoch": 0.04570184983677911, "percentage": 1.53, "elapsed_time": "0:08:41", "remaining_time": "9:21:06"}
|
8 |
+
{"current_steps": 8, "total_steps": 459, "loss": 0.799, "lr": 1.521739130434783e-06, "epoch": 0.05223068552774755, "percentage": 1.74, "elapsed_time": "0:09:37", "remaining_time": "9:03:02"}
|
9 |
+
{"current_steps": 9, "total_steps": 459, "loss": 0.8523, "lr": 1.7391304347826088e-06, "epoch": 0.058759521218716, "percentage": 1.96, "elapsed_time": "0:11:02", "remaining_time": "9:11:52"}
|
10 |
+
{"current_steps": 10, "total_steps": 459, "loss": 0.8531, "lr": 1.956521739130435e-06, "epoch": 0.06528835690968444, "percentage": 2.18, "elapsed_time": "0:12:19", "remaining_time": "9:13:43"}
|
11 |
+
{"current_steps": 11, "total_steps": 459, "loss": 0.7496, "lr": 2.173913043478261e-06, "epoch": 0.07181719260065289, "percentage": 2.4, "elapsed_time": "0:13:32", "remaining_time": "9:11:21"}
|
12 |
+
{"current_steps": 12, "total_steps": 459, "loss": 0.7624, "lr": 2.391304347826087e-06, "epoch": 0.07834602829162132, "percentage": 2.61, "elapsed_time": "0:14:34", "remaining_time": "9:03:04"}
|
13 |
+
{"current_steps": 13, "total_steps": 459, "loss": 0.8073, "lr": 2.6086956521739132e-06, "epoch": 0.08487486398258977, "percentage": 2.83, "elapsed_time": "0:15:38", "remaining_time": "8:56:30"}
|
14 |
+
{"current_steps": 14, "total_steps": 459, "loss": 0.7144, "lr": 2.8260869565217393e-06, "epoch": 0.09140369967355821, "percentage": 3.05, "elapsed_time": "0:16:55", "remaining_time": "8:57:45"}
|
15 |
+
{"current_steps": 15, "total_steps": 459, "loss": 0.6503, "lr": 3.043478260869566e-06, "epoch": 0.09793253536452666, "percentage": 3.27, "elapsed_time": "0:18:03", "remaining_time": "8:54:43"}
|
16 |
+
{"current_steps": 16, "total_steps": 459, "loss": 0.6791, "lr": 3.2608695652173914e-06, "epoch": 0.1044613710554951, "percentage": 3.49, "elapsed_time": "0:18:59", "remaining_time": "8:45:53"}
|
17 |
+
{"current_steps": 17, "total_steps": 459, "loss": 0.638, "lr": 3.4782608695652175e-06, "epoch": 0.11099020674646355, "percentage": 3.7, "elapsed_time": "0:20:15", "remaining_time": "8:46:45"}
|
18 |
+
{"current_steps": 18, "total_steps": 459, "loss": 0.5872, "lr": 3.6956521739130436e-06, "epoch": 0.117519042437432, "percentage": 3.92, "elapsed_time": "0:21:30", "remaining_time": "8:47:01"}
|
19 |
+
{"current_steps": 19, "total_steps": 459, "loss": 0.5898, "lr": 3.91304347826087e-06, "epoch": 0.12404787812840043, "percentage": 4.14, "elapsed_time": "0:22:42", "remaining_time": "8:45:47"}
|
20 |
+
{"current_steps": 20, "total_steps": 459, "loss": 0.5648, "lr": 4.130434782608696e-06, "epoch": 0.1305767138193689, "percentage": 4.36, "elapsed_time": "0:23:55", "remaining_time": "8:45:00"}
|
21 |
+
{"current_steps": 21, "total_steps": 459, "loss": 0.5785, "lr": 4.347826086956522e-06, "epoch": 0.13710554951033732, "percentage": 4.58, "elapsed_time": "0:24:52", "remaining_time": "8:38:41"}
|
22 |
+
{"current_steps": 22, "total_steps": 459, "loss": 0.5384, "lr": 4.565217391304348e-06, "epoch": 0.14363438520130578, "percentage": 4.79, "elapsed_time": "0:25:52", "remaining_time": "8:33:53"}
|
23 |
+
{"current_steps": 23, "total_steps": 459, "loss": 0.6126, "lr": 4.782608695652174e-06, "epoch": 0.1501632208922742, "percentage": 5.01, "elapsed_time": "0:26:57", "remaining_time": "8:30:59"}
|
24 |
+
{"current_steps": 24, "total_steps": 459, "loss": 0.5585, "lr": 5e-06, "epoch": 0.15669205658324264, "percentage": 5.23, "elapsed_time": "0:27:54", "remaining_time": "8:25:50"}
|
25 |
+
{"current_steps": 25, "total_steps": 459, "loss": 0.5076, "lr": 5.2173913043478265e-06, "epoch": 0.1632208922742111, "percentage": 5.45, "elapsed_time": "0:29:04", "remaining_time": "8:24:51"}
|
26 |
+
{"current_steps": 26, "total_steps": 459, "loss": 0.5539, "lr": 5.4347826086956525e-06, "epoch": 0.16974972796517954, "percentage": 5.66, "elapsed_time": "0:30:10", "remaining_time": "8:22:31"}
|
27 |
+
{"current_steps": 27, "total_steps": 459, "loss": 0.5259, "lr": 5.652173913043479e-06, "epoch": 0.176278563656148, "percentage": 5.88, "elapsed_time": "0:31:11", "remaining_time": "8:19:10"}
|
28 |
+
{"current_steps": 28, "total_steps": 459, "loss": 0.5336, "lr": 5.8695652173913055e-06, "epoch": 0.18280739934711643, "percentage": 6.1, "elapsed_time": "0:32:30", "remaining_time": "8:20:25"}
|
29 |
+
{"current_steps": 29, "total_steps": 459, "loss": 0.4915, "lr": 6.086956521739132e-06, "epoch": 0.1893362350380849, "percentage": 6.32, "elapsed_time": "0:33:30", "remaining_time": "8:16:51"}
|
30 |
+
{"current_steps": 30, "total_steps": 459, "loss": 0.4779, "lr": 6.304347826086958e-06, "epoch": 0.19586507072905332, "percentage": 6.54, "elapsed_time": "0:34:34", "remaining_time": "8:14:20"}
|
31 |
+
{"current_steps": 31, "total_steps": 459, "loss": 0.5092, "lr": 6.521739130434783e-06, "epoch": 0.20239390642002175, "percentage": 6.75, "elapsed_time": "0:35:39", "remaining_time": "8:12:21"}
|
32 |
+
{"current_steps": 32, "total_steps": 459, "loss": 0.4959, "lr": 6.739130434782609e-06, "epoch": 0.2089227421109902, "percentage": 6.97, "elapsed_time": "0:36:36", "remaining_time": "8:08:27"}
|
33 |
+
{"current_steps": 33, "total_steps": 459, "loss": 0.5217, "lr": 6.956521739130435e-06, "epoch": 0.21545157780195864, "percentage": 7.19, "elapsed_time": "0:37:46", "remaining_time": "8:07:37"}
|
34 |
+
{"current_steps": 34, "total_steps": 459, "loss": 0.5079, "lr": 7.173913043478261e-06, "epoch": 0.2219804134929271, "percentage": 7.41, "elapsed_time": "0:38:49", "remaining_time": "8:05:14"}
|
35 |
+
{"current_steps": 35, "total_steps": 459, "loss": 0.5449, "lr": 7.391304347826087e-06, "epoch": 0.22850924918389554, "percentage": 7.63, "elapsed_time": "0:40:10", "remaining_time": "8:06:36"}
|
36 |
+
{"current_steps": 36, "total_steps": 459, "loss": 0.4993, "lr": 7.608695652173914e-06, "epoch": 0.235038084874864, "percentage": 7.84, "elapsed_time": "0:41:10", "remaining_time": "8:03:47"}
|
37 |
+
{"current_steps": 37, "total_steps": 459, "loss": 0.4685, "lr": 7.82608695652174e-06, "epoch": 0.24156692056583243, "percentage": 8.06, "elapsed_time": "0:42:25", "remaining_time": "8:03:56"}
|
38 |
+
{"current_steps": 38, "total_steps": 459, "loss": 0.4806, "lr": 8.043478260869566e-06, "epoch": 0.24809575625680086, "percentage": 8.28, "elapsed_time": "0:43:39", "remaining_time": "8:03:40"}
|
39 |
+
{"current_steps": 39, "total_steps": 459, "loss": 0.468, "lr": 8.260869565217392e-06, "epoch": 0.2546245919477693, "percentage": 8.5, "elapsed_time": "0:44:42", "remaining_time": "8:01:28"}
|
40 |
+
{"current_steps": 40, "total_steps": 459, "loss": 0.4569, "lr": 8.478260869565218e-06, "epoch": 0.2611534276387378, "percentage": 8.71, "elapsed_time": "0:45:53", "remaining_time": "8:00:47"}
|
41 |
+
{"current_steps": 41, "total_steps": 459, "loss": 0.4406, "lr": 8.695652173913044e-06, "epoch": 0.2676822633297062, "percentage": 8.93, "elapsed_time": "0:47:03", "remaining_time": "7:59:44"}
|
42 |
+
{"current_steps": 42, "total_steps": 459, "loss": 0.4557, "lr": 8.91304347826087e-06, "epoch": 0.27421109902067464, "percentage": 9.15, "elapsed_time": "0:48:03", "remaining_time": "7:57:13"}
|
43 |
+
{"current_steps": 43, "total_steps": 459, "loss": 0.4134, "lr": 9.130434782608697e-06, "epoch": 0.2807399347116431, "percentage": 9.37, "elapsed_time": "0:49:23", "remaining_time": "7:57:46"}
|
44 |
+
{"current_steps": 44, "total_steps": 459, "loss": 0.4841, "lr": 9.347826086956523e-06, "epoch": 0.28726877040261156, "percentage": 9.59, "elapsed_time": "0:50:29", "remaining_time": "7:56:17"}
|
45 |
+
{"current_steps": 45, "total_steps": 459, "loss": 0.4275, "lr": 9.565217391304349e-06, "epoch": 0.29379760609357997, "percentage": 9.8, "elapsed_time": "0:51:40", "remaining_time": "7:55:20"}
|
46 |
+
{"current_steps": 46, "total_steps": 459, "loss": 0.4753, "lr": 9.782608695652175e-06, "epoch": 0.3003264417845484, "percentage": 10.02, "elapsed_time": "0:52:55", "remaining_time": "7:55:14"}
|
47 |
+
{"current_steps": 47, "total_steps": 459, "loss": 0.4649, "lr": 1e-05, "epoch": 0.3068552774755169, "percentage": 10.24, "elapsed_time": "0:54:06", "remaining_time": "7:54:17"}
|
48 |
+
{"current_steps": 48, "total_steps": 459, "loss": 0.4243, "lr": 9.999855343632037e-06, "epoch": 0.3133841131664853, "percentage": 10.46, "elapsed_time": "0:55:14", "remaining_time": "7:53:01"}
|
49 |
+
{"current_steps": 49, "total_steps": 459, "loss": 0.4119, "lr": 9.99942138289833e-06, "epoch": 0.31991294885745375, "percentage": 10.68, "elapsed_time": "0:56:41", "remaining_time": "7:54:24"}
|
50 |
+
{"current_steps": 50, "total_steps": 459, "loss": 0.4827, "lr": 9.998698142908954e-06, "epoch": 0.3264417845484222, "percentage": 10.89, "elapsed_time": "0:57:58", "remaining_time": "7:54:16"}
|
51 |
+
{"current_steps": 51, "total_steps": 459, "loss": 0.4263, "lr": 9.997685665512418e-06, "epoch": 0.33297062023939067, "percentage": 11.11, "elapsed_time": "0:58:59", "remaining_time": "7:51:53"}
|
52 |
+
{"current_steps": 52, "total_steps": 459, "loss": 0.4548, "lr": 9.99638400929324e-06, "epoch": 0.3394994559303591, "percentage": 11.33, "elapsed_time": "1:00:14", "remaining_time": "7:51:26"}
|
53 |
+
{"current_steps": 53, "total_steps": 459, "loss": 0.4391, "lr": 9.994793249568568e-06, "epoch": 0.34602829162132753, "percentage": 11.55, "elapsed_time": "1:01:14", "remaining_time": "7:49:08"}
|
54 |
+
{"current_steps": 54, "total_steps": 459, "loss": 0.4194, "lr": 9.99291347838381e-06, "epoch": 0.352557127312296, "percentage": 11.76, "elapsed_time": "1:02:37", "remaining_time": "7:49:43"}
|
55 |
+
{"current_steps": 55, "total_steps": 459, "loss": 0.4396, "lr": 9.990744804507315e-06, "epoch": 0.3590859630032644, "percentage": 11.98, "elapsed_time": "1:03:52", "remaining_time": "7:49:08"}
|
56 |
+
{"current_steps": 56, "total_steps": 459, "loss": 0.4568, "lr": 9.988287353424077e-06, "epoch": 0.36561479869423286, "percentage": 12.2, "elapsed_time": "1:05:00", "remaining_time": "7:47:49"}
|
57 |
+
{"current_steps": 57, "total_steps": 459, "loss": 0.4243, "lr": 9.985541267328479e-06, "epoch": 0.3721436343852013, "percentage": 12.42, "elapsed_time": "1:06:04", "remaining_time": "7:46:03"}
|
58 |
+
{"current_steps": 58, "total_steps": 459, "loss": 0.4497, "lr": 9.98250670511605e-06, "epoch": 0.3786724700761698, "percentage": 12.64, "elapsed_time": "1:07:24", "remaining_time": "7:46:00"}
|
59 |
+
{"current_steps": 59, "total_steps": 459, "loss": 0.4838, "lr": 9.979183842374294e-06, "epoch": 0.3852013057671382, "percentage": 12.85, "elapsed_time": "1:08:52", "remaining_time": "7:46:54"}
|
60 |
+
{"current_steps": 60, "total_steps": 459, "loss": 0.4156, "lr": 9.975572871372513e-06, "epoch": 0.39173014145810664, "percentage": 13.07, "elapsed_time": "1:09:59", "remaining_time": "7:45:25"}
|
61 |
+
{"current_steps": 61, "total_steps": 459, "loss": 0.4101, "lr": 9.971674001050687e-06, "epoch": 0.3982589771490751, "percentage": 13.29, "elapsed_time": "1:10:52", "remaining_time": "7:42:23"}
|
62 |
+
{"current_steps": 62, "total_steps": 459, "loss": 0.4644, "lr": 9.967487457007382e-06, "epoch": 0.4047878128400435, "percentage": 13.51, "elapsed_time": "1:11:37", "remaining_time": "7:38:37"}
|
63 |
+
{"current_steps": 63, "total_steps": 459, "loss": 0.4146, "lr": 9.963013481486704e-06, "epoch": 0.41131664853101196, "percentage": 13.73, "elapsed_time": "1:12:43", "remaining_time": "7:37:07"}
|
64 |
+
{"current_steps": 64, "total_steps": 459, "loss": 0.4088, "lr": 9.958252333364266e-06, "epoch": 0.4178454842219804, "percentage": 13.94, "elapsed_time": "1:14:02", "remaining_time": "7:36:57"}
|
65 |
+
{"current_steps": 65, "total_steps": 459, "loss": 0.4399, "lr": 9.953204288132234e-06, "epoch": 0.4243743199129489, "percentage": 14.16, "elapsed_time": "1:15:02", "remaining_time": "7:34:50"}
|
66 |
+
{"current_steps": 66, "total_steps": 459, "loss": 0.414, "lr": 9.947869637883359e-06, "epoch": 0.4309031556039173, "percentage": 14.38, "elapsed_time": "1:16:02", "remaining_time": "7:32:49"}
|
67 |
+
{"current_steps": 67, "total_steps": 459, "loss": 0.4747, "lr": 9.942248691294092e-06, "epoch": 0.43743199129488575, "percentage": 14.6, "elapsed_time": "1:16:58", "remaining_time": "7:30:22"}
|
68 |
+
{"current_steps": 68, "total_steps": 459, "loss": 0.4272, "lr": 9.936341773606723e-06, "epoch": 0.4439608269858542, "percentage": 14.81, "elapsed_time": "1:17:41", "remaining_time": "7:26:46"}
|
69 |
+
{"current_steps": 69, "total_steps": 459, "loss": 0.4408, "lr": 9.930149226610555e-06, "epoch": 0.4504896626768226, "percentage": 15.03, "elapsed_time": "1:18:46", "remaining_time": "7:25:15"}
|
70 |
+
{"current_steps": 70, "total_steps": 459, "loss": 0.4796, "lr": 9.923671408622128e-06, "epoch": 0.45701849836779107, "percentage": 15.25, "elapsed_time": "1:19:50", "remaining_time": "7:23:43"}
|
71 |
+
{"current_steps": 71, "total_steps": 459, "loss": 0.4161, "lr": 9.916908694464494e-06, "epoch": 0.46354733405875953, "percentage": 15.47, "elapsed_time": "1:20:51", "remaining_time": "7:21:52"}
|
72 |
+
{"current_steps": 72, "total_steps": 459, "loss": 0.4157, "lr": 9.909861475445517e-06, "epoch": 0.470076169749728, "percentage": 15.69, "elapsed_time": "1:22:12", "remaining_time": "7:21:49"}
|
73 |
+
{"current_steps": 73, "total_steps": 459, "loss": 0.4385, "lr": 9.902530159335245e-06, "epoch": 0.4766050054406964, "percentage": 15.9, "elapsed_time": "1:23:24", "remaining_time": "7:21:04"}
|
74 |
+
{"current_steps": 74, "total_steps": 459, "loss": 0.4499, "lr": 9.894915170342297e-06, "epoch": 0.48313384113166485, "percentage": 16.12, "elapsed_time": "1:24:36", "remaining_time": "7:20:11"}
|
75 |
+
{"current_steps": 75, "total_steps": 459, "loss": 0.427, "lr": 9.887016949089334e-06, "epoch": 0.4896626768226333, "percentage": 16.34, "elapsed_time": "1:25:52", "remaining_time": "7:19:39"}
|
76 |
+
{"current_steps": 76, "total_steps": 459, "loss": 0.4522, "lr": 9.878835952587559e-06, "epoch": 0.4961915125136017, "percentage": 16.56, "elapsed_time": "1:27:04", "remaining_time": "7:18:47"}
|
77 |
+
{"current_steps": 77, "total_steps": 459, "loss": 0.4429, "lr": 9.870372654210265e-06, "epoch": 0.5027203482045702, "percentage": 16.78, "elapsed_time": "1:28:25", "remaining_time": "7:18:41"}
|
78 |
+
{"current_steps": 78, "total_steps": 459, "loss": 0.408, "lr": 9.861627543665456e-06, "epoch": 0.5092491838955386, "percentage": 16.99, "elapsed_time": "1:29:50", "remaining_time": "7:18:49"}
|
79 |
+
{"current_steps": 79, "total_steps": 459, "loss": 0.4213, "lr": 9.852601126967502e-06, "epoch": 0.515778019586507, "percentage": 17.21, "elapsed_time": "1:30:50", "remaining_time": "7:16:56"}
|
80 |
+
{"current_steps": 80, "total_steps": 459, "loss": 0.4132, "lr": 9.843293926407866e-06, "epoch": 0.5223068552774756, "percentage": 17.43, "elapsed_time": "1:32:00", "remaining_time": "7:15:54"}
|
81 |
+
{"current_steps": 81, "total_steps": 459, "loss": 0.4181, "lr": 9.833706480524878e-06, "epoch": 0.528835690968444, "percentage": 17.65, "elapsed_time": "1:32:55", "remaining_time": "7:13:36"}
|
82 |
+
{"current_steps": 82, "total_steps": 459, "loss": 0.4418, "lr": 9.823839344072582e-06, "epoch": 0.5353645266594124, "percentage": 17.86, "elapsed_time": "1:34:07", "remaining_time": "7:12:44"}
|
83 |
+
{"current_steps": 83, "total_steps": 459, "loss": 0.419, "lr": 9.81369308798862e-06, "epoch": 0.5418933623503809, "percentage": 18.08, "elapsed_time": "1:35:00", "remaining_time": "7:10:21"}
|
84 |
+
{"current_steps": 84, "total_steps": 459, "loss": 0.4095, "lr": 9.803268299361217e-06, "epoch": 0.5484221980413493, "percentage": 18.3, "elapsed_time": "1:36:12", "remaining_time": "7:09:31"}
|
85 |
+
{"current_steps": 85, "total_steps": 459, "loss": 0.4243, "lr": 9.7925655813952e-06, "epoch": 0.5549510337323177, "percentage": 18.52, "elapsed_time": "1:37:09", "remaining_time": "7:07:31"}
|
86 |
+
{"current_steps": 86, "total_steps": 459, "loss": 0.3727, "lr": 9.781585553377086e-06, "epoch": 0.5614798694232862, "percentage": 18.74, "elapsed_time": "1:38:18", "remaining_time": "7:06:24"}
|
87 |
+
{"current_steps": 87, "total_steps": 459, "loss": 0.4063, "lr": 9.770328850639268e-06, "epoch": 0.5680087051142546, "percentage": 18.95, "elapsed_time": "1:39:38", "remaining_time": "7:06:05"}
|
88 |
+
{"current_steps": 88, "total_steps": 459, "loss": 0.4432, "lr": 9.758796124523238e-06, "epoch": 0.5745375408052231, "percentage": 19.17, "elapsed_time": "1:40:24", "remaining_time": "7:03:19"}
|
89 |
+
{"current_steps": 89, "total_steps": 459, "loss": 0.4527, "lr": 9.746988042341907e-06, "epoch": 0.5810663764961915, "percentage": 19.39, "elapsed_time": "1:41:15", "remaining_time": "7:00:58"}
|
90 |
+
{"current_steps": 90, "total_steps": 459, "loss": 0.3915, "lr": 9.734905287340985e-06, "epoch": 0.5875952121871599, "percentage": 19.61, "elapsed_time": "1:42:15", "remaining_time": "6:59:14"}
|
91 |
+
{"current_steps": 91, "total_steps": 459, "loss": 0.3874, "lr": 9.722548558659457e-06, "epoch": 0.5941240478781284, "percentage": 19.83, "elapsed_time": "1:43:28", "remaining_time": "6:58:27"}
|
92 |
+
{"current_steps": 92, "total_steps": 459, "loss": 0.4132, "lr": 9.709918571289114e-06, "epoch": 0.6006528835690969, "percentage": 20.04, "elapsed_time": "1:44:45", "remaining_time": "6:57:51"}
|
93 |
+
{"current_steps": 93, "total_steps": 459, "loss": 0.4179, "lr": 9.697016056033202e-06, "epoch": 0.6071817192600653, "percentage": 20.26, "elapsed_time": "1:45:51", "remaining_time": "6:56:34"}
|
94 |
+
{"current_steps": 94, "total_steps": 459, "loss": 0.3873, "lr": 9.683841759464114e-06, "epoch": 0.6137105549510338, "percentage": 20.48, "elapsed_time": "1:46:42", "remaining_time": "6:54:21"}
|
95 |
+
{"current_steps": 95, "total_steps": 459, "loss": 0.4401, "lr": 9.670396443880208e-06, "epoch": 0.6202393906420022, "percentage": 20.7, "elapsed_time": "1:47:40", "remaining_time": "6:52:32"}
|
96 |
+
{"current_steps": 96, "total_steps": 459, "loss": 0.3998, "lr": 9.656680887261693e-06, "epoch": 0.6267682263329706, "percentage": 20.92, "elapsed_time": "1:48:41", "remaining_time": "6:50:59"}
|
97 |
+
{"current_steps": 97, "total_steps": 459, "loss": 0.3667, "lr": 9.64269588322561e-06, "epoch": 0.6332970620239391, "percentage": 21.13, "elapsed_time": "1:50:10", "remaining_time": "6:51:10"}
|
98 |
+
{"current_steps": 98, "total_steps": 459, "loss": 0.4073, "lr": 9.628442240979915e-06, "epoch": 0.6398258977149075, "percentage": 21.35, "elapsed_time": "1:51:40", "remaining_time": "6:51:23"}
|
99 |
+
{"current_steps": 99, "total_steps": 459, "loss": 0.4234, "lr": 9.613920785276655e-06, "epoch": 0.6463547334058759, "percentage": 21.57, "elapsed_time": "1:52:38", "remaining_time": "6:49:35"}
|
100 |
+
{"current_steps": 100, "total_steps": 459, "loss": 0.4614, "lr": 9.599132356364247e-06, "epoch": 0.6528835690968444, "percentage": 21.79, "elapsed_time": "1:53:45", "remaining_time": "6:48:23"}
|
101 |
+
{"current_steps": 101, "total_steps": 459, "loss": 0.4418, "lr": 9.584077809938856e-06, "epoch": 0.6594124047878128, "percentage": 22.0, "elapsed_time": "1:57:48", "remaining_time": "6:57:34"}
|
102 |
+
{"current_steps": 102, "total_steps": 459, "loss": 0.4131, "lr": 9.568758017094884e-06, "epoch": 0.6659412404787813, "percentage": 22.22, "elapsed_time": "1:58:57", "remaining_time": "6:56:21"}
|
103 |
+
{"current_steps": 103, "total_steps": 459, "loss": 0.389, "lr": 9.553173864274567e-06, "epoch": 0.6724700761697497, "percentage": 22.44, "elapsed_time": "2:00:15", "remaining_time": "6:55:37"}
|
104 |
+
{"current_steps": 104, "total_steps": 459, "loss": 0.4406, "lr": 9.537326253216685e-06, "epoch": 0.6789989118607181, "percentage": 22.66, "elapsed_time": "2:01:14", "remaining_time": "6:53:51"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 7992
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fedf49e8e2ef124d53ba44d045fba488fc71c102215242f478c36c1acedaa0e4
|
3 |
size 7992
|