yuzhounie commited on
Commit
6e100e3
·
verified ·
1 Parent(s): c18daa8

Training in progress, step 2148

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:728c295871c494d5d0b555809c03f36dcba106eaa33e6137026884eac0bfeaf8
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f636066c446878f490a2ab3d8366b5c6704e2f3a1a02a75f0d37079d8dea26e
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b6d66d467f2e7d263f57ccdb3228259f9924b289575064881dffdf8d69a2da1f
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d91e2adeb80a47306666d4a89fe2e8790333bb0cb8d654227be5b1e1f87b7035
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d63f46e90a48121a44eb6cf9e10cd798565607f016b2c21ae3e932b4feb6b666
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00fbc05c610ce8c7ef71246407e6abc86ed5f2855aeb7ad17e36db12ced35f76
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6716c227c90308816e0af32cf5e1ef23f5b826876ef0ddc6f0d86d18febdedbf
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fccad15716bad379d2e8c7fe4480b072f5d51e30778fc3c842a94ff2c79ee10
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -2014,3 +2014,136 @@
2014
  {"current_steps": 2014, "total_steps": 2148, "loss": 0.2267, "lr": 1.1986727955373588e-07, "epoch": 2.8119042083236456, "percentage": 93.76, "elapsed_time": "4:41:03", "remaining_time": "0:18:42"}
2015
  {"current_steps": 2015, "total_steps": 2148, "loss": 0.2363, "lr": 1.1810504364603737e-07, "epoch": 2.813299232736573, "percentage": 93.81, "elapsed_time": "4:41:10", "remaining_time": "0:18:33"}
2016
  {"current_steps": 2016, "total_steps": 2148, "loss": 0.2097, "lr": 1.163557028281792e-07, "epoch": 2.8146942571495, "percentage": 93.85, "elapsed_time": "4:41:17", "remaining_time": "0:18:25"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2014
  {"current_steps": 2014, "total_steps": 2148, "loss": 0.2267, "lr": 1.1986727955373588e-07, "epoch": 2.8119042083236456, "percentage": 93.76, "elapsed_time": "4:41:03", "remaining_time": "0:18:42"}
2015
  {"current_steps": 2015, "total_steps": 2148, "loss": 0.2363, "lr": 1.1810504364603737e-07, "epoch": 2.813299232736573, "percentage": 93.81, "elapsed_time": "4:41:10", "remaining_time": "0:18:33"}
2016
  {"current_steps": 2016, "total_steps": 2148, "loss": 0.2097, "lr": 1.163557028281792e-07, "epoch": 2.8146942571495, "percentage": 93.85, "elapsed_time": "4:41:17", "remaining_time": "0:18:25"}
2017
+ {"current_steps": 2017, "total_steps": 2148, "loss": 0.1964, "lr": 1.146192617208891e-07, "epoch": 2.8160892815624274, "percentage": 93.9, "elapsed_time": "4:41:30", "remaining_time": "0:18:17"}
2018
+ {"current_steps": 2018, "total_steps": 2148, "loss": 0.2091, "lr": 1.128957249108209e-07, "epoch": 2.8174843059753547, "percentage": 93.95, "elapsed_time": "4:41:38", "remaining_time": "0:18:08"}
2019
+ {"current_steps": 2019, "total_steps": 2148, "loss": 0.2097, "lr": 1.1118509695054236e-07, "epoch": 2.818879330388282, "percentage": 93.99, "elapsed_time": "4:41:44", "remaining_time": "0:18:00"}
2020
+ {"current_steps": 2020, "total_steps": 2148, "loss": 0.2057, "lr": 1.094873823585263e-07, "epoch": 2.8202743548012092, "percentage": 94.04, "elapsed_time": "4:41:52", "remaining_time": "0:17:51"}
2021
+ {"current_steps": 2021, "total_steps": 2148, "loss": 0.2375, "lr": 1.0780258561913281e-07, "epoch": 2.8216693792141365, "percentage": 94.09, "elapsed_time": "4:41:59", "remaining_time": "0:17:43"}
2022
+ {"current_steps": 2022, "total_steps": 2148, "loss": 0.2365, "lr": 1.0613071118260321e-07, "epoch": 2.8230644036270633, "percentage": 94.13, "elapsed_time": "4:42:06", "remaining_time": "0:17:34"}
2023
+ {"current_steps": 2023, "total_steps": 2148, "loss": 0.2507, "lr": 1.0447176346504439e-07, "epoch": 2.8244594280399906, "percentage": 94.18, "elapsed_time": "4:42:17", "remaining_time": "0:17:26"}
2024
+ {"current_steps": 2024, "total_steps": 2148, "loss": 0.2503, "lr": 1.0282574684841784e-07, "epoch": 2.825854452452918, "percentage": 94.23, "elapsed_time": "4:42:24", "remaining_time": "0:17:18"}
2025
+ {"current_steps": 2025, "total_steps": 2148, "loss": 0.2135, "lr": 1.011926656805301e-07, "epoch": 2.827249476865845, "percentage": 94.27, "elapsed_time": "4:42:38", "remaining_time": "0:17:10"}
2026
+ {"current_steps": 2026, "total_steps": 2148, "loss": 0.2098, "lr": 9.957252427501951e-08, "epoch": 2.8286445012787724, "percentage": 94.32, "elapsed_time": "4:42:46", "remaining_time": "0:17:01"}
2027
+ {"current_steps": 2027, "total_steps": 2148, "loss": 0.2391, "lr": 9.796532691134453e-08, "epoch": 2.8300395256916997, "percentage": 94.37, "elapsed_time": "4:42:56", "remaining_time": "0:16:53"}
2028
+ {"current_steps": 2028, "total_steps": 2148, "loss": 0.2211, "lr": 9.637107783477484e-08, "epoch": 2.831434550104627, "percentage": 94.41, "elapsed_time": "4:43:03", "remaining_time": "0:16:44"}
2029
+ {"current_steps": 2029, "total_steps": 2148, "loss": 0.2056, "lr": 9.478978125637583e-08, "epoch": 2.832829574517554, "percentage": 94.46, "elapsed_time": "4:43:14", "remaining_time": "0:16:36"}
2030
+ {"current_steps": 2030, "total_steps": 2148, "loss": 0.2356, "lr": 9.322144135300137e-08, "epoch": 2.834224598930481, "percentage": 94.51, "elapsed_time": "4:43:24", "remaining_time": "0:16:28"}
2031
+ {"current_steps": 2031, "total_steps": 2148, "loss": 0.2069, "lr": 9.166606226728103e-08, "epoch": 2.8356196233434083, "percentage": 94.55, "elapsed_time": "4:43:30", "remaining_time": "0:16:19"}
2032
+ {"current_steps": 2032, "total_steps": 2148, "loss": 0.2401, "lr": 9.012364810761121e-08, "epoch": 2.8370146477563356, "percentage": 94.6, "elapsed_time": "4:43:38", "remaining_time": "0:16:11"}
2033
+ {"current_steps": 2033, "total_steps": 2148, "loss": 0.235, "lr": 8.859420294814014e-08, "epoch": 2.838409672169263, "percentage": 94.65, "elapsed_time": "4:43:48", "remaining_time": "0:16:03"}
2034
+ {"current_steps": 2034, "total_steps": 2148, "loss": 0.2546, "lr": 8.70777308287618e-08, "epoch": 2.83980469658219, "percentage": 94.69, "elapsed_time": "4:43:55", "remaining_time": "0:15:54"}
2035
+ {"current_steps": 2035, "total_steps": 2148, "loss": 0.2552, "lr": 8.557423575510037e-08, "epoch": 2.8411997209951174, "percentage": 94.74, "elapsed_time": "4:44:04", "remaining_time": "0:15:46"}
2036
+ {"current_steps": 2036, "total_steps": 2148, "loss": 0.245, "lr": 8.408372169850521e-08, "epoch": 2.8425947454080447, "percentage": 94.79, "elapsed_time": "4:44:18", "remaining_time": "0:15:38"}
2037
+ {"current_steps": 2037, "total_steps": 2148, "loss": 0.2627, "lr": 8.26061925960353e-08, "epoch": 2.843989769820972, "percentage": 94.83, "elapsed_time": "4:44:30", "remaining_time": "0:15:30"}
2038
+ {"current_steps": 2038, "total_steps": 2148, "loss": 0.2387, "lr": 8.114165235045268e-08, "epoch": 2.8453847942338992, "percentage": 94.88, "elapsed_time": "4:44:36", "remaining_time": "0:15:21"}
2039
+ {"current_steps": 2039, "total_steps": 2148, "loss": 0.228, "lr": 7.969010483020845e-08, "epoch": 2.8467798186468265, "percentage": 94.93, "elapsed_time": "4:44:42", "remaining_time": "0:15:13"}
2040
+ {"current_steps": 2040, "total_steps": 2148, "loss": 0.2349, "lr": 7.825155386943784e-08, "epoch": 2.8481748430597538, "percentage": 94.97, "elapsed_time": "4:44:50", "remaining_time": "0:15:04"}
2041
+ {"current_steps": 2041, "total_steps": 2148, "loss": 0.2427, "lr": 7.682600326794353e-08, "epoch": 2.849569867472681, "percentage": 95.02, "elapsed_time": "4:45:02", "remaining_time": "0:14:56"}
2042
+ {"current_steps": 2042, "total_steps": 2148, "loss": 0.2302, "lr": 7.541345679118961e-08, "epoch": 2.850964891885608, "percentage": 95.07, "elapsed_time": "4:45:11", "remaining_time": "0:14:48"}
2043
+ {"current_steps": 2043, "total_steps": 2148, "loss": 0.227, "lr": 7.401391817029257e-08, "epoch": 2.852359916298535, "percentage": 95.11, "elapsed_time": "4:45:19", "remaining_time": "0:14:39"}
2044
+ {"current_steps": 2044, "total_steps": 2148, "loss": 0.2281, "lr": 7.262739110200923e-08, "epoch": 2.8537549407114624, "percentage": 95.16, "elapsed_time": "4:45:25", "remaining_time": "0:14:31"}
2045
+ {"current_steps": 2045, "total_steps": 2148, "loss": 0.2552, "lr": 7.125387924872552e-08, "epoch": 2.8551499651243897, "percentage": 95.2, "elapsed_time": "4:45:35", "remaining_time": "0:14:23"}
2046
+ {"current_steps": 2046, "total_steps": 2148, "loss": 0.2123, "lr": 6.98933862384521e-08, "epoch": 2.856544989537317, "percentage": 95.25, "elapsed_time": "4:45:41", "remaining_time": "0:14:14"}
2047
+ {"current_steps": 2047, "total_steps": 2148, "loss": 0.1864, "lr": 6.854591566480884e-08, "epoch": 2.857940013950244, "percentage": 95.3, "elapsed_time": "4:45:50", "remaining_time": "0:14:06"}
2048
+ {"current_steps": 2048, "total_steps": 2148, "loss": 0.2352, "lr": 6.721147108701864e-08, "epoch": 2.8593350383631715, "percentage": 95.34, "elapsed_time": "4:45:57", "remaining_time": "0:13:57"}
2049
+ {"current_steps": 2049, "total_steps": 2148, "loss": 0.2299, "lr": 6.589005602989862e-08, "epoch": 2.8607300627760983, "percentage": 95.39, "elapsed_time": "4:46:05", "remaining_time": "0:13:49"}
2050
+ {"current_steps": 2050, "total_steps": 2148, "loss": 0.2346, "lr": 6.458167398384896e-08, "epoch": 2.8621250871890256, "percentage": 95.44, "elapsed_time": "4:46:11", "remaining_time": "0:13:40"}
2051
+ {"current_steps": 2051, "total_steps": 2148, "loss": 0.2003, "lr": 6.328632840484294e-08, "epoch": 2.863520111601953, "percentage": 95.48, "elapsed_time": "4:46:18", "remaining_time": "0:13:32"}
2052
+ {"current_steps": 2052, "total_steps": 2148, "loss": 0.2241, "lr": 6.200402271442085e-08, "epoch": 2.86491513601488, "percentage": 95.53, "elapsed_time": "4:46:24", "remaining_time": "0:13:23"}
2053
+ {"current_steps": 2053, "total_steps": 2148, "loss": 0.2304, "lr": 6.073476029967884e-08, "epoch": 2.8663101604278074, "percentage": 95.58, "elapsed_time": "4:46:32", "remaining_time": "0:13:15"}
2054
+ {"current_steps": 2054, "total_steps": 2148, "loss": 0.2461, "lr": 5.947854451326007e-08, "epoch": 2.8677051848407347, "percentage": 95.62, "elapsed_time": "4:46:40", "remaining_time": "0:13:07"}
2055
+ {"current_steps": 2055, "total_steps": 2148, "loss": 0.2136, "lr": 5.823537867334694e-08, "epoch": 2.869100209253662, "percentage": 95.67, "elapsed_time": "4:46:48", "remaining_time": "0:12:58"}
2056
+ {"current_steps": 2056, "total_steps": 2148, "loss": 0.2243, "lr": 5.7005266063650534e-08, "epoch": 2.870495233666589, "percentage": 95.72, "elapsed_time": "4:46:54", "remaining_time": "0:12:50"}
2057
+ {"current_steps": 2057, "total_steps": 2148, "loss": 0.2805, "lr": 5.5788209933403944e-08, "epoch": 2.8718902580795165, "percentage": 95.76, "elapsed_time": "4:47:00", "remaining_time": "0:12:41"}
2058
+ {"current_steps": 2058, "total_steps": 2148, "loss": 0.2263, "lr": 5.4584213497351766e-08, "epoch": 2.8732852824924437, "percentage": 95.81, "elapsed_time": "4:47:07", "remaining_time": "0:12:33"}
2059
+ {"current_steps": 2059, "total_steps": 2148, "loss": 0.2099, "lr": 5.339327993574339e-08, "epoch": 2.874680306905371, "percentage": 95.86, "elapsed_time": "4:47:14", "remaining_time": "0:12:24"}
2060
+ {"current_steps": 2060, "total_steps": 2148, "loss": 0.1981, "lr": 5.221541239432415e-08, "epoch": 2.8760753313182983, "percentage": 95.9, "elapsed_time": "4:47:23", "remaining_time": "0:12:16"}
2061
+ {"current_steps": 2061, "total_steps": 2148, "loss": 0.1994, "lr": 5.1050613984324756e-08, "epoch": 2.8774703557312256, "percentage": 95.95, "elapsed_time": "4:47:33", "remaining_time": "0:12:08"}
2062
+ {"current_steps": 2062, "total_steps": 2148, "loss": 0.2516, "lr": 4.989888778245744e-08, "epoch": 2.8788653801441524, "percentage": 96.0, "elapsed_time": "4:47:41", "remaining_time": "0:11:59"}
2063
+ {"current_steps": 2063, "total_steps": 2148, "loss": 0.2377, "lr": 4.8760236830903697e-08, "epoch": 2.8802604045570797, "percentage": 96.04, "elapsed_time": "4:47:51", "remaining_time": "0:11:51"}
2064
+ {"current_steps": 2064, "total_steps": 2148, "loss": 0.2451, "lr": 4.763466413730822e-08, "epoch": 2.881655428970007, "percentage": 96.09, "elapsed_time": "4:47:58", "remaining_time": "0:11:43"}
2065
+ {"current_steps": 2065, "total_steps": 2148, "loss": 0.2393, "lr": 4.65221726747711e-08, "epoch": 2.883050453382934, "percentage": 96.14, "elapsed_time": "4:48:08", "remaining_time": "0:11:34"}
2066
+ {"current_steps": 2066, "total_steps": 2148, "loss": 0.2225, "lr": 4.542276538183954e-08, "epoch": 2.8844454777958615, "percentage": 96.18, "elapsed_time": "4:48:23", "remaining_time": "0:11:26"}
2067
+ {"current_steps": 2067, "total_steps": 2148, "loss": 0.246, "lr": 4.433644516249891e-08, "epoch": 2.8858405022087887, "percentage": 96.23, "elapsed_time": "4:48:30", "remaining_time": "0:11:18"}
2068
+ {"current_steps": 2068, "total_steps": 2148, "loss": 0.2508, "lr": 4.326321488616836e-08, "epoch": 2.887235526621716, "percentage": 96.28, "elapsed_time": "4:48:48", "remaining_time": "0:11:10"}
2069
+ {"current_steps": 2069, "total_steps": 2148, "loss": 0.2237, "lr": 4.220307738768859e-08, "epoch": 2.888630551034643, "percentage": 96.32, "elapsed_time": "4:48:54", "remaining_time": "0:11:01"}
2070
+ {"current_steps": 2070, "total_steps": 2148, "loss": 0.246, "lr": 4.11560354673185e-08, "epoch": 2.89002557544757, "percentage": 96.37, "elapsed_time": "4:49:03", "remaining_time": "0:10:53"}
2071
+ {"current_steps": 2071, "total_steps": 2148, "loss": 0.2291, "lr": 4.0122091890726354e-08, "epoch": 2.8914205998604974, "percentage": 96.42, "elapsed_time": "4:49:09", "remaining_time": "0:10:45"}
2072
+ {"current_steps": 2072, "total_steps": 2148, "loss": 0.2018, "lr": 3.9101249388981965e-08, "epoch": 2.8928156242734246, "percentage": 96.46, "elapsed_time": "4:49:22", "remaining_time": "0:10:36"}
2073
+ {"current_steps": 2073, "total_steps": 2148, "loss": 0.2586, "lr": 3.809351065854894e-08, "epoch": 2.894210648686352, "percentage": 96.51, "elapsed_time": "4:49:32", "remaining_time": "0:10:28"}
2074
+ {"current_steps": 2074, "total_steps": 2148, "loss": 0.2614, "lr": 3.709887836128023e-08, "epoch": 2.895605673099279, "percentage": 96.55, "elapsed_time": "4:49:42", "remaining_time": "0:10:20"}
2075
+ {"current_steps": 2075, "total_steps": 2148, "loss": 0.2514, "lr": 3.611735512440706e-08, "epoch": 2.8970006975122065, "percentage": 96.6, "elapsed_time": "4:49:48", "remaining_time": "0:10:11"}
2076
+ {"current_steps": 2076, "total_steps": 2148, "loss": 0.2265, "lr": 3.5148943540536105e-08, "epoch": 2.8983957219251337, "percentage": 96.65, "elapsed_time": "4:49:57", "remaining_time": "0:10:03"}
2077
+ {"current_steps": 2077, "total_steps": 2148, "loss": 0.2521, "lr": 3.4193646167640646e-08, "epoch": 2.899790746338061, "percentage": 96.69, "elapsed_time": "4:50:04", "remaining_time": "0:09:54"}
2078
+ {"current_steps": 2078, "total_steps": 2148, "loss": 0.228, "lr": 3.325146552905223e-08, "epoch": 2.9011857707509883, "percentage": 96.74, "elapsed_time": "4:50:12", "remaining_time": "0:09:46"}
2079
+ {"current_steps": 2079, "total_steps": 2148, "loss": 0.2535, "lr": 3.2322404113457886e-08, "epoch": 2.9025807951639155, "percentage": 96.79, "elapsed_time": "4:50:21", "remaining_time": "0:09:38"}
2080
+ {"current_steps": 2080, "total_steps": 2148, "loss": 0.2293, "lr": 3.1406464374890144e-08, "epoch": 2.903975819576843, "percentage": 96.83, "elapsed_time": "4:50:28", "remaining_time": "0:09:29"}
2081
+ {"current_steps": 2081, "total_steps": 2148, "loss": 0.2477, "lr": 3.0503648732722046e-08, "epoch": 2.90537084398977, "percentage": 96.88, "elapsed_time": "4:50:38", "remaining_time": "0:09:21"}
2082
+ {"current_steps": 2082, "total_steps": 2148, "loss": 0.2157, "lr": 2.9613959571660468e-08, "epoch": 2.906765868402697, "percentage": 96.93, "elapsed_time": "4:50:44", "remaining_time": "0:09:13"}
2083
+ {"current_steps": 2083, "total_steps": 2148, "loss": 0.2189, "lr": 2.8737399241740016e-08, "epoch": 2.908160892815624, "percentage": 96.97, "elapsed_time": "4:50:51", "remaining_time": "0:09:04"}
2084
+ {"current_steps": 2084, "total_steps": 2148, "loss": 0.2289, "lr": 2.7873970058316934e-08, "epoch": 2.9095559172285514, "percentage": 97.02, "elapsed_time": "4:51:01", "remaining_time": "0:08:56"}
2085
+ {"current_steps": 2085, "total_steps": 2148, "loss": 0.2243, "lr": 2.7023674302061875e-08, "epoch": 2.9109509416414787, "percentage": 97.07, "elapsed_time": "4:51:07", "remaining_time": "0:08:47"}
2086
+ {"current_steps": 2086, "total_steps": 2148, "loss": 0.2063, "lr": 2.6186514218954905e-08, "epoch": 2.912345966054406, "percentage": 97.11, "elapsed_time": "4:51:13", "remaining_time": "0:08:39"}
2087
+ {"current_steps": 2087, "total_steps": 2148, "loss": 0.2177, "lr": 2.5362492020280517e-08, "epoch": 2.9137409904673333, "percentage": 97.16, "elapsed_time": "4:51:26", "remaining_time": "0:08:31"}
2088
+ {"current_steps": 2088, "total_steps": 2148, "loss": 0.2492, "lr": 2.4551609882619288e-08, "epoch": 2.9151360148802605, "percentage": 97.21, "elapsed_time": "4:51:35", "remaining_time": "0:08:22"}
2089
+ {"current_steps": 2089, "total_steps": 2148, "loss": 0.2173, "lr": 2.3753869947843457e-08, "epoch": 2.9165310392931874, "percentage": 97.25, "elapsed_time": "4:51:42", "remaining_time": "0:08:14"}
2090
+ {"current_steps": 2090, "total_steps": 2148, "loss": 0.2468, "lr": 2.296927432311358e-08, "epoch": 2.9179260637061146, "percentage": 97.3, "elapsed_time": "4:51:49", "remaining_time": "0:08:05"}
2091
+ {"current_steps": 2091, "total_steps": 2148, "loss": 0.2247, "lr": 2.2197825080867432e-08, "epoch": 2.919321088119042, "percentage": 97.35, "elapsed_time": "4:51:59", "remaining_time": "0:07:57"}
2092
+ {"current_steps": 2092, "total_steps": 2148, "loss": 0.2491, "lr": 2.1439524258819456e-08, "epoch": 2.920716112531969, "percentage": 97.39, "elapsed_time": "4:52:09", "remaining_time": "0:07:49"}
2093
+ {"current_steps": 2093, "total_steps": 2148, "loss": 0.2173, "lr": 2.0694373859954653e-08, "epoch": 2.9221111369448964, "percentage": 97.44, "elapsed_time": "4:52:16", "remaining_time": "0:07:40"}
2094
+ {"current_steps": 2094, "total_steps": 2148, "loss": 0.2368, "lr": 1.99623758525197e-08, "epoch": 2.9235061613578237, "percentage": 97.49, "elapsed_time": "4:52:23", "remaining_time": "0:07:32"}
2095
+ {"current_steps": 2095, "total_steps": 2148, "loss": 0.221, "lr": 1.9243532170023504e-08, "epoch": 2.924901185770751, "percentage": 97.53, "elapsed_time": "4:52:32", "remaining_time": "0:07:24"}
2096
+ {"current_steps": 2096, "total_steps": 2148, "loss": 0.2049, "lr": 1.8537844711227215e-08, "epoch": 2.9262962101836782, "percentage": 97.58, "elapsed_time": "4:52:40", "remaining_time": "0:07:15"}
2097
+ {"current_steps": 2097, "total_steps": 2148, "loss": 0.2097, "lr": 1.7845315340140334e-08, "epoch": 2.9276912345966055, "percentage": 97.63, "elapsed_time": "4:52:50", "remaining_time": "0:07:07"}
2098
+ {"current_steps": 2098, "total_steps": 2148, "loss": 0.1912, "lr": 1.7165945886018498e-08, "epoch": 2.929086259009533, "percentage": 97.67, "elapsed_time": "4:53:00", "remaining_time": "0:06:58"}
2099
+ {"current_steps": 2099, "total_steps": 2148, "loss": 0.2142, "lr": 1.6499738143354594e-08, "epoch": 2.93048128342246, "percentage": 97.72, "elapsed_time": "4:53:07", "remaining_time": "0:06:50"}
2100
+ {"current_steps": 2100, "total_steps": 2148, "loss": 0.2267, "lr": 1.584669387187765e-08, "epoch": 2.9318763078353873, "percentage": 97.77, "elapsed_time": "4:53:22", "remaining_time": "0:06:42"}
2101
+ {"current_steps": 2101, "total_steps": 2148, "loss": 0.219, "lr": 1.520681479654562e-08, "epoch": 2.9332713322483146, "percentage": 97.81, "elapsed_time": "4:53:31", "remaining_time": "0:06:33"}
2102
+ {"current_steps": 2102, "total_steps": 2148, "loss": 0.2275, "lr": 1.4580102607541502e-08, "epoch": 2.9346663566612414, "percentage": 97.86, "elapsed_time": "4:53:38", "remaining_time": "0:06:25"}
2103
+ {"current_steps": 2103, "total_steps": 2148, "loss": 0.2082, "lr": 1.3966558960269994e-08, "epoch": 2.9360613810741687, "percentage": 97.91, "elapsed_time": "4:53:45", "remaining_time": "0:06:17"}
2104
+ {"current_steps": 2104, "total_steps": 2148, "loss": 0.2073, "lr": 1.3366185475351957e-08, "epoch": 2.937456405487096, "percentage": 97.95, "elapsed_time": "4:53:52", "remaining_time": "0:06:08"}
2105
+ {"current_steps": 2105, "total_steps": 2148, "loss": 0.2326, "lr": 1.2778983738620521e-08, "epoch": 2.9388514299000232, "percentage": 98.0, "elapsed_time": "4:54:01", "remaining_time": "0:06:00"}
2106
+ {"current_steps": 2106, "total_steps": 2148, "loss": 0.2094, "lr": 1.2204955301116095e-08, "epoch": 2.9402464543129505, "percentage": 98.04, "elapsed_time": "4:54:07", "remaining_time": "0:05:51"}
2107
+ {"current_steps": 2107, "total_steps": 2148, "loss": 0.2212, "lr": 1.164410167908414e-08, "epoch": 2.941641478725878, "percentage": 98.09, "elapsed_time": "4:54:15", "remaining_time": "0:05:43"}
2108
+ {"current_steps": 2108, "total_steps": 2148, "loss": 0.2125, "lr": 1.109642435396907e-08, "epoch": 2.943036503138805, "percentage": 98.14, "elapsed_time": "4:54:25", "remaining_time": "0:05:35"}
2109
+ {"current_steps": 2109, "total_steps": 2148, "loss": 0.2243, "lr": 1.0561924772412024e-08, "epoch": 2.9444315275517323, "percentage": 98.18, "elapsed_time": "4:54:32", "remaining_time": "0:05:26"}
2110
+ {"current_steps": 2110, "total_steps": 2148, "loss": 0.2682, "lr": 1.0040604346245319e-08, "epoch": 2.945826551964659, "percentage": 98.23, "elapsed_time": "4:54:39", "remaining_time": "0:05:18"}
2111
+ {"current_steps": 2111, "total_steps": 2148, "loss": 0.2187, "lr": 9.532464452491341e-09, "epoch": 2.9472215763775864, "percentage": 98.28, "elapsed_time": "4:54:45", "remaining_time": "0:05:09"}
2112
+ {"current_steps": 2112, "total_steps": 2148, "loss": 0.2265, "lr": 9.037506433355325e-09, "epoch": 2.9486166007905137, "percentage": 98.32, "elapsed_time": "4:54:53", "remaining_time": "0:05:01"}
2113
+ {"current_steps": 2113, "total_steps": 2148, "loss": 0.2115, "lr": 8.555731596224803e-09, "epoch": 2.950011625203441, "percentage": 98.37, "elapsed_time": "4:55:02", "remaining_time": "0:04:53"}
2114
+ {"current_steps": 2114, "total_steps": 2148, "loss": 0.2384, "lr": 8.087141213665717e-09, "epoch": 2.9514066496163682, "percentage": 98.42, "elapsed_time": "4:55:10", "remaining_time": "0:04:44"}
2115
+ {"current_steps": 2115, "total_steps": 2148, "loss": 0.2296, "lr": 7.631736523416867e-09, "epoch": 2.9528016740292955, "percentage": 98.46, "elapsed_time": "4:55:17", "remaining_time": "0:04:36"}
2116
+ {"current_steps": 2116, "total_steps": 2148, "loss": 0.1834, "lr": 7.1895187283899104e-09, "epoch": 2.9541966984422228, "percentage": 98.51, "elapsed_time": "4:55:28", "remaining_time": "0:04:28"}
2117
+ {"current_steps": 2117, "total_steps": 2148, "loss": 0.2321, "lr": 6.760488996662706e-09, "epoch": 2.95559172285515, "percentage": 98.56, "elapsed_time": "4:55:37", "remaining_time": "0:04:19"}
2118
+ {"current_steps": 2118, "total_steps": 2148, "loss": 0.197, "lr": 6.3446484614798635e-09, "epoch": 2.9569867472680773, "percentage": 98.6, "elapsed_time": "4:55:46", "remaining_time": "0:04:11"}
2119
+ {"current_steps": 2119, "total_steps": 2148, "loss": 0.2359, "lr": 5.941998221247192e-09, "epoch": 2.9583817716810046, "percentage": 98.65, "elapsed_time": "4:55:54", "remaining_time": "0:04:02"}
2120
+ {"current_steps": 2120, "total_steps": 2148, "loss": 0.2762, "lr": 5.552539339528373e-09, "epoch": 2.959776796093932, "percentage": 98.7, "elapsed_time": "4:56:02", "remaining_time": "0:03:54"}
2121
+ {"current_steps": 2121, "total_steps": 2148, "loss": 0.2286, "lr": 5.176272845045516e-09, "epoch": 2.961171820506859, "percentage": 98.74, "elapsed_time": "4:56:11", "remaining_time": "0:03:46"}
2122
+ {"current_steps": 2122, "total_steps": 2148, "loss": 0.2036, "lr": 4.813199731671381e-09, "epoch": 2.962566844919786, "percentage": 98.79, "elapsed_time": "4:56:18", "remaining_time": "0:03:37"}
2123
+ {"current_steps": 2123, "total_steps": 2148, "loss": 0.1943, "lr": 4.463320958432716e-09, "epoch": 2.963961869332713, "percentage": 98.84, "elapsed_time": "4:56:25", "remaining_time": "0:03:29"}
2124
+ {"current_steps": 2124, "total_steps": 2148, "loss": 0.219, "lr": 4.1266374495024795e-09, "epoch": 2.9653568937456405, "percentage": 98.88, "elapsed_time": "4:56:31", "remaining_time": "0:03:21"}
2125
+ {"current_steps": 2125, "total_steps": 2148, "loss": 0.2182, "lr": 3.803150094200403e-09, "epoch": 2.9667519181585678, "percentage": 98.93, "elapsed_time": "4:56:37", "remaining_time": "0:03:12"}
2126
+ {"current_steps": 2126, "total_steps": 2148, "loss": 0.2141, "lr": 3.4928597469885416e-09, "epoch": 2.968146942571495, "percentage": 98.98, "elapsed_time": "4:56:46", "remaining_time": "0:03:04"}
2127
+ {"current_steps": 2127, "total_steps": 2148, "loss": 0.23, "lr": 3.1957672274723907e-09, "epoch": 2.9695419669844223, "percentage": 99.02, "elapsed_time": "4:56:54", "remaining_time": "0:02:55"}
2128
+ {"current_steps": 2128, "total_steps": 2148, "loss": 0.2378, "lr": 2.9118733203942207e-09, "epoch": 2.9709369913973496, "percentage": 99.07, "elapsed_time": "4:57:01", "remaining_time": "0:02:47"}
2129
+ {"current_steps": 2129, "total_steps": 2148, "loss": 0.2335, "lr": 2.6411787756353e-09, "epoch": 2.972332015810277, "percentage": 99.12, "elapsed_time": "4:57:10", "remaining_time": "0:02:39"}
2130
+ {"current_steps": 2130, "total_steps": 2148, "loss": 0.2453, "lr": 2.3836843082108987e-09, "epoch": 2.9737270402232037, "percentage": 99.16, "elapsed_time": "4:57:18", "remaining_time": "0:02:30"}
2131
+ {"current_steps": 2131, "total_steps": 2148, "loss": 0.2151, "lr": 2.1393905982691752e-09, "epoch": 2.975122064636131, "percentage": 99.21, "elapsed_time": "4:57:26", "remaining_time": "0:02:22"}
2132
+ {"current_steps": 2132, "total_steps": 2148, "loss": 0.2255, "lr": 1.9082982910911817e-09, "epoch": 2.976517089049058, "percentage": 99.26, "elapsed_time": "4:57:34", "remaining_time": "0:02:13"}
2133
+ {"current_steps": 2133, "total_steps": 2148, "loss": 0.2194, "lr": 1.6904079970853083e-09, "epoch": 2.9779121134619855, "percentage": 99.3, "elapsed_time": "4:57:46", "remaining_time": "0:02:05"}
2134
+ {"current_steps": 2134, "total_steps": 2148, "loss": 0.2221, "lr": 1.4857202917900604e-09, "epoch": 2.9793071378749127, "percentage": 99.35, "elapsed_time": "4:58:00", "remaining_time": "0:01:57"}
2135
+ {"current_steps": 2135, "total_steps": 2148, "loss": 0.2172, "lr": 1.2942357158701734e-09, "epoch": 2.98070216228784, "percentage": 99.39, "elapsed_time": "4:58:07", "remaining_time": "0:01:48"}
2136
+ {"current_steps": 2136, "total_steps": 2148, "loss": 0.2406, "lr": 1.1159547751143918e-09, "epoch": 2.9820971867007673, "percentage": 99.44, "elapsed_time": "4:58:13", "remaining_time": "0:01:40"}
2137
+ {"current_steps": 2137, "total_steps": 2148, "loss": 0.2521, "lr": 9.508779404360235e-10, "epoch": 2.9834922111136946, "percentage": 99.49, "elapsed_time": "4:58:21", "remaining_time": "0:01:32"}
2138
+ {"current_steps": 2138, "total_steps": 2148, "loss": 0.2252, "lr": 7.990056478707209e-10, "epoch": 2.984887235526622, "percentage": 99.53, "elapsed_time": "4:58:28", "remaining_time": "0:01:23"}
2139
+ {"current_steps": 2139, "total_steps": 2148, "loss": 0.2268, "lr": 6.603382985759244e-10, "epoch": 2.986282259939549, "percentage": 99.58, "elapsed_time": "4:58:35", "remaining_time": "0:01:15"}
2140
+ {"current_steps": 2140, "total_steps": 2148, "loss": 0.2651, "lr": 5.348762588286427e-10, "epoch": 2.9876772843524764, "percentage": 99.63, "elapsed_time": "4:58:41", "remaining_time": "0:01:06"}
2141
+ {"current_steps": 2141, "total_steps": 2148, "loss": 0.2521, "lr": 4.2261986002600783e-10, "epoch": 2.9890723087654036, "percentage": 99.67, "elapsed_time": "4:58:53", "remaining_time": "0:00:58"}
2142
+ {"current_steps": 2142, "total_steps": 2148, "loss": 0.2588, "lr": 3.235693986830546e-10, "epoch": 2.9904673331783305, "percentage": 99.72, "elapsed_time": "4:59:02", "remaining_time": "0:00:50"}
2143
+ {"current_steps": 2143, "total_steps": 2148, "loss": 0.2408, "lr": 2.3772513643327555e-10, "epoch": 2.9918623575912577, "percentage": 99.77, "elapsed_time": "4:59:12", "remaining_time": "0:00:41"}
2144
+ {"current_steps": 2144, "total_steps": 2148, "loss": 0.2254, "lr": 1.650873000258457e-10, "epoch": 2.993257382004185, "percentage": 99.81, "elapsed_time": "4:59:21", "remaining_time": "0:00:33"}
2145
+ {"current_steps": 2145, "total_steps": 2148, "loss": 0.2305, "lr": 1.0565608132728778e-10, "epoch": 2.9946524064171123, "percentage": 99.86, "elapsed_time": "4:59:32", "remaining_time": "0:00:25"}
2146
+ {"current_steps": 2146, "total_steps": 2148, "loss": 0.2517, "lr": 5.943163732036183e-11, "epoch": 2.9960474308300395, "percentage": 99.91, "elapsed_time": "4:59:39", "remaining_time": "0:00:16"}
2147
+ {"current_steps": 2147, "total_steps": 2148, "loss": 0.2434, "lr": 2.6414090102400147e-11, "epoch": 2.997442455242967, "percentage": 99.95, "elapsed_time": "4:59:47", "remaining_time": "0:00:08"}
2148
+ {"current_steps": 2148, "total_steps": 2148, "loss": 0.2413, "lr": 6.6035268864173e-12, "epoch": 2.998837479655894, "percentage": 100.0, "elapsed_time": "4:59:54", "remaining_time": "0:00:00"}
2149
+ {"current_steps": 2148, "total_steps": 2148, "epoch": 2.998837479655894, "percentage": 100.0, "elapsed_time": "5:01:39", "remaining_time": "0:00:00"}