|
{"current_steps": 1, "total_steps": 100, "loss": 0.063, "lr": 1e-05, "epoch": 0.048484848484848485, "percentage": 1.0, "elapsed_time": "0:00:27", "remaining_time": "0:45:13"} |
|
{"current_steps": 2, "total_steps": 100, "loss": 0.0607, "lr": 2e-05, "epoch": 0.09696969696969697, "percentage": 2.0, "elapsed_time": "0:00:45", "remaining_time": "0:37:02"} |
|
{"current_steps": 3, "total_steps": 100, "loss": 0.0615, "lr": 3e-05, "epoch": 0.14545454545454545, "percentage": 3.0, "elapsed_time": "0:01:04", "remaining_time": "0:34:46"} |
|
{"current_steps": 4, "total_steps": 100, "loss": 0.0504, "lr": 4e-05, "epoch": 0.19393939393939394, "percentage": 4.0, "elapsed_time": "0:01:25", "remaining_time": "0:34:03"} |
|
{"current_steps": 5, "total_steps": 100, "loss": 0.0395, "lr": 5e-05, "epoch": 0.24242424242424243, "percentage": 5.0, "elapsed_time": "0:01:43", "remaining_time": "0:32:37"} |
|
{"current_steps": 5, "total_steps": 100, "eval_loss": 0.04326783865690231, "epoch": 0.24242424242424243, "percentage": 5.0, "elapsed_time": "0:01:54", "remaining_time": "0:36:13"} |
|
{"current_steps": 6, "total_steps": 100, "loss": 0.0419, "lr": 6e-05, "epoch": 0.2909090909090909, "percentage": 6.0, "elapsed_time": "0:02:12", "remaining_time": "0:34:37"} |
|
{"current_steps": 7, "total_steps": 100, "loss": 0.0381, "lr": 7e-05, "epoch": 0.3393939393939394, "percentage": 7.0, "elapsed_time": "0:02:35", "remaining_time": "0:34:24"} |
|
{"current_steps": 8, "total_steps": 100, "loss": 0.0341, "lr": 8e-05, "epoch": 0.3878787878787879, "percentage": 8.0, "elapsed_time": "0:02:52", "remaining_time": "0:33:09"} |
|
{"current_steps": 9, "total_steps": 100, "loss": 0.0345, "lr": 9e-05, "epoch": 0.43636363636363634, "percentage": 9.0, "elapsed_time": "0:03:10", "remaining_time": "0:32:10"} |
|
{"current_steps": 10, "total_steps": 100, "loss": 0.0324, "lr": 0.0001, "epoch": 0.48484848484848486, "percentage": 10.0, "elapsed_time": "0:03:28", "remaining_time": "0:31:13"} |
|
{"current_steps": 10, "total_steps": 100, "eval_loss": 0.03000650927424431, "epoch": 0.48484848484848486, "percentage": 10.0, "elapsed_time": "0:03:38", "remaining_time": "0:32:47"} |
|
{"current_steps": 11, "total_steps": 100, "loss": 0.0331, "lr": 9.99695413509548e-05, "epoch": 0.5333333333333333, "percentage": 11.0, "elapsed_time": "0:03:56", "remaining_time": "0:31:51"} |
|
{"current_steps": 12, "total_steps": 100, "loss": 0.029, "lr": 9.987820251299122e-05, "epoch": 0.5818181818181818, "percentage": 12.0, "elapsed_time": "0:04:14", "remaining_time": "0:31:03"} |
|
{"current_steps": 13, "total_steps": 100, "loss": 0.0257, "lr": 9.972609476841367e-05, "epoch": 0.6303030303030303, "percentage": 13.0, "elapsed_time": "0:04:32", "remaining_time": "0:30:20"} |
|
{"current_steps": 14, "total_steps": 100, "loss": 0.0215, "lr": 9.951340343707852e-05, "epoch": 0.6787878787878788, "percentage": 14.0, "elapsed_time": "0:04:48", "remaining_time": "0:29:32"} |
|
{"current_steps": 15, "total_steps": 100, "loss": 0.024, "lr": 9.924038765061042e-05, "epoch": 0.7272727272727273, "percentage": 15.0, "elapsed_time": "0:05:06", "remaining_time": "0:28:56"} |
|
{"current_steps": 15, "total_steps": 100, "eval_loss": 0.024439169093966484, "epoch": 0.7272727272727273, "percentage": 15.0, "elapsed_time": "0:05:16", "remaining_time": "0:29:54"} |
|
{"current_steps": 16, "total_steps": 100, "loss": 0.0321, "lr": 9.890738003669029e-05, "epoch": 0.7757575757575758, "percentage": 16.0, "elapsed_time": "0:05:34", "remaining_time": "0:29:17"} |
|
{"current_steps": 17, "total_steps": 100, "loss": 0.0281, "lr": 9.851478631379982e-05, "epoch": 0.8242424242424242, "percentage": 17.0, "elapsed_time": "0:05:52", "remaining_time": "0:28:41"} |
|
{"current_steps": 18, "total_steps": 100, "loss": 0.0202, "lr": 9.806308479691595e-05, "epoch": 0.8727272727272727, "percentage": 18.0, "elapsed_time": "0:06:11", "remaining_time": "0:28:11"} |
|
{"current_steps": 19, "total_steps": 100, "loss": 0.0206, "lr": 9.755282581475769e-05, "epoch": 0.9212121212121213, "percentage": 19.0, "elapsed_time": "0:06:28", "remaining_time": "0:27:35"} |
|
{"current_steps": 20, "total_steps": 100, "loss": 0.0189, "lr": 9.698463103929542e-05, "epoch": 0.9696969696969697, "percentage": 20.0, "elapsed_time": "0:06:45", "remaining_time": "0:27:01"} |
|
{"current_steps": 20, "total_steps": 100, "eval_loss": 0.0212231557816267, "epoch": 0.9696969696969697, "percentage": 20.0, "elapsed_time": "0:06:55", "remaining_time": "0:27:43"} |
|
{"current_steps": 21, "total_steps": 100, "loss": 0.0317, "lr": 9.635919272833938e-05, "epoch": 1.0363636363636364, "percentage": 21.0, "elapsed_time": "0:07:17", "remaining_time": "0:27:25"} |
|
{"current_steps": 22, "total_steps": 100, "loss": 0.019, "lr": 9.567727288213005e-05, "epoch": 1.084848484848485, "percentage": 22.0, "elapsed_time": "0:07:34", "remaining_time": "0:26:52"} |
|
{"current_steps": 23, "total_steps": 100, "loss": 0.019, "lr": 9.493970231495835e-05, "epoch": 1.1333333333333333, "percentage": 23.0, "elapsed_time": "0:07:52", "remaining_time": "0:26:22"} |
|
{"current_steps": 24, "total_steps": 100, "loss": 0.0181, "lr": 9.414737964294636e-05, "epoch": 1.1818181818181819, "percentage": 24.0, "elapsed_time": "0:08:10", "remaining_time": "0:25:53"} |
|
{"current_steps": 25, "total_steps": 100, "loss": 0.0171, "lr": 9.330127018922194e-05, "epoch": 1.2303030303030302, "percentage": 25.0, "elapsed_time": "0:08:27", "remaining_time": "0:25:23"} |
|
{"current_steps": 25, "total_steps": 100, "eval_loss": 0.019027845934033394, "epoch": 1.2303030303030302, "percentage": 25.0, "elapsed_time": "0:08:38", "remaining_time": "0:25:54"} |
|
{"current_steps": 26, "total_steps": 100, "loss": 0.0182, "lr": 9.24024048078213e-05, "epoch": 1.2787878787878788, "percentage": 26.0, "elapsed_time": "0:08:55", "remaining_time": "0:25:24"} |
|
{"current_steps": 27, "total_steps": 100, "loss": 0.0163, "lr": 9.145187862775209e-05, "epoch": 1.3272727272727272, "percentage": 27.0, "elapsed_time": "0:09:13", "remaining_time": "0:24:56"} |
|
{"current_steps": 28, "total_steps": 100, "loss": 0.0177, "lr": 9.045084971874738e-05, "epoch": 1.3757575757575757, "percentage": 28.0, "elapsed_time": "0:09:31", "remaining_time": "0:24:28"} |
|
{"current_steps": 29, "total_steps": 100, "loss": 0.014, "lr": 8.940053768033609e-05, "epoch": 1.4242424242424243, "percentage": 29.0, "elapsed_time": "0:09:47", "remaining_time": "0:23:59"} |
|
{"current_steps": 30, "total_steps": 100, "loss": 0.0146, "lr": 8.83022221559489e-05, "epoch": 1.4727272727272727, "percentage": 30.0, "elapsed_time": "0:10:05", "remaining_time": "0:23:32"} |
|
{"current_steps": 30, "total_steps": 100, "eval_loss": 0.01733844168484211, "epoch": 1.4727272727272727, "percentage": 30.0, "elapsed_time": "0:10:15", "remaining_time": "0:23:56"} |
|
{"current_steps": 31, "total_steps": 100, "loss": 0.017, "lr": 8.715724127386972e-05, "epoch": 1.5212121212121212, "percentage": 31.0, "elapsed_time": "0:10:33", "remaining_time": "0:23:30"} |
|
{"current_steps": 32, "total_steps": 100, "loss": 0.0155, "lr": 8.596699001693255e-05, "epoch": 1.5696969696969698, "percentage": 32.0, "elapsed_time": "0:10:51", "remaining_time": "0:23:04"} |
|
{"current_steps": 33, "total_steps": 100, "loss": 0.0157, "lr": 8.473291852294987e-05, "epoch": 1.6181818181818182, "percentage": 33.0, "elapsed_time": "0:11:08", "remaining_time": "0:22:37"} |
|
{"current_steps": 34, "total_steps": 100, "loss": 0.0167, "lr": 8.345653031794292e-05, "epoch": 1.6666666666666665, "percentage": 34.0, "elapsed_time": "0:11:26", "remaining_time": "0:22:12"} |
|
{"current_steps": 35, "total_steps": 100, "loss": 0.0144, "lr": 8.213938048432697e-05, "epoch": 1.7151515151515153, "percentage": 35.0, "elapsed_time": "0:11:44", "remaining_time": "0:21:48"} |
|
{"current_steps": 35, "total_steps": 100, "eval_loss": 0.016134196892380714, "epoch": 1.7151515151515153, "percentage": 35.0, "elapsed_time": "0:11:54", "remaining_time": "0:22:07"} |
|
{"current_steps": 36, "total_steps": 100, "loss": 0.0162, "lr": 8.07830737662829e-05, "epoch": 1.7636363636363637, "percentage": 36.0, "elapsed_time": "0:12:12", "remaining_time": "0:21:41"} |
|
{"current_steps": 37, "total_steps": 100, "loss": 0.0194, "lr": 7.938926261462366e-05, "epoch": 1.812121212121212, "percentage": 37.0, "elapsed_time": "0:12:29", "remaining_time": "0:21:16"} |
|
{"current_steps": 38, "total_steps": 100, "loss": 0.0154, "lr": 7.795964517353735e-05, "epoch": 1.8606060606060606, "percentage": 38.0, "elapsed_time": "0:12:46", "remaining_time": "0:20:50"} |
|
{"current_steps": 39, "total_steps": 100, "loss": 0.0134, "lr": 7.649596321166024e-05, "epoch": 1.9090909090909092, "percentage": 39.0, "elapsed_time": "0:13:03", "remaining_time": "0:20:25"} |
|
{"current_steps": 40, "total_steps": 100, "loss": 0.0104, "lr": 7.500000000000001e-05, "epoch": 1.9575757575757575, "percentage": 40.0, "elapsed_time": "0:13:21", "remaining_time": "0:20:01"} |
|
{"current_steps": 40, "total_steps": 100, "eval_loss": 0.015456685796380043, "epoch": 1.9575757575757575, "percentage": 40.0, "elapsed_time": "0:13:31", "remaining_time": "0:20:17"} |
|
{"current_steps": 41, "total_steps": 100, "loss": 0.0277, "lr": 7.347357813929454e-05, "epoch": 2.0242424242424244, "percentage": 41.0, "elapsed_time": "0:13:49", "remaining_time": "0:19:54"} |
|
{"current_steps": 42, "total_steps": 100, "loss": 0.012, "lr": 7.191855733945387e-05, "epoch": 2.0727272727272728, "percentage": 42.0, "elapsed_time": "0:14:07", "remaining_time": "0:19:30"} |
|
{"current_steps": 43, "total_steps": 100, "loss": 0.0147, "lr": 7.033683215379002e-05, "epoch": 2.121212121212121, "percentage": 43.0, "elapsed_time": "0:14:25", "remaining_time": "0:19:06"} |
|
{"current_steps": 44, "total_steps": 100, "loss": 0.014, "lr": 6.873032967079561e-05, "epoch": 2.16969696969697, "percentage": 44.0, "elapsed_time": "0:14:41", "remaining_time": "0:18:42"} |
|
{"current_steps": 45, "total_steps": 100, "loss": 0.0143, "lr": 6.710100716628344e-05, "epoch": 2.2181818181818183, "percentage": 45.0, "elapsed_time": "0:14:59", "remaining_time": "0:18:19"} |
|
{"current_steps": 45, "total_steps": 100, "eval_loss": 0.01516613457351923, "epoch": 2.2181818181818183, "percentage": 45.0, "elapsed_time": "0:15:09", "remaining_time": "0:18:31"} |
|
{"current_steps": 46, "total_steps": 100, "loss": 0.0126, "lr": 6.545084971874738e-05, "epoch": 2.2666666666666666, "percentage": 46.0, "elapsed_time": "0:15:27", "remaining_time": "0:18:08"} |
|
{"current_steps": 47, "total_steps": 100, "loss": 0.0118, "lr": 6.378186779084995e-05, "epoch": 2.315151515151515, "percentage": 47.0, "elapsed_time": "0:15:45", "remaining_time": "0:17:46"} |
|
{"current_steps": 48, "total_steps": 100, "loss": 0.0121, "lr": 6.209609477998338e-05, "epoch": 2.3636363636363638, "percentage": 48.0, "elapsed_time": "0:16:03", "remaining_time": "0:17:23"} |
|
{"current_steps": 49, "total_steps": 100, "loss": 0.0096, "lr": 6.0395584540887963e-05, "epoch": 2.412121212121212, "percentage": 49.0, "elapsed_time": "0:16:20", "remaining_time": "0:17:00"} |
|
{"current_steps": 50, "total_steps": 100, "loss": 0.0117, "lr": 5.868240888334653e-05, "epoch": 2.4606060606060605, "percentage": 50.0, "elapsed_time": "0:16:38", "remaining_time": "0:16:38"} |
|
{"current_steps": 50, "total_steps": 100, "eval_loss": 0.014072530902922153, "epoch": 2.4606060606060605, "percentage": 50.0, "elapsed_time": "0:16:48", "remaining_time": "0:16:48"} |
|
{"current_steps": 51, "total_steps": 100, "loss": 0.0139, "lr": 5.695865504800327e-05, "epoch": 2.509090909090909, "percentage": 51.0, "elapsed_time": "0:17:12", "remaining_time": "0:16:32"} |
|
{"current_steps": 52, "total_steps": 100, "loss": 0.0099, "lr": 5.522642316338268e-05, "epoch": 2.5575757575757576, "percentage": 52.0, "elapsed_time": "0:17:30", "remaining_time": "0:16:09"} |
|
{"current_steps": 53, "total_steps": 100, "loss": 0.013, "lr": 5.348782368720626e-05, "epoch": 2.606060606060606, "percentage": 53.0, "elapsed_time": "0:17:49", "remaining_time": "0:15:47"} |
|
{"current_steps": 54, "total_steps": 100, "loss": 0.0093, "lr": 5.174497483512506e-05, "epoch": 2.6545454545454543, "percentage": 54.0, "elapsed_time": "0:18:06", "remaining_time": "0:15:25"} |
|
{"current_steps": 55, "total_steps": 100, "loss": 0.015, "lr": 5e-05, "epoch": 2.703030303030303, "percentage": 55.0, "elapsed_time": "0:18:24", "remaining_time": "0:15:03"} |
|
{"current_steps": 55, "total_steps": 100, "eval_loss": 0.013632840476930141, "epoch": 2.703030303030303, "percentage": 55.0, "elapsed_time": "0:18:34", "remaining_time": "0:15:12"} |
|
{"current_steps": 56, "total_steps": 100, "loss": 0.0109, "lr": 4.825502516487497e-05, "epoch": 2.7515151515151515, "percentage": 56.0, "elapsed_time": "0:18:52", "remaining_time": "0:14:49"} |
|
{"current_steps": 57, "total_steps": 100, "loss": 0.0104, "lr": 4.6512176312793736e-05, "epoch": 2.8, "percentage": 57.0, "elapsed_time": "0:19:10", "remaining_time": "0:14:27"} |
|
{"current_steps": 58, "total_steps": 100, "loss": 0.0097, "lr": 4.477357683661734e-05, "epoch": 2.8484848484848486, "percentage": 58.0, "elapsed_time": "0:19:26", "remaining_time": "0:14:04"} |
|
{"current_steps": 59, "total_steps": 100, "loss": 0.0108, "lr": 4.3041344951996746e-05, "epoch": 2.896969696969697, "percentage": 59.0, "elapsed_time": "0:19:43", "remaining_time": "0:13:42"} |
|
{"current_steps": 60, "total_steps": 100, "loss": 0.0092, "lr": 4.131759111665349e-05, "epoch": 2.9454545454545453, "percentage": 60.0, "elapsed_time": "0:20:01", "remaining_time": "0:13:20"} |
|
{"current_steps": 60, "total_steps": 100, "eval_loss": 0.013053460977971554, "epoch": 2.9454545454545453, "percentage": 60.0, "elapsed_time": "0:20:11", "remaining_time": "0:13:27"} |
|
{"current_steps": 61, "total_steps": 100, "loss": 0.0172, "lr": 3.960441545911204e-05, "epoch": 3.012121212121212, "percentage": 61.0, "elapsed_time": "0:20:29", "remaining_time": "0:13:06"} |
|
{"current_steps": 62, "total_steps": 100, "loss": 0.008, "lr": 3.790390522001662e-05, "epoch": 3.0606060606060606, "percentage": 62.0, "elapsed_time": "0:20:47", "remaining_time": "0:12:44"} |
|
{"current_steps": 63, "total_steps": 100, "loss": 0.0121, "lr": 3.6218132209150045e-05, "epoch": 3.109090909090909, "percentage": 63.0, "elapsed_time": "0:21:05", "remaining_time": "0:12:23"} |
|
{"current_steps": 64, "total_steps": 100, "loss": 0.008, "lr": 3.4549150281252636e-05, "epoch": 3.1575757575757577, "percentage": 64.0, "elapsed_time": "0:21:22", "remaining_time": "0:12:01"} |
|
{"current_steps": 65, "total_steps": 100, "loss": 0.008, "lr": 3.289899283371657e-05, "epoch": 3.206060606060606, "percentage": 65.0, "elapsed_time": "0:21:40", "remaining_time": "0:11:40"} |
|
{"current_steps": 65, "total_steps": 100, "eval_loss": 0.012713730335235596, "epoch": 3.206060606060606, "percentage": 65.0, "elapsed_time": "0:21:50", "remaining_time": "0:11:45"} |
|
{"current_steps": 66, "total_steps": 100, "loss": 0.0096, "lr": 3.12696703292044e-05, "epoch": 3.2545454545454544, "percentage": 66.0, "elapsed_time": "0:22:08", "remaining_time": "0:11:24"} |
|
{"current_steps": 67, "total_steps": 100, "loss": 0.0071, "lr": 2.9663167846209998e-05, "epoch": 3.303030303030303, "percentage": 67.0, "elapsed_time": "0:22:26", "remaining_time": "0:11:03"} |
|
{"current_steps": 68, "total_steps": 100, "loss": 0.0092, "lr": 2.8081442660546125e-05, "epoch": 3.3515151515151516, "percentage": 68.0, "elapsed_time": "0:22:44", "remaining_time": "0:10:41"} |
|
{"current_steps": 69, "total_steps": 100, "loss": 0.009, "lr": 2.6526421860705473e-05, "epoch": 3.4, "percentage": 69.0, "elapsed_time": "0:23:01", "remaining_time": "0:10:20"} |
|
{"current_steps": 70, "total_steps": 100, "loss": 0.0109, "lr": 2.500000000000001e-05, "epoch": 3.4484848484848483, "percentage": 70.0, "elapsed_time": "0:23:19", "remaining_time": "0:09:59"} |
|
{"current_steps": 70, "total_steps": 100, "eval_loss": 0.012468294240534306, "epoch": 3.4484848484848483, "percentage": 70.0, "elapsed_time": "0:23:29", "remaining_time": "0:10:04"} |
|
{"current_steps": 71, "total_steps": 100, "loss": 0.0123, "lr": 2.350403678833976e-05, "epoch": 3.496969696969697, "percentage": 71.0, "elapsed_time": "0:23:47", "remaining_time": "0:09:43"} |
|
{"current_steps": 72, "total_steps": 100, "loss": 0.0072, "lr": 2.2040354826462668e-05, "epoch": 3.5454545454545454, "percentage": 72.0, "elapsed_time": "0:24:05", "remaining_time": "0:09:22"} |
|
{"current_steps": 73, "total_steps": 100, "loss": 0.009, "lr": 2.061073738537635e-05, "epoch": 3.5939393939393938, "percentage": 73.0, "elapsed_time": "0:24:23", "remaining_time": "0:09:01"} |
|
{"current_steps": 74, "total_steps": 100, "loss": 0.0078, "lr": 1.9216926233717085e-05, "epoch": 3.6424242424242426, "percentage": 74.0, "elapsed_time": "0:24:41", "remaining_time": "0:08:40"} |
|
{"current_steps": 75, "total_steps": 100, "loss": 0.0085, "lr": 1.7860619515673033e-05, "epoch": 3.690909090909091, "percentage": 75.0, "elapsed_time": "0:24:58", "remaining_time": "0:08:19"} |
|
{"current_steps": 75, "total_steps": 100, "eval_loss": 0.012197648175060749, "epoch": 3.690909090909091, "percentage": 75.0, "elapsed_time": "0:25:08", "remaining_time": "0:08:22"} |
|
{"current_steps": 76, "total_steps": 100, "loss": 0.0089, "lr": 1.6543469682057106e-05, "epoch": 3.7393939393939393, "percentage": 76.0, "elapsed_time": "0:25:26", "remaining_time": "0:08:02"} |
|
{"current_steps": 77, "total_steps": 100, "loss": 0.0127, "lr": 1.526708147705013e-05, "epoch": 3.787878787878788, "percentage": 77.0, "elapsed_time": "0:25:44", "remaining_time": "0:07:41"} |
|
{"current_steps": 78, "total_steps": 100, "loss": 0.0085, "lr": 1.4033009983067452e-05, "epoch": 3.8363636363636364, "percentage": 78.0, "elapsed_time": "0:26:01", "remaining_time": "0:07:20"} |
|
{"current_steps": 79, "total_steps": 100, "loss": 0.0079, "lr": 1.2842758726130283e-05, "epoch": 3.8848484848484848, "percentage": 79.0, "elapsed_time": "0:26:18", "remaining_time": "0:06:59"} |
|
{"current_steps": 80, "total_steps": 100, "loss": 0.0089, "lr": 1.1697777844051105e-05, "epoch": 3.9333333333333336, "percentage": 80.0, "elapsed_time": "0:26:36", "remaining_time": "0:06:39"} |
|
{"current_steps": 80, "total_steps": 100, "eval_loss": 0.011956109665334225, "epoch": 3.9333333333333336, "percentage": 80.0, "elapsed_time": "0:26:47", "remaining_time": "0:06:41"} |
|
{"current_steps": 81, "total_steps": 100, "loss": 0.013, "lr": 1.0599462319663905e-05, "epoch": 3.981818181818182, "percentage": 81.0, "elapsed_time": "0:27:03", "remaining_time": "0:06:20"} |
|
{"current_steps": 82, "total_steps": 100, "loss": 0.0092, "lr": 9.549150281252633e-06, "epoch": 4.048484848484849, "percentage": 82.0, "elapsed_time": "0:27:21", "remaining_time": "0:06:00"} |
|
{"current_steps": 83, "total_steps": 100, "loss": 0.0064, "lr": 8.548121372247918e-06, "epoch": 4.096969696969697, "percentage": 83.0, "elapsed_time": "0:27:39", "remaining_time": "0:05:39"} |
|
{"current_steps": 84, "total_steps": 100, "loss": 0.0086, "lr": 7.597595192178702e-06, "epoch": 4.1454545454545455, "percentage": 84.0, "elapsed_time": "0:27:57", "remaining_time": "0:05:19"} |
|
{"current_steps": 85, "total_steps": 100, "loss": 0.0074, "lr": 6.698729810778065e-06, "epoch": 4.193939393939394, "percentage": 85.0, "elapsed_time": "0:28:14", "remaining_time": "0:04:59"} |
|
{"current_steps": 85, "total_steps": 100, "eval_loss": 0.011830544099211693, "epoch": 4.193939393939394, "percentage": 85.0, "elapsed_time": "0:28:24", "remaining_time": "0:05:00"} |
|
{"current_steps": 86, "total_steps": 100, "loss": 0.009, "lr": 5.852620357053651e-06, "epoch": 4.242424242424242, "percentage": 86.0, "elapsed_time": "0:28:42", "remaining_time": "0:04:40"} |
|
{"current_steps": 87, "total_steps": 100, "loss": 0.0074, "lr": 5.060297685041659e-06, "epoch": 4.290909090909091, "percentage": 87.0, "elapsed_time": "0:28:59", "remaining_time": "0:04:19"} |
|
{"current_steps": 88, "total_steps": 100, "loss": 0.0094, "lr": 4.322727117869951e-06, "epoch": 4.33939393939394, "percentage": 88.0, "elapsed_time": "0:29:18", "remaining_time": "0:03:59"} |
|
{"current_steps": 89, "total_steps": 100, "loss": 0.0084, "lr": 3.6408072716606346e-06, "epoch": 4.387878787878788, "percentage": 89.0, "elapsed_time": "0:29:35", "remaining_time": "0:03:39"} |
|
{"current_steps": 90, "total_steps": 100, "loss": 0.0074, "lr": 3.0153689607045845e-06, "epoch": 4.4363636363636365, "percentage": 90.0, "elapsed_time": "0:29:53", "remaining_time": "0:03:19"} |
|
{"current_steps": 90, "total_steps": 100, "eval_loss": 0.011814383789896965, "epoch": 4.4363636363636365, "percentage": 90.0, "elapsed_time": "0:30:03", "remaining_time": "0:03:20"} |
|
{"current_steps": 91, "total_steps": 100, "loss": 0.0087, "lr": 2.4471741852423237e-06, "epoch": 4.484848484848484, "percentage": 91.0, "elapsed_time": "0:30:21", "remaining_time": "0:03:00"} |
|
{"current_steps": 92, "total_steps": 100, "loss": 0.0073, "lr": 1.9369152030840556e-06, "epoch": 4.533333333333333, "percentage": 92.0, "elapsed_time": "0:30:38", "remaining_time": "0:02:39"} |
|
{"current_steps": 93, "total_steps": 100, "loss": 0.0075, "lr": 1.4852136862001764e-06, "epoch": 4.581818181818182, "percentage": 93.0, "elapsed_time": "0:30:56", "remaining_time": "0:02:19"} |
|
{"current_steps": 94, "total_steps": 100, "loss": 0.0071, "lr": 1.0926199633097157e-06, "epoch": 4.63030303030303, "percentage": 94.0, "elapsed_time": "0:31:13", "remaining_time": "0:01:59"} |
|
{"current_steps": 95, "total_steps": 100, "loss": 0.0066, "lr": 7.596123493895991e-07, "epoch": 4.678787878787879, "percentage": 95.0, "elapsed_time": "0:31:31", "remaining_time": "0:01:39"} |
|
{"current_steps": 95, "total_steps": 100, "eval_loss": 0.011838787235319614, "epoch": 4.678787878787879, "percentage": 95.0, "elapsed_time": "0:31:41", "remaining_time": "0:01:40"} |
|
{"current_steps": 96, "total_steps": 100, "loss": 0.0063, "lr": 4.865965629214819e-07, "epoch": 4.7272727272727275, "percentage": 96.0, "elapsed_time": "0:31:59", "remaining_time": "0:01:19"} |
|
{"current_steps": 97, "total_steps": 100, "loss": 0.0076, "lr": 2.7390523158633554e-07, "epoch": 4.775757575757575, "percentage": 97.0, "elapsed_time": "0:32:17", "remaining_time": "0:00:59"} |
|
{"current_steps": 98, "total_steps": 100, "loss": 0.0103, "lr": 1.2179748700879012e-07, "epoch": 4.824242424242424, "percentage": 98.0, "elapsed_time": "0:32:35", "remaining_time": "0:00:39"} |
|
{"current_steps": 99, "total_steps": 100, "loss": 0.0057, "lr": 3.04586490452119e-08, "epoch": 4.872727272727273, "percentage": 99.0, "elapsed_time": "0:32:52", "remaining_time": "0:00:19"} |
|
{"current_steps": 100, "total_steps": 100, "loss": 0.0065, "lr": 0.0, "epoch": 4.921212121212121, "percentage": 100.0, "elapsed_time": "0:33:10", "remaining_time": "0:00:00"} |
|
{"current_steps": 100, "total_steps": 100, "eval_loss": 0.011823242530226707, "epoch": 4.921212121212121, "percentage": 100.0, "elapsed_time": "0:33:20", "remaining_time": "0:00:00"} |
|
{"current_steps": 100, "total_steps": 100, "epoch": 4.921212121212121, "percentage": 100.0, "elapsed_time": "0:33:27", "remaining_time": "0:00:00"} |
|
|