[ { "train": { "lr": 9.875093667547056e-05, "grad_norm": Infinity, "grad_scale": 16646.144, "ce": 3.3427528912723066, "ppl": 33.995531789183616, "ce_q1": 2.6098834899961947, "ppl_q1": 16.068788988828658, "ce_q2": 3.199262778028846, "ppl_q2": 29.528365777134894, "ce_q3": 3.5988389488831163, "ppl_q3": 44.14542267882824, "ce_q4": 3.963026348605752, "ppl_q4": 65.16646182084084, "duration": 1218.7015924453735 }, "valid": { "ce": 2.3822669982910156, "ppl": 10.829425811767578, "ce_q1": 1.7792327404022217, "ppl_q1": 5.925308704376221, "ce_q2": 2.184326171875, "ppl_q2": 8.884659767150879, "ce_q3": 2.657968759536743, "ppl_q3": 14.267280578613281, "ce_q4": 2.9075403213500977, "ppl_q4": 18.311702728271484, "duration": 12.130462884902954 } }, { "train": { "lr": 9.441882233514132e-05, "grad_norm": 3.1516987761110067, "grad_scale": 16384.0, "ce": 2.7866730407330906, "ppl": 18.343669335007668, "ce_q1": 1.960708865690045, "ppl_q1": 7.67068022608757, "ce_q2": 2.627964652788825, "ppl_q2": 15.557403705596924, "ce_q3": 3.0775233307108283, "ppl_q3": 24.984127308368684, "ce_q4": 3.4804952954860635, "ppl_q4": 38.55263476216793, "duration": 1236.4078493118286 }, "valid": { "ce": 2.0738468170166016, "ppl": 7.955367088317871, "ce_q1": 1.3967729806900024, "ppl_q1": 4.042134761810303, "ce_q2": 1.8793870210647583, "ppl_q2": 6.549488544464111, "ce_q3": 2.3681416511535645, "ppl_q3": 10.677531242370605, "ce_q4": 2.65108585357666, "ppl_q4": 14.169415473937988, "duration": 16.665278434753418 } }, { "train": { "lr": 8.528177696195438e-05, "grad_norm": 2.5766738409250975, "grad_scale": 32604.16, "ce": 2.456978987471317, "ppl": 13.047622307181358, "ce_q1": 1.6183160656695255, "ppl_q1": 5.345393500924111, "ce_q2": 2.2931290368936024, "ppl_q2": 10.987915291905404, "ce_q3": 2.7538199657049116, "ppl_q3": 17.96441888523102, "ce_q4": 3.1626508837685106, "ppl_q4": 27.951965188264847, "duration": 1225.9593234062195 }, "valid": { "ce": 1.8575392961502075, "ppl": 6.407949447631836, "ce_q1": 1.146897554397583, "ppl_q1": 3.1484100818634033, "ce_q2": 1.676759123802185, "ppl_q2": 5.3481950759887695, "ce_q3": 2.1644644737243652, "ppl_q3": 8.709936141967773, "ce_q4": 2.4420361518859863, "ppl_q4": 11.49642562866211, "duration": 14.441946506500244 } }, { "train": { "lr": 7.268561864754141e-05, "grad_norm": 2.390021135300398, "grad_scale": 32768.0, "ce": 2.243085328816436, "ppl": 10.385881650805473, "ce_q1": 1.4056685628239065, "ppl_q1": 4.270641067743301, "ce_q2": 2.0750045562880115, "ppl_q2": 8.697048548817635, "ce_q3": 2.539443302554544, "ppl_q3": 14.286545807361604, "ce_q4": 2.9522249091272244, "ppl_q4": 22.33064289879799, "duration": 1231.9223251342773 }, "valid": { "ce": 1.6338310241699219, "ppl": 5.123465538024902, "ce_q1": 0.9277531504631042, "ppl_q1": 2.5288209915161133, "ce_q2": 1.4565773010253906, "ppl_q2": 4.2912468910217285, "ce_q3": 1.9195992946624756, "ppl_q3": 6.818225860595703, "ce_q4": 2.2313942909240723, "ppl_q4": 9.31284236907959, "duration": 12.240105867385864 } }, { "train": { "lr": 5.7865306001898234e-05, "grad_norm": 2.3538931381218133, "grad_scale": 65208.32, "ce": 2.0580586477583274, "ppl": 8.52094031894207, "ce_q1": 1.2490628082135227, "ppl_q1": 3.6193587613105773, "ce_q2": 1.8907092852091882, "ppl_q2": 7.142661284089089, "ce_q3": 2.34134632987684, "ppl_q3": 11.545488672852516, "ce_q4": 2.751116160790931, "ppl_q4": 17.986016420960425, "duration": 1227.4011478424072 }, "valid": { "ce": 1.4793100357055664, "ppl": 4.389915466308594, "ce_q1": 0.7983056902885437, "ppl_q1": 2.221773386001587, "ce_q2": 1.30791437625885, "ppl_q2": 3.6984519958496094, "ce_q3": 1.7428033351898193, "ppl_q3": 5.7133378982543945, "ce_q4": 2.068216562271118, "ppl_q4": 7.910702228546143, "duration": 12.669232368469238 } } ]