diff --git "a/training_metrics.json" "b/training_metrics.json" new file mode 100644--- /dev/null +++ "b/training_metrics.json" @@ -0,0 +1,7502 @@ +[ + { + "loss": 5.689858436584473, + "ce_loss": 5.689294815063477, + "load_loss": 0.05635414645075798, + "step": 0 + }, + { + "loss": 5.719565391540527, + "ce_loss": 5.7192535400390625, + "load_loss": 0.0311886053532362, + "step": 0 + }, + { + "loss": 5.69443941116333, + "ce_loss": 5.693742275238037, + "load_loss": 0.06971193104982376, + "step": 0 + }, + { + "loss": 5.714108467102051, + "ce_loss": 5.713362216949463, + "load_loss": 0.07464882731437683, + "step": 0 + }, + { + "loss": 5.6943840980529785, + "ce_loss": 5.693857192993164, + "load_loss": 0.05267912149429321, + "step": 0 + }, + { + "loss": 5.718689441680908, + "ce_loss": 5.7181925773620605, + "load_loss": 0.04967620223760605, + "step": 0 + }, + { + "loss": 5.661374568939209, + "ce_loss": 5.660612106323242, + "load_loss": 0.07623668015003204, + "step": 0 + }, + { + "loss": 5.713210582733154, + "ce_loss": 5.71274471282959, + "load_loss": 0.046608179807662964, + "step": 0 + }, + { + "loss": 5.644876003265381, + "ce_loss": 5.644097328186035, + "load_loss": 0.07787863910198212, + "step": 0 + }, + { + "loss": 5.71357536315918, + "ce_loss": 5.712971210479736, + "load_loss": 0.0604049488902092, + "step": 0 + }, + { + "loss": 5.7391533851623535, + "ce_loss": 5.738358974456787, + "load_loss": 0.07946363091468811, + "step": 0 + }, + { + "loss": 5.734140396118164, + "ce_loss": 5.733516216278076, + "load_loss": 0.06240258365869522, + "step": 0 + }, + { + "loss": 5.7183990478515625, + "ce_loss": 5.717578887939453, + "load_loss": 0.08203428983688354, + "step": 0 + }, + { + "loss": 5.717033386230469, + "ce_loss": 5.716202259063721, + "load_loss": 0.0831233412027359, + "step": 0 + }, + { + "loss": 5.708643913269043, + "ce_loss": 5.707900047302246, + "load_loss": 0.07436925917863846, + "step": 0 + }, + { + "loss": 5.688057899475098, + "ce_loss": 5.687402248382568, + "load_loss": 0.06556539237499237, + "step": 0 + }, + { + "loss": 5.722081661224365, + "ce_loss": 5.721498966217041, + "load_loss": 0.05828619748353958, + "step": 0 + }, + { + "loss": 5.670475959777832, + "ce_loss": 5.669703960418701, + "load_loss": 0.07720319926738739, + "step": 0 + }, + { + "loss": 5.7430853843688965, + "ce_loss": 5.741848945617676, + "load_loss": 0.12364812940359116, + "step": 0 + }, + { + "loss": 5.699087619781494, + "ce_loss": 5.698500156402588, + "load_loss": 0.058748625218868256, + "step": 0 + }, + { + "loss": 5.7084197998046875, + "ce_loss": 5.707733631134033, + "load_loss": 0.06863292306661606, + "step": 0 + }, + { + "loss": 5.711325168609619, + "ce_loss": 5.7108330726623535, + "load_loss": 0.049223825335502625, + "step": 0 + }, + { + "loss": 5.731059551239014, + "ce_loss": 5.730546951293945, + "load_loss": 0.051241569221019745, + "step": 0 + }, + { + "loss": 5.741281032562256, + "ce_loss": 5.740720272064209, + "load_loss": 0.0560736209154129, + "step": 0 + }, + { + "loss": 5.7227959632873535, + "ce_loss": 5.722142219543457, + "load_loss": 0.06537055224180222, + "step": 0 + }, + { + "loss": 5.707277774810791, + "ce_loss": 5.706926345825195, + "load_loss": 0.03516090288758278, + "step": 0 + }, + { + "loss": 5.722303867340088, + "ce_loss": 5.721961498260498, + "load_loss": 0.034251365810632706, + "step": 0 + }, + { + "loss": 5.699742317199707, + "ce_loss": 5.699192523956299, + "load_loss": 0.05498743802309036, + "step": 0 + }, + { + "loss": 5.696236610412598, + "ce_loss": 5.695744037628174, + "load_loss": 0.04925110936164856, + "step": 0 + }, + { + "loss": 5.706628322601318, + "ce_loss": 5.705794811248779, + "load_loss": 0.08334546536207199, + "step": 0 + }, + { + "loss": 5.7205939292907715, + "ce_loss": 5.719974994659424, + "load_loss": 0.06190185621380806, + "step": 0 + }, + { + "loss": 5.746643543243408, + "ce_loss": 5.745938777923584, + "load_loss": 0.07046062499284744, + "step": 0 + }, + { + "loss": 5.734704971313477, + "ce_loss": 5.734246253967285, + "load_loss": 0.045881979167461395, + "step": 0 + }, + { + "loss": 5.694089412689209, + "ce_loss": 5.693714618682861, + "load_loss": 0.03748070448637009, + "step": 0 + }, + { + "loss": 5.696475028991699, + "ce_loss": 5.696158409118652, + "load_loss": 0.03164049983024597, + "step": 0 + }, + { + "loss": 5.711445331573486, + "ce_loss": 5.710980415344238, + "load_loss": 0.04647797346115112, + "step": 0 + }, + { + "loss": 5.71622371673584, + "ce_loss": 5.715688228607178, + "load_loss": 0.05352834239602089, + "step": 0 + }, + { + "loss": 5.722156047821045, + "ce_loss": 5.721581935882568, + "load_loss": 0.057405855506658554, + "step": 0 + }, + { + "loss": 5.682126045227051, + "ce_loss": 5.68113899230957, + "load_loss": 0.09872099757194519, + "step": 0 + }, + { + "loss": 5.710678577423096, + "ce_loss": 5.710114002227783, + "load_loss": 0.0564388744533062, + "step": 0 + }, + { + "loss": 5.716264247894287, + "ce_loss": 5.715885639190674, + "load_loss": 0.037865109741687775, + "step": 0 + }, + { + "loss": 5.69733190536499, + "ce_loss": 5.696606159210205, + "load_loss": 0.0725669339299202, + "step": 0 + }, + { + "loss": 5.721652984619141, + "ce_loss": 5.72122859954834, + "load_loss": 0.04244057089090347, + "step": 0 + }, + { + "loss": 5.650073051452637, + "ce_loss": 5.648885726928711, + "load_loss": 0.11872273683547974, + "step": 0 + }, + { + "loss": 5.717469692230225, + "ce_loss": 5.716835021972656, + "load_loss": 0.06346674263477325, + "step": 0 + }, + { + "loss": 5.73955774307251, + "ce_loss": 5.7390971183776855, + "load_loss": 0.04606389254331589, + "step": 0 + }, + { + "loss": 5.74078369140625, + "ce_loss": 5.740128517150879, + "load_loss": 0.06550076603889465, + "step": 0 + }, + { + "loss": 5.745792388916016, + "ce_loss": 5.745595455169678, + "load_loss": 0.01968579739332199, + "step": 0 + }, + { + "loss": 5.7139997482299805, + "ce_loss": 5.7134480476379395, + "load_loss": 0.05518658086657524, + "step": 0 + }, + { + "loss": 5.6939897537231445, + "ce_loss": 5.693375587463379, + "load_loss": 0.06140640005469322, + "step": 0 + }, + { + "loss": 5.698018550872803, + "ce_loss": 5.6970062255859375, + "load_loss": 0.10121983289718628, + "step": 0 + }, + { + "loss": 5.732625961303711, + "ce_loss": 5.732214450836182, + "load_loss": 0.04114854708313942, + "step": 0 + }, + { + "loss": 5.666359901428223, + "ce_loss": 5.66531229019165, + "load_loss": 0.10475029051303864, + "step": 0 + }, + { + "loss": 5.705451488494873, + "ce_loss": 5.704887390136719, + "load_loss": 0.0563986599445343, + "step": 0 + }, + { + "loss": 5.732690334320068, + "ce_loss": 5.731888771057129, + "load_loss": 0.08017068356275558, + "step": 0 + }, + { + "loss": 5.743021488189697, + "ce_loss": 5.74224328994751, + "load_loss": 0.07783986628055573, + "step": 0 + }, + { + "loss": 5.723941326141357, + "ce_loss": 5.722815036773682, + "load_loss": 0.11262211203575134, + "step": 0 + }, + { + "loss": 5.708563804626465, + "ce_loss": 5.708098411560059, + "load_loss": 0.046553608030080795, + "step": 0 + }, + { + "loss": 5.66008996963501, + "ce_loss": 5.659422397613525, + "load_loss": 0.06674252450466156, + "step": 0 + }, + { + "loss": 5.751020431518555, + "ce_loss": 5.750646591186523, + "load_loss": 0.0373820923268795, + "step": 0 + }, + { + "loss": 5.746757984161377, + "ce_loss": 5.745999336242676, + "load_loss": 0.07588052749633789, + "step": 0 + }, + { + "loss": 5.738731384277344, + "ce_loss": 5.73820686340332, + "load_loss": 0.05246131122112274, + "step": 0 + }, + { + "loss": 5.716710567474365, + "ce_loss": 5.715806484222412, + "load_loss": 0.09043078124523163, + "step": 0 + }, + { + "loss": 5.673379421234131, + "ce_loss": 5.672630310058594, + "load_loss": 0.07489774376153946, + "step": 1 + }, + { + "loss": 5.48313570022583, + "ce_loss": 5.482280731201172, + "load_loss": 0.08551878482103348, + "step": 1 + }, + { + "loss": 5.512439250946045, + "ce_loss": 5.5118513107299805, + "load_loss": 0.058801762759685516, + "step": 1 + }, + { + "loss": 5.5210771560668945, + "ce_loss": 5.520323753356934, + "load_loss": 0.07532044500112534, + "step": 1 + }, + { + "loss": 5.533121585845947, + "ce_loss": 5.532468795776367, + "load_loss": 0.06528821587562561, + "step": 1 + }, + { + "loss": 5.4879536628723145, + "ce_loss": 5.487229347229004, + "load_loss": 0.0724472627043724, + "step": 1 + }, + { + "loss": 5.465908527374268, + "ce_loss": 5.465108394622803, + "load_loss": 0.08002611249685287, + "step": 1 + }, + { + "loss": 5.519738674163818, + "ce_loss": 5.519254207611084, + "load_loss": 0.04846029728651047, + "step": 1 + }, + { + "loss": 5.498325347900391, + "ce_loss": 5.4970550537109375, + "load_loss": 0.12703019380569458, + "step": 1 + }, + { + "loss": 5.497963905334473, + "ce_loss": 5.497251033782959, + "load_loss": 0.07127395272254944, + "step": 1 + }, + { + "loss": 5.527613162994385, + "ce_loss": 5.527114391326904, + "load_loss": 0.04987343028187752, + "step": 1 + }, + { + "loss": 5.526426315307617, + "ce_loss": 5.5259623527526855, + "load_loss": 0.04640568792819977, + "step": 1 + }, + { + "loss": 5.564351558685303, + "ce_loss": 5.5634379386901855, + "load_loss": 0.09136999398469925, + "step": 1 + }, + { + "loss": 5.523436069488525, + "ce_loss": 5.522709846496582, + "load_loss": 0.07261814922094345, + "step": 1 + }, + { + "loss": 5.510257244110107, + "ce_loss": 5.509274482727051, + "load_loss": 0.09828441590070724, + "step": 1 + }, + { + "loss": 5.521299839019775, + "ce_loss": 5.520488739013672, + "load_loss": 0.08111517131328583, + "step": 1 + }, + { + "loss": 5.508573055267334, + "ce_loss": 5.507687568664551, + "load_loss": 0.08852744102478027, + "step": 1 + }, + { + "loss": 5.509494304656982, + "ce_loss": 5.508915424346924, + "load_loss": 0.05788121372461319, + "step": 1 + }, + { + "loss": 5.517122745513916, + "ce_loss": 5.5166850090026855, + "load_loss": 0.04378621280193329, + "step": 1 + }, + { + "loss": 5.49953031539917, + "ce_loss": 5.498560428619385, + "load_loss": 0.0969727635383606, + "step": 1 + }, + { + "loss": 5.466097831726074, + "ce_loss": 5.465244770050049, + "load_loss": 0.08528949320316315, + "step": 1 + }, + { + "loss": 5.6572651863098145, + "ce_loss": 5.656364440917969, + "load_loss": 0.09008084237575531, + "step": 1 + }, + { + "loss": 5.561635494232178, + "ce_loss": 5.561043739318848, + "load_loss": 0.059169407933950424, + "step": 1 + }, + { + "loss": 5.55869197845459, + "ce_loss": 5.557982444763184, + "load_loss": 0.07094938308000565, + "step": 1 + }, + { + "loss": 5.52331018447876, + "ce_loss": 5.522854804992676, + "load_loss": 0.045528218150138855, + "step": 1 + }, + { + "loss": 5.538680553436279, + "ce_loss": 5.537826061248779, + "load_loss": 0.0854632556438446, + "step": 1 + }, + { + "loss": 5.53391170501709, + "ce_loss": 5.5331315994262695, + "load_loss": 0.07803230732679367, + "step": 1 + }, + { + "loss": 5.505067348480225, + "ce_loss": 5.503977298736572, + "load_loss": 0.10900118947029114, + "step": 1 + }, + { + "loss": 5.532364845275879, + "ce_loss": 5.531580924987793, + "load_loss": 0.07840234041213989, + "step": 1 + }, + { + "loss": 5.515168190002441, + "ce_loss": 5.514620780944824, + "load_loss": 0.05475526675581932, + "step": 1 + }, + { + "loss": 5.525841236114502, + "ce_loss": 5.524870872497559, + "load_loss": 0.09703163802623749, + "step": 1 + }, + { + "loss": 5.552040100097656, + "ce_loss": 5.55143928527832, + "load_loss": 0.060098569840192795, + "step": 1 + }, + { + "loss": 5.6212639808654785, + "ce_loss": 5.620526313781738, + "load_loss": 0.07377901673316956, + "step": 1 + }, + { + "loss": 5.477939128875732, + "ce_loss": 5.477062702178955, + "load_loss": 0.08765476942062378, + "step": 1 + }, + { + "loss": 5.527283191680908, + "ce_loss": 5.526524066925049, + "load_loss": 0.07593557983636856, + "step": 1 + }, + { + "loss": 5.560898303985596, + "ce_loss": 5.559985160827637, + "load_loss": 0.09129436314105988, + "step": 1 + }, + { + "loss": 5.540337085723877, + "ce_loss": 5.539581775665283, + "load_loss": 0.07554591447114944, + "step": 1 + }, + { + "loss": 5.507293224334717, + "ce_loss": 5.506340503692627, + "load_loss": 0.09527671337127686, + "step": 1 + }, + { + "loss": 5.4874162673950195, + "ce_loss": 5.486365795135498, + "load_loss": 0.1050490066409111, + "step": 1 + }, + { + "loss": 5.530200958251953, + "ce_loss": 5.529582500457764, + "load_loss": 0.06185062974691391, + "step": 1 + }, + { + "loss": 5.542208194732666, + "ce_loss": 5.541903495788574, + "load_loss": 0.030451400205492973, + "step": 1 + }, + { + "loss": 5.499722957611084, + "ce_loss": 5.499083995819092, + "load_loss": 0.06389231234788895, + "step": 1 + }, + { + "loss": 5.487544059753418, + "ce_loss": 5.486514568328857, + "load_loss": 0.10296519845724106, + "step": 1 + }, + { + "loss": 5.56644344329834, + "ce_loss": 5.565408706665039, + "load_loss": 0.10345108062028885, + "step": 1 + }, + { + "loss": 5.5415358543396, + "ce_loss": 5.540714740753174, + "load_loss": 0.08209699392318726, + "step": 1 + }, + { + "loss": 5.514513969421387, + "ce_loss": 5.513740062713623, + "load_loss": 0.07737505435943604, + "step": 1 + }, + { + "loss": 5.543450832366943, + "ce_loss": 5.5429487228393555, + "load_loss": 0.05021809786558151, + "step": 1 + }, + { + "loss": 5.522648811340332, + "ce_loss": 5.52229642868042, + "load_loss": 0.03525999188423157, + "step": 1 + }, + { + "loss": 5.527862071990967, + "ce_loss": 5.526886463165283, + "load_loss": 0.0975639596581459, + "step": 1 + }, + { + "loss": 5.500956058502197, + "ce_loss": 5.500197887420654, + "load_loss": 0.07582308351993561, + "step": 1 + }, + { + "loss": 5.554368495941162, + "ce_loss": 5.5539445877075195, + "load_loss": 0.04237929359078407, + "step": 1 + }, + { + "loss": 5.559906005859375, + "ce_loss": 5.559255599975586, + "load_loss": 0.06502397358417511, + "step": 1 + }, + { + "loss": 5.574231147766113, + "ce_loss": 5.573594570159912, + "load_loss": 0.06366157531738281, + "step": 1 + }, + { + "loss": 5.5068559646606445, + "ce_loss": 5.5058722496032715, + "load_loss": 0.09837105870246887, + "step": 1 + }, + { + "loss": 5.505845069885254, + "ce_loss": 5.504973411560059, + "load_loss": 0.0871693566441536, + "step": 1 + }, + { + "loss": 5.591604709625244, + "ce_loss": 5.591125011444092, + "load_loss": 0.04798876494169235, + "step": 1 + }, + { + "loss": 5.52475643157959, + "ce_loss": 5.523838043212891, + "load_loss": 0.09184391051530838, + "step": 1 + }, + { + "loss": 5.563226222991943, + "ce_loss": 5.56292724609375, + "load_loss": 0.02990376204252243, + "step": 1 + }, + { + "loss": 5.549938678741455, + "ce_loss": 5.549421310424805, + "load_loss": 0.05172840878367424, + "step": 1 + }, + { + "loss": 5.492251396179199, + "ce_loss": 5.491492748260498, + "load_loss": 0.07588004320859909, + "step": 1 + }, + { + "loss": 5.46108865737915, + "ce_loss": 5.459971904754639, + "load_loss": 0.11166469752788544, + "step": 1 + }, + { + "loss": 5.506716728210449, + "ce_loss": 5.505953788757324, + "load_loss": 0.0762903019785881, + "step": 1 + }, + { + "loss": 5.60500431060791, + "ce_loss": 5.6044697761535645, + "load_loss": 0.053470902144908905, + "step": 1 + }, + { + "loss": 5.46644401550293, + "ce_loss": 5.464977264404297, + "load_loss": 0.14667385816574097, + "step": 1 + }, + { + "loss": 5.493645191192627, + "ce_loss": 5.492853164672852, + "load_loss": 0.07919555902481079, + "step": 1 + }, + { + "loss": 5.546830654144287, + "ce_loss": 5.545833110809326, + "load_loss": 0.09976409375667572, + "step": 1 + }, + { + "loss": 5.519857406616211, + "ce_loss": 5.518960475921631, + "load_loss": 0.0896739512681961, + "step": 1 + }, + { + "loss": 5.545159816741943, + "ce_loss": 5.544742584228516, + "load_loss": 0.04174405336380005, + "step": 1 + }, + { + "loss": 5.544160842895508, + "ce_loss": 5.54362154006958, + "load_loss": 0.05393189564347267, + "step": 1 + }, + { + "loss": 5.500524044036865, + "ce_loss": 5.49978494644165, + "load_loss": 0.07391496002674103, + "step": 1 + }, + { + "loss": 5.489800453186035, + "ce_loss": 5.489029407501221, + "load_loss": 0.07710696756839752, + "step": 1 + }, + { + "loss": 5.494702339172363, + "ce_loss": 5.494016170501709, + "load_loss": 0.06861186772584915, + "step": 1 + }, + { + "loss": 5.520761489868164, + "ce_loss": 5.519794464111328, + "load_loss": 0.09671953320503235, + "step": 1 + }, + { + "loss": 5.573816776275635, + "ce_loss": 5.573301792144775, + "load_loss": 0.05152113363146782, + "step": 1 + }, + { + "loss": 5.630615234375, + "ce_loss": 5.629541397094727, + "load_loss": 0.10739944130182266, + "step": 1 + }, + { + "loss": 5.543285369873047, + "ce_loss": 5.542623996734619, + "load_loss": 0.06611446291208267, + "step": 1 + }, + { + "loss": 5.5425896644592285, + "ce_loss": 5.542087554931641, + "load_loss": 0.05023341625928879, + "step": 1 + }, + { + "loss": 5.535411834716797, + "ce_loss": 5.534487247467041, + "load_loss": 0.09243655204772949, + "step": 1 + }, + { + "loss": 5.530694484710693, + "ce_loss": 5.529472827911377, + "load_loss": 0.12218042463064194, + "step": 1 + }, + { + "loss": 5.55825662612915, + "ce_loss": 5.557408332824707, + "load_loss": 0.08484093844890594, + "step": 1 + }, + { + "loss": 5.5372138023376465, + "ce_loss": 5.536549091339111, + "load_loss": 0.06645961105823517, + "step": 1 + }, + { + "loss": 5.492568492889404, + "ce_loss": 5.491556167602539, + "load_loss": 0.10124711692333221, + "step": 1 + }, + { + "loss": 5.533909320831299, + "ce_loss": 5.533122539520264, + "load_loss": 0.0786881297826767, + "step": 1 + }, + { + "loss": 5.587963104248047, + "ce_loss": 5.587594509124756, + "load_loss": 0.03685072809457779, + "step": 1 + }, + { + "loss": 5.548852920532227, + "ce_loss": 5.548318862915039, + "load_loss": 0.0534091480076313, + "step": 1 + }, + { + "loss": 5.541507244110107, + "ce_loss": 5.540977478027344, + "load_loss": 0.05299219861626625, + "step": 1 + }, + { + "loss": 5.511085510253906, + "ce_loss": 5.510141372680664, + "load_loss": 0.09440067410469055, + "step": 1 + }, + { + "loss": 5.483974933624268, + "ce_loss": 5.483067989349365, + "load_loss": 0.09067300707101822, + "step": 1 + }, + { + "loss": 5.528117656707764, + "ce_loss": 5.527292251586914, + "load_loss": 0.08254170417785645, + "step": 1 + }, + { + "loss": 5.562511444091797, + "ce_loss": 5.561832427978516, + "load_loss": 0.06790051609277725, + "step": 1 + }, + { + "loss": 5.509886741638184, + "ce_loss": 5.509017467498779, + "load_loss": 0.08692042529582977, + "step": 1 + }, + { + "loss": 5.548254489898682, + "ce_loss": 5.5474443435668945, + "load_loss": 0.08099788427352905, + "step": 1 + }, + { + "loss": 5.605651378631592, + "ce_loss": 5.604710102081299, + "load_loss": 0.0941062718629837, + "step": 1 + }, + { + "loss": 5.583693027496338, + "ce_loss": 5.58294153213501, + "load_loss": 0.07516247779130936, + "step": 1 + }, + { + "loss": 5.606704235076904, + "ce_loss": 5.606049060821533, + "load_loss": 0.06551273167133331, + "step": 1 + }, + { + "loss": 5.526449203491211, + "ce_loss": 5.525969505310059, + "load_loss": 0.04794711992144585, + "step": 1 + }, + { + "loss": 5.533439636230469, + "ce_loss": 5.5327887535095215, + "load_loss": 0.06510917842388153, + "step": 1 + }, + { + "loss": 5.509059906005859, + "ce_loss": 5.508255481719971, + "load_loss": 0.08044832944869995, + "step": 1 + }, + { + "loss": 5.489537715911865, + "ce_loss": 5.488663196563721, + "load_loss": 0.08747236430644989, + "step": 1 + }, + { + "loss": 5.5333757400512695, + "ce_loss": 5.5329461097717285, + "load_loss": 0.04295087233185768, + "step": 1 + }, + { + "loss": 5.564270973205566, + "ce_loss": 5.563500881195068, + "load_loss": 0.07699016481637955, + "step": 1 + }, + { + "loss": 5.483701229095459, + "ce_loss": 5.482613563537598, + "load_loss": 0.10874363780021667, + "step": 1 + }, + { + "loss": 5.490377426147461, + "ce_loss": 5.489251136779785, + "load_loss": 0.11264079064130783, + "step": 1 + }, + { + "loss": 5.597060680389404, + "ce_loss": 5.596401214599609, + "load_loss": 0.06592489033937454, + "step": 1 + }, + { + "loss": 5.511696815490723, + "ce_loss": 5.510860443115234, + "load_loss": 0.08363939076662064, + "step": 1 + }, + { + "loss": 5.596091270446777, + "ce_loss": 5.5949506759643555, + "load_loss": 0.11404196172952652, + "step": 1 + }, + { + "loss": 5.522383213043213, + "ce_loss": 5.52177095413208, + "load_loss": 0.06120917201042175, + "step": 1 + }, + { + "loss": 5.618241786956787, + "ce_loss": 5.617502689361572, + "load_loss": 0.07389054447412491, + "step": 1 + }, + { + "loss": 5.503175735473633, + "ce_loss": 5.502262115478516, + "load_loss": 0.09137717634439468, + "step": 1 + }, + { + "loss": 5.5171589851379395, + "ce_loss": 5.516239166259766, + "load_loss": 0.0919913649559021, + "step": 1 + }, + { + "loss": 5.541401386260986, + "ce_loss": 5.540619850158691, + "load_loss": 0.0781601220369339, + "step": 1 + }, + { + "loss": 5.5128936767578125, + "ce_loss": 5.511927127838135, + "load_loss": 0.09663814306259155, + "step": 1 + }, + { + "loss": 5.490386486053467, + "ce_loss": 5.489527225494385, + "load_loss": 0.08591562509536743, + "step": 1 + }, + { + "loss": 5.503547191619873, + "ce_loss": 5.502521514892578, + "load_loss": 0.10256212204694748, + "step": 1 + }, + { + "loss": 5.659358501434326, + "ce_loss": 5.658554553985596, + "load_loss": 0.08039136976003647, + "step": 1 + }, + { + "loss": 5.4799485206604, + "ce_loss": 5.4789276123046875, + "load_loss": 0.10209251195192337, + "step": 1 + }, + { + "loss": 5.524848461151123, + "ce_loss": 5.524204254150391, + "load_loss": 0.06440308690071106, + "step": 1 + }, + { + "loss": 5.527563571929932, + "ce_loss": 5.527145862579346, + "load_loss": 0.04179193079471588, + "step": 1 + }, + { + "loss": 5.527397632598877, + "ce_loss": 5.526625633239746, + "load_loss": 0.07717686891555786, + "step": 1 + }, + { + "loss": 5.499438285827637, + "ce_loss": 5.498791694641113, + "load_loss": 0.06467260420322418, + "step": 1 + }, + { + "loss": 5.526208877563477, + "ce_loss": 5.52552604675293, + "load_loss": 0.06829783320426941, + "step": 1 + }, + { + "loss": 5.50149393081665, + "ce_loss": 5.500916957855225, + "load_loss": 0.05768255144357681, + "step": 1 + }, + { + "loss": 5.517845630645752, + "ce_loss": 5.516928195953369, + "load_loss": 0.09173476696014404, + "step": 1 + }, + { + "loss": 5.506264686584473, + "ce_loss": 5.505121231079102, + "load_loss": 0.1143224760890007, + "step": 1 + }, + { + "loss": 5.510690212249756, + "ce_loss": 5.50990104675293, + "load_loss": 0.07893610000610352, + "step": 1 + }, + { + "loss": 5.520713806152344, + "ce_loss": 5.519953727722168, + "load_loss": 0.07599541544914246, + "step": 2 + }, + { + "loss": 5.285400867462158, + "ce_loss": 5.284564971923828, + "load_loss": 0.08360061049461365, + "step": 2 + }, + { + "loss": 5.318922996520996, + "ce_loss": 5.3175458908081055, + "load_loss": 0.13770627975463867, + "step": 2 + }, + { + "loss": 5.316718101501465, + "ce_loss": 5.31565523147583, + "load_loss": 0.10629364103078842, + "step": 2 + }, + { + "loss": 5.394433498382568, + "ce_loss": 5.393900394439697, + "load_loss": 0.05329808592796326, + "step": 2 + }, + { + "loss": 5.337387561798096, + "ce_loss": 5.336475849151611, + "load_loss": 0.09118185937404633, + "step": 2 + }, + { + "loss": 5.402957916259766, + "ce_loss": 5.4025397300720215, + "load_loss": 0.04179815202951431, + "step": 2 + }, + { + "loss": 5.375954627990723, + "ce_loss": 5.375035285949707, + "load_loss": 0.09193965792655945, + "step": 2 + }, + { + "loss": 5.303027153015137, + "ce_loss": 5.301855564117432, + "load_loss": 0.11716455221176147, + "step": 2 + }, + { + "loss": 5.323362827301025, + "ce_loss": 5.322753429412842, + "load_loss": 0.06091668829321861, + "step": 2 + }, + { + "loss": 5.353307247161865, + "ce_loss": 5.352133750915527, + "load_loss": 0.11734358966350555, + "step": 2 + }, + { + "loss": 5.4313178062438965, + "ce_loss": 5.430115222930908, + "load_loss": 0.12023639678955078, + "step": 2 + }, + { + "loss": 5.341640949249268, + "ce_loss": 5.3408942222595215, + "load_loss": 0.07467754185199738, + "step": 2 + }, + { + "loss": 5.360178470611572, + "ce_loss": 5.359657287597656, + "load_loss": 0.0521065890789032, + "step": 2 + }, + { + "loss": 5.334360599517822, + "ce_loss": 5.333957195281982, + "load_loss": 0.04034576192498207, + "step": 2 + }, + { + "loss": 5.408840179443359, + "ce_loss": 5.40809965133667, + "load_loss": 0.07405857741832733, + "step": 2 + }, + { + "loss": 5.4093146324157715, + "ce_loss": 5.408435821533203, + "load_loss": 0.08789555728435516, + "step": 2 + }, + { + "loss": 5.398310661315918, + "ce_loss": 5.397338390350342, + "load_loss": 0.09722311794757843, + "step": 2 + }, + { + "loss": 5.306783676147461, + "ce_loss": 5.305963039398193, + "load_loss": 0.08204672485589981, + "step": 2 + }, + { + "loss": 5.411231517791748, + "ce_loss": 5.410456657409668, + "load_loss": 0.07747797667980194, + "step": 2 + }, + { + "loss": 5.361852169036865, + "ce_loss": 5.360986709594727, + "load_loss": 0.08656571060419083, + "step": 2 + }, + { + "loss": 5.2985711097717285, + "ce_loss": 5.297416687011719, + "load_loss": 0.11542781442403793, + "step": 2 + }, + { + "loss": 5.459392547607422, + "ce_loss": 5.458520412445068, + "load_loss": 0.08719377219676971, + "step": 2 + }, + { + "loss": 5.380703449249268, + "ce_loss": 5.37991189956665, + "load_loss": 0.07915535569190979, + "step": 2 + }, + { + "loss": 5.393849849700928, + "ce_loss": 5.3930840492248535, + "load_loss": 0.07658374309539795, + "step": 2 + }, + { + "loss": 5.3218488693237305, + "ce_loss": 5.320769309997559, + "load_loss": 0.1079355925321579, + "step": 2 + }, + { + "loss": 5.292452812194824, + "ce_loss": 5.2914299964904785, + "load_loss": 0.10227777063846588, + "step": 2 + }, + { + "loss": 5.295072555541992, + "ce_loss": 5.293803691864014, + "load_loss": 0.12690332531929016, + "step": 2 + }, + { + "loss": 5.384504795074463, + "ce_loss": 5.383327007293701, + "load_loss": 0.11779644340276718, + "step": 2 + }, + { + "loss": 5.307857990264893, + "ce_loss": 5.306832313537598, + "load_loss": 0.10259036719799042, + "step": 2 + }, + { + "loss": 5.378410816192627, + "ce_loss": 5.377630233764648, + "load_loss": 0.07806151360273361, + "step": 2 + }, + { + "loss": 5.401968002319336, + "ce_loss": 5.401004791259766, + "load_loss": 0.09632842242717743, + "step": 2 + }, + { + "loss": 5.368804931640625, + "ce_loss": 5.36810827255249, + "load_loss": 0.06965305656194687, + "step": 2 + }, + { + "loss": 5.329218864440918, + "ce_loss": 5.328744411468506, + "load_loss": 0.04745069891214371, + "step": 2 + }, + { + "loss": 5.306212902069092, + "ce_loss": 5.305108070373535, + "load_loss": 0.11048278212547302, + "step": 2 + }, + { + "loss": 5.321471691131592, + "ce_loss": 5.320685863494873, + "load_loss": 0.0785675048828125, + "step": 2 + }, + { + "loss": 5.544010162353516, + "ce_loss": 5.542876720428467, + "load_loss": 0.11332054436206818, + "step": 2 + }, + { + "loss": 5.370018482208252, + "ce_loss": 5.3693928718566895, + "load_loss": 0.06255097687244415, + "step": 2 + }, + { + "loss": 5.4162492752075195, + "ce_loss": 5.415427207946777, + "load_loss": 0.08221236616373062, + "step": 2 + }, + { + "loss": 5.350608825683594, + "ce_loss": 5.3501200675964355, + "load_loss": 0.048868145793676376, + "step": 2 + }, + { + "loss": 5.301860809326172, + "ce_loss": 5.30042839050293, + "load_loss": 0.14325159788131714, + "step": 2 + }, + { + "loss": 5.372697830200195, + "ce_loss": 5.371368408203125, + "load_loss": 0.13296277821063995, + "step": 2 + }, + { + "loss": 5.30839729309082, + "ce_loss": 5.307399749755859, + "load_loss": 0.09974589943885803, + "step": 2 + }, + { + "loss": 5.321526527404785, + "ce_loss": 5.320805072784424, + "load_loss": 0.07214854657649994, + "step": 2 + }, + { + "loss": 5.316849231719971, + "ce_loss": 5.315724849700928, + "load_loss": 0.112429678440094, + "step": 2 + }, + { + "loss": 5.340661525726318, + "ce_loss": 5.3393988609313965, + "load_loss": 0.12625612318515778, + "step": 2 + }, + { + "loss": 5.323927402496338, + "ce_loss": 5.322925567626953, + "load_loss": 0.1001867949962616, + "step": 2 + }, + { + "loss": 5.338357448577881, + "ce_loss": 5.337642192840576, + "load_loss": 0.07152910530567169, + "step": 2 + }, + { + "loss": 5.367527484893799, + "ce_loss": 5.36683988571167, + "load_loss": 0.06876073777675629, + "step": 2 + }, + { + "loss": 5.402642250061035, + "ce_loss": 5.401899337768555, + "load_loss": 0.07430223375558853, + "step": 2 + }, + { + "loss": 5.39479923248291, + "ce_loss": 5.394072532653809, + "load_loss": 0.07265740633010864, + "step": 2 + }, + { + "loss": 5.350793838500977, + "ce_loss": 5.3498358726501465, + "load_loss": 0.0957937091588974, + "step": 2 + }, + { + "loss": 5.550811767578125, + "ce_loss": 5.5496110916137695, + "load_loss": 0.12007267773151398, + "step": 2 + }, + { + "loss": 5.347704887390137, + "ce_loss": 5.3473663330078125, + "load_loss": 0.033872224390506744, + "step": 2 + }, + { + "loss": 5.311154842376709, + "ce_loss": 5.310262203216553, + "load_loss": 0.08925363421440125, + "step": 2 + }, + { + "loss": 5.383706092834473, + "ce_loss": 5.383091926574707, + "load_loss": 0.06141023337841034, + "step": 2 + }, + { + "loss": 5.326407432556152, + "ce_loss": 5.325632572174072, + "load_loss": 0.07750237733125687, + "step": 2 + }, + { + "loss": 5.387877464294434, + "ce_loss": 5.387033939361572, + "load_loss": 0.08435840159654617, + "step": 2 + }, + { + "loss": 5.349466800689697, + "ce_loss": 5.3488874435424805, + "load_loss": 0.057922378182411194, + "step": 2 + }, + { + "loss": 5.365749359130859, + "ce_loss": 5.365141868591309, + "load_loss": 0.060739077627658844, + "step": 2 + }, + { + "loss": 5.341970443725586, + "ce_loss": 5.340991020202637, + "load_loss": 0.09793113172054291, + "step": 2 + }, + { + "loss": 5.292368412017822, + "ce_loss": 5.2913818359375, + "load_loss": 0.09863961488008499, + "step": 2 + }, + { + "loss": 5.302265644073486, + "ce_loss": 5.300985813140869, + "load_loss": 0.12800100445747375, + "step": 2 + }, + { + "loss": 5.3327131271362305, + "ce_loss": 5.331390380859375, + "load_loss": 0.1322825402021408, + "step": 2 + }, + { + "loss": 5.303983688354492, + "ce_loss": 5.3032355308532715, + "load_loss": 0.0748048797249794, + "step": 2 + }, + { + "loss": 5.4129743576049805, + "ce_loss": 5.41189432144165, + "load_loss": 0.10798536986112595, + "step": 2 + }, + { + "loss": 5.306609153747559, + "ce_loss": 5.305609226226807, + "load_loss": 0.09997232258319855, + "step": 2 + }, + { + "loss": 5.427919864654541, + "ce_loss": 5.427144527435303, + "load_loss": 0.07751913368701935, + "step": 2 + }, + { + "loss": 5.386650562286377, + "ce_loss": 5.385462284088135, + "load_loss": 0.11884815990924835, + "step": 2 + }, + { + "loss": 5.355135917663574, + "ce_loss": 5.354583263397217, + "load_loss": 0.05528567358851433, + "step": 2 + }, + { + "loss": 5.342507362365723, + "ce_loss": 5.341914176940918, + "load_loss": 0.059307754039764404, + "step": 2 + }, + { + "loss": 5.3114728927612305, + "ce_loss": 5.310337066650391, + "load_loss": 0.11359484493732452, + "step": 2 + }, + { + "loss": 5.293288707733154, + "ce_loss": 5.2923264503479, + "load_loss": 0.0962216705083847, + "step": 2 + }, + { + "loss": 5.422966480255127, + "ce_loss": 5.42241096496582, + "load_loss": 0.055571459233760834, + "step": 2 + }, + { + "loss": 5.357258319854736, + "ce_loss": 5.3557257652282715, + "load_loss": 0.15323786437511444, + "step": 2 + }, + { + "loss": 5.4190449714660645, + "ce_loss": 5.41812801361084, + "load_loss": 0.09171178936958313, + "step": 2 + }, + { + "loss": 5.298023223876953, + "ce_loss": 5.297276496887207, + "load_loss": 0.07467228174209595, + "step": 2 + }, + { + "loss": 5.405617713928223, + "ce_loss": 5.404499530792236, + "load_loss": 0.11183034628629684, + "step": 2 + }, + { + "loss": 5.337530136108398, + "ce_loss": 5.336732864379883, + "load_loss": 0.0797063410282135, + "step": 2 + }, + { + "loss": 5.315585613250732, + "ce_loss": 5.314721584320068, + "load_loss": 0.08639049530029297, + "step": 2 + }, + { + "loss": 5.384786128997803, + "ce_loss": 5.384128570556641, + "load_loss": 0.06574442982673645, + "step": 2 + }, + { + "loss": 5.3660430908203125, + "ce_loss": 5.365492820739746, + "load_loss": 0.05503387376666069, + "step": 2 + }, + { + "loss": 5.348938465118408, + "ce_loss": 5.348080635070801, + "load_loss": 0.0857677087187767, + "step": 2 + }, + { + "loss": 5.350103378295898, + "ce_loss": 5.349146366119385, + "load_loss": 0.0957123190164566, + "step": 2 + }, + { + "loss": 5.590724468231201, + "ce_loss": 5.589959144592285, + "load_loss": 0.07653778791427612, + "step": 2 + }, + { + "loss": 5.325222015380859, + "ce_loss": 5.324296951293945, + "load_loss": 0.09249064326286316, + "step": 2 + }, + { + "loss": 5.302094459533691, + "ce_loss": 5.301046371459961, + "load_loss": 0.10479097813367844, + "step": 2 + }, + { + "loss": 5.426806926727295, + "ce_loss": 5.4261274337768555, + "load_loss": 0.06793592870235443, + "step": 2 + }, + { + "loss": 5.322082996368408, + "ce_loss": 5.321176052093506, + "load_loss": 0.09071272611618042, + "step": 2 + }, + { + "loss": 5.374181270599365, + "ce_loss": 5.373734474182129, + "load_loss": 0.04469623044133186, + "step": 2 + }, + { + "loss": 5.319766998291016, + "ce_loss": 5.319177627563477, + "load_loss": 0.05891473963856697, + "step": 2 + }, + { + "loss": 5.364841461181641, + "ce_loss": 5.364147186279297, + "load_loss": 0.0694141760468483, + "step": 2 + }, + { + "loss": 5.370384216308594, + "ce_loss": 5.369755744934082, + "load_loss": 0.06285926699638367, + "step": 2 + }, + { + "loss": 5.438268661499023, + "ce_loss": 5.43757438659668, + "load_loss": 0.06942231953144073, + "step": 2 + }, + { + "loss": 5.38671350479126, + "ce_loss": 5.385992050170898, + "load_loss": 0.07212316989898682, + "step": 2 + }, + { + "loss": 5.364638328552246, + "ce_loss": 5.363935470581055, + "load_loss": 0.07027393579483032, + "step": 2 + }, + { + "loss": 5.277721405029297, + "ce_loss": 5.276371002197266, + "load_loss": 0.135047048330307, + "step": 2 + }, + { + "loss": 5.468009948730469, + "ce_loss": 5.467443466186523, + "load_loss": 0.05665811896324158, + "step": 2 + }, + { + "loss": 5.279819011688232, + "ce_loss": 5.278937339782715, + "load_loss": 0.0881664976477623, + "step": 2 + }, + { + "loss": 5.342848300933838, + "ce_loss": 5.34192419052124, + "load_loss": 0.09239106625318527, + "step": 2 + }, + { + "loss": 5.319812297821045, + "ce_loss": 5.319029331207275, + "load_loss": 0.07828506827354431, + "step": 2 + }, + { + "loss": 5.3164849281311035, + "ce_loss": 5.3152875900268555, + "load_loss": 0.11975578218698502, + "step": 2 + }, + { + "loss": 5.325706481933594, + "ce_loss": 5.3250732421875, + "load_loss": 0.06330254673957825, + "step": 2 + }, + { + "loss": 5.357410907745361, + "ce_loss": 5.356308937072754, + "load_loss": 0.11020752787590027, + "step": 2 + }, + { + "loss": 5.327867031097412, + "ce_loss": 5.327209949493408, + "load_loss": 0.06572479754686356, + "step": 2 + }, + { + "loss": 5.285209655761719, + "ce_loss": 5.284108638763428, + "load_loss": 0.11008115112781525, + "step": 2 + }, + { + "loss": 5.350188732147217, + "ce_loss": 5.349318504333496, + "load_loss": 0.08704344928264618, + "step": 2 + }, + { + "loss": 5.348325729370117, + "ce_loss": 5.347412109375, + "load_loss": 0.09135180711746216, + "step": 2 + }, + { + "loss": 5.4786906242370605, + "ce_loss": 5.477850914001465, + "load_loss": 0.08396873623132706, + "step": 2 + }, + { + "loss": 5.322304725646973, + "ce_loss": 5.321200847625732, + "load_loss": 0.11036837100982666, + "step": 2 + }, + { + "loss": 5.313679218292236, + "ce_loss": 5.312912940979004, + "load_loss": 0.07662396132946014, + "step": 2 + }, + { + "loss": 5.331940650939941, + "ce_loss": 5.331076622009277, + "load_loss": 0.08638811111450195, + "step": 2 + }, + { + "loss": 5.378920078277588, + "ce_loss": 5.378435134887695, + "load_loss": 0.04847991466522217, + "step": 2 + }, + { + "loss": 5.304769039154053, + "ce_loss": 5.303901195526123, + "load_loss": 0.08677682280540466, + "step": 2 + }, + { + "loss": 5.360819339752197, + "ce_loss": 5.360217571258545, + "load_loss": 0.06016559526324272, + "step": 2 + }, + { + "loss": 5.338390827178955, + "ce_loss": 5.3372015953063965, + "load_loss": 0.11891470104455948, + "step": 2 + }, + { + "loss": 5.366626739501953, + "ce_loss": 5.366143703460693, + "load_loss": 0.048284608870744705, + "step": 2 + }, + { + "loss": 5.331643104553223, + "ce_loss": 5.330733776092529, + "load_loss": 0.09092623740434647, + "step": 2 + }, + { + "loss": 5.321435451507568, + "ce_loss": 5.320710182189941, + "load_loss": 0.07254204154014587, + "step": 2 + }, + { + "loss": 5.327141761779785, + "ce_loss": 5.326182842254639, + "load_loss": 0.09587268531322479, + "step": 2 + }, + { + "loss": 5.341834545135498, + "ce_loss": 5.340916633605957, + "load_loss": 0.091767318546772, + "step": 2 + }, + { + "loss": 5.382009029388428, + "ce_loss": 5.381232261657715, + "load_loss": 0.07769482582807541, + "step": 2 + }, + { + "loss": 5.352447986602783, + "ce_loss": 5.3512349128723145, + "load_loss": 0.12132066488265991, + "step": 2 + }, + { + "loss": 5.248870372772217, + "ce_loss": 5.247734069824219, + "load_loss": 0.1136106550693512, + "step": 2 + }, + { + "loss": 5.316664695739746, + "ce_loss": 5.315652370452881, + "load_loss": 0.10124089568853378, + "step": 2 + }, + { + "loss": 5.366480350494385, + "ce_loss": 5.365838050842285, + "load_loss": 0.06424033641815186, + "step": 3 + }, + { + "loss": 5.451786041259766, + "ce_loss": 5.450634479522705, + "load_loss": 0.11517983675003052, + "step": 3 + }, + { + "loss": 5.186261177062988, + "ce_loss": 5.185348033905029, + "load_loss": 0.09130154550075531, + "step": 3 + }, + { + "loss": 5.261318683624268, + "ce_loss": 5.259909152984619, + "load_loss": 0.14093562960624695, + "step": 3 + }, + { + "loss": 5.25942325592041, + "ce_loss": 5.25849723815918, + "load_loss": 0.09261126816272736, + "step": 3 + }, + { + "loss": 5.202247619628906, + "ce_loss": 5.200950622558594, + "load_loss": 0.12970471382141113, + "step": 3 + }, + { + "loss": 5.185050964355469, + "ce_loss": 5.1843791007995605, + "load_loss": 0.0671781450510025, + "step": 3 + }, + { + "loss": 5.277399063110352, + "ce_loss": 5.276408672332764, + "load_loss": 0.09902448952198029, + "step": 3 + }, + { + "loss": 5.317290306091309, + "ce_loss": 5.316318988800049, + "load_loss": 0.0971360057592392, + "step": 3 + }, + { + "loss": 5.20380163192749, + "ce_loss": 5.202595233917236, + "load_loss": 0.12065860629081726, + "step": 3 + }, + { + "loss": 5.27182149887085, + "ce_loss": 5.270961284637451, + "load_loss": 0.08600179851055145, + "step": 3 + }, + { + "loss": 5.211792469024658, + "ce_loss": 5.210910797119141, + "load_loss": 0.08817176520824432, + "step": 3 + }, + { + "loss": 5.18540620803833, + "ce_loss": 5.184267044067383, + "load_loss": 0.11392562836408615, + "step": 3 + }, + { + "loss": 5.193941593170166, + "ce_loss": 5.192541599273682, + "load_loss": 0.13998442888259888, + "step": 3 + }, + { + "loss": 5.1156535148620605, + "ce_loss": 5.11463737487793, + "load_loss": 0.10161237418651581, + "step": 3 + }, + { + "loss": 5.240695476531982, + "ce_loss": 5.23969030380249, + "load_loss": 0.1005338504910469, + "step": 3 + }, + { + "loss": 5.459580421447754, + "ce_loss": 5.45846700668335, + "load_loss": 0.11133439838886261, + "step": 3 + }, + { + "loss": 5.1615800857543945, + "ce_loss": 5.160705089569092, + "load_loss": 0.0875159353017807, + "step": 3 + }, + { + "loss": 5.126975059509277, + "ce_loss": 5.1252360343933105, + "load_loss": 0.17390501499176025, + "step": 3 + }, + { + "loss": 5.10294246673584, + "ce_loss": 5.101553916931152, + "load_loss": 0.13885515928268433, + "step": 3 + }, + { + "loss": 5.107306957244873, + "ce_loss": 5.105893611907959, + "load_loss": 0.1413300782442093, + "step": 3 + }, + { + "loss": 5.279711723327637, + "ce_loss": 5.278626918792725, + "load_loss": 0.10847701132297516, + "step": 3 + }, + { + "loss": 5.118396759033203, + "ce_loss": 5.117003917694092, + "load_loss": 0.1392802596092224, + "step": 3 + }, + { + "loss": 5.152900695800781, + "ce_loss": 5.1517157554626465, + "load_loss": 0.11850348860025406, + "step": 3 + }, + { + "loss": 5.097411632537842, + "ce_loss": 5.096042156219482, + "load_loss": 0.13694177567958832, + "step": 3 + }, + { + "loss": 5.244536399841309, + "ce_loss": 5.242846965789795, + "load_loss": 0.16893413662910461, + "step": 3 + }, + { + "loss": 5.185676574707031, + "ce_loss": 5.184523105621338, + "load_loss": 0.115359827876091, + "step": 3 + }, + { + "loss": 5.113781929016113, + "ce_loss": 5.1126389503479, + "load_loss": 0.1142812967300415, + "step": 3 + }, + { + "loss": 5.094011306762695, + "ce_loss": 5.093057632446289, + "load_loss": 0.09535856544971466, + "step": 3 + }, + { + "loss": 5.194404125213623, + "ce_loss": 5.193044185638428, + "load_loss": 0.13597384095191956, + "step": 3 + }, + { + "loss": 5.105125904083252, + "ce_loss": 5.104041576385498, + "load_loss": 0.10842099785804749, + "step": 3 + }, + { + "loss": 5.26706075668335, + "ce_loss": 5.265887260437012, + "load_loss": 0.11736416816711426, + "step": 3 + }, + { + "loss": 5.126828670501709, + "ce_loss": 5.1255950927734375, + "load_loss": 0.12333650141954422, + "step": 3 + }, + { + "loss": 5.125635623931885, + "ce_loss": 5.124752521514893, + "load_loss": 0.08830005675554276, + "step": 3 + }, + { + "loss": 5.320208549499512, + "ce_loss": 5.31945276260376, + "load_loss": 0.0755760669708252, + "step": 3 + }, + { + "loss": 5.201677322387695, + "ce_loss": 5.200661659240723, + "load_loss": 0.10158125311136246, + "step": 3 + }, + { + "loss": 5.1885504722595215, + "ce_loss": 5.187704086303711, + "load_loss": 0.0846274346113205, + "step": 3 + }, + { + "loss": 5.282595634460449, + "ce_loss": 5.28176212310791, + "load_loss": 0.08334305882453918, + "step": 3 + }, + { + "loss": 5.162280082702637, + "ce_loss": 5.161004066467285, + "load_loss": 0.1275855004787445, + "step": 3 + }, + { + "loss": 5.224671840667725, + "ce_loss": 5.223367214202881, + "load_loss": 0.13046346604824066, + "step": 3 + }, + { + "loss": 5.230123996734619, + "ce_loss": 5.22920560836792, + "load_loss": 0.0918276309967041, + "step": 3 + }, + { + "loss": 5.2469096183776855, + "ce_loss": 5.245858669281006, + "load_loss": 0.10511697083711624, + "step": 3 + }, + { + "loss": 5.283612251281738, + "ce_loss": 5.282408714294434, + "load_loss": 0.12036804854869843, + "step": 3 + }, + { + "loss": 5.317785263061523, + "ce_loss": 5.3168535232543945, + "load_loss": 0.0931699275970459, + "step": 3 + }, + { + "loss": 5.48847770690918, + "ce_loss": 5.486970901489258, + "load_loss": 0.15067246556282043, + "step": 3 + }, + { + "loss": 5.253434181213379, + "ce_loss": 5.252256393432617, + "load_loss": 0.11777250468730927, + "step": 3 + }, + { + "loss": 5.152308940887451, + "ce_loss": 5.151449680328369, + "load_loss": 0.08592712134122849, + "step": 3 + }, + { + "loss": 5.150986194610596, + "ce_loss": 5.149564743041992, + "load_loss": 0.1421242505311966, + "step": 3 + }, + { + "loss": 5.29911470413208, + "ce_loss": 5.297784328460693, + "load_loss": 0.13302405178546906, + "step": 3 + }, + { + "loss": 5.139804840087891, + "ce_loss": 5.138701438903809, + "load_loss": 0.11034683138132095, + "step": 3 + }, + { + "loss": 5.1965413093566895, + "ce_loss": 5.1957478523254395, + "load_loss": 0.07933869957923889, + "step": 3 + }, + { + "loss": 5.278923988342285, + "ce_loss": 5.278161525726318, + "load_loss": 0.07625678926706314, + "step": 3 + }, + { + "loss": 5.24303674697876, + "ce_loss": 5.242001056671143, + "load_loss": 0.10355687141418457, + "step": 3 + }, + { + "loss": 5.233099937438965, + "ce_loss": 5.2321858406066895, + "load_loss": 0.09142743796110153, + "step": 3 + }, + { + "loss": 5.319681644439697, + "ce_loss": 5.318516731262207, + "load_loss": 0.11646994948387146, + "step": 3 + }, + { + "loss": 5.088719844818115, + "ce_loss": 5.087283134460449, + "load_loss": 0.14366184175014496, + "step": 3 + }, + { + "loss": 5.224547386169434, + "ce_loss": 5.223245620727539, + "load_loss": 0.1301647424697876, + "step": 3 + }, + { + "loss": 5.203068733215332, + "ce_loss": 5.2023420333862305, + "load_loss": 0.07268708944320679, + "step": 3 + }, + { + "loss": 5.383535861968994, + "ce_loss": 5.382448673248291, + "load_loss": 0.1087077409029007, + "step": 3 + }, + { + "loss": 5.161837577819824, + "ce_loss": 5.161148548126221, + "load_loss": 0.0689058005809784, + "step": 3 + }, + { + "loss": 5.1439008712768555, + "ce_loss": 5.14280891418457, + "load_loss": 0.1091754361987114, + "step": 3 + }, + { + "loss": 5.228513240814209, + "ce_loss": 5.226799011230469, + "load_loss": 0.17140233516693115, + "step": 3 + }, + { + "loss": 5.077149868011475, + "ce_loss": 5.075962066650391, + "load_loss": 0.11879836767911911, + "step": 3 + }, + { + "loss": 5.222142696380615, + "ce_loss": 5.221027374267578, + "load_loss": 0.11154215782880783, + "step": 3 + }, + { + "loss": 5.10561990737915, + "ce_loss": 5.104797840118408, + "load_loss": 0.08220469951629639, + "step": 3 + }, + { + "loss": 5.20397424697876, + "ce_loss": 5.203255653381348, + "load_loss": 0.07186707109212875, + "step": 3 + }, + { + "loss": 5.394243240356445, + "ce_loss": 5.3930463790893555, + "load_loss": 0.11968348920345306, + "step": 3 + }, + { + "loss": 5.450029373168945, + "ce_loss": 5.449063301086426, + "load_loss": 0.09660607576370239, + "step": 3 + }, + { + "loss": 5.277613162994385, + "ce_loss": 5.276667594909668, + "load_loss": 0.09456871449947357, + "step": 3 + }, + { + "loss": 5.158787250518799, + "ce_loss": 5.157497882843018, + "load_loss": 0.12895506620407104, + "step": 3 + }, + { + "loss": 5.178194046020508, + "ce_loss": 5.176967144012451, + "load_loss": 0.12267014384269714, + "step": 3 + }, + { + "loss": 5.177774429321289, + "ce_loss": 5.176793098449707, + "load_loss": 0.09812787920236588, + "step": 3 + }, + { + "loss": 5.156642913818359, + "ce_loss": 5.155407905578613, + "load_loss": 0.12352272123098373, + "step": 3 + }, + { + "loss": 5.230657577514648, + "ce_loss": 5.229443073272705, + "load_loss": 0.12145661562681198, + "step": 3 + }, + { + "loss": 5.156344413757324, + "ce_loss": 5.155635833740234, + "load_loss": 0.07085077464580536, + "step": 3 + }, + { + "loss": 5.213442325592041, + "ce_loss": 5.212599754333496, + "load_loss": 0.08426888287067413, + "step": 3 + }, + { + "loss": 5.340024948120117, + "ce_loss": 5.338743209838867, + "load_loss": 0.12816232442855835, + "step": 3 + }, + { + "loss": 5.129477024078369, + "ce_loss": 5.128434181213379, + "load_loss": 0.10427110642194748, + "step": 3 + }, + { + "loss": 5.244553565979004, + "ce_loss": 5.2438459396362305, + "load_loss": 0.07077465951442719, + "step": 3 + }, + { + "loss": 5.15726375579834, + "ce_loss": 5.15578031539917, + "load_loss": 0.14832347631454468, + "step": 3 + }, + { + "loss": 5.134742736816406, + "ce_loss": 5.133810520172119, + "load_loss": 0.09322977066040039, + "step": 3 + }, + { + "loss": 5.174201011657715, + "ce_loss": 5.172897815704346, + "load_loss": 0.13031411170959473, + "step": 3 + }, + { + "loss": 5.129069805145264, + "ce_loss": 5.127540111541748, + "load_loss": 0.1529626101255417, + "step": 3 + }, + { + "loss": 5.213240623474121, + "ce_loss": 5.212150573730469, + "load_loss": 0.10898395627737045, + "step": 3 + }, + { + "loss": 5.324206352233887, + "ce_loss": 5.3231987953186035, + "load_loss": 0.10076746344566345, + "step": 3 + }, + { + "loss": 5.121259689331055, + "ce_loss": 5.120218753814697, + "load_loss": 0.10410068184137344, + "step": 3 + }, + { + "loss": 5.175106048583984, + "ce_loss": 5.173721790313721, + "load_loss": 0.1384047120809555, + "step": 3 + }, + { + "loss": 5.233923435211182, + "ce_loss": 5.233304023742676, + "load_loss": 0.06194015219807625, + "step": 3 + }, + { + "loss": 5.13226842880249, + "ce_loss": 5.1311445236206055, + "load_loss": 0.11239616572856903, + "step": 3 + }, + { + "loss": 5.290378570556641, + "ce_loss": 5.2893242835998535, + "load_loss": 0.105433389544487, + "step": 3 + }, + { + "loss": 5.275423526763916, + "ce_loss": 5.274381637573242, + "load_loss": 0.10420408844947815, + "step": 3 + }, + { + "loss": 5.125052452087402, + "ce_loss": 5.1240668296813965, + "load_loss": 0.0985807329416275, + "step": 3 + }, + { + "loss": 5.129659652709961, + "ce_loss": 5.12827730178833, + "load_loss": 0.13821706175804138, + "step": 3 + }, + { + "loss": 5.228230953216553, + "ce_loss": 5.227156162261963, + "load_loss": 0.10747317224740982, + "step": 3 + }, + { + "loss": 5.205542087554932, + "ce_loss": 5.204185485839844, + "load_loss": 0.1356760859489441, + "step": 3 + }, + { + "loss": 5.469588756561279, + "ce_loss": 5.468235969543457, + "load_loss": 0.1352892816066742, + "step": 3 + }, + { + "loss": 5.13189172744751, + "ce_loss": 5.130489826202393, + "load_loss": 0.1401749551296234, + "step": 3 + }, + { + "loss": 5.167385578155518, + "ce_loss": 5.166370868682861, + "load_loss": 0.10145679861307144, + "step": 3 + }, + { + "loss": 5.4257378578186035, + "ce_loss": 5.424793720245361, + "load_loss": 0.09440402686595917, + "step": 3 + }, + { + "loss": 5.136709690093994, + "ce_loss": 5.135167121887207, + "load_loss": 0.15426085889339447, + "step": 3 + }, + { + "loss": 5.1786274909973145, + "ce_loss": 5.177438259124756, + "load_loss": 0.11890608072280884, + "step": 3 + }, + { + "loss": 5.1467180252075195, + "ce_loss": 5.145693302154541, + "load_loss": 0.10247978568077087, + "step": 3 + }, + { + "loss": 5.11523962020874, + "ce_loss": 5.114311695098877, + "load_loss": 0.0928051620721817, + "step": 3 + }, + { + "loss": 5.155282020568848, + "ce_loss": 5.154057502746582, + "load_loss": 0.12243413925170898, + "step": 3 + }, + { + "loss": 5.136712074279785, + "ce_loss": 5.13557767868042, + "load_loss": 0.11342586576938629, + "step": 3 + }, + { + "loss": 5.131498336791992, + "ce_loss": 5.130566120147705, + "load_loss": 0.09322928637266159, + "step": 3 + }, + { + "loss": 5.244434356689453, + "ce_loss": 5.243031024932861, + "load_loss": 0.14032958447933197, + "step": 3 + }, + { + "loss": 5.225911617279053, + "ce_loss": 5.225388526916504, + "load_loss": 0.0522894524037838, + "step": 3 + }, + { + "loss": 5.209970474243164, + "ce_loss": 5.208925724029541, + "load_loss": 0.10449035465717316, + "step": 3 + }, + { + "loss": 5.20566463470459, + "ce_loss": 5.2043609619140625, + "load_loss": 0.13037298619747162, + "step": 3 + }, + { + "loss": 5.149158477783203, + "ce_loss": 5.148135662078857, + "load_loss": 0.10227729380130768, + "step": 3 + }, + { + "loss": 5.248654842376709, + "ce_loss": 5.247729301452637, + "load_loss": 0.09253133088350296, + "step": 3 + }, + { + "loss": 5.097421646118164, + "ce_loss": 5.096019268035889, + "load_loss": 0.14023813605308533, + "step": 3 + }, + { + "loss": 5.1642255783081055, + "ce_loss": 5.163351058959961, + "load_loss": 0.08746375888586044, + "step": 3 + }, + { + "loss": 5.135500431060791, + "ce_loss": 5.134281158447266, + "load_loss": 0.12192574888467789, + "step": 3 + }, + { + "loss": 5.333640098571777, + "ce_loss": 5.332828521728516, + "load_loss": 0.08113814890384674, + "step": 3 + }, + { + "loss": 5.16300106048584, + "ce_loss": 5.161525726318359, + "load_loss": 0.14751110970973969, + "step": 3 + }, + { + "loss": 5.165749549865723, + "ce_loss": 5.164829254150391, + "load_loss": 0.09202869236469269, + "step": 3 + }, + { + "loss": 5.172216892242432, + "ce_loss": 5.17129373550415, + "load_loss": 0.09233362972736359, + "step": 3 + }, + { + "loss": 5.167056560516357, + "ce_loss": 5.166024684906006, + "load_loss": 0.10319496691226959, + "step": 3 + }, + { + "loss": 5.143087387084961, + "ce_loss": 5.142531871795654, + "load_loss": 0.0555647537112236, + "step": 3 + }, + { + "loss": 5.362790107727051, + "ce_loss": 5.361782073974609, + "load_loss": 0.10079427063465118, + "step": 3 + }, + { + "loss": 5.391131401062012, + "ce_loss": 5.389885425567627, + "load_loss": 0.12459118664264679, + "step": 3 + }, + { + "loss": 5.207069396972656, + "ce_loss": 5.206437110900879, + "load_loss": 0.06325085461139679, + "step": 3 + }, + { + "loss": 5.239530563354492, + "ce_loss": 5.238580226898193, + "load_loss": 0.09503830969333649, + "step": 3 + }, + { + "loss": 5.105722427368164, + "ce_loss": 5.104574680328369, + "load_loss": 0.11479735374450684, + "step": 4 + }, + { + "loss": 5.041556358337402, + "ce_loss": 5.040302753448486, + "load_loss": 0.1253662109375, + "step": 4 + }, + { + "loss": 5.001564025878906, + "ce_loss": 5.000161170959473, + "load_loss": 0.14030754566192627, + "step": 4 + }, + { + "loss": 4.960509777069092, + "ce_loss": 4.95910120010376, + "load_loss": 0.14087817072868347, + "step": 4 + }, + { + "loss": 5.089745044708252, + "ce_loss": 5.088712215423584, + "load_loss": 0.10326103866100311, + "step": 4 + }, + { + "loss": 5.123603343963623, + "ce_loss": 5.12231969833374, + "load_loss": 0.12836289405822754, + "step": 4 + }, + { + "loss": 5.007664680480957, + "ce_loss": 5.006443977355957, + "load_loss": 0.12206554412841797, + "step": 4 + }, + { + "loss": 4.989034652709961, + "ce_loss": 4.988070964813232, + "load_loss": 0.09637725353240967, + "step": 4 + }, + { + "loss": 5.186829566955566, + "ce_loss": 5.185821533203125, + "load_loss": 0.10080672055482864, + "step": 4 + }, + { + "loss": 5.153075695037842, + "ce_loss": 5.151601791381836, + "load_loss": 0.14740148186683655, + "step": 4 + }, + { + "loss": 4.916862964630127, + "ce_loss": 4.915342807769775, + "load_loss": 0.15201716125011444, + "step": 4 + }, + { + "loss": 5.214655876159668, + "ce_loss": 5.213145732879639, + "load_loss": 0.15100614726543427, + "step": 4 + }, + { + "loss": 5.1803131103515625, + "ce_loss": 5.178628921508789, + "load_loss": 0.1684008538722992, + "step": 4 + }, + { + "loss": 5.092656135559082, + "ce_loss": 5.09163761138916, + "load_loss": 0.10184024274349213, + "step": 4 + }, + { + "loss": 5.030149936676025, + "ce_loss": 5.029284954071045, + "load_loss": 0.086519755423069, + "step": 4 + }, + { + "loss": 4.98245096206665, + "ce_loss": 4.980936050415039, + "load_loss": 0.15148964524269104, + "step": 4 + }, + { + "loss": 4.9616899490356445, + "ce_loss": 4.9602155685424805, + "load_loss": 0.14742062985897064, + "step": 4 + }, + { + "loss": 5.014886379241943, + "ce_loss": 5.013296604156494, + "load_loss": 0.15899620950222015, + "step": 4 + }, + { + "loss": 5.046016693115234, + "ce_loss": 5.044070720672607, + "load_loss": 0.19461379945278168, + "step": 4 + }, + { + "loss": 4.997530937194824, + "ce_loss": 4.996466636657715, + "load_loss": 0.10643532872200012, + "step": 4 + }, + { + "loss": 4.973173141479492, + "ce_loss": 4.972139835357666, + "load_loss": 0.10333235561847687, + "step": 4 + }, + { + "loss": 5.0746917724609375, + "ce_loss": 5.073171615600586, + "load_loss": 0.15199561417102814, + "step": 4 + }, + { + "loss": 5.131619930267334, + "ce_loss": 5.130079746246338, + "load_loss": 0.15400953590869904, + "step": 4 + }, + { + "loss": 5.134965419769287, + "ce_loss": 5.133638858795166, + "load_loss": 0.13265305757522583, + "step": 4 + }, + { + "loss": 5.06727933883667, + "ce_loss": 5.065884590148926, + "load_loss": 0.1394827514886856, + "step": 4 + }, + { + "loss": 5.052821159362793, + "ce_loss": 5.051478385925293, + "load_loss": 0.1342557668685913, + "step": 4 + }, + { + "loss": 5.11099910736084, + "ce_loss": 5.109930992126465, + "load_loss": 0.10679532587528229, + "step": 4 + }, + { + "loss": 5.167531490325928, + "ce_loss": 5.165694713592529, + "load_loss": 0.18369212746620178, + "step": 4 + }, + { + "loss": 5.051634311676025, + "ce_loss": 5.050246238708496, + "load_loss": 0.1388068050146103, + "step": 4 + }, + { + "loss": 4.986548900604248, + "ce_loss": 4.985368251800537, + "load_loss": 0.11805303394794464, + "step": 4 + }, + { + "loss": 5.037880897521973, + "ce_loss": 5.03684663772583, + "load_loss": 0.10340416431427002, + "step": 4 + }, + { + "loss": 5.289742469787598, + "ce_loss": 5.288827896118164, + "load_loss": 0.09144659340381622, + "step": 4 + }, + { + "loss": 5.136407375335693, + "ce_loss": 5.135026454925537, + "load_loss": 0.13808205723762512, + "step": 4 + }, + { + "loss": 4.953204154968262, + "ce_loss": 4.951904296875, + "load_loss": 0.1299991011619568, + "step": 4 + }, + { + "loss": 5.206218242645264, + "ce_loss": 5.205124855041504, + "load_loss": 0.10934585332870483, + "step": 4 + }, + { + "loss": 4.975628852844238, + "ce_loss": 4.974353313446045, + "load_loss": 0.1275433599948883, + "step": 4 + }, + { + "loss": 4.943752765655518, + "ce_loss": 4.942587375640869, + "load_loss": 0.11655564606189728, + "step": 4 + }, + { + "loss": 5.062301158905029, + "ce_loss": 5.061116695404053, + "load_loss": 0.11846615374088287, + "step": 4 + }, + { + "loss": 5.023245811462402, + "ce_loss": 5.021785736083984, + "load_loss": 0.1460300087928772, + "step": 4 + }, + { + "loss": 4.98094367980957, + "ce_loss": 4.97968053817749, + "load_loss": 0.12632600963115692, + "step": 4 + }, + { + "loss": 5.010547161102295, + "ce_loss": 5.0094075202941895, + "load_loss": 0.11395100504159927, + "step": 4 + }, + { + "loss": 4.943954944610596, + "ce_loss": 4.942524433135986, + "load_loss": 0.14305388927459717, + "step": 4 + }, + { + "loss": 4.979029655456543, + "ce_loss": 4.977869510650635, + "load_loss": 0.11602044850587845, + "step": 4 + }, + { + "loss": 5.134889602661133, + "ce_loss": 5.133806228637695, + "load_loss": 0.1083209440112114, + "step": 4 + }, + { + "loss": 5.069670677185059, + "ce_loss": 5.069085121154785, + "load_loss": 0.0585341639816761, + "step": 4 + }, + { + "loss": 5.005459308624268, + "ce_loss": 5.004170894622803, + "load_loss": 0.12885694205760956, + "step": 4 + }, + { + "loss": 5.015411376953125, + "ce_loss": 5.014306545257568, + "load_loss": 0.11048182845115662, + "step": 4 + }, + { + "loss": 5.28474235534668, + "ce_loss": 5.283285617828369, + "load_loss": 0.14564990997314453, + "step": 4 + }, + { + "loss": 4.988275051116943, + "ce_loss": 4.987467288970947, + "load_loss": 0.08076093345880508, + "step": 4 + }, + { + "loss": 4.962780952453613, + "ce_loss": 4.9613871574401855, + "load_loss": 0.13936881721019745, + "step": 4 + }, + { + "loss": 5.008322715759277, + "ce_loss": 5.007258892059326, + "load_loss": 0.10638267546892166, + "step": 4 + }, + { + "loss": 4.995354175567627, + "ce_loss": 4.994263648986816, + "load_loss": 0.1090327799320221, + "step": 4 + }, + { + "loss": 5.124089241027832, + "ce_loss": 5.123000621795654, + "load_loss": 0.10884226113557816, + "step": 4 + }, + { + "loss": 5.0453996658325195, + "ce_loss": 5.043872356414795, + "load_loss": 0.15275390446186066, + "step": 4 + }, + { + "loss": 5.119015693664551, + "ce_loss": 5.118017673492432, + "load_loss": 0.09979856014251709, + "step": 4 + }, + { + "loss": 4.997279644012451, + "ce_loss": 4.995699882507324, + "load_loss": 0.1579861342906952, + "step": 4 + }, + { + "loss": 5.052245140075684, + "ce_loss": 5.050884246826172, + "load_loss": 0.13609972596168518, + "step": 4 + }, + { + "loss": 5.207485198974609, + "ce_loss": 5.206484794616699, + "load_loss": 0.10004796832799911, + "step": 4 + }, + { + "loss": 5.355697154998779, + "ce_loss": 5.354294300079346, + "load_loss": 0.14026974141597748, + "step": 4 + }, + { + "loss": 5.0093770027160645, + "ce_loss": 5.008268356323242, + "load_loss": 0.11086909472942352, + "step": 4 + }, + { + "loss": 4.986634254455566, + "ce_loss": 4.98543119430542, + "load_loss": 0.12029576301574707, + "step": 4 + }, + { + "loss": 5.065466403961182, + "ce_loss": 5.0645012855529785, + "load_loss": 0.09649309515953064, + "step": 4 + }, + { + "loss": 5.1575751304626465, + "ce_loss": 5.156363487243652, + "load_loss": 0.12115120887756348, + "step": 4 + }, + { + "loss": 5.085602760314941, + "ce_loss": 5.084139347076416, + "load_loss": 0.1463335007429123, + "step": 4 + }, + { + "loss": 5.022790908813477, + "ce_loss": 5.021641731262207, + "load_loss": 0.11490314453840256, + "step": 4 + }, + { + "loss": 5.190988540649414, + "ce_loss": 5.189647197723389, + "load_loss": 0.13412077724933624, + "step": 4 + }, + { + "loss": 5.090539932250977, + "ce_loss": 5.089672088623047, + "load_loss": 0.08677539229393005, + "step": 4 + }, + { + "loss": 5.093902111053467, + "ce_loss": 5.093130588531494, + "load_loss": 0.07714144140481949, + "step": 4 + }, + { + "loss": 5.072310447692871, + "ce_loss": 5.070898056030273, + "load_loss": 0.14122331142425537, + "step": 4 + }, + { + "loss": 5.015969276428223, + "ce_loss": 5.014551162719727, + "load_loss": 0.1418173909187317, + "step": 4 + }, + { + "loss": 5.076681137084961, + "ce_loss": 5.075845241546631, + "load_loss": 0.0835723727941513, + "step": 4 + }, + { + "loss": 5.0701518058776855, + "ce_loss": 5.069005489349365, + "load_loss": 0.11465422064065933, + "step": 4 + }, + { + "loss": 5.026144027709961, + "ce_loss": 5.024903774261475, + "load_loss": 0.12404593825340271, + "step": 4 + }, + { + "loss": 4.9435601234436035, + "ce_loss": 4.942136764526367, + "load_loss": 0.14232099056243896, + "step": 4 + }, + { + "loss": 4.9994893074035645, + "ce_loss": 4.997939586639404, + "load_loss": 0.15496550500392914, + "step": 4 + }, + { + "loss": 4.991105556488037, + "ce_loss": 4.989588737487793, + "load_loss": 0.15166771411895752, + "step": 4 + }, + { + "loss": 5.034537315368652, + "ce_loss": 5.033608913421631, + "load_loss": 0.09284202009439468, + "step": 4 + }, + { + "loss": 5.101203441619873, + "ce_loss": 5.100046634674072, + "load_loss": 0.11565853655338287, + "step": 4 + }, + { + "loss": 5.478394985198975, + "ce_loss": 5.477128982543945, + "load_loss": 0.1265888214111328, + "step": 4 + }, + { + "loss": 5.012144088745117, + "ce_loss": 5.010854721069336, + "load_loss": 0.12895362079143524, + "step": 4 + }, + { + "loss": 4.975273609161377, + "ce_loss": 4.9738569259643555, + "load_loss": 0.14167378842830658, + "step": 4 + }, + { + "loss": 5.0378007888793945, + "ce_loss": 5.036388874053955, + "load_loss": 0.1412079930305481, + "step": 4 + }, + { + "loss": 5.1198320388793945, + "ce_loss": 5.118545055389404, + "load_loss": 0.12869656085968018, + "step": 4 + }, + { + "loss": 5.195223331451416, + "ce_loss": 5.193652153015137, + "load_loss": 0.1571134626865387, + "step": 4 + }, + { + "loss": 4.959562301635742, + "ce_loss": 4.9584641456604, + "load_loss": 0.10983605682849884, + "step": 4 + }, + { + "loss": 5.272184371948242, + "ce_loss": 5.271017551422119, + "load_loss": 0.11666812747716904, + "step": 4 + }, + { + "loss": 5.1047892570495605, + "ce_loss": 5.10351037979126, + "load_loss": 0.12789714336395264, + "step": 4 + }, + { + "loss": 4.998221397399902, + "ce_loss": 4.997015953063965, + "load_loss": 0.12054996192455292, + "step": 4 + }, + { + "loss": 5.057313919067383, + "ce_loss": 5.056361675262451, + "load_loss": 0.09520299732685089, + "step": 4 + }, + { + "loss": 4.953908443450928, + "ce_loss": 4.952419757843018, + "load_loss": 0.14886727929115295, + "step": 4 + }, + { + "loss": 4.963015079498291, + "ce_loss": 4.961806774139404, + "load_loss": 0.1208089292049408, + "step": 4 + }, + { + "loss": 5.159411430358887, + "ce_loss": 5.15802001953125, + "load_loss": 0.13912563025951385, + "step": 4 + }, + { + "loss": 4.970909595489502, + "ce_loss": 4.969681262969971, + "load_loss": 0.12282188981771469, + "step": 4 + }, + { + "loss": 5.083982467651367, + "ce_loss": 5.0830078125, + "load_loss": 0.09747827798128128, + "step": 4 + }, + { + "loss": 5.139321327209473, + "ce_loss": 5.137893199920654, + "load_loss": 0.14282459020614624, + "step": 4 + }, + { + "loss": 5.05523157119751, + "ce_loss": 5.054191589355469, + "load_loss": 0.10397718101739883, + "step": 4 + }, + { + "loss": 5.012917518615723, + "ce_loss": 5.012105941772461, + "load_loss": 0.08114293217658997, + "step": 4 + }, + { + "loss": 4.962013244628906, + "ce_loss": 4.960689067840576, + "load_loss": 0.13239455223083496, + "step": 4 + }, + { + "loss": 4.977715969085693, + "ce_loss": 4.976246356964111, + "load_loss": 0.14693762362003326, + "step": 4 + }, + { + "loss": 5.20817232131958, + "ce_loss": 5.207478046417236, + "load_loss": 0.06941033899784088, + "step": 4 + }, + { + "loss": 5.041216850280762, + "ce_loss": 5.04005241394043, + "load_loss": 0.11646085232496262, + "step": 4 + }, + { + "loss": 4.994439601898193, + "ce_loss": 4.993289470672607, + "load_loss": 0.11503526568412781, + "step": 4 + }, + { + "loss": 5.045073986053467, + "ce_loss": 5.043934345245361, + "load_loss": 0.11395818740129471, + "step": 4 + }, + { + "loss": 5.110751628875732, + "ce_loss": 5.109496116638184, + "load_loss": 0.12556201219558716, + "step": 4 + }, + { + "loss": 4.976954460144043, + "ce_loss": 4.975590705871582, + "load_loss": 0.13637404143810272, + "step": 4 + }, + { + "loss": 5.0020670890808105, + "ce_loss": 5.000659942626953, + "load_loss": 0.14069578051567078, + "step": 4 + }, + { + "loss": 5.0157575607299805, + "ce_loss": 5.014624118804932, + "load_loss": 0.11333011835813522, + "step": 4 + }, + { + "loss": 4.967869758605957, + "ce_loss": 4.966929912567139, + "load_loss": 0.09398180991411209, + "step": 4 + }, + { + "loss": 5.156005382537842, + "ce_loss": 5.154533386230469, + "load_loss": 0.14717984199523926, + "step": 4 + }, + { + "loss": 4.940810203552246, + "ce_loss": 4.939011096954346, + "load_loss": 0.1799108386039734, + "step": 4 + }, + { + "loss": 4.918017864227295, + "ce_loss": 4.916433334350586, + "load_loss": 0.1584385186433792, + "step": 4 + }, + { + "loss": 5.18239688873291, + "ce_loss": 5.180662155151367, + "load_loss": 0.1734880656003952, + "step": 4 + }, + { + "loss": 5.170213222503662, + "ce_loss": 5.168896675109863, + "load_loss": 0.13167506456375122, + "step": 4 + }, + { + "loss": 5.01312255859375, + "ce_loss": 5.012134552001953, + "load_loss": 0.0988239124417305, + "step": 4 + }, + { + "loss": 4.984898090362549, + "ce_loss": 4.983777046203613, + "load_loss": 0.11211134493350983, + "step": 4 + }, + { + "loss": 4.982788562774658, + "ce_loss": 4.981577396392822, + "load_loss": 0.12113254517316818, + "step": 4 + }, + { + "loss": 5.042897701263428, + "ce_loss": 5.041626930236816, + "load_loss": 0.12708763778209686, + "step": 4 + }, + { + "loss": 5.096471309661865, + "ce_loss": 5.095460414886475, + "load_loss": 0.10106857120990753, + "step": 4 + }, + { + "loss": 4.978748321533203, + "ce_loss": 4.977292060852051, + "load_loss": 0.14560729265213013, + "step": 4 + }, + { + "loss": 5.2806525230407715, + "ce_loss": 5.279472351074219, + "load_loss": 0.11803483217954636, + "step": 4 + }, + { + "loss": 5.138638973236084, + "ce_loss": 5.137416362762451, + "load_loss": 0.12227090448141098, + "step": 4 + }, + { + "loss": 5.1625518798828125, + "ce_loss": 5.161233425140381, + "load_loss": 0.13186654448509216, + "step": 4 + }, + { + "loss": 4.990941047668457, + "ce_loss": 4.989779949188232, + "load_loss": 0.11611762642860413, + "step": 4 + }, + { + "loss": 5.0500617027282715, + "ce_loss": 5.048461437225342, + "load_loss": 0.16003739833831787, + "step": 4 + }, + { + "loss": 5.106400489807129, + "ce_loss": 5.105234146118164, + "load_loss": 0.11661738157272339, + "step": 4 + }, + { + "loss": 5.290626049041748, + "ce_loss": 5.2896552085876465, + "load_loss": 0.0970948338508606, + "step": 5 + }, + { + "loss": 4.818631172180176, + "ce_loss": 4.817363739013672, + "load_loss": 0.12672428786754608, + "step": 5 + }, + { + "loss": 4.961798191070557, + "ce_loss": 4.960453987121582, + "load_loss": 0.13440656661987305, + "step": 5 + }, + { + "loss": 4.8237690925598145, + "ce_loss": 4.822427272796631, + "load_loss": 0.13420072197914124, + "step": 5 + }, + { + "loss": 4.814997673034668, + "ce_loss": 4.813769340515137, + "load_loss": 0.12283624708652496, + "step": 5 + }, + { + "loss": 4.9557108879089355, + "ce_loss": 4.954495906829834, + "load_loss": 0.12147434055805206, + "step": 5 + }, + { + "loss": 4.934597015380859, + "ce_loss": 4.933218955993652, + "load_loss": 0.13780871033668518, + "step": 5 + }, + { + "loss": 4.949193477630615, + "ce_loss": 4.948011875152588, + "load_loss": 0.11817652732133865, + "step": 5 + }, + { + "loss": 4.777073383331299, + "ce_loss": 4.775473117828369, + "load_loss": 0.160019189119339, + "step": 5 + }, + { + "loss": 4.826393127441406, + "ce_loss": 4.825381755828857, + "load_loss": 0.10114467889070511, + "step": 5 + }, + { + "loss": 4.9223456382751465, + "ce_loss": 4.920987606048584, + "load_loss": 0.1357799619436264, + "step": 5 + }, + { + "loss": 4.898773670196533, + "ce_loss": 4.89748477935791, + "load_loss": 0.1289043128490448, + "step": 5 + }, + { + "loss": 5.05389928817749, + "ce_loss": 5.052340984344482, + "load_loss": 0.1558535099029541, + "step": 5 + }, + { + "loss": 4.875833988189697, + "ce_loss": 4.874575614929199, + "load_loss": 0.12584921717643738, + "step": 5 + }, + { + "loss": 4.836881160736084, + "ce_loss": 4.835371971130371, + "load_loss": 0.15089987218379974, + "step": 5 + }, + { + "loss": 5.127742767333984, + "ce_loss": 5.126344680786133, + "load_loss": 0.13980348408222198, + "step": 5 + }, + { + "loss": 4.892400741577148, + "ce_loss": 4.891075611114502, + "load_loss": 0.13249510526657104, + "step": 5 + }, + { + "loss": 4.7972588539123535, + "ce_loss": 4.7958984375, + "load_loss": 0.136065274477005, + "step": 5 + }, + { + "loss": 4.894777297973633, + "ce_loss": 4.893580913543701, + "load_loss": 0.11962701380252838, + "step": 5 + }, + { + "loss": 4.879599571228027, + "ce_loss": 4.878396034240723, + "load_loss": 0.12037474662065506, + "step": 5 + }, + { + "loss": 4.844310283660889, + "ce_loss": 4.842886447906494, + "load_loss": 0.14238321781158447, + "step": 5 + }, + { + "loss": 4.8212761878967285, + "ce_loss": 4.8199238777160645, + "load_loss": 0.1352514773607254, + "step": 5 + }, + { + "loss": 5.091840744018555, + "ce_loss": 5.090614318847656, + "load_loss": 0.12264955788850784, + "step": 5 + }, + { + "loss": 4.809109210968018, + "ce_loss": 4.807820796966553, + "load_loss": 0.12885405123233795, + "step": 5 + }, + { + "loss": 4.9258832931518555, + "ce_loss": 4.9244184494018555, + "load_loss": 0.14649291336536407, + "step": 5 + }, + { + "loss": 4.96202278137207, + "ce_loss": 4.9609222412109375, + "load_loss": 0.11006966233253479, + "step": 5 + }, + { + "loss": 5.097322940826416, + "ce_loss": 5.096010684967041, + "load_loss": 0.1312207728624344, + "step": 5 + }, + { + "loss": 4.893229007720947, + "ce_loss": 4.89223051071167, + "load_loss": 0.09984882175922394, + "step": 5 + }, + { + "loss": 4.897961616516113, + "ce_loss": 4.896583080291748, + "load_loss": 0.13783025741577148, + "step": 5 + }, + { + "loss": 4.886246204376221, + "ce_loss": 4.8847336769104, + "load_loss": 0.15124309062957764, + "step": 5 + }, + { + "loss": 4.859015464782715, + "ce_loss": 4.857851505279541, + "load_loss": 0.11637899279594421, + "step": 5 + }, + { + "loss": 5.312042713165283, + "ce_loss": 5.310174942016602, + "load_loss": 0.1867874413728714, + "step": 5 + }, + { + "loss": 4.920048713684082, + "ce_loss": 4.918450355529785, + "load_loss": 0.1598176658153534, + "step": 5 + }, + { + "loss": 5.0131754875183105, + "ce_loss": 5.011838912963867, + "load_loss": 0.1336650550365448, + "step": 5 + }, + { + "loss": 4.855599403381348, + "ce_loss": 4.8542633056640625, + "load_loss": 0.13358844816684723, + "step": 5 + }, + { + "loss": 5.043703556060791, + "ce_loss": 5.041956901550293, + "load_loss": 0.1746862530708313, + "step": 5 + }, + { + "loss": 4.8922438621521, + "ce_loss": 4.890994071960449, + "load_loss": 0.12497846782207489, + "step": 5 + }, + { + "loss": 5.000698089599609, + "ce_loss": 4.999244689941406, + "load_loss": 0.14532677829265594, + "step": 5 + }, + { + "loss": 4.833770275115967, + "ce_loss": 4.832086086273193, + "load_loss": 0.16841378808021545, + "step": 5 + }, + { + "loss": 4.820947647094727, + "ce_loss": 4.819730758666992, + "load_loss": 0.12167300283908844, + "step": 5 + }, + { + "loss": 5.178308010101318, + "ce_loss": 5.17713737487793, + "load_loss": 0.11704248189926147, + "step": 5 + }, + { + "loss": 4.77994441986084, + "ce_loss": 4.77895975112915, + "load_loss": 0.0984572321176529, + "step": 5 + }, + { + "loss": 4.8725361824035645, + "ce_loss": 4.871399879455566, + "load_loss": 0.11364175379276276, + "step": 5 + }, + { + "loss": 5.342255592346191, + "ce_loss": 5.340713977813721, + "load_loss": 0.15417994558811188, + "step": 5 + }, + { + "loss": 4.869293689727783, + "ce_loss": 4.867892265319824, + "load_loss": 0.14012852311134338, + "step": 5 + }, + { + "loss": 4.879809856414795, + "ce_loss": 4.878472328186035, + "load_loss": 0.13374833762645721, + "step": 5 + }, + { + "loss": 4.86292028427124, + "ce_loss": 4.861630916595459, + "load_loss": 0.12895171344280243, + "step": 5 + }, + { + "loss": 4.867336750030518, + "ce_loss": 4.866026401519775, + "load_loss": 0.13101541996002197, + "step": 5 + }, + { + "loss": 4.851133346557617, + "ce_loss": 4.849943161010742, + "load_loss": 0.11901857703924179, + "step": 5 + }, + { + "loss": 4.916110992431641, + "ce_loss": 4.91441011428833, + "load_loss": 0.17007537186145782, + "step": 5 + }, + { + "loss": 4.959451198577881, + "ce_loss": 4.958427429199219, + "load_loss": 0.10236633569002151, + "step": 5 + }, + { + "loss": 4.897066116333008, + "ce_loss": 4.895788669586182, + "load_loss": 0.12774011492729187, + "step": 5 + }, + { + "loss": 5.159424304962158, + "ce_loss": 5.158260822296143, + "load_loss": 0.11635793745517731, + "step": 5 + }, + { + "loss": 4.889738082885742, + "ce_loss": 4.888802528381348, + "load_loss": 0.09355385601520538, + "step": 5 + }, + { + "loss": 4.8767852783203125, + "ce_loss": 4.875661373138428, + "load_loss": 0.11240668594837189, + "step": 5 + }, + { + "loss": 4.828258991241455, + "ce_loss": 4.8272833824157715, + "load_loss": 0.09755438566207886, + "step": 5 + }, + { + "loss": 4.964545249938965, + "ce_loss": 4.963242530822754, + "load_loss": 0.1302868127822876, + "step": 5 + }, + { + "loss": 4.913424015045166, + "ce_loss": 4.912200450897217, + "load_loss": 0.12237286567687988, + "step": 5 + }, + { + "loss": 4.860200881958008, + "ce_loss": 4.858964443206787, + "load_loss": 0.12363377213478088, + "step": 5 + }, + { + "loss": 4.8831353187561035, + "ce_loss": 4.881842613220215, + "load_loss": 0.12925615906715393, + "step": 5 + }, + { + "loss": 4.769160270690918, + "ce_loss": 4.767755508422852, + "load_loss": 0.14048179984092712, + "step": 5 + }, + { + "loss": 5.026341438293457, + "ce_loss": 5.024953842163086, + "load_loss": 0.1387670785188675, + "step": 5 + }, + { + "loss": 4.867936611175537, + "ce_loss": 4.866633415222168, + "load_loss": 0.13030022382736206, + "step": 5 + }, + { + "loss": 4.902166843414307, + "ce_loss": 4.900944709777832, + "load_loss": 0.12222685664892197, + "step": 5 + }, + { + "loss": 5.036012172698975, + "ce_loss": 5.034929275512695, + "load_loss": 0.10828791558742523, + "step": 5 + }, + { + "loss": 4.879532814025879, + "ce_loss": 4.877954959869385, + "load_loss": 0.15777502954006195, + "step": 5 + }, + { + "loss": 4.865845203399658, + "ce_loss": 4.864627838134766, + "load_loss": 0.1217242181301117, + "step": 5 + }, + { + "loss": 5.011448860168457, + "ce_loss": 5.010199546813965, + "load_loss": 0.12491334974765778, + "step": 5 + }, + { + "loss": 4.893879413604736, + "ce_loss": 4.892507553100586, + "load_loss": 0.13717444241046906, + "step": 5 + }, + { + "loss": 4.8745317459106445, + "ce_loss": 4.8738017082214355, + "load_loss": 0.0729944184422493, + "step": 5 + }, + { + "loss": 4.996376037597656, + "ce_loss": 4.995105266571045, + "load_loss": 0.1270550787448883, + "step": 5 + }, + { + "loss": 5.014294624328613, + "ce_loss": 5.0127058029174805, + "load_loss": 0.1589057296514511, + "step": 5 + }, + { + "loss": 4.907698154449463, + "ce_loss": 4.906002521514893, + "load_loss": 0.16955308616161346, + "step": 5 + }, + { + "loss": 4.899357795715332, + "ce_loss": 4.897809982299805, + "load_loss": 0.15479031205177307, + "step": 5 + }, + { + "loss": 4.884696006774902, + "ce_loss": 4.882867813110352, + "load_loss": 0.18283717334270477, + "step": 5 + }, + { + "loss": 5.194336891174316, + "ce_loss": 5.192911148071289, + "load_loss": 0.14257995784282684, + "step": 5 + }, + { + "loss": 4.8899970054626465, + "ce_loss": 4.889023303985596, + "load_loss": 0.09735142439603806, + "step": 5 + }, + { + "loss": 4.941700458526611, + "ce_loss": 4.940612316131592, + "load_loss": 0.10879343748092651, + "step": 5 + }, + { + "loss": 5.2609052658081055, + "ce_loss": 5.25977087020874, + "load_loss": 0.11344979703426361, + "step": 5 + }, + { + "loss": 5.101428508758545, + "ce_loss": 5.100186347961426, + "load_loss": 0.12423980981111526, + "step": 5 + }, + { + "loss": 4.885984897613525, + "ce_loss": 4.884743690490723, + "load_loss": 0.12412780523300171, + "step": 5 + }, + { + "loss": 5.175535202026367, + "ce_loss": 5.174375534057617, + "load_loss": 0.11597113311290741, + "step": 5 + }, + { + "loss": 4.981139659881592, + "ce_loss": 4.980381965637207, + "load_loss": 0.07577090710401535, + "step": 5 + }, + { + "loss": 4.853254795074463, + "ce_loss": 4.851715087890625, + "load_loss": 0.15395256876945496, + "step": 5 + }, + { + "loss": 4.838575839996338, + "ce_loss": 4.837349891662598, + "load_loss": 0.12260694801807404, + "step": 5 + }, + { + "loss": 4.9921674728393555, + "ce_loss": 4.991384506225586, + "load_loss": 0.07831043750047684, + "step": 5 + }, + { + "loss": 5.074146270751953, + "ce_loss": 5.072839260101318, + "load_loss": 0.13067936897277832, + "step": 5 + }, + { + "loss": 4.8408098220825195, + "ce_loss": 4.839382171630859, + "load_loss": 0.14278246462345123, + "step": 5 + }, + { + "loss": 5.067137241363525, + "ce_loss": 5.065629005432129, + "load_loss": 0.15082614123821259, + "step": 5 + }, + { + "loss": 4.955542087554932, + "ce_loss": 4.954446315765381, + "load_loss": 0.10956989228725433, + "step": 5 + }, + { + "loss": 4.932624816894531, + "ce_loss": 4.930913925170898, + "load_loss": 0.17107011377811432, + "step": 5 + }, + { + "loss": 4.873562812805176, + "ce_loss": 4.871925354003906, + "load_loss": 0.163763165473938, + "step": 5 + }, + { + "loss": 4.9365081787109375, + "ce_loss": 4.935154914855957, + "load_loss": 0.13530316948890686, + "step": 5 + }, + { + "loss": 4.9882121086120605, + "ce_loss": 4.987473964691162, + "load_loss": 0.073827363550663, + "step": 5 + }, + { + "loss": 4.87101411819458, + "ce_loss": 4.869230270385742, + "load_loss": 0.1783880889415741, + "step": 5 + }, + { + "loss": 5.000949382781982, + "ce_loss": 4.999066352844238, + "load_loss": 0.1882929801940918, + "step": 5 + }, + { + "loss": 4.832135200500488, + "ce_loss": 4.831289768218994, + "load_loss": 0.08456328511238098, + "step": 5 + }, + { + "loss": 5.274632453918457, + "ce_loss": 5.273238658905029, + "load_loss": 0.13937264680862427, + "step": 5 + }, + { + "loss": 4.900485992431641, + "ce_loss": 4.898824691772461, + "load_loss": 0.16611887514591217, + "step": 5 + }, + { + "loss": 5.147662162780762, + "ce_loss": 5.146243095397949, + "load_loss": 0.14188632369041443, + "step": 5 + }, + { + "loss": 4.854607582092285, + "ce_loss": 4.853281021118164, + "load_loss": 0.132649227976799, + "step": 5 + }, + { + "loss": 4.950091361999512, + "ce_loss": 4.948530673980713, + "load_loss": 0.15608759224414825, + "step": 5 + }, + { + "loss": 4.842403888702393, + "ce_loss": 4.841009140014648, + "load_loss": 0.13949422538280487, + "step": 5 + }, + { + "loss": 4.84272575378418, + "ce_loss": 4.841470718383789, + "load_loss": 0.12549352645874023, + "step": 5 + }, + { + "loss": 4.917208671569824, + "ce_loss": 4.916077613830566, + "load_loss": 0.11311183124780655, + "step": 5 + }, + { + "loss": 4.921689987182617, + "ce_loss": 4.920042037963867, + "load_loss": 0.16479524970054626, + "step": 5 + }, + { + "loss": 4.832238674163818, + "ce_loss": 4.831122875213623, + "load_loss": 0.11157423257827759, + "step": 5 + }, + { + "loss": 4.829413890838623, + "ce_loss": 4.828509330749512, + "load_loss": 0.09045661985874176, + "step": 5 + }, + { + "loss": 4.8725385665893555, + "ce_loss": 4.871006965637207, + "load_loss": 0.15315744280815125, + "step": 5 + }, + { + "loss": 5.010220527648926, + "ce_loss": 5.008493900299072, + "load_loss": 0.1726723313331604, + "step": 5 + }, + { + "loss": 4.9563422203063965, + "ce_loss": 4.955264091491699, + "load_loss": 0.10779102146625519, + "step": 5 + }, + { + "loss": 4.847928524017334, + "ce_loss": 4.8466081619262695, + "load_loss": 0.13202691078186035, + "step": 5 + }, + { + "loss": 4.919735431671143, + "ce_loss": 4.918035507202148, + "load_loss": 0.1699714958667755, + "step": 5 + }, + { + "loss": 4.8555684089660645, + "ce_loss": 4.854043483734131, + "load_loss": 0.1524949073791504, + "step": 5 + }, + { + "loss": 4.894381046295166, + "ce_loss": 4.89319372177124, + "load_loss": 0.11872416734695435, + "step": 5 + }, + { + "loss": 5.018799304962158, + "ce_loss": 5.017637729644775, + "load_loss": 0.11617746204137802, + "step": 5 + }, + { + "loss": 4.869941711425781, + "ce_loss": 4.868724346160889, + "load_loss": 0.12173762917518616, + "step": 5 + }, + { + "loss": 4.860079765319824, + "ce_loss": 4.858872890472412, + "load_loss": 0.12067729234695435, + "step": 5 + }, + { + "loss": 5.04349422454834, + "ce_loss": 5.042275428771973, + "load_loss": 0.1218893826007843, + "step": 5 + }, + { + "loss": 4.775557518005371, + "ce_loss": 4.77417516708374, + "load_loss": 0.13824385404586792, + "step": 5 + }, + { + "loss": 4.829329967498779, + "ce_loss": 4.827751159667969, + "load_loss": 0.15787412226200104, + "step": 5 + }, + { + "loss": 4.888046741485596, + "ce_loss": 4.886868953704834, + "load_loss": 0.11777537316083908, + "step": 5 + }, + { + "loss": 4.869625091552734, + "ce_loss": 4.868274211883545, + "load_loss": 0.1350896656513214, + "step": 5 + }, + { + "loss": 4.815764427185059, + "ce_loss": 4.814654350280762, + "load_loss": 0.1109858900308609, + "step": 5 + }, + { + "loss": 4.961215972900391, + "ce_loss": 4.96022367477417, + "load_loss": 0.0992107093334198, + "step": 5 + }, + { + "loss": 4.846055507659912, + "ce_loss": 4.844780921936035, + "load_loss": 0.12743565440177917, + "step": 6 + }, + { + "loss": 4.774820327758789, + "ce_loss": 4.773776531219482, + "load_loss": 0.10436013340950012, + "step": 6 + }, + { + "loss": 4.757609844207764, + "ce_loss": 4.756335735321045, + "load_loss": 0.12740261852741241, + "step": 6 + }, + { + "loss": 4.837573051452637, + "ce_loss": 4.836209297180176, + "load_loss": 0.136389821767807, + "step": 6 + }, + { + "loss": 4.754680633544922, + "ce_loss": 4.753264427185059, + "load_loss": 0.14162877202033997, + "step": 6 + }, + { + "loss": 4.738608360290527, + "ce_loss": 4.737152576446533, + "load_loss": 0.14559341967105865, + "step": 6 + }, + { + "loss": 4.870166778564453, + "ce_loss": 4.869107246398926, + "load_loss": 0.10596859455108643, + "step": 6 + }, + { + "loss": 4.647329807281494, + "ce_loss": 4.645685195922852, + "load_loss": 0.16445392370224, + "step": 6 + }, + { + "loss": 4.6962504386901855, + "ce_loss": 4.695173263549805, + "load_loss": 0.10769719630479813, + "step": 6 + }, + { + "loss": 4.760800361633301, + "ce_loss": 4.759346008300781, + "load_loss": 0.145417258143425, + "step": 6 + }, + { + "loss": 4.770374298095703, + "ce_loss": 4.7686991691589355, + "load_loss": 0.16751956939697266, + "step": 6 + }, + { + "loss": 4.630374431610107, + "ce_loss": 4.628481864929199, + "load_loss": 0.18923839926719666, + "step": 6 + }, + { + "loss": 4.95698356628418, + "ce_loss": 4.956023216247559, + "load_loss": 0.09602779895067215, + "step": 6 + }, + { + "loss": 4.737622261047363, + "ce_loss": 4.736242771148682, + "load_loss": 0.13792839646339417, + "step": 6 + }, + { + "loss": 4.762267589569092, + "ce_loss": 4.76108455657959, + "load_loss": 0.11829094588756561, + "step": 6 + }, + { + "loss": 5.271988868713379, + "ce_loss": 5.270596027374268, + "load_loss": 0.13928984105587006, + "step": 6 + }, + { + "loss": 4.893436908721924, + "ce_loss": 4.892152309417725, + "load_loss": 0.12844809889793396, + "step": 6 + }, + { + "loss": 4.721114635467529, + "ce_loss": 4.719810962677002, + "load_loss": 0.1303902119398117, + "step": 6 + }, + { + "loss": 4.817175388336182, + "ce_loss": 4.8153910636901855, + "load_loss": 0.1784479320049286, + "step": 6 + }, + { + "loss": 4.736242771148682, + "ce_loss": 4.7346601486206055, + "load_loss": 0.1582752764225006, + "step": 6 + }, + { + "loss": 4.884071350097656, + "ce_loss": 4.883116245269775, + "load_loss": 0.0955289900302887, + "step": 6 + }, + { + "loss": 4.722914218902588, + "ce_loss": 4.722056865692139, + "load_loss": 0.08574233949184418, + "step": 6 + }, + { + "loss": 4.780397415161133, + "ce_loss": 4.778840065002441, + "load_loss": 0.1557285636663437, + "step": 6 + }, + { + "loss": 4.66785192489624, + "ce_loss": 4.666070938110352, + "load_loss": 0.17812049388885498, + "step": 6 + }, + { + "loss": 4.715280532836914, + "ce_loss": 4.713840484619141, + "load_loss": 0.14402374625205994, + "step": 6 + }, + { + "loss": 4.721773147583008, + "ce_loss": 4.7202959060668945, + "load_loss": 0.147738978266716, + "step": 6 + }, + { + "loss": 4.920031547546387, + "ce_loss": 4.919066905975342, + "load_loss": 0.09648783504962921, + "step": 6 + }, + { + "loss": 4.799487590789795, + "ce_loss": 4.797939300537109, + "load_loss": 0.1548132747411728, + "step": 6 + }, + { + "loss": 4.765450477600098, + "ce_loss": 4.763806343078613, + "load_loss": 0.1644333451986313, + "step": 6 + }, + { + "loss": 4.750949382781982, + "ce_loss": 4.749456882476807, + "load_loss": 0.14925839006900787, + "step": 6 + }, + { + "loss": 4.88720703125, + "ce_loss": 4.8858842849731445, + "load_loss": 0.13229642808437347, + "step": 6 + }, + { + "loss": 4.744002342224121, + "ce_loss": 4.742257595062256, + "load_loss": 0.17445935308933258, + "step": 6 + }, + { + "loss": 4.800455093383789, + "ce_loss": 4.798869609832764, + "load_loss": 0.15855772793293, + "step": 6 + }, + { + "loss": 4.697412014007568, + "ce_loss": 4.696535587310791, + "load_loss": 0.08766385167837143, + "step": 6 + }, + { + "loss": 4.749873161315918, + "ce_loss": 4.748236656188965, + "load_loss": 0.16363008320331573, + "step": 6 + }, + { + "loss": 4.669769287109375, + "ce_loss": 4.668026924133301, + "load_loss": 0.1742396205663681, + "step": 6 + }, + { + "loss": 4.71203088760376, + "ce_loss": 4.710367202758789, + "load_loss": 0.1663491129875183, + "step": 6 + }, + { + "loss": 4.774081707000732, + "ce_loss": 4.7728190422058105, + "load_loss": 0.12627096474170685, + "step": 6 + }, + { + "loss": 5.055183410644531, + "ce_loss": 5.053896427154541, + "load_loss": 0.1287195384502411, + "step": 6 + }, + { + "loss": 4.832553386688232, + "ce_loss": 4.831343173980713, + "load_loss": 0.12104349583387375, + "step": 6 + }, + { + "loss": 4.68254280090332, + "ce_loss": 4.680818557739258, + "load_loss": 0.17242054641246796, + "step": 6 + }, + { + "loss": 4.773293495178223, + "ce_loss": 4.771780490875244, + "load_loss": 0.15130725502967834, + "step": 6 + }, + { + "loss": 4.7425079345703125, + "ce_loss": 4.740633964538574, + "load_loss": 0.18737384676933289, + "step": 6 + }, + { + "loss": 4.946664333343506, + "ce_loss": 4.945047378540039, + "load_loss": 0.16168414056301117, + "step": 6 + }, + { + "loss": 4.9566264152526855, + "ce_loss": 4.955048561096191, + "load_loss": 0.1577846109867096, + "step": 6 + }, + { + "loss": 4.773850440979004, + "ce_loss": 4.772455215454102, + "load_loss": 0.1395244002342224, + "step": 6 + }, + { + "loss": 4.682232856750488, + "ce_loss": 4.680924892425537, + "load_loss": 0.13078898191452026, + "step": 6 + }, + { + "loss": 4.7810821533203125, + "ce_loss": 4.779726982116699, + "load_loss": 0.13551953434944153, + "step": 6 + }, + { + "loss": 4.757134914398193, + "ce_loss": 4.755643844604492, + "load_loss": 0.1491233855485916, + "step": 6 + }, + { + "loss": 4.6687912940979, + "ce_loss": 4.6677045822143555, + "load_loss": 0.10865172743797302, + "step": 6 + }, + { + "loss": 4.970254898071289, + "ce_loss": 4.969211578369141, + "load_loss": 0.10431849211454391, + "step": 6 + }, + { + "loss": 4.695629596710205, + "ce_loss": 4.694540977478027, + "load_loss": 0.10886907577514648, + "step": 6 + }, + { + "loss": 4.79782772064209, + "ce_loss": 4.796354293823242, + "load_loss": 0.14733687043190002, + "step": 6 + }, + { + "loss": 5.137404441833496, + "ce_loss": 5.136138916015625, + "load_loss": 0.1265677660703659, + "step": 6 + }, + { + "loss": 4.760657787322998, + "ce_loss": 4.75935173034668, + "load_loss": 0.13060131669044495, + "step": 6 + }, + { + "loss": 5.049295425415039, + "ce_loss": 5.047582626342773, + "load_loss": 0.1712668538093567, + "step": 6 + }, + { + "loss": 4.943414211273193, + "ce_loss": 4.941761493682861, + "load_loss": 0.1652710735797882, + "step": 6 + }, + { + "loss": 4.674397945404053, + "ce_loss": 4.672693729400635, + "load_loss": 0.17041811347007751, + "step": 6 + }, + { + "loss": 4.726748466491699, + "ce_loss": 4.725289821624756, + "load_loss": 0.1458490490913391, + "step": 6 + }, + { + "loss": 4.862025737762451, + "ce_loss": 4.860691070556641, + "load_loss": 0.13347212970256805, + "step": 6 + }, + { + "loss": 4.703556537628174, + "ce_loss": 4.702502250671387, + "load_loss": 0.10544392466545105, + "step": 6 + }, + { + "loss": 4.715970993041992, + "ce_loss": 4.714035987854004, + "load_loss": 0.1934964954853058, + "step": 6 + }, + { + "loss": 4.706308364868164, + "ce_loss": 4.705056667327881, + "load_loss": 0.12516753375530243, + "step": 6 + }, + { + "loss": 4.697547435760498, + "ce_loss": 4.696513652801514, + "load_loss": 0.10336634516716003, + "step": 6 + }, + { + "loss": 4.906116485595703, + "ce_loss": 4.9051899909973145, + "load_loss": 0.09263426065444946, + "step": 6 + }, + { + "loss": 4.766894340515137, + "ce_loss": 4.765006065368652, + "load_loss": 0.1888415664434433, + "step": 6 + }, + { + "loss": 4.94364595413208, + "ce_loss": 4.942134857177734, + "load_loss": 0.15112389624118805, + "step": 6 + }, + { + "loss": 5.36491060256958, + "ce_loss": 5.36350679397583, + "load_loss": 0.14038079977035522, + "step": 6 + }, + { + "loss": 4.718177318572998, + "ce_loss": 4.717108726501465, + "load_loss": 0.10687047243118286, + "step": 6 + }, + { + "loss": 4.735644817352295, + "ce_loss": 4.733755111694336, + "load_loss": 0.188984215259552, + "step": 6 + }, + { + "loss": 4.751328468322754, + "ce_loss": 4.750280857086182, + "load_loss": 0.10478091984987259, + "step": 6 + }, + { + "loss": 4.890024185180664, + "ce_loss": 4.8886566162109375, + "load_loss": 0.13676561415195465, + "step": 6 + }, + { + "loss": 4.948148250579834, + "ce_loss": 4.9472150802612305, + "load_loss": 0.09330300986766815, + "step": 6 + }, + { + "loss": 4.733623504638672, + "ce_loss": 4.732082843780518, + "load_loss": 0.154087096452713, + "step": 6 + }, + { + "loss": 4.719979763031006, + "ce_loss": 4.718499660491943, + "load_loss": 0.1480041891336441, + "step": 6 + }, + { + "loss": 4.696141719818115, + "ce_loss": 4.694974422454834, + "load_loss": 0.11673084646463394, + "step": 6 + }, + { + "loss": 4.899826526641846, + "ce_loss": 4.898248672485352, + "load_loss": 0.1578051745891571, + "step": 6 + }, + { + "loss": 5.071712017059326, + "ce_loss": 5.070132255554199, + "load_loss": 0.15799331665039062, + "step": 6 + }, + { + "loss": 4.706161022186279, + "ce_loss": 4.704991817474365, + "load_loss": 0.11691179126501083, + "step": 6 + }, + { + "loss": 4.720216751098633, + "ce_loss": 4.718722343444824, + "load_loss": 0.14945369958877563, + "step": 6 + }, + { + "loss": 5.2769060134887695, + "ce_loss": 5.275165557861328, + "load_loss": 0.17406538128852844, + "step": 6 + }, + { + "loss": 4.797750473022461, + "ce_loss": 4.796431541442871, + "load_loss": 0.13190291821956635, + "step": 6 + }, + { + "loss": 4.675431728363037, + "ce_loss": 4.673956394195557, + "load_loss": 0.14754414558410645, + "step": 6 + }, + { + "loss": 4.760585308074951, + "ce_loss": 4.758798599243164, + "load_loss": 0.17867004871368408, + "step": 6 + }, + { + "loss": 5.1015191078186035, + "ce_loss": 5.100021839141846, + "load_loss": 0.14972129464149475, + "step": 6 + }, + { + "loss": 4.755246639251709, + "ce_loss": 4.753688335418701, + "load_loss": 0.15581569075584412, + "step": 6 + }, + { + "loss": 4.735243320465088, + "ce_loss": 4.734127521514893, + "load_loss": 0.11156130582094193, + "step": 6 + }, + { + "loss": 4.779728889465332, + "ce_loss": 4.778358459472656, + "load_loss": 0.13702362775802612, + "step": 6 + }, + { + "loss": 4.734323501586914, + "ce_loss": 4.73355770111084, + "load_loss": 0.07658470422029495, + "step": 6 + }, + { + "loss": 4.744997501373291, + "ce_loss": 4.743070125579834, + "load_loss": 0.19275163114070892, + "step": 6 + }, + { + "loss": 4.69105339050293, + "ce_loss": 4.689414024353027, + "load_loss": 0.1639474630355835, + "step": 6 + }, + { + "loss": 5.223947048187256, + "ce_loss": 5.222323417663574, + "load_loss": 0.1623840183019638, + "step": 6 + }, + { + "loss": 4.649318218231201, + "ce_loss": 4.64793586730957, + "load_loss": 0.1382218301296234, + "step": 6 + }, + { + "loss": 4.678218364715576, + "ce_loss": 4.676529884338379, + "load_loss": 0.16884461045265198, + "step": 6 + }, + { + "loss": 4.805236339569092, + "ce_loss": 4.803460597991943, + "load_loss": 0.1775757074356079, + "step": 6 + }, + { + "loss": 4.835171699523926, + "ce_loss": 4.833616733551025, + "load_loss": 0.15548394620418549, + "step": 6 + }, + { + "loss": 4.718822002410889, + "ce_loss": 4.717070579528809, + "load_loss": 0.17512236535549164, + "step": 6 + }, + { + "loss": 4.74401330947876, + "ce_loss": 4.742424964904785, + "load_loss": 0.15881143510341644, + "step": 6 + }, + { + "loss": 4.729469299316406, + "ce_loss": 4.72845458984375, + "load_loss": 0.10147928446531296, + "step": 6 + }, + { + "loss": 4.9102864265441895, + "ce_loss": 4.908633708953857, + "load_loss": 0.165268674492836, + "step": 6 + }, + { + "loss": 4.620763778686523, + "ce_loss": 4.619132995605469, + "load_loss": 0.163070946931839, + "step": 6 + }, + { + "loss": 4.810704708099365, + "ce_loss": 4.809329032897949, + "load_loss": 0.13755738735198975, + "step": 6 + }, + { + "loss": 4.891191005706787, + "ce_loss": 4.8892927169799805, + "load_loss": 0.18985068798065186, + "step": 6 + }, + { + "loss": 4.754910469055176, + "ce_loss": 4.753417491912842, + "load_loss": 0.14929716289043427, + "step": 6 + }, + { + "loss": 5.136593818664551, + "ce_loss": 5.135116100311279, + "load_loss": 0.14776578545570374, + "step": 6 + }, + { + "loss": 4.768642902374268, + "ce_loss": 4.767439365386963, + "load_loss": 0.12035560607910156, + "step": 6 + }, + { + "loss": 4.862582683563232, + "ce_loss": 4.8604912757873535, + "load_loss": 0.209121435880661, + "step": 6 + }, + { + "loss": 4.87473726272583, + "ce_loss": 4.873154640197754, + "load_loss": 0.15824656188488007, + "step": 6 + }, + { + "loss": 4.773401737213135, + "ce_loss": 4.77182674407959, + "load_loss": 0.1575189232826233, + "step": 6 + }, + { + "loss": 4.8127546310424805, + "ce_loss": 4.811598300933838, + "load_loss": 0.11563317477703094, + "step": 6 + }, + { + "loss": 4.761439323425293, + "ce_loss": 4.75981330871582, + "load_loss": 0.16259893774986267, + "step": 6 + }, + { + "loss": 4.737564563751221, + "ce_loss": 4.736052989959717, + "load_loss": 0.15116219222545624, + "step": 6 + }, + { + "loss": 4.65061616897583, + "ce_loss": 4.649356365203857, + "load_loss": 0.12596507370471954, + "step": 6 + }, + { + "loss": 4.815762996673584, + "ce_loss": 4.814575672149658, + "load_loss": 0.11872799694538116, + "step": 6 + }, + { + "loss": 4.778446197509766, + "ce_loss": 4.776551723480225, + "load_loss": 0.18943612277507782, + "step": 6 + }, + { + "loss": 4.766861438751221, + "ce_loss": 4.765481472015381, + "load_loss": 0.13801074028015137, + "step": 6 + }, + { + "loss": 4.762087821960449, + "ce_loss": 4.76092004776001, + "load_loss": 0.11678732931613922, + "step": 6 + }, + { + "loss": 4.745720386505127, + "ce_loss": 4.744539737701416, + "load_loss": 0.11808222532272339, + "step": 6 + }, + { + "loss": 4.824373245239258, + "ce_loss": 4.8228912353515625, + "load_loss": 0.14818033576011658, + "step": 6 + }, + { + "loss": 4.819917678833008, + "ce_loss": 4.8185133934021, + "load_loss": 0.1404171884059906, + "step": 6 + }, + { + "loss": 4.960516929626465, + "ce_loss": 4.959470748901367, + "load_loss": 0.10462629795074463, + "step": 6 + }, + { + "loss": 4.83809232711792, + "ce_loss": 4.836843013763428, + "load_loss": 0.12493681907653809, + "step": 6 + }, + { + "loss": 4.766984462738037, + "ce_loss": 4.765711307525635, + "load_loss": 0.127317413687706, + "step": 6 + }, + { + "loss": 4.703835964202881, + "ce_loss": 4.702975273132324, + "load_loss": 0.0860913097858429, + "step": 6 + }, + { + "loss": 4.928010940551758, + "ce_loss": 4.926743507385254, + "load_loss": 0.1267501413822174, + "step": 6 + }, + { + "loss": 4.719653606414795, + "ce_loss": 4.717951774597168, + "load_loss": 0.17017494142055511, + "step": 7 + }, + { + "loss": 4.56519889831543, + "ce_loss": 4.563364028930664, + "load_loss": 0.1834704875946045, + "step": 7 + }, + { + "loss": 4.8537726402282715, + "ce_loss": 4.85237979888916, + "load_loss": 0.13929174840450287, + "step": 7 + }, + { + "loss": 4.91811466217041, + "ce_loss": 4.9163994789123535, + "load_loss": 0.17149999737739563, + "step": 7 + }, + { + "loss": 4.750820159912109, + "ce_loss": 4.749937057495117, + "load_loss": 0.08831537514925003, + "step": 7 + }, + { + "loss": 4.673011779785156, + "ce_loss": 4.671802997589111, + "load_loss": 0.1208922266960144, + "step": 7 + }, + { + "loss": 4.751174449920654, + "ce_loss": 4.749674320220947, + "load_loss": 0.15000087022781372, + "step": 7 + }, + { + "loss": 4.588021755218506, + "ce_loss": 4.586489677429199, + "load_loss": 0.1531866490840912, + "step": 7 + }, + { + "loss": 4.814282417297363, + "ce_loss": 4.812992095947266, + "load_loss": 0.12901201844215393, + "step": 7 + }, + { + "loss": 4.5619049072265625, + "ce_loss": 4.560385227203369, + "load_loss": 0.1519664227962494, + "step": 7 + }, + { + "loss": 4.8420586585998535, + "ce_loss": 4.841032028198242, + "load_loss": 0.10266696661710739, + "step": 7 + }, + { + "loss": 4.620840549468994, + "ce_loss": 4.619616985321045, + "load_loss": 0.12234558165073395, + "step": 7 + }, + { + "loss": 4.578613758087158, + "ce_loss": 4.577227592468262, + "load_loss": 0.13863208889961243, + "step": 7 + }, + { + "loss": 4.764087200164795, + "ce_loss": 4.762157917022705, + "load_loss": 0.1929100900888443, + "step": 7 + }, + { + "loss": 4.594468593597412, + "ce_loss": 4.593311786651611, + "load_loss": 0.11569587886333466, + "step": 7 + }, + { + "loss": 4.631911754608154, + "ce_loss": 4.629833221435547, + "load_loss": 0.20784713327884674, + "step": 7 + }, + { + "loss": 4.825191974639893, + "ce_loss": 4.82396936416626, + "load_loss": 0.12223978340625763, + "step": 7 + }, + { + "loss": 4.579054832458496, + "ce_loss": 4.577614784240723, + "load_loss": 0.14401991665363312, + "step": 7 + }, + { + "loss": 4.626672744750977, + "ce_loss": 4.625114917755127, + "load_loss": 0.1557711660861969, + "step": 7 + }, + { + "loss": 4.749643802642822, + "ce_loss": 4.748318672180176, + "load_loss": 0.13249364495277405, + "step": 7 + }, + { + "loss": 4.652554512023926, + "ce_loss": 4.650982856750488, + "load_loss": 0.15715175867080688, + "step": 7 + }, + { + "loss": 4.905162811279297, + "ce_loss": 4.903087139129639, + "load_loss": 0.2075517475605011, + "step": 7 + }, + { + "loss": 4.5943169593811035, + "ce_loss": 4.59273624420166, + "load_loss": 0.15807566046714783, + "step": 7 + }, + { + "loss": 4.763587474822998, + "ce_loss": 4.762064456939697, + "load_loss": 0.15232019126415253, + "step": 7 + }, + { + "loss": 4.584417343139648, + "ce_loss": 4.583102703094482, + "load_loss": 0.13148503005504608, + "step": 7 + }, + { + "loss": 4.720241069793701, + "ce_loss": 4.7183122634887695, + "load_loss": 0.19289717078208923, + "step": 7 + }, + { + "loss": 4.659064769744873, + "ce_loss": 4.657410144805908, + "load_loss": 0.16548171639442444, + "step": 7 + }, + { + "loss": 4.561006546020508, + "ce_loss": 4.5594024658203125, + "load_loss": 0.16042083501815796, + "step": 7 + }, + { + "loss": 4.609738826751709, + "ce_loss": 4.607920169830322, + "load_loss": 0.18187928199768066, + "step": 7 + }, + { + "loss": 5.047382354736328, + "ce_loss": 5.045466899871826, + "load_loss": 0.19154050946235657, + "step": 7 + }, + { + "loss": 4.620100975036621, + "ce_loss": 4.618234157562256, + "load_loss": 0.18669411540031433, + "step": 7 + }, + { + "loss": 4.572187423706055, + "ce_loss": 4.570816516876221, + "load_loss": 0.1371002346277237, + "step": 7 + }, + { + "loss": 5.318172454833984, + "ce_loss": 5.316612720489502, + "load_loss": 0.15596744418144226, + "step": 7 + }, + { + "loss": 4.654269218444824, + "ce_loss": 4.6528849601745605, + "load_loss": 0.13843342661857605, + "step": 7 + }, + { + "loss": 4.705007553100586, + "ce_loss": 4.703812122344971, + "load_loss": 0.11955185234546661, + "step": 7 + }, + { + "loss": 4.792496204376221, + "ce_loss": 4.790971279144287, + "load_loss": 0.1524791121482849, + "step": 7 + }, + { + "loss": 4.697828769683838, + "ce_loss": 4.696099758148193, + "load_loss": 0.17289063334465027, + "step": 7 + }, + { + "loss": 4.623258590698242, + "ce_loss": 4.621745586395264, + "load_loss": 0.15131059288978577, + "step": 7 + }, + { + "loss": 4.634652137756348, + "ce_loss": 4.633242130279541, + "load_loss": 0.14100119471549988, + "step": 7 + }, + { + "loss": 4.69765567779541, + "ce_loss": 4.696142196655273, + "load_loss": 0.1513608694076538, + "step": 7 + }, + { + "loss": 4.727609157562256, + "ce_loss": 4.725805282592773, + "load_loss": 0.18039384484291077, + "step": 7 + }, + { + "loss": 4.5812296867370605, + "ce_loss": 4.579615116119385, + "load_loss": 0.16143617033958435, + "step": 7 + }, + { + "loss": 4.611410617828369, + "ce_loss": 4.609738349914551, + "load_loss": 0.16722898185253143, + "step": 7 + }, + { + "loss": 4.690121173858643, + "ce_loss": 4.688251495361328, + "load_loss": 0.1869703084230423, + "step": 7 + }, + { + "loss": 4.910267353057861, + "ce_loss": 4.908802509307861, + "load_loss": 0.14647182822227478, + "step": 7 + }, + { + "loss": 4.619054317474365, + "ce_loss": 4.617735385894775, + "load_loss": 0.13187995553016663, + "step": 7 + }, + { + "loss": 4.693589210510254, + "ce_loss": 4.692035675048828, + "load_loss": 0.1553681194782257, + "step": 7 + }, + { + "loss": 4.698826789855957, + "ce_loss": 4.697298526763916, + "load_loss": 0.15280798077583313, + "step": 7 + }, + { + "loss": 4.599837303161621, + "ce_loss": 4.598466873168945, + "load_loss": 0.13704469799995422, + "step": 7 + }, + { + "loss": 4.735747814178467, + "ce_loss": 4.733868598937988, + "load_loss": 0.18791669607162476, + "step": 7 + }, + { + "loss": 4.772045135498047, + "ce_loss": 4.770461082458496, + "load_loss": 0.1584131419658661, + "step": 7 + }, + { + "loss": 4.618276596069336, + "ce_loss": 4.61634635925293, + "load_loss": 0.19302639365196228, + "step": 7 + }, + { + "loss": 4.6697821617126465, + "ce_loss": 4.6681976318359375, + "load_loss": 0.1584342122077942, + "step": 7 + }, + { + "loss": 4.587678909301758, + "ce_loss": 4.5865325927734375, + "load_loss": 0.1146484762430191, + "step": 7 + }, + { + "loss": 4.702242851257324, + "ce_loss": 4.700340270996094, + "load_loss": 0.19024178385734558, + "step": 7 + }, + { + "loss": 4.61588191986084, + "ce_loss": 4.614152908325195, + "load_loss": 0.1728973388671875, + "step": 7 + }, + { + "loss": 4.751852989196777, + "ce_loss": 4.750592231750488, + "load_loss": 0.12609432637691498, + "step": 7 + }, + { + "loss": 5.427748203277588, + "ce_loss": 5.426389694213867, + "load_loss": 0.13585655391216278, + "step": 7 + }, + { + "loss": 4.722622394561768, + "ce_loss": 4.7214202880859375, + "load_loss": 0.12018758058547974, + "step": 7 + }, + { + "loss": 4.822697639465332, + "ce_loss": 4.821579456329346, + "load_loss": 0.11181071400642395, + "step": 7 + }, + { + "loss": 4.8774614334106445, + "ce_loss": 4.875921726226807, + "load_loss": 0.1539621502161026, + "step": 7 + }, + { + "loss": 4.664033889770508, + "ce_loss": 4.662491798400879, + "load_loss": 0.154207244515419, + "step": 7 + }, + { + "loss": 4.706447124481201, + "ce_loss": 4.7053022384643555, + "load_loss": 0.11449960619211197, + "step": 7 + }, + { + "loss": 4.691031455993652, + "ce_loss": 4.689380168914795, + "load_loss": 0.16511215269565582, + "step": 7 + }, + { + "loss": 5.15080451965332, + "ce_loss": 5.149381160736084, + "load_loss": 0.14235258102416992, + "step": 7 + }, + { + "loss": 4.595117568969727, + "ce_loss": 4.593714714050293, + "load_loss": 0.1402941644191742, + "step": 7 + }, + { + "loss": 4.672632694244385, + "ce_loss": 4.670848369598389, + "load_loss": 0.17841249704360962, + "step": 7 + }, + { + "loss": 4.687108039855957, + "ce_loss": 4.685398578643799, + "load_loss": 0.17094659805297852, + "step": 7 + }, + { + "loss": 4.937878608703613, + "ce_loss": 4.936484336853027, + "load_loss": 0.13942769169807434, + "step": 7 + }, + { + "loss": 4.609994888305664, + "ce_loss": 4.60813570022583, + "load_loss": 0.18591763079166412, + "step": 7 + }, + { + "loss": 4.526098251342773, + "ce_loss": 4.524715900421143, + "load_loss": 0.13824672996997833, + "step": 7 + }, + { + "loss": 4.606593608856201, + "ce_loss": 4.604963779449463, + "load_loss": 0.1629919707775116, + "step": 7 + }, + { + "loss": 4.615144729614258, + "ce_loss": 4.6135358810424805, + "load_loss": 0.16086314618587494, + "step": 7 + }, + { + "loss": 4.668472766876221, + "ce_loss": 4.666412353515625, + "load_loss": 0.2060289978981018, + "step": 7 + }, + { + "loss": 4.578979969024658, + "ce_loss": 4.577608585357666, + "load_loss": 0.13713470101356506, + "step": 7 + }, + { + "loss": 4.594782829284668, + "ce_loss": 4.593109607696533, + "load_loss": 0.16733334958553314, + "step": 7 + }, + { + "loss": 4.712697505950928, + "ce_loss": 4.711035251617432, + "load_loss": 0.16623234748840332, + "step": 7 + }, + { + "loss": 4.7517900466918945, + "ce_loss": 4.750376224517822, + "load_loss": 0.14137651026248932, + "step": 7 + }, + { + "loss": 4.7150444984436035, + "ce_loss": 4.713601112365723, + "load_loss": 0.14433011412620544, + "step": 7 + }, + { + "loss": 4.639660835266113, + "ce_loss": 4.6378655433654785, + "load_loss": 0.17954367399215698, + "step": 7 + }, + { + "loss": 4.8388166427612305, + "ce_loss": 4.837156772613525, + "load_loss": 0.16597189009189606, + "step": 7 + }, + { + "loss": 4.58594274520874, + "ce_loss": 4.584188938140869, + "load_loss": 0.17539042234420776, + "step": 7 + }, + { + "loss": 4.7419657707214355, + "ce_loss": 4.740464210510254, + "load_loss": 0.15017080307006836, + "step": 7 + }, + { + "loss": 4.554733753204346, + "ce_loss": 4.553150177001953, + "load_loss": 0.15834037959575653, + "step": 7 + }, + { + "loss": 4.60679817199707, + "ce_loss": 4.605113506317139, + "load_loss": 0.168484628200531, + "step": 7 + }, + { + "loss": 4.820178985595703, + "ce_loss": 4.818552494049072, + "load_loss": 0.1626449078321457, + "step": 7 + }, + { + "loss": 4.729384422302246, + "ce_loss": 4.727717399597168, + "load_loss": 0.1666947454214096, + "step": 7 + }, + { + "loss": 5.100430488586426, + "ce_loss": 5.098937511444092, + "load_loss": 0.1493067443370819, + "step": 7 + }, + { + "loss": 4.670891284942627, + "ce_loss": 4.66953706741333, + "load_loss": 0.13542285561561584, + "step": 7 + }, + { + "loss": 4.805309295654297, + "ce_loss": 4.804079055786133, + "load_loss": 0.12300954014062881, + "step": 7 + }, + { + "loss": 4.73900842666626, + "ce_loss": 4.737569332122803, + "load_loss": 0.14393040537834167, + "step": 7 + }, + { + "loss": 4.792140007019043, + "ce_loss": 4.790698051452637, + "load_loss": 0.1441793292760849, + "step": 7 + }, + { + "loss": 4.660822868347168, + "ce_loss": 4.659458637237549, + "load_loss": 0.13643722236156464, + "step": 7 + }, + { + "loss": 4.629177093505859, + "ce_loss": 4.627232074737549, + "load_loss": 0.19450704753398895, + "step": 7 + }, + { + "loss": 4.636930465698242, + "ce_loss": 4.635324478149414, + "load_loss": 0.16059747338294983, + "step": 7 + }, + { + "loss": 4.611499309539795, + "ce_loss": 4.609652042388916, + "load_loss": 0.18470889329910278, + "step": 7 + }, + { + "loss": 4.910333156585693, + "ce_loss": 4.908915042877197, + "load_loss": 0.14181403815746307, + "step": 7 + }, + { + "loss": 4.694431304931641, + "ce_loss": 4.692738056182861, + "load_loss": 0.16932141780853271, + "step": 7 + }, + { + "loss": 4.623430252075195, + "ce_loss": 4.622118949890137, + "load_loss": 0.13110780715942383, + "step": 7 + }, + { + "loss": 4.564480781555176, + "ce_loss": 4.562869548797607, + "load_loss": 0.16113075613975525, + "step": 7 + }, + { + "loss": 4.554691314697266, + "ce_loss": 4.553230285644531, + "load_loss": 0.14610323309898376, + "step": 7 + }, + { + "loss": 4.631114959716797, + "ce_loss": 4.629305362701416, + "load_loss": 0.18095970153808594, + "step": 7 + }, + { + "loss": 4.604038715362549, + "ce_loss": 4.602653980255127, + "load_loss": 0.138463094830513, + "step": 7 + }, + { + "loss": 4.796709060668945, + "ce_loss": 4.795337200164795, + "load_loss": 0.13719214498996735, + "step": 7 + }, + { + "loss": 4.723158836364746, + "ce_loss": 4.721692085266113, + "load_loss": 0.14665615558624268, + "step": 7 + }, + { + "loss": 4.589303493499756, + "ce_loss": 4.58770751953125, + "load_loss": 0.1595783233642578, + "step": 7 + }, + { + "loss": 4.599321365356445, + "ce_loss": 4.5975661277771, + "load_loss": 0.1755005419254303, + "step": 7 + }, + { + "loss": 4.601973056793213, + "ce_loss": 4.600655555725098, + "load_loss": 0.13174544274806976, + "step": 7 + }, + { + "loss": 4.595872402191162, + "ce_loss": 4.594264030456543, + "load_loss": 0.16081863641738892, + "step": 7 + }, + { + "loss": 4.5791449546813965, + "ce_loss": 4.577596664428711, + "load_loss": 0.15480946004390717, + "step": 7 + }, + { + "loss": 4.636533737182617, + "ce_loss": 4.635072708129883, + "load_loss": 0.14611569046974182, + "step": 7 + }, + { + "loss": 4.572009086608887, + "ce_loss": 4.570135593414307, + "load_loss": 0.18737098574638367, + "step": 7 + }, + { + "loss": 4.842492580413818, + "ce_loss": 4.840884685516357, + "load_loss": 0.16078799962997437, + "step": 7 + }, + { + "loss": 4.608424663543701, + "ce_loss": 4.606971263885498, + "load_loss": 0.1453181654214859, + "step": 7 + }, + { + "loss": 4.747304916381836, + "ce_loss": 4.745694637298584, + "load_loss": 0.16102831065654755, + "step": 7 + }, + { + "loss": 4.597240924835205, + "ce_loss": 4.595911979675293, + "load_loss": 0.13288572430610657, + "step": 7 + }, + { + "loss": 4.60433292388916, + "ce_loss": 4.602591037750244, + "load_loss": 0.17416590452194214, + "step": 7 + }, + { + "loss": 4.652182579040527, + "ce_loss": 4.65057373046875, + "load_loss": 0.1608942747116089, + "step": 7 + }, + { + "loss": 4.695618152618408, + "ce_loss": 4.694099426269531, + "load_loss": 0.1518864780664444, + "step": 7 + }, + { + "loss": 4.6272759437561035, + "ce_loss": 4.625590801239014, + "load_loss": 0.16849994659423828, + "step": 7 + }, + { + "loss": 4.735241889953613, + "ce_loss": 4.733664035797119, + "load_loss": 0.1577669084072113, + "step": 7 + }, + { + "loss": 4.696555137634277, + "ce_loss": 4.695301532745361, + "load_loss": 0.12534131109714508, + "step": 7 + }, + { + "loss": 4.522485733032227, + "ce_loss": 4.52081823348999, + "load_loss": 0.16673783957958221, + "step": 7 + }, + { + "loss": 4.667792320251465, + "ce_loss": 4.666574954986572, + "load_loss": 0.12172949314117432, + "step": 7 + }, + { + "loss": 4.790217876434326, + "ce_loss": 4.789135456085205, + "load_loss": 0.1082596704363823, + "step": 7 + }, + { + "loss": 4.564183712005615, + "ce_loss": 4.56264066696167, + "load_loss": 0.1543082445859909, + "step": 8 + }, + { + "loss": 4.611279010772705, + "ce_loss": 4.609615802764893, + "load_loss": 0.16630221903324127, + "step": 8 + }, + { + "loss": 4.50180196762085, + "ce_loss": 4.500031471252441, + "load_loss": 0.17703668773174286, + "step": 8 + }, + { + "loss": 4.838124752044678, + "ce_loss": 4.83656120300293, + "load_loss": 0.15636476874351501, + "step": 8 + }, + { + "loss": 4.801764965057373, + "ce_loss": 4.800063610076904, + "load_loss": 0.17011508345603943, + "step": 8 + }, + { + "loss": 4.585259437561035, + "ce_loss": 4.583858966827393, + "load_loss": 0.14003469049930573, + "step": 8 + }, + { + "loss": 4.8109517097473145, + "ce_loss": 4.80912446975708, + "load_loss": 0.182717964053154, + "step": 8 + }, + { + "loss": 4.55617618560791, + "ce_loss": 4.554617404937744, + "load_loss": 0.15588366985321045, + "step": 8 + }, + { + "loss": 4.602419376373291, + "ce_loss": 4.601103782653809, + "load_loss": 0.13158267736434937, + "step": 8 + }, + { + "loss": 4.535086631774902, + "ce_loss": 4.533388614654541, + "load_loss": 0.16980251669883728, + "step": 8 + }, + { + "loss": 4.498399257659912, + "ce_loss": 4.496716499328613, + "load_loss": 0.16829219460487366, + "step": 8 + }, + { + "loss": 4.599291801452637, + "ce_loss": 4.597559452056885, + "load_loss": 0.17325109243392944, + "step": 8 + }, + { + "loss": 4.6213459968566895, + "ce_loss": 4.619945049285889, + "load_loss": 0.1400720328092575, + "step": 8 + }, + { + "loss": 4.435547828674316, + "ce_loss": 4.433986186981201, + "load_loss": 0.15616707503795624, + "step": 8 + }, + { + "loss": 4.920144557952881, + "ce_loss": 4.918412685394287, + "load_loss": 0.17319317162036896, + "step": 8 + }, + { + "loss": 4.880865097045898, + "ce_loss": 4.879348278045654, + "load_loss": 0.15167251229286194, + "step": 8 + }, + { + "loss": 4.749228477478027, + "ce_loss": 4.747267723083496, + "load_loss": 0.1960834264755249, + "step": 8 + }, + { + "loss": 4.760655403137207, + "ce_loss": 4.758770942687988, + "load_loss": 0.18844377994537354, + "step": 8 + }, + { + "loss": 4.7401347160339355, + "ce_loss": 4.738302230834961, + "load_loss": 0.18324501812458038, + "step": 8 + }, + { + "loss": 4.494149684906006, + "ce_loss": 4.49249792098999, + "load_loss": 0.1651872992515564, + "step": 8 + }, + { + "loss": 5.034966468811035, + "ce_loss": 5.033369064331055, + "load_loss": 0.15976309776306152, + "step": 8 + }, + { + "loss": 4.485203742980957, + "ce_loss": 4.483374118804932, + "load_loss": 0.18295541405677795, + "step": 8 + }, + { + "loss": 4.746823787689209, + "ce_loss": 4.745244026184082, + "load_loss": 0.1579861342906952, + "step": 8 + }, + { + "loss": 4.462760925292969, + "ce_loss": 4.461207389831543, + "load_loss": 0.15537479519844055, + "step": 8 + }, + { + "loss": 4.737006187438965, + "ce_loss": 4.735307693481445, + "load_loss": 0.1698642522096634, + "step": 8 + }, + { + "loss": 4.532962322235107, + "ce_loss": 4.531397342681885, + "load_loss": 0.1564830094575882, + "step": 8 + }, + { + "loss": 4.573707580566406, + "ce_loss": 4.571878433227539, + "load_loss": 0.18292619287967682, + "step": 8 + }, + { + "loss": 4.643583297729492, + "ce_loss": 4.641932487487793, + "load_loss": 0.165068119764328, + "step": 8 + }, + { + "loss": 4.483240604400635, + "ce_loss": 4.481675624847412, + "load_loss": 0.1565007120370865, + "step": 8 + }, + { + "loss": 4.884979724884033, + "ce_loss": 4.883645534515381, + "load_loss": 0.13340750336647034, + "step": 8 + }, + { + "loss": 4.498594284057617, + "ce_loss": 4.497044563293457, + "load_loss": 0.15495353937149048, + "step": 8 + }, + { + "loss": 4.866496562957764, + "ce_loss": 4.865097999572754, + "load_loss": 0.13986045122146606, + "step": 8 + }, + { + "loss": 4.8104095458984375, + "ce_loss": 4.809332847595215, + "load_loss": 0.1076713502407074, + "step": 8 + }, + { + "loss": 5.071938991546631, + "ce_loss": 5.070371150970459, + "load_loss": 0.15680038928985596, + "step": 8 + }, + { + "loss": 4.768524169921875, + "ce_loss": 4.767110347747803, + "load_loss": 0.14140330255031586, + "step": 8 + }, + { + "loss": 4.543979167938232, + "ce_loss": 4.542386531829834, + "load_loss": 0.15926094353199005, + "step": 8 + }, + { + "loss": 4.498645305633545, + "ce_loss": 4.497056007385254, + "load_loss": 0.15891243517398834, + "step": 8 + }, + { + "loss": 4.6829400062561035, + "ce_loss": 4.681360721588135, + "load_loss": 0.1579301357269287, + "step": 8 + }, + { + "loss": 4.698750019073486, + "ce_loss": 4.697086334228516, + "load_loss": 0.16635248064994812, + "step": 8 + }, + { + "loss": 4.860175609588623, + "ce_loss": 4.8585615158081055, + "load_loss": 0.16141080856323242, + "step": 8 + }, + { + "loss": 4.492092132568359, + "ce_loss": 4.49028205871582, + "load_loss": 0.18100468814373016, + "step": 8 + }, + { + "loss": 4.62700891494751, + "ce_loss": 4.62546443939209, + "load_loss": 0.1544269621372223, + "step": 8 + }, + { + "loss": 4.5407633781433105, + "ce_loss": 4.539175987243652, + "load_loss": 0.15875446796417236, + "step": 8 + }, + { + "loss": 4.58378791809082, + "ce_loss": 4.582204341888428, + "load_loss": 0.1583748459815979, + "step": 8 + }, + { + "loss": 4.727247714996338, + "ce_loss": 4.725451469421387, + "load_loss": 0.1796480268239975, + "step": 8 + }, + { + "loss": 4.532161235809326, + "ce_loss": 4.530611038208008, + "load_loss": 0.15503014624118805, + "step": 8 + }, + { + "loss": 4.934046745300293, + "ce_loss": 4.933002471923828, + "load_loss": 0.1044171079993248, + "step": 8 + }, + { + "loss": 4.53216028213501, + "ce_loss": 4.530281066894531, + "load_loss": 0.18794256448745728, + "step": 8 + }, + { + "loss": 4.787412643432617, + "ce_loss": 4.78574800491333, + "load_loss": 0.16646496951580048, + "step": 8 + }, + { + "loss": 4.563728332519531, + "ce_loss": 4.561739921569824, + "load_loss": 0.19883981347084045, + "step": 8 + }, + { + "loss": 4.565825462341309, + "ce_loss": 4.564077854156494, + "load_loss": 0.17475518584251404, + "step": 8 + }, + { + "loss": 4.451100826263428, + "ce_loss": 4.449386119842529, + "load_loss": 0.17147797346115112, + "step": 8 + }, + { + "loss": 4.481180667877197, + "ce_loss": 4.479358673095703, + "load_loss": 0.1822110116481781, + "step": 8 + }, + { + "loss": 4.63729190826416, + "ce_loss": 4.635491371154785, + "load_loss": 0.1800338625907898, + "step": 8 + }, + { + "loss": 4.547484397888184, + "ce_loss": 4.545652389526367, + "load_loss": 0.18319620192050934, + "step": 8 + }, + { + "loss": 5.06574010848999, + "ce_loss": 5.0642313957214355, + "load_loss": 0.15087257325649261, + "step": 8 + }, + { + "loss": 4.520502090454102, + "ce_loss": 4.518734455108643, + "load_loss": 0.17675137519836426, + "step": 8 + }, + { + "loss": 4.59569787979126, + "ce_loss": 4.593988418579102, + "load_loss": 0.17093464732170105, + "step": 8 + }, + { + "loss": 4.430959701538086, + "ce_loss": 4.42954158782959, + "load_loss": 0.14183461666107178, + "step": 8 + }, + { + "loss": 4.689673900604248, + "ce_loss": 4.688210964202881, + "load_loss": 0.1463133990764618, + "step": 8 + }, + { + "loss": 4.511449337005615, + "ce_loss": 4.5100507736206055, + "load_loss": 0.13983269035816193, + "step": 8 + }, + { + "loss": 4.497646331787109, + "ce_loss": 4.4962077140808105, + "load_loss": 0.14385859668254852, + "step": 8 + }, + { + "loss": 4.579916477203369, + "ce_loss": 4.578255653381348, + "load_loss": 0.16607770323753357, + "step": 8 + }, + { + "loss": 4.57789945602417, + "ce_loss": 4.576443195343018, + "load_loss": 0.14563794434070587, + "step": 8 + }, + { + "loss": 4.6810126304626465, + "ce_loss": 4.679560661315918, + "load_loss": 0.1452181190252304, + "step": 8 + }, + { + "loss": 4.698313236236572, + "ce_loss": 4.696773052215576, + "load_loss": 0.15402533113956451, + "step": 8 + }, + { + "loss": 4.524057865142822, + "ce_loss": 4.522525310516357, + "load_loss": 0.15326324105262756, + "step": 8 + }, + { + "loss": 4.827587604522705, + "ce_loss": 4.825892925262451, + "load_loss": 0.1694817692041397, + "step": 8 + }, + { + "loss": 4.660487174987793, + "ce_loss": 4.65886116027832, + "load_loss": 0.16259607672691345, + "step": 8 + }, + { + "loss": 4.590516567230225, + "ce_loss": 4.5888590812683105, + "load_loss": 0.16573207080364227, + "step": 8 + }, + { + "loss": 4.5967817306518555, + "ce_loss": 4.595085620880127, + "load_loss": 0.16963064670562744, + "step": 8 + }, + { + "loss": 4.717798709869385, + "ce_loss": 4.715978622436523, + "load_loss": 0.1820257604122162, + "step": 8 + }, + { + "loss": 4.651412010192871, + "ce_loss": 4.650023937225342, + "load_loss": 0.13879533112049103, + "step": 8 + }, + { + "loss": 4.601981163024902, + "ce_loss": 4.600490093231201, + "load_loss": 0.1490985006093979, + "step": 8 + }, + { + "loss": 5.050583362579346, + "ce_loss": 5.048878192901611, + "load_loss": 0.17052438855171204, + "step": 8 + }, + { + "loss": 4.798221111297607, + "ce_loss": 4.796472549438477, + "load_loss": 0.17485715448856354, + "step": 8 + }, + { + "loss": 4.691749572753906, + "ce_loss": 4.690081596374512, + "load_loss": 0.16680964827537537, + "step": 8 + }, + { + "loss": 4.596169471740723, + "ce_loss": 4.594388008117676, + "load_loss": 0.17816069722175598, + "step": 8 + }, + { + "loss": 4.65920352935791, + "ce_loss": 4.65749454498291, + "load_loss": 0.17091500759124756, + "step": 8 + }, + { + "loss": 5.06365442276001, + "ce_loss": 5.062100410461426, + "load_loss": 0.15541070699691772, + "step": 8 + }, + { + "loss": 4.5500054359436035, + "ce_loss": 4.548675060272217, + "load_loss": 0.13302548229694366, + "step": 8 + }, + { + "loss": 4.539022445678711, + "ce_loss": 4.5373101234436035, + "load_loss": 0.17123766243457794, + "step": 8 + }, + { + "loss": 4.574374198913574, + "ce_loss": 4.572775840759277, + "load_loss": 0.15983346104621887, + "step": 8 + }, + { + "loss": 4.494575023651123, + "ce_loss": 4.492996692657471, + "load_loss": 0.15781429409980774, + "step": 8 + }, + { + "loss": 4.5450053215026855, + "ce_loss": 4.543238162994385, + "load_loss": 0.1767183542251587, + "step": 8 + }, + { + "loss": 4.442013263702393, + "ce_loss": 4.440333843231201, + "load_loss": 0.16792741417884827, + "step": 8 + }, + { + "loss": 4.531535625457764, + "ce_loss": 4.530003547668457, + "load_loss": 0.1531885713338852, + "step": 8 + }, + { + "loss": 4.457118988037109, + "ce_loss": 4.455575466156006, + "load_loss": 0.15436473488807678, + "step": 8 + }, + { + "loss": 4.734434604644775, + "ce_loss": 4.733259677886963, + "load_loss": 0.11750969290733337, + "step": 8 + }, + { + "loss": 4.556101322174072, + "ce_loss": 4.554550647735596, + "load_loss": 0.1550583839416504, + "step": 8 + }, + { + "loss": 4.901827812194824, + "ce_loss": 4.900021553039551, + "load_loss": 0.18061405420303345, + "step": 8 + }, + { + "loss": 4.529775142669678, + "ce_loss": 4.527968406677246, + "load_loss": 0.18067342042922974, + "step": 8 + }, + { + "loss": 4.8250908851623535, + "ce_loss": 4.823431491851807, + "load_loss": 0.16592881083488464, + "step": 8 + }, + { + "loss": 4.576887607574463, + "ce_loss": 4.5752854347229, + "load_loss": 0.16023270785808563, + "step": 8 + }, + { + "loss": 4.574178218841553, + "ce_loss": 4.572418212890625, + "load_loss": 0.17597828805446625, + "step": 8 + }, + { + "loss": 4.632482528686523, + "ce_loss": 4.630932331085205, + "load_loss": 0.1550392359495163, + "step": 8 + }, + { + "loss": 4.645779132843018, + "ce_loss": 4.643946647644043, + "load_loss": 0.18326081335544586, + "step": 8 + }, + { + "loss": 4.493447780609131, + "ce_loss": 4.491526126861572, + "load_loss": 0.19218578934669495, + "step": 8 + }, + { + "loss": 4.593158721923828, + "ce_loss": 4.591472625732422, + "load_loss": 0.16859090328216553, + "step": 8 + }, + { + "loss": 4.539381980895996, + "ce_loss": 4.537477970123291, + "load_loss": 0.19041459262371063, + "step": 8 + }, + { + "loss": 4.6170196533203125, + "ce_loss": 4.615307807922363, + "load_loss": 0.1711902618408203, + "step": 8 + }, + { + "loss": 4.517987251281738, + "ce_loss": 4.516186237335205, + "load_loss": 0.18010568618774414, + "step": 8 + }, + { + "loss": 4.491471767425537, + "ce_loss": 4.489874839782715, + "load_loss": 0.15970422327518463, + "step": 8 + }, + { + "loss": 4.585572242736816, + "ce_loss": 4.584146499633789, + "load_loss": 0.14257949590682983, + "step": 8 + }, + { + "loss": 4.552011013031006, + "ce_loss": 4.550271511077881, + "load_loss": 0.17392750084400177, + "step": 8 + }, + { + "loss": 4.458287715911865, + "ce_loss": 4.456879615783691, + "load_loss": 0.14079152047634125, + "step": 8 + }, + { + "loss": 4.4681077003479, + "ce_loss": 4.4663896560668945, + "load_loss": 0.1718212068080902, + "step": 8 + }, + { + "loss": 4.579757213592529, + "ce_loss": 4.578100204467773, + "load_loss": 0.16570095717906952, + "step": 8 + }, + { + "loss": 5.043086528778076, + "ce_loss": 5.041384696960449, + "load_loss": 0.17017781734466553, + "step": 8 + }, + { + "loss": 4.512306213378906, + "ce_loss": 4.510446548461914, + "load_loss": 0.1859544962644577, + "step": 8 + }, + { + "loss": 4.698381423950195, + "ce_loss": 4.696890830993652, + "load_loss": 0.14907121658325195, + "step": 8 + }, + { + "loss": 4.597009658813477, + "ce_loss": 4.595345973968506, + "load_loss": 0.16638168692588806, + "step": 8 + }, + { + "loss": 4.580239295959473, + "ce_loss": 4.5784382820129395, + "load_loss": 0.18009324371814728, + "step": 8 + }, + { + "loss": 4.670261383056641, + "ce_loss": 4.668701171875, + "load_loss": 0.15600907802581787, + "step": 8 + }, + { + "loss": 4.814944267272949, + "ce_loss": 4.813685417175293, + "load_loss": 0.12588225305080414, + "step": 8 + }, + { + "loss": 4.578847408294678, + "ce_loss": 4.577186107635498, + "load_loss": 0.16615380346775055, + "step": 8 + }, + { + "loss": 4.5628485679626465, + "ce_loss": 4.5607476234436035, + "load_loss": 0.21011283993721008, + "step": 8 + }, + { + "loss": 4.550915241241455, + "ce_loss": 4.549561500549316, + "load_loss": 0.1353505551815033, + "step": 8 + }, + { + "loss": 4.557919502258301, + "ce_loss": 4.556314945220947, + "load_loss": 0.16046679019927979, + "step": 8 + }, + { + "loss": 4.774209499359131, + "ce_loss": 4.772717475891113, + "load_loss": 0.1491846740245819, + "step": 8 + }, + { + "loss": 4.60324764251709, + "ce_loss": 4.602005958557129, + "load_loss": 0.12418380379676819, + "step": 8 + }, + { + "loss": 4.51777458190918, + "ce_loss": 4.5163679122924805, + "load_loss": 0.14065270125865936, + "step": 8 + }, + { + "loss": 4.499476432800293, + "ce_loss": 4.497992515563965, + "load_loss": 0.14839336276054382, + "step": 8 + }, + { + "loss": 4.495580196380615, + "ce_loss": 4.493810176849365, + "load_loss": 0.17700126767158508, + "step": 8 + }, + { + "loss": 4.552156925201416, + "ce_loss": 4.5507402420043945, + "load_loss": 0.14166037738323212, + "step": 8 + }, + { + "loss": 4.570185661315918, + "ce_loss": 4.568483352661133, + "load_loss": 0.17024530470371246, + "step": 9 + }, + { + "loss": 4.486547470092773, + "ce_loss": 4.484549522399902, + "load_loss": 0.19979292154312134, + "step": 9 + }, + { + "loss": 4.367212772369385, + "ce_loss": 4.3655686378479, + "load_loss": 0.1643950492143631, + "step": 9 + }, + { + "loss": 4.501341819763184, + "ce_loss": 4.499776840209961, + "load_loss": 0.15650981664657593, + "step": 9 + }, + { + "loss": 4.513529300689697, + "ce_loss": 4.511865615844727, + "load_loss": 0.16635727882385254, + "step": 9 + }, + { + "loss": 4.487527847290039, + "ce_loss": 4.4857330322265625, + "load_loss": 0.1794843226671219, + "step": 9 + }, + { + "loss": 4.485169410705566, + "ce_loss": 4.483631134033203, + "load_loss": 0.15382331609725952, + "step": 9 + }, + { + "loss": 4.510141849517822, + "ce_loss": 4.508670330047607, + "load_loss": 0.1471712291240692, + "step": 9 + }, + { + "loss": 4.389777183532715, + "ce_loss": 4.3877787590026855, + "load_loss": 0.19983360171318054, + "step": 9 + }, + { + "loss": 4.703469753265381, + "ce_loss": 4.7020463943481445, + "load_loss": 0.14231620728969574, + "step": 9 + }, + { + "loss": 4.353072643280029, + "ce_loss": 4.351524353027344, + "load_loss": 0.1548376977443695, + "step": 9 + }, + { + "loss": 4.553796768188477, + "ce_loss": 4.551846504211426, + "load_loss": 0.195046067237854, + "step": 9 + }, + { + "loss": 4.376445293426514, + "ce_loss": 4.375, + "load_loss": 0.14454792439937592, + "step": 9 + }, + { + "loss": 4.972555637359619, + "ce_loss": 4.971088409423828, + "load_loss": 0.14670976996421814, + "step": 9 + }, + { + "loss": 4.489965438842773, + "ce_loss": 4.488119125366211, + "load_loss": 0.18464331328868866, + "step": 9 + }, + { + "loss": 4.4123148918151855, + "ce_loss": 4.410518169403076, + "load_loss": 0.17967818677425385, + "step": 9 + }, + { + "loss": 4.354409694671631, + "ce_loss": 4.352778911590576, + "load_loss": 0.1630905717611313, + "step": 9 + }, + { + "loss": 4.5832624435424805, + "ce_loss": 4.581306457519531, + "load_loss": 0.19560137391090393, + "step": 9 + }, + { + "loss": 4.402486801147461, + "ce_loss": 4.400864124298096, + "load_loss": 0.1622782051563263, + "step": 9 + }, + { + "loss": 4.493518352508545, + "ce_loss": 4.491552352905273, + "load_loss": 0.1966100037097931, + "step": 9 + }, + { + "loss": 4.432300090789795, + "ce_loss": 4.430467128753662, + "load_loss": 0.18330246210098267, + "step": 9 + }, + { + "loss": 4.495750427246094, + "ce_loss": 4.4938764572143555, + "load_loss": 0.1873987466096878, + "step": 9 + }, + { + "loss": 4.776342391967773, + "ce_loss": 4.774787425994873, + "load_loss": 0.15549448132514954, + "step": 9 + }, + { + "loss": 4.640838623046875, + "ce_loss": 4.639303684234619, + "load_loss": 0.15351024270057678, + "step": 9 + }, + { + "loss": 4.450356483459473, + "ce_loss": 4.4485321044921875, + "load_loss": 0.1824168562889099, + "step": 9 + }, + { + "loss": 4.434298992156982, + "ce_loss": 4.432903289794922, + "load_loss": 0.13955168426036835, + "step": 9 + }, + { + "loss": 4.464273452758789, + "ce_loss": 4.462723255157471, + "load_loss": 0.15503062307834625, + "step": 9 + }, + { + "loss": 4.8900604248046875, + "ce_loss": 4.8884782791137695, + "load_loss": 0.15821734070777893, + "step": 9 + }, + { + "loss": 4.628287315368652, + "ce_loss": 4.626498699188232, + "load_loss": 0.17884045839309692, + "step": 9 + }, + { + "loss": 4.505551338195801, + "ce_loss": 4.503793239593506, + "load_loss": 0.1758274883031845, + "step": 9 + }, + { + "loss": 4.464161396026611, + "ce_loss": 4.4626264572143555, + "load_loss": 0.153512641787529, + "step": 9 + }, + { + "loss": 4.394668102264404, + "ce_loss": 4.393124103546143, + "load_loss": 0.1544121354818344, + "step": 9 + }, + { + "loss": 4.676578521728516, + "ce_loss": 4.675145149230957, + "load_loss": 0.14332769811153412, + "step": 9 + }, + { + "loss": 4.5243988037109375, + "ce_loss": 4.523135662078857, + "load_loss": 0.1263241022825241, + "step": 9 + }, + { + "loss": 4.402472019195557, + "ce_loss": 4.400691509246826, + "load_loss": 0.17803719639778137, + "step": 9 + }, + { + "loss": 4.9150590896606445, + "ce_loss": 4.913350582122803, + "load_loss": 0.17085565626621246, + "step": 9 + }, + { + "loss": 4.672189235687256, + "ce_loss": 4.670803070068359, + "load_loss": 0.1386244297027588, + "step": 9 + }, + { + "loss": 4.837491989135742, + "ce_loss": 4.836182594299316, + "load_loss": 0.130935937166214, + "step": 9 + }, + { + "loss": 4.388063430786133, + "ce_loss": 4.386332035064697, + "load_loss": 0.17315535247325897, + "step": 9 + }, + { + "loss": 4.473698139190674, + "ce_loss": 4.47178840637207, + "load_loss": 0.19099287688732147, + "step": 9 + }, + { + "loss": 4.421807765960693, + "ce_loss": 4.420523166656494, + "load_loss": 0.1284390091896057, + "step": 9 + }, + { + "loss": 4.934109210968018, + "ce_loss": 4.932440757751465, + "load_loss": 0.16686230897903442, + "step": 9 + }, + { + "loss": 4.4393086433410645, + "ce_loss": 4.437413215637207, + "load_loss": 0.18954238295555115, + "step": 9 + }, + { + "loss": 4.443741321563721, + "ce_loss": 4.4422078132629395, + "load_loss": 0.153350830078125, + "step": 9 + }, + { + "loss": 4.788259506225586, + "ce_loss": 4.786574840545654, + "load_loss": 0.16847506165504456, + "step": 9 + }, + { + "loss": 4.6719465255737305, + "ce_loss": 4.6700053215026855, + "load_loss": 0.19412551820278168, + "step": 9 + }, + { + "loss": 4.471473217010498, + "ce_loss": 4.469878673553467, + "load_loss": 0.1594768464565277, + "step": 9 + }, + { + "loss": 4.964576721191406, + "ce_loss": 4.963138580322266, + "load_loss": 0.14380449056625366, + "step": 9 + }, + { + "loss": 4.371495246887207, + "ce_loss": 4.369926929473877, + "load_loss": 0.15685304999351501, + "step": 9 + }, + { + "loss": 4.369771480560303, + "ce_loss": 4.367923736572266, + "load_loss": 0.1847519874572754, + "step": 9 + }, + { + "loss": 4.545703411102295, + "ce_loss": 4.543589115142822, + "load_loss": 0.2114374190568924, + "step": 9 + }, + { + "loss": 4.550317287445068, + "ce_loss": 4.548335552215576, + "load_loss": 0.19816674292087555, + "step": 9 + }, + { + "loss": 4.494417190551758, + "ce_loss": 4.492530822753906, + "load_loss": 0.18861563503742218, + "step": 9 + }, + { + "loss": 4.377195358276367, + "ce_loss": 4.37551736831665, + "load_loss": 0.1677933633327484, + "step": 9 + }, + { + "loss": 4.555685520172119, + "ce_loss": 4.554121017456055, + "load_loss": 0.1564413458108902, + "step": 9 + }, + { + "loss": 4.996828556060791, + "ce_loss": 4.995198726654053, + "load_loss": 0.1629704236984253, + "step": 9 + }, + { + "loss": 4.478908061981201, + "ce_loss": 4.477023124694824, + "load_loss": 0.18850791454315186, + "step": 9 + }, + { + "loss": 4.400085926055908, + "ce_loss": 4.398821830749512, + "load_loss": 0.1264050006866455, + "step": 9 + }, + { + "loss": 4.467526435852051, + "ce_loss": 4.465628623962402, + "load_loss": 0.1897989809513092, + "step": 9 + }, + { + "loss": 4.462507724761963, + "ce_loss": 4.460812091827393, + "load_loss": 0.1695406436920166, + "step": 9 + }, + { + "loss": 4.712759017944336, + "ce_loss": 4.711030006408691, + "load_loss": 0.1728963702917099, + "step": 9 + }, + { + "loss": 4.67330265045166, + "ce_loss": 4.671687126159668, + "load_loss": 0.16154339909553528, + "step": 9 + }, + { + "loss": 4.411342144012451, + "ce_loss": 4.40984582901001, + "load_loss": 0.14963991940021515, + "step": 9 + }, + { + "loss": 4.517206192016602, + "ce_loss": 4.515612602233887, + "load_loss": 0.15933752059936523, + "step": 9 + }, + { + "loss": 4.443175792694092, + "ce_loss": 4.4415717124938965, + "load_loss": 0.1603906750679016, + "step": 9 + }, + { + "loss": 4.687338352203369, + "ce_loss": 4.68583345413208, + "load_loss": 0.15049391984939575, + "step": 9 + }, + { + "loss": 4.404651165008545, + "ce_loss": 4.402957916259766, + "load_loss": 0.16930989921092987, + "step": 9 + }, + { + "loss": 4.509786605834961, + "ce_loss": 4.507684230804443, + "load_loss": 0.21022149920463562, + "step": 9 + }, + { + "loss": 4.446996688842773, + "ce_loss": 4.445230960845947, + "load_loss": 0.17656806111335754, + "step": 9 + }, + { + "loss": 4.4092254638671875, + "ce_loss": 4.40719747543335, + "load_loss": 0.2028159350156784, + "step": 9 + }, + { + "loss": 4.685594081878662, + "ce_loss": 4.683963775634766, + "load_loss": 0.1630139797925949, + "step": 9 + }, + { + "loss": 4.44552755355835, + "ce_loss": 4.443485260009766, + "load_loss": 0.20422810316085815, + "step": 9 + }, + { + "loss": 4.742377281188965, + "ce_loss": 4.740766525268555, + "load_loss": 0.16105224192142487, + "step": 9 + }, + { + "loss": 4.5370259284973145, + "ce_loss": 4.535283088684082, + "load_loss": 0.1743013709783554, + "step": 9 + }, + { + "loss": 4.555706977844238, + "ce_loss": 4.553968906402588, + "load_loss": 0.17378820478916168, + "step": 9 + }, + { + "loss": 4.653775215148926, + "ce_loss": 4.652195930480957, + "load_loss": 0.1579492837190628, + "step": 9 + }, + { + "loss": 4.416654109954834, + "ce_loss": 4.414700984954834, + "load_loss": 0.19533617794513702, + "step": 9 + }, + { + "loss": 4.535888671875, + "ce_loss": 4.534047603607178, + "load_loss": 0.1841220110654831, + "step": 9 + }, + { + "loss": 4.397876262664795, + "ce_loss": 4.396320819854736, + "load_loss": 0.15555813908576965, + "step": 9 + }, + { + "loss": 4.384604454040527, + "ce_loss": 4.38322639465332, + "load_loss": 0.13780489563941956, + "step": 9 + }, + { + "loss": 4.611122131347656, + "ce_loss": 4.609568119049072, + "load_loss": 0.15538102388381958, + "step": 9 + }, + { + "loss": 4.436176776885986, + "ce_loss": 4.434381484985352, + "load_loss": 0.17955181002616882, + "step": 9 + }, + { + "loss": 4.740777969360352, + "ce_loss": 4.73900842666626, + "load_loss": 0.17693090438842773, + "step": 9 + }, + { + "loss": 4.800822734832764, + "ce_loss": 4.799191474914551, + "load_loss": 0.16311882436275482, + "step": 9 + }, + { + "loss": 4.341202735900879, + "ce_loss": 4.339548587799072, + "load_loss": 0.16541802883148193, + "step": 9 + }, + { + "loss": 4.425372123718262, + "ce_loss": 4.423474311828613, + "load_loss": 0.1897774338722229, + "step": 9 + }, + { + "loss": 4.386414051055908, + "ce_loss": 4.384555816650391, + "load_loss": 0.18580946326255798, + "step": 9 + }, + { + "loss": 4.845292568206787, + "ce_loss": 4.843847274780273, + "load_loss": 0.1445436179637909, + "step": 9 + }, + { + "loss": 4.429476737976074, + "ce_loss": 4.4276347160339355, + "load_loss": 0.1841861605644226, + "step": 9 + }, + { + "loss": 4.636216163635254, + "ce_loss": 4.634779453277588, + "load_loss": 0.14368338882923126, + "step": 9 + }, + { + "loss": 4.482416152954102, + "ce_loss": 4.480520248413086, + "load_loss": 0.18956968188285828, + "step": 9 + }, + { + "loss": 4.5338969230651855, + "ce_loss": 4.532465934753418, + "load_loss": 0.1430806964635849, + "step": 9 + }, + { + "loss": 4.515044212341309, + "ce_loss": 4.512965202331543, + "load_loss": 0.20791509747505188, + "step": 9 + }, + { + "loss": 4.3504958152771, + "ce_loss": 4.349167823791504, + "load_loss": 0.1328119933605194, + "step": 9 + }, + { + "loss": 4.397106647491455, + "ce_loss": 4.395364761352539, + "load_loss": 0.17418745160102844, + "step": 9 + }, + { + "loss": 4.463773727416992, + "ce_loss": 4.462365627288818, + "load_loss": 0.14082743227481842, + "step": 9 + }, + { + "loss": 4.390902996063232, + "ce_loss": 4.389556407928467, + "load_loss": 0.13466458022594452, + "step": 9 + }, + { + "loss": 4.696567535400391, + "ce_loss": 4.695411205291748, + "load_loss": 0.11562217026948929, + "step": 9 + }, + { + "loss": 4.466492176055908, + "ce_loss": 4.464819431304932, + "load_loss": 0.1672610640525818, + "step": 9 + }, + { + "loss": 4.651327610015869, + "ce_loss": 4.649980068206787, + "load_loss": 0.13474547863006592, + "step": 9 + }, + { + "loss": 4.756494998931885, + "ce_loss": 4.754746913909912, + "load_loss": 0.17482890188694, + "step": 9 + }, + { + "loss": 4.426702499389648, + "ce_loss": 4.424997329711914, + "load_loss": 0.17052581906318665, + "step": 9 + }, + { + "loss": 4.51123571395874, + "ce_loss": 4.509498119354248, + "load_loss": 0.17376235127449036, + "step": 9 + }, + { + "loss": 4.395541667938232, + "ce_loss": 4.393534183502197, + "load_loss": 0.20072877407073975, + "step": 9 + }, + { + "loss": 4.393453598022461, + "ce_loss": 4.391932487487793, + "load_loss": 0.15210668742656708, + "step": 9 + }, + { + "loss": 4.43089485168457, + "ce_loss": 4.429052829742432, + "load_loss": 0.1841813623905182, + "step": 9 + }, + { + "loss": 4.4771246910095215, + "ce_loss": 4.4754815101623535, + "load_loss": 0.164295956492424, + "step": 9 + }, + { + "loss": 4.7996087074279785, + "ce_loss": 4.79814338684082, + "load_loss": 0.14651541411876678, + "step": 9 + }, + { + "loss": 4.483159065246582, + "ce_loss": 4.4810967445373535, + "load_loss": 0.20622815191745758, + "step": 9 + }, + { + "loss": 4.47341775894165, + "ce_loss": 4.47174596786499, + "load_loss": 0.16718733310699463, + "step": 9 + }, + { + "loss": 4.510718822479248, + "ce_loss": 4.5088934898376465, + "load_loss": 0.1825370192527771, + "step": 9 + }, + { + "loss": 4.440892696380615, + "ce_loss": 4.4392523765563965, + "load_loss": 0.16401351988315582, + "step": 9 + }, + { + "loss": 4.623330116271973, + "ce_loss": 4.621463298797607, + "load_loss": 0.18666872382164001, + "step": 9 + }, + { + "loss": 4.565524101257324, + "ce_loss": 4.563933372497559, + "load_loss": 0.15909577906131744, + "step": 9 + }, + { + "loss": 4.4294633865356445, + "ce_loss": 4.427814960479736, + "load_loss": 0.16485413908958435, + "step": 9 + }, + { + "loss": 4.41305685043335, + "ce_loss": 4.411428451538086, + "load_loss": 0.1628272831439972, + "step": 9 + }, + { + "loss": 4.416673183441162, + "ce_loss": 4.4151291847229, + "load_loss": 0.15441596508026123, + "step": 9 + }, + { + "loss": 4.691522598266602, + "ce_loss": 4.689863204956055, + "load_loss": 0.16594797372817993, + "step": 9 + }, + { + "loss": 4.346898555755615, + "ce_loss": 4.345126152038574, + "load_loss": 0.17726072669029236, + "step": 9 + }, + { + "loss": 4.410984992980957, + "ce_loss": 4.409241676330566, + "load_loss": 0.1743391752243042, + "step": 9 + }, + { + "loss": 4.902798175811768, + "ce_loss": 4.901369571685791, + "load_loss": 0.14284421503543854, + "step": 9 + }, + { + "loss": 4.514629364013672, + "ce_loss": 4.512499809265137, + "load_loss": 0.21295300126075745, + "step": 9 + }, + { + "loss": 4.4243268966674805, + "ce_loss": 4.42225456237793, + "load_loss": 0.20721715688705444, + "step": 9 + }, + { + "loss": 4.592822074890137, + "ce_loss": 4.5908098220825195, + "load_loss": 0.20121322572231293, + "step": 9 + }, + { + "loss": 4.65581750869751, + "ce_loss": 4.654210090637207, + "load_loss": 0.16076359152793884, + "step": 9 + }, + { + "loss": 4.522003173828125, + "ce_loss": 4.5203776359558105, + "load_loss": 0.16255921125411987, + "step": 10 + }, + { + "loss": 4.337252140045166, + "ce_loss": 4.3357744216918945, + "load_loss": 0.1477562040090561, + "step": 10 + }, + { + "loss": 4.478119373321533, + "ce_loss": 4.476452827453613, + "load_loss": 0.16663970053195953, + "step": 10 + }, + { + "loss": 4.343516826629639, + "ce_loss": 4.342116355895996, + "load_loss": 0.1400303840637207, + "step": 10 + }, + { + "loss": 4.5872650146484375, + "ce_loss": 4.58594274520874, + "load_loss": 0.13221457600593567, + "step": 10 + }, + { + "loss": 4.4486002922058105, + "ce_loss": 4.446689128875732, + "load_loss": 0.19112499058246613, + "step": 10 + }, + { + "loss": 4.334053993225098, + "ce_loss": 4.332498073577881, + "load_loss": 0.1556079387664795, + "step": 10 + }, + { + "loss": 5.090190410614014, + "ce_loss": 5.0884013175964355, + "load_loss": 0.17890891432762146, + "step": 10 + }, + { + "loss": 4.468631267547607, + "ce_loss": 4.466922760009766, + "load_loss": 0.17083027958869934, + "step": 10 + }, + { + "loss": 4.54462194442749, + "ce_loss": 4.542961120605469, + "load_loss": 0.1661049872636795, + "step": 10 + }, + { + "loss": 4.653275489807129, + "ce_loss": 4.6511688232421875, + "load_loss": 0.2106676548719406, + "step": 10 + }, + { + "loss": 4.545570373535156, + "ce_loss": 4.543698787689209, + "load_loss": 0.18716657161712646, + "step": 10 + }, + { + "loss": 4.422323226928711, + "ce_loss": 4.420559406280518, + "load_loss": 0.17636746168136597, + "step": 10 + }, + { + "loss": 4.5021538734436035, + "ce_loss": 4.5005083084106445, + "load_loss": 0.16456881165504456, + "step": 10 + }, + { + "loss": 4.401285648345947, + "ce_loss": 4.399391174316406, + "load_loss": 0.18944378197193146, + "step": 10 + }, + { + "loss": 4.411815643310547, + "ce_loss": 4.409893035888672, + "load_loss": 0.192237988114357, + "step": 10 + }, + { + "loss": 4.417019367218018, + "ce_loss": 4.415287017822266, + "load_loss": 0.17321233451366425, + "step": 10 + }, + { + "loss": 4.303189277648926, + "ce_loss": 4.301307678222656, + "load_loss": 0.1881742626428604, + "step": 10 + }, + { + "loss": 4.292294979095459, + "ce_loss": 4.290518760681152, + "load_loss": 0.17760252952575684, + "step": 10 + }, + { + "loss": 4.564502239227295, + "ce_loss": 4.562849521636963, + "load_loss": 0.1652500182390213, + "step": 10 + }, + { + "loss": 4.367251873016357, + "ce_loss": 4.365828990936279, + "load_loss": 0.14228269457817078, + "step": 10 + }, + { + "loss": 4.353029251098633, + "ce_loss": 4.351443767547607, + "load_loss": 0.15856777131557465, + "step": 10 + }, + { + "loss": 5.161331653594971, + "ce_loss": 5.159909725189209, + "load_loss": 0.1421874314546585, + "step": 10 + }, + { + "loss": 4.380423545837402, + "ce_loss": 4.379131317138672, + "load_loss": 0.1292116343975067, + "step": 10 + }, + { + "loss": 5.1947340965271, + "ce_loss": 5.192930221557617, + "load_loss": 0.18037280440330505, + "step": 10 + }, + { + "loss": 4.472927570343018, + "ce_loss": 4.471369743347168, + "load_loss": 0.15576638281345367, + "step": 10 + }, + { + "loss": 4.601015090942383, + "ce_loss": 4.599339008331299, + "load_loss": 0.16761577129364014, + "step": 10 + }, + { + "loss": 4.343294143676758, + "ce_loss": 4.341591835021973, + "load_loss": 0.17022375762462616, + "step": 10 + }, + { + "loss": 4.38454532623291, + "ce_loss": 4.383020877838135, + "load_loss": 0.15246476233005524, + "step": 10 + }, + { + "loss": 4.456377983093262, + "ce_loss": 4.4548234939575195, + "load_loss": 0.1554269790649414, + "step": 10 + }, + { + "loss": 4.436436653137207, + "ce_loss": 4.43495512008667, + "load_loss": 0.14813390374183655, + "step": 10 + }, + { + "loss": 4.50187873840332, + "ce_loss": 4.500225067138672, + "load_loss": 0.16535964608192444, + "step": 10 + }, + { + "loss": 4.515215873718262, + "ce_loss": 4.513073921203613, + "load_loss": 0.21421727538108826, + "step": 10 + }, + { + "loss": 4.649897575378418, + "ce_loss": 4.648240566253662, + "load_loss": 0.16570095717906952, + "step": 10 + }, + { + "loss": 4.337067127227783, + "ce_loss": 4.3357110023498535, + "load_loss": 0.13561145961284637, + "step": 10 + }, + { + "loss": 4.4227142333984375, + "ce_loss": 4.4210309982299805, + "load_loss": 0.16830894351005554, + "step": 10 + }, + { + "loss": 4.25950288772583, + "ce_loss": 4.257874488830566, + "load_loss": 0.1628316044807434, + "step": 10 + }, + { + "loss": 4.386429309844971, + "ce_loss": 4.3847336769104, + "load_loss": 0.16957417130470276, + "step": 10 + }, + { + "loss": 4.7797770500183105, + "ce_loss": 4.778041362762451, + "load_loss": 0.173567533493042, + "step": 10 + }, + { + "loss": 4.3778581619262695, + "ce_loss": 4.376332759857178, + "load_loss": 0.1525394320487976, + "step": 10 + }, + { + "loss": 4.65309476852417, + "ce_loss": 4.651680946350098, + "load_loss": 0.14140379428863525, + "step": 10 + }, + { + "loss": 4.35516357421875, + "ce_loss": 4.353191375732422, + "load_loss": 0.19723519682884216, + "step": 10 + }, + { + "loss": 4.280926704406738, + "ce_loss": 4.27956485748291, + "load_loss": 0.1361681967973709, + "step": 10 + }, + { + "loss": 4.57785701751709, + "ce_loss": 4.5761637687683105, + "load_loss": 0.1693386435508728, + "step": 10 + }, + { + "loss": 4.4349188804626465, + "ce_loss": 4.433090686798096, + "load_loss": 0.18283286690711975, + "step": 10 + }, + { + "loss": 4.365965366363525, + "ce_loss": 4.364137649536133, + "load_loss": 0.18275435268878937, + "step": 10 + }, + { + "loss": 4.85269832611084, + "ce_loss": 4.851057052612305, + "load_loss": 0.16412265598773956, + "step": 10 + }, + { + "loss": 4.398861885070801, + "ce_loss": 4.397269248962402, + "load_loss": 0.15928439795970917, + "step": 10 + }, + { + "loss": 4.416820526123047, + "ce_loss": 4.41493558883667, + "load_loss": 0.188495934009552, + "step": 10 + }, + { + "loss": 4.307016372680664, + "ce_loss": 4.305228233337402, + "load_loss": 0.17880216240882874, + "step": 10 + }, + { + "loss": 4.417165279388428, + "ce_loss": 4.415377616882324, + "load_loss": 0.17878922820091248, + "step": 10 + }, + { + "loss": 4.947488784790039, + "ce_loss": 4.946112155914307, + "load_loss": 0.13766510784626007, + "step": 10 + }, + { + "loss": 4.69696569442749, + "ce_loss": 4.695470809936523, + "load_loss": 0.14948433637619019, + "step": 10 + }, + { + "loss": 4.3391900062561035, + "ce_loss": 4.337735176086426, + "load_loss": 0.145499587059021, + "step": 10 + }, + { + "loss": 4.3508734703063965, + "ce_loss": 4.3491740226745605, + "load_loss": 0.1699293702840805, + "step": 10 + }, + { + "loss": 4.551959991455078, + "ce_loss": 4.5501861572265625, + "load_loss": 0.17739953100681305, + "step": 10 + }, + { + "loss": 4.447351932525635, + "ce_loss": 4.44560432434082, + "load_loss": 0.17478008568286896, + "step": 10 + }, + { + "loss": 4.403700828552246, + "ce_loss": 4.402166366577148, + "load_loss": 0.1534341275691986, + "step": 10 + }, + { + "loss": 4.526284217834473, + "ce_loss": 4.524669647216797, + "load_loss": 0.1614452749490738, + "step": 10 + }, + { + "loss": 4.765143871307373, + "ce_loss": 4.763570785522461, + "load_loss": 0.15732839703559875, + "step": 10 + }, + { + "loss": 4.615752696990967, + "ce_loss": 4.613851070404053, + "load_loss": 0.1901618242263794, + "step": 10 + }, + { + "loss": 4.282208442687988, + "ce_loss": 4.280725955963135, + "load_loss": 0.1482262909412384, + "step": 10 + } +] \ No newline at end of file