diff --git "a/model/trainer_state.json" "b/model/trainer_state.json" new file mode 100644--- /dev/null +++ "b/model/trainer_state.json" @@ -0,0 +1,39882 @@ +{ + "best_global_step": null, + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 0.4999799269340399, + "eval_steps": 500, + "global_step": 49816, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.00010036532980047372, + "learning_rate": 0.00019998193424063592, + "loss": 1.5103, + "mean_token_accuracy": 0.633021330833435, + "num_tokens": 33810.0, + "step": 10 + }, + { + "epoch": 0.00020073065960094744, + "learning_rate": 0.00019996186117467583, + "loss": 1.2727, + "mean_token_accuracy": 0.677767938375473, + "num_tokens": 68079.0, + "step": 20 + }, + { + "epoch": 0.0003010959894014212, + "learning_rate": 0.00019994178810871574, + "loss": 1.1203, + "mean_token_accuracy": 0.7041535198688507, + "num_tokens": 102274.0, + "step": 30 + }, + { + "epoch": 0.0004014613192018949, + "learning_rate": 0.00019992171504275562, + "loss": 1.0614, + "mean_token_accuracy": 0.7179206430912017, + "num_tokens": 135784.0, + "step": 40 + }, + { + "epoch": 0.0005018266490023686, + "learning_rate": 0.00019990164197679556, + "loss": 1.0812, + "mean_token_accuracy": 0.7120111465454102, + "num_tokens": 169612.0, + "step": 50 + }, + { + "epoch": 0.0006021919788028423, + "learning_rate": 0.00019988156891083544, + "loss": 1.0127, + "mean_token_accuracy": 0.7204696774482727, + "num_tokens": 203734.0, + "step": 60 + }, + { + "epoch": 0.0007025573086033161, + "learning_rate": 0.00019986149584487535, + "loss": 0.9832, + "mean_token_accuracy": 0.7345041453838348, + "num_tokens": 237931.0, + "step": 70 + }, + { + "epoch": 0.0008029226384037898, + "learning_rate": 0.00019984142277891526, + "loss": 0.9677, + "mean_token_accuracy": 0.7350185573101043, + "num_tokens": 272629.0, + "step": 80 + }, + { + "epoch": 0.0009032879682042635, + "learning_rate": 0.00019982134971295516, + "loss": 0.997, + "mean_token_accuracy": 0.7259666502475739, + "num_tokens": 306161.0, + "step": 90 + }, + { + "epoch": 0.0010036532980047372, + "learning_rate": 0.00019980127664699507, + "loss": 1.0068, + "mean_token_accuracy": 0.7253551065921784, + "num_tokens": 339884.0, + "step": 100 + }, + { + "epoch": 0.001104018627805211, + "learning_rate": 0.00019978120358103498, + "loss": 0.9897, + "mean_token_accuracy": 0.7253098130226135, + "num_tokens": 373256.0, + "step": 110 + }, + { + "epoch": 0.0012043839576056847, + "learning_rate": 0.0001997611305150749, + "loss": 0.9673, + "mean_token_accuracy": 0.729346650838852, + "num_tokens": 407123.0, + "step": 120 + }, + { + "epoch": 0.0013047492874061583, + "learning_rate": 0.00019974105744911477, + "loss": 0.9385, + "mean_token_accuracy": 0.7343133509159088, + "num_tokens": 441186.0, + "step": 130 + }, + { + "epoch": 0.0014051146172066322, + "learning_rate": 0.0001997209843831547, + "loss": 0.9334, + "mean_token_accuracy": 0.7334938704967499, + "num_tokens": 476076.0, + "step": 140 + }, + { + "epoch": 0.0015054799470071059, + "learning_rate": 0.0001997009113171946, + "loss": 0.9647, + "mean_token_accuracy": 0.7314290404319763, + "num_tokens": 510012.0, + "step": 150 + }, + { + "epoch": 0.0016058452768075795, + "learning_rate": 0.0001996808382512345, + "loss": 0.9372, + "mean_token_accuracy": 0.7441855669021606, + "num_tokens": 543926.0, + "step": 160 + }, + { + "epoch": 0.0017062106066080534, + "learning_rate": 0.0001996607651852744, + "loss": 0.9317, + "mean_token_accuracy": 0.7420060276985169, + "num_tokens": 577963.0, + "step": 170 + }, + { + "epoch": 0.001806575936408527, + "learning_rate": 0.00019964069211931431, + "loss": 0.9181, + "mean_token_accuracy": 0.7427789747714997, + "num_tokens": 611919.0, + "step": 180 + }, + { + "epoch": 0.0019069412662090007, + "learning_rate": 0.00019962061905335422, + "loss": 0.9343, + "mean_token_accuracy": 0.7363346517086029, + "num_tokens": 645919.0, + "step": 190 + }, + { + "epoch": 0.0020073065960094743, + "learning_rate": 0.00019960054598739413, + "loss": 0.9205, + "mean_token_accuracy": 0.7433876693248749, + "num_tokens": 679456.0, + "step": 200 + }, + { + "epoch": 0.002107671925809948, + "learning_rate": 0.000199580472921434, + "loss": 0.8805, + "mean_token_accuracy": 0.7510487496852875, + "num_tokens": 713397.0, + "step": 210 + }, + { + "epoch": 0.002208037255610422, + "learning_rate": 0.00019956039985547395, + "loss": 0.9355, + "mean_token_accuracy": 0.7372931838035583, + "num_tokens": 746693.0, + "step": 220 + }, + { + "epoch": 0.0023084025854108957, + "learning_rate": 0.00019954032678951386, + "loss": 0.9282, + "mean_token_accuracy": 0.7390501201152802, + "num_tokens": 780480.0, + "step": 230 + }, + { + "epoch": 0.0024087679152113694, + "learning_rate": 0.00019952025372355374, + "loss": 0.8976, + "mean_token_accuracy": 0.7474514424800873, + "num_tokens": 814570.0, + "step": 240 + }, + { + "epoch": 0.002509133245011843, + "learning_rate": 0.00019950018065759367, + "loss": 0.9076, + "mean_token_accuracy": 0.7378260135650635, + "num_tokens": 848776.0, + "step": 250 + }, + { + "epoch": 0.0026094985748123167, + "learning_rate": 0.00019948010759163355, + "loss": 0.9324, + "mean_token_accuracy": 0.7361941576004029, + "num_tokens": 881643.0, + "step": 260 + }, + { + "epoch": 0.0027098639046127903, + "learning_rate": 0.00019946003452567346, + "loss": 0.9155, + "mean_token_accuracy": 0.7408255219459534, + "num_tokens": 915814.0, + "step": 270 + }, + { + "epoch": 0.0028102292344132644, + "learning_rate": 0.00019943996145971337, + "loss": 0.8939, + "mean_token_accuracy": 0.7481561243534088, + "num_tokens": 950660.0, + "step": 280 + }, + { + "epoch": 0.002910594564213738, + "learning_rate": 0.00019941988839375328, + "loss": 0.9425, + "mean_token_accuracy": 0.735199373960495, + "num_tokens": 984112.0, + "step": 290 + }, + { + "epoch": 0.0030109598940142117, + "learning_rate": 0.00019939981532779316, + "loss": 0.899, + "mean_token_accuracy": 0.743339866399765, + "num_tokens": 1018221.0, + "step": 300 + }, + { + "epoch": 0.0031113252238146854, + "learning_rate": 0.0001993797422618331, + "loss": 0.9045, + "mean_token_accuracy": 0.7475386559963226, + "num_tokens": 1051883.0, + "step": 310 + }, + { + "epoch": 0.003211690553615159, + "learning_rate": 0.00019935966919587298, + "loss": 0.9073, + "mean_token_accuracy": 0.7443807065486908, + "num_tokens": 1086327.0, + "step": 320 + }, + { + "epoch": 0.0033120558834156327, + "learning_rate": 0.00019933959612991289, + "loss": 0.9139, + "mean_token_accuracy": 0.7400292158126831, + "num_tokens": 1120924.0, + "step": 330 + }, + { + "epoch": 0.0034124212132161068, + "learning_rate": 0.0001993195230639528, + "loss": 0.8737, + "mean_token_accuracy": 0.7494464218616486, + "num_tokens": 1154916.0, + "step": 340 + }, + { + "epoch": 0.0035127865430165804, + "learning_rate": 0.0001992994499979927, + "loss": 0.8745, + "mean_token_accuracy": 0.7504120409488678, + "num_tokens": 1189348.0, + "step": 350 + }, + { + "epoch": 0.003613151872817054, + "learning_rate": 0.0001992793769320326, + "loss": 0.9187, + "mean_token_accuracy": 0.7410196900367737, + "num_tokens": 1223853.0, + "step": 360 + }, + { + "epoch": 0.0037135172026175277, + "learning_rate": 0.00019925930386607252, + "loss": 0.8834, + "mean_token_accuracy": 0.749067735671997, + "num_tokens": 1257683.0, + "step": 370 + }, + { + "epoch": 0.0038138825324180014, + "learning_rate": 0.00019923923080011243, + "loss": 0.8981, + "mean_token_accuracy": 0.7470409989356994, + "num_tokens": 1292294.0, + "step": 380 + }, + { + "epoch": 0.0039142478622184755, + "learning_rate": 0.0001992191577341523, + "loss": 0.9096, + "mean_token_accuracy": 0.7398540675640106, + "num_tokens": 1326683.0, + "step": 390 + }, + { + "epoch": 0.004014613192018949, + "learning_rate": 0.00019919908466819225, + "loss": 0.8964, + "mean_token_accuracy": 0.7491674959659577, + "num_tokens": 1360379.0, + "step": 400 + }, + { + "epoch": 0.004114978521819423, + "learning_rate": 0.00019917901160223213, + "loss": 0.8677, + "mean_token_accuracy": 0.7554733157157898, + "num_tokens": 1394724.0, + "step": 410 + }, + { + "epoch": 0.004215343851619896, + "learning_rate": 0.00019915893853627203, + "loss": 0.894, + "mean_token_accuracy": 0.7477222561836243, + "num_tokens": 1429795.0, + "step": 420 + }, + { + "epoch": 0.00431570918142037, + "learning_rate": 0.00019913886547031194, + "loss": 0.8876, + "mean_token_accuracy": 0.747435849905014, + "num_tokens": 1463279.0, + "step": 430 + }, + { + "epoch": 0.004416074511220844, + "learning_rate": 0.00019911879240435185, + "loss": 0.9133, + "mean_token_accuracy": 0.7419423460960388, + "num_tokens": 1497656.0, + "step": 440 + }, + { + "epoch": 0.004516439841021317, + "learning_rate": 0.00019909871933839176, + "loss": 0.9105, + "mean_token_accuracy": 0.7445949018001556, + "num_tokens": 1531438.0, + "step": 450 + }, + { + "epoch": 0.0046168051708217915, + "learning_rate": 0.00019907864627243167, + "loss": 0.9147, + "mean_token_accuracy": 0.7372195899486542, + "num_tokens": 1564860.0, + "step": 460 + }, + { + "epoch": 0.004717170500622265, + "learning_rate": 0.00019905857320647158, + "loss": 0.8822, + "mean_token_accuracy": 0.7499520599842071, + "num_tokens": 1598515.0, + "step": 470 + }, + { + "epoch": 0.004817535830422739, + "learning_rate": 0.00019903850014051146, + "loss": 0.886, + "mean_token_accuracy": 0.7500568509101868, + "num_tokens": 1632684.0, + "step": 480 + }, + { + "epoch": 0.004917901160223213, + "learning_rate": 0.0001990184270745514, + "loss": 0.8615, + "mean_token_accuracy": 0.7524400293827057, + "num_tokens": 1666653.0, + "step": 490 + }, + { + "epoch": 0.005018266490023686, + "learning_rate": 0.00019899835400859128, + "loss": 0.8954, + "mean_token_accuracy": 0.7409865975379943, + "num_tokens": 1700533.0, + "step": 500 + }, + { + "epoch": 0.00511863181982416, + "learning_rate": 0.00019897828094263118, + "loss": 0.932, + "mean_token_accuracy": 0.7376771807670593, + "num_tokens": 1734093.0, + "step": 510 + }, + { + "epoch": 0.005218997149624633, + "learning_rate": 0.0001989582078766711, + "loss": 0.8562, + "mean_token_accuracy": 0.7520005285739899, + "num_tokens": 1767804.0, + "step": 520 + }, + { + "epoch": 0.0053193624794251075, + "learning_rate": 0.000198938134810711, + "loss": 0.8675, + "mean_token_accuracy": 0.7533258378505707, + "num_tokens": 1801441.0, + "step": 530 + }, + { + "epoch": 0.005419727809225581, + "learning_rate": 0.00019891806174475088, + "loss": 0.8802, + "mean_token_accuracy": 0.752521938085556, + "num_tokens": 1835240.0, + "step": 540 + }, + { + "epoch": 0.005520093139026055, + "learning_rate": 0.00019889798867879082, + "loss": 0.8772, + "mean_token_accuracy": 0.7515844464302063, + "num_tokens": 1868712.0, + "step": 550 + }, + { + "epoch": 0.005620458468826529, + "learning_rate": 0.0001988779156128307, + "loss": 0.8726, + "mean_token_accuracy": 0.7543687939643859, + "num_tokens": 1902913.0, + "step": 560 + }, + { + "epoch": 0.005720823798627002, + "learning_rate": 0.0001988578425468706, + "loss": 0.8543, + "mean_token_accuracy": 0.7525355458259583, + "num_tokens": 1936217.0, + "step": 570 + }, + { + "epoch": 0.005821189128427476, + "learning_rate": 0.00019883776948091054, + "loss": 0.9133, + "mean_token_accuracy": 0.7481994688510895, + "num_tokens": 1969679.0, + "step": 580 + }, + { + "epoch": 0.005921554458227949, + "learning_rate": 0.00019881769641495042, + "loss": 0.8996, + "mean_token_accuracy": 0.7466781139373779, + "num_tokens": 2003835.0, + "step": 590 + }, + { + "epoch": 0.0060219197880284235, + "learning_rate": 0.00019879762334899033, + "loss": 0.9024, + "mean_token_accuracy": 0.7528743803501129, + "num_tokens": 2037954.0, + "step": 600 + }, + { + "epoch": 0.0061222851178288976, + "learning_rate": 0.00019877755028303024, + "loss": 0.9052, + "mean_token_accuracy": 0.7427110850811005, + "num_tokens": 2072301.0, + "step": 610 + }, + { + "epoch": 0.006222650447629371, + "learning_rate": 0.00019875747721707015, + "loss": 0.886, + "mean_token_accuracy": 0.7461163103580475, + "num_tokens": 2106896.0, + "step": 620 + }, + { + "epoch": 0.006323015777429845, + "learning_rate": 0.00019873740415111003, + "loss": 0.9005, + "mean_token_accuracy": 0.7445556104183197, + "num_tokens": 2140725.0, + "step": 630 + }, + { + "epoch": 0.006423381107230318, + "learning_rate": 0.00019871733108514997, + "loss": 0.8882, + "mean_token_accuracy": 0.7516779065132141, + "num_tokens": 2175119.0, + "step": 640 + }, + { + "epoch": 0.006523746437030792, + "learning_rate": 0.00019869725801918985, + "loss": 0.9102, + "mean_token_accuracy": 0.7461168050765992, + "num_tokens": 2209647.0, + "step": 650 + }, + { + "epoch": 0.006624111766831265, + "learning_rate": 0.00019867718495322976, + "loss": 0.8439, + "mean_token_accuracy": 0.756019902229309, + "num_tokens": 2243954.0, + "step": 660 + }, + { + "epoch": 0.0067244770966317395, + "learning_rate": 0.00019865711188726966, + "loss": 0.8892, + "mean_token_accuracy": 0.7439179301261902, + "num_tokens": 2278114.0, + "step": 670 + }, + { + "epoch": 0.0068248424264322136, + "learning_rate": 0.00019863703882130957, + "loss": 0.9091, + "mean_token_accuracy": 0.744629728794098, + "num_tokens": 2312064.0, + "step": 680 + }, + { + "epoch": 0.006925207756232687, + "learning_rate": 0.00019861696575534948, + "loss": 0.8235, + "mean_token_accuracy": 0.7626911222934722, + "num_tokens": 2345670.0, + "step": 690 + }, + { + "epoch": 0.007025573086033161, + "learning_rate": 0.0001985968926893894, + "loss": 0.8921, + "mean_token_accuracy": 0.7451446413993835, + "num_tokens": 2379617.0, + "step": 700 + }, + { + "epoch": 0.007125938415833634, + "learning_rate": 0.0001985768196234293, + "loss": 0.8448, + "mean_token_accuracy": 0.7558365881443023, + "num_tokens": 2414653.0, + "step": 710 + }, + { + "epoch": 0.007226303745634108, + "learning_rate": 0.00019855674655746918, + "loss": 0.8762, + "mean_token_accuracy": 0.7509781241416931, + "num_tokens": 2448981.0, + "step": 720 + }, + { + "epoch": 0.007326669075434582, + "learning_rate": 0.00019853667349150911, + "loss": 0.8753, + "mean_token_accuracy": 0.7493642330169678, + "num_tokens": 2483413.0, + "step": 730 + }, + { + "epoch": 0.0074270344052350555, + "learning_rate": 0.000198516600425549, + "loss": 0.8811, + "mean_token_accuracy": 0.7473379790782928, + "num_tokens": 2516947.0, + "step": 740 + }, + { + "epoch": 0.0075273997350355296, + "learning_rate": 0.00019849652735958893, + "loss": 0.8589, + "mean_token_accuracy": 0.7478324592113494, + "num_tokens": 2551303.0, + "step": 750 + }, + { + "epoch": 0.007627765064836003, + "learning_rate": 0.0001984764542936288, + "loss": 0.9073, + "mean_token_accuracy": 0.7422046661376953, + "num_tokens": 2585751.0, + "step": 760 + }, + { + "epoch": 0.007728130394636477, + "learning_rate": 0.00019845638122766872, + "loss": 0.8407, + "mean_token_accuracy": 0.7600900292396545, + "num_tokens": 2620871.0, + "step": 770 + }, + { + "epoch": 0.007828495724436951, + "learning_rate": 0.00019843630816170863, + "loss": 0.8666, + "mean_token_accuracy": 0.7502162098884583, + "num_tokens": 2654342.0, + "step": 780 + }, + { + "epoch": 0.007928861054237424, + "learning_rate": 0.00019841623509574854, + "loss": 0.8833, + "mean_token_accuracy": 0.7511953830718994, + "num_tokens": 2689101.0, + "step": 790 + }, + { + "epoch": 0.008029226384037897, + "learning_rate": 0.00019839616202978845, + "loss": 0.8698, + "mean_token_accuracy": 0.7504532694816589, + "num_tokens": 2723619.0, + "step": 800 + }, + { + "epoch": 0.008129591713838372, + "learning_rate": 0.00019837608896382836, + "loss": 0.8612, + "mean_token_accuracy": 0.7555593311786651, + "num_tokens": 2756956.0, + "step": 810 + }, + { + "epoch": 0.008229957043638846, + "learning_rate": 0.00019835601589786826, + "loss": 0.8864, + "mean_token_accuracy": 0.7532445669174195, + "num_tokens": 2790576.0, + "step": 820 + }, + { + "epoch": 0.008330322373439319, + "learning_rate": 0.00019833594283190815, + "loss": 0.8861, + "mean_token_accuracy": 0.7430309534072876, + "num_tokens": 2823827.0, + "step": 830 + }, + { + "epoch": 0.008430687703239792, + "learning_rate": 0.00019831586976594808, + "loss": 0.8871, + "mean_token_accuracy": 0.7462802588939667, + "num_tokens": 2858359.0, + "step": 840 + }, + { + "epoch": 0.008531053033040267, + "learning_rate": 0.00019829579669998796, + "loss": 0.8695, + "mean_token_accuracy": 0.7541916847229004, + "num_tokens": 2892919.0, + "step": 850 + }, + { + "epoch": 0.00863141836284074, + "learning_rate": 0.00019827572363402787, + "loss": 0.8838, + "mean_token_accuracy": 0.7506275475025177, + "num_tokens": 2927106.0, + "step": 860 + }, + { + "epoch": 0.008731783692641213, + "learning_rate": 0.00019825565056806778, + "loss": 0.8475, + "mean_token_accuracy": 0.7548351526260376, + "num_tokens": 2960466.0, + "step": 870 + }, + { + "epoch": 0.008832149022441688, + "learning_rate": 0.0001982355775021077, + "loss": 0.8557, + "mean_token_accuracy": 0.7527715265750885, + "num_tokens": 2993569.0, + "step": 880 + }, + { + "epoch": 0.008932514352242162, + "learning_rate": 0.00019821550443614757, + "loss": 0.8773, + "mean_token_accuracy": 0.7506238102912903, + "num_tokens": 3028181.0, + "step": 890 + }, + { + "epoch": 0.009032879682042635, + "learning_rate": 0.0001981954313701875, + "loss": 0.8718, + "mean_token_accuracy": 0.7520479619503021, + "num_tokens": 3061934.0, + "step": 900 + }, + { + "epoch": 0.00913324501184311, + "learning_rate": 0.00019817535830422739, + "loss": 0.8554, + "mean_token_accuracy": 0.7517975449562073, + "num_tokens": 3095089.0, + "step": 910 + }, + { + "epoch": 0.009233610341643583, + "learning_rate": 0.0001981552852382673, + "loss": 0.8492, + "mean_token_accuracy": 0.7479332447052002, + "num_tokens": 3129099.0, + "step": 920 + }, + { + "epoch": 0.009333975671444056, + "learning_rate": 0.00019813521217230723, + "loss": 0.8679, + "mean_token_accuracy": 0.749633401632309, + "num_tokens": 3162147.0, + "step": 930 + }, + { + "epoch": 0.00943434100124453, + "learning_rate": 0.0001981151391063471, + "loss": 0.8895, + "mean_token_accuracy": 0.7500181376934052, + "num_tokens": 3196315.0, + "step": 940 + }, + { + "epoch": 0.009534706331045004, + "learning_rate": 0.00019809506604038702, + "loss": 0.8793, + "mean_token_accuracy": 0.7507654368877411, + "num_tokens": 3230752.0, + "step": 950 + }, + { + "epoch": 0.009635071660845478, + "learning_rate": 0.00019807499297442693, + "loss": 0.848, + "mean_token_accuracy": 0.7560262858867646, + "num_tokens": 3264343.0, + "step": 960 + }, + { + "epoch": 0.00973543699064595, + "learning_rate": 0.00019805491990846684, + "loss": 0.8647, + "mean_token_accuracy": 0.7528027355670929, + "num_tokens": 3298563.0, + "step": 970 + }, + { + "epoch": 0.009835802320446426, + "learning_rate": 0.00019803484684250672, + "loss": 0.8385, + "mean_token_accuracy": 0.7556717336177826, + "num_tokens": 3332120.0, + "step": 980 + }, + { + "epoch": 0.009936167650246899, + "learning_rate": 0.00019801477377654665, + "loss": 0.8657, + "mean_token_accuracy": 0.7579919815063476, + "num_tokens": 3366253.0, + "step": 990 + }, + { + "epoch": 0.010036532980047372, + "learning_rate": 0.00019799470071058653, + "loss": 0.8592, + "mean_token_accuracy": 0.7515231788158416, + "num_tokens": 3399434.0, + "step": 1000 + }, + { + "epoch": 0.010136898309847845, + "learning_rate": 0.00019797462764462644, + "loss": 0.8361, + "mean_token_accuracy": 0.7587453186511993, + "num_tokens": 3433578.0, + "step": 1010 + }, + { + "epoch": 0.01023726363964832, + "learning_rate": 0.00019795455457866635, + "loss": 0.834, + "mean_token_accuracy": 0.7555178880691529, + "num_tokens": 3467942.0, + "step": 1020 + }, + { + "epoch": 0.010337628969448794, + "learning_rate": 0.00019793448151270626, + "loss": 0.8569, + "mean_token_accuracy": 0.7506053686141968, + "num_tokens": 3502285.0, + "step": 1030 + }, + { + "epoch": 0.010437994299249267, + "learning_rate": 0.00019791440844674617, + "loss": 0.8725, + "mean_token_accuracy": 0.7484077334403991, + "num_tokens": 3536182.0, + "step": 1040 + }, + { + "epoch": 0.010538359629049742, + "learning_rate": 0.00019789433538078608, + "loss": 0.8061, + "mean_token_accuracy": 0.7640980839729309, + "num_tokens": 3570133.0, + "step": 1050 + }, + { + "epoch": 0.010638724958850215, + "learning_rate": 0.00019787426231482598, + "loss": 0.8913, + "mean_token_accuracy": 0.7447064459323883, + "num_tokens": 3604046.0, + "step": 1060 + }, + { + "epoch": 0.010739090288650688, + "learning_rate": 0.00019785418924886587, + "loss": 0.8695, + "mean_token_accuracy": 0.7490169048309326, + "num_tokens": 3638337.0, + "step": 1070 + }, + { + "epoch": 0.010839455618451161, + "learning_rate": 0.0001978341161829058, + "loss": 0.861, + "mean_token_accuracy": 0.7469825208187103, + "num_tokens": 3672695.0, + "step": 1080 + }, + { + "epoch": 0.010939820948251636, + "learning_rate": 0.00019781404311694568, + "loss": 0.8901, + "mean_token_accuracy": 0.7456781506538391, + "num_tokens": 3707086.0, + "step": 1090 + }, + { + "epoch": 0.01104018627805211, + "learning_rate": 0.0001977939700509856, + "loss": 0.8429, + "mean_token_accuracy": 0.7588579893112183, + "num_tokens": 3740519.0, + "step": 1100 + }, + { + "epoch": 0.011140551607852583, + "learning_rate": 0.0001977738969850255, + "loss": 0.8728, + "mean_token_accuracy": 0.7522070944309235, + "num_tokens": 3774450.0, + "step": 1110 + }, + { + "epoch": 0.011240916937653058, + "learning_rate": 0.0001977538239190654, + "loss": 0.8837, + "mean_token_accuracy": 0.7503505706787109, + "num_tokens": 3808768.0, + "step": 1120 + }, + { + "epoch": 0.011341282267453531, + "learning_rate": 0.00019773375085310532, + "loss": 0.8359, + "mean_token_accuracy": 0.7603037297725678, + "num_tokens": 3843046.0, + "step": 1130 + }, + { + "epoch": 0.011441647597254004, + "learning_rate": 0.00019771367778714523, + "loss": 0.8845, + "mean_token_accuracy": 0.7438742220401764, + "num_tokens": 3876186.0, + "step": 1140 + }, + { + "epoch": 0.011542012927054479, + "learning_rate": 0.00019769360472118513, + "loss": 0.8405, + "mean_token_accuracy": 0.7548528850078583, + "num_tokens": 3910140.0, + "step": 1150 + }, + { + "epoch": 0.011642378256854952, + "learning_rate": 0.00019767353165522502, + "loss": 0.8441, + "mean_token_accuracy": 0.7579459309577942, + "num_tokens": 3944252.0, + "step": 1160 + }, + { + "epoch": 0.011742743586655426, + "learning_rate": 0.00019765345858926495, + "loss": 0.8564, + "mean_token_accuracy": 0.7527571260929108, + "num_tokens": 3978821.0, + "step": 1170 + }, + { + "epoch": 0.011843108916455899, + "learning_rate": 0.00019763338552330483, + "loss": 0.8654, + "mean_token_accuracy": 0.7558556854724884, + "num_tokens": 4013127.0, + "step": 1180 + }, + { + "epoch": 0.011943474246256374, + "learning_rate": 0.00019761331245734474, + "loss": 0.8622, + "mean_token_accuracy": 0.7480232536792755, + "num_tokens": 4047220.0, + "step": 1190 + }, + { + "epoch": 0.012043839576056847, + "learning_rate": 0.00019759323939138465, + "loss": 0.8616, + "mean_token_accuracy": 0.7525281727313995, + "num_tokens": 4081046.0, + "step": 1200 + }, + { + "epoch": 0.01214420490585732, + "learning_rate": 0.00019757316632542456, + "loss": 0.867, + "mean_token_accuracy": 0.748983871936798, + "num_tokens": 4115169.0, + "step": 1210 + }, + { + "epoch": 0.012244570235657795, + "learning_rate": 0.00019755309325946444, + "loss": 0.8851, + "mean_token_accuracy": 0.7456744372844696, + "num_tokens": 4149891.0, + "step": 1220 + }, + { + "epoch": 0.012344935565458268, + "learning_rate": 0.00019753302019350437, + "loss": 0.8321, + "mean_token_accuracy": 0.757876992225647, + "num_tokens": 4183258.0, + "step": 1230 + }, + { + "epoch": 0.012445300895258742, + "learning_rate": 0.00019751294712754426, + "loss": 0.8615, + "mean_token_accuracy": 0.7554275155067444, + "num_tokens": 4217359.0, + "step": 1240 + }, + { + "epoch": 0.012545666225059215, + "learning_rate": 0.00019749287406158416, + "loss": 0.856, + "mean_token_accuracy": 0.7524965465068817, + "num_tokens": 4251484.0, + "step": 1250 + }, + { + "epoch": 0.01264603155485969, + "learning_rate": 0.00019747280099562407, + "loss": 0.8659, + "mean_token_accuracy": 0.7591691255569458, + "num_tokens": 4285841.0, + "step": 1260 + }, + { + "epoch": 0.012746396884660163, + "learning_rate": 0.00019745272792966398, + "loss": 0.8621, + "mean_token_accuracy": 0.7493607640266419, + "num_tokens": 4318785.0, + "step": 1270 + }, + { + "epoch": 0.012846762214460636, + "learning_rate": 0.0001974326548637039, + "loss": 0.8471, + "mean_token_accuracy": 0.7562038958072662, + "num_tokens": 4352516.0, + "step": 1280 + }, + { + "epoch": 0.012947127544261111, + "learning_rate": 0.0001974125817977438, + "loss": 0.8829, + "mean_token_accuracy": 0.7481812596321106, + "num_tokens": 4385434.0, + "step": 1290 + }, + { + "epoch": 0.013047492874061584, + "learning_rate": 0.0001973925087317837, + "loss": 0.882, + "mean_token_accuracy": 0.7556095838546752, + "num_tokens": 4419873.0, + "step": 1300 + }, + { + "epoch": 0.013147858203862058, + "learning_rate": 0.00019737243566582361, + "loss": 0.84, + "mean_token_accuracy": 0.7592958688735962, + "num_tokens": 4454568.0, + "step": 1310 + }, + { + "epoch": 0.01324822353366253, + "learning_rate": 0.00019735236259986352, + "loss": 0.8413, + "mean_token_accuracy": 0.7540211915969849, + "num_tokens": 4488603.0, + "step": 1320 + }, + { + "epoch": 0.013348588863463006, + "learning_rate": 0.0001973322895339034, + "loss": 0.8775, + "mean_token_accuracy": 0.7487682044506073, + "num_tokens": 4522062.0, + "step": 1330 + }, + { + "epoch": 0.013448954193263479, + "learning_rate": 0.00019731221646794334, + "loss": 0.8799, + "mean_token_accuracy": 0.7497659981250763, + "num_tokens": 4556010.0, + "step": 1340 + }, + { + "epoch": 0.013549319523063952, + "learning_rate": 0.00019729214340198322, + "loss": 0.8476, + "mean_token_accuracy": 0.7548844814300537, + "num_tokens": 4589180.0, + "step": 1350 + }, + { + "epoch": 0.013649684852864427, + "learning_rate": 0.00019727207033602313, + "loss": 0.8683, + "mean_token_accuracy": 0.7509661138057708, + "num_tokens": 4621813.0, + "step": 1360 + }, + { + "epoch": 0.0137500501826649, + "learning_rate": 0.00019725199727006304, + "loss": 0.8475, + "mean_token_accuracy": 0.7586887240409851, + "num_tokens": 4655223.0, + "step": 1370 + }, + { + "epoch": 0.013850415512465374, + "learning_rate": 0.00019723192420410295, + "loss": 0.8623, + "mean_token_accuracy": 0.7530815541744232, + "num_tokens": 4688942.0, + "step": 1380 + }, + { + "epoch": 0.013950780842265849, + "learning_rate": 0.00019721185113814285, + "loss": 0.8928, + "mean_token_accuracy": 0.7447740018367768, + "num_tokens": 4722711.0, + "step": 1390 + }, + { + "epoch": 0.014051146172066322, + "learning_rate": 0.00019719177807218276, + "loss": 0.8438, + "mean_token_accuracy": 0.7587530732154846, + "num_tokens": 4756986.0, + "step": 1400 + }, + { + "epoch": 0.014151511501866795, + "learning_rate": 0.00019717170500622267, + "loss": 0.8618, + "mean_token_accuracy": 0.7547706186771392, + "num_tokens": 4790634.0, + "step": 1410 + }, + { + "epoch": 0.014251876831667268, + "learning_rate": 0.00019715163194026255, + "loss": 0.8517, + "mean_token_accuracy": 0.7552112579345703, + "num_tokens": 4824610.0, + "step": 1420 + }, + { + "epoch": 0.014352242161467743, + "learning_rate": 0.0001971315588743025, + "loss": 0.8669, + "mean_token_accuracy": 0.7512627184391022, + "num_tokens": 4858592.0, + "step": 1430 + }, + { + "epoch": 0.014452607491268216, + "learning_rate": 0.00019711148580834237, + "loss": 0.8912, + "mean_token_accuracy": 0.743174260854721, + "num_tokens": 4891961.0, + "step": 1440 + }, + { + "epoch": 0.01455297282106869, + "learning_rate": 0.00019709141274238228, + "loss": 0.8344, + "mean_token_accuracy": 0.7583801984786988, + "num_tokens": 4925217.0, + "step": 1450 + }, + { + "epoch": 0.014653338150869165, + "learning_rate": 0.0001970713396764222, + "loss": 0.837, + "mean_token_accuracy": 0.7593223810195923, + "num_tokens": 4958103.0, + "step": 1460 + }, + { + "epoch": 0.014753703480669638, + "learning_rate": 0.0001970512666104621, + "loss": 0.8856, + "mean_token_accuracy": 0.7498394906520843, + "num_tokens": 4991826.0, + "step": 1470 + }, + { + "epoch": 0.014854068810470111, + "learning_rate": 0.000197031193544502, + "loss": 0.8543, + "mean_token_accuracy": 0.7504751682281494, + "num_tokens": 5024795.0, + "step": 1480 + }, + { + "epoch": 0.014954434140270584, + "learning_rate": 0.0001970111204785419, + "loss": 0.8593, + "mean_token_accuracy": 0.7564951300621032, + "num_tokens": 5058977.0, + "step": 1490 + }, + { + "epoch": 0.015054799470071059, + "learning_rate": 0.00019699104741258182, + "loss": 0.8904, + "mean_token_accuracy": 0.7444755256175994, + "num_tokens": 5093915.0, + "step": 1500 + }, + { + "epoch": 0.015155164799871532, + "learning_rate": 0.0001969709743466217, + "loss": 0.8556, + "mean_token_accuracy": 0.7554027199745178, + "num_tokens": 5128235.0, + "step": 1510 + }, + { + "epoch": 0.015255530129672006, + "learning_rate": 0.00019695090128066164, + "loss": 0.8499, + "mean_token_accuracy": 0.7527681648731231, + "num_tokens": 5163167.0, + "step": 1520 + }, + { + "epoch": 0.01535589545947248, + "learning_rate": 0.00019693082821470152, + "loss": 0.8481, + "mean_token_accuracy": 0.7494793772697449, + "num_tokens": 5197445.0, + "step": 1530 + }, + { + "epoch": 0.015456260789272954, + "learning_rate": 0.00019691075514874143, + "loss": 0.8476, + "mean_token_accuracy": 0.7548111736774444, + "num_tokens": 5231705.0, + "step": 1540 + }, + { + "epoch": 0.015556626119073427, + "learning_rate": 0.00019689068208278134, + "loss": 0.8589, + "mean_token_accuracy": 0.7536470830440521, + "num_tokens": 5266220.0, + "step": 1550 + }, + { + "epoch": 0.015656991448873902, + "learning_rate": 0.00019687060901682124, + "loss": 0.8563, + "mean_token_accuracy": 0.753504478931427, + "num_tokens": 5300098.0, + "step": 1560 + }, + { + "epoch": 0.015757356778674375, + "learning_rate": 0.00019685053595086113, + "loss": 0.8322, + "mean_token_accuracy": 0.7565286755561829, + "num_tokens": 5334353.0, + "step": 1570 + }, + { + "epoch": 0.01585772210847485, + "learning_rate": 0.00019683046288490106, + "loss": 0.853, + "mean_token_accuracy": 0.7614298403263092, + "num_tokens": 5368411.0, + "step": 1580 + }, + { + "epoch": 0.01595808743827532, + "learning_rate": 0.00019681038981894094, + "loss": 0.855, + "mean_token_accuracy": 0.755518627166748, + "num_tokens": 5402236.0, + "step": 1590 + }, + { + "epoch": 0.016058452768075795, + "learning_rate": 0.00019679031675298085, + "loss": 0.8521, + "mean_token_accuracy": 0.7516325056552887, + "num_tokens": 5436012.0, + "step": 1600 + }, + { + "epoch": 0.016158818097876268, + "learning_rate": 0.00019677024368702076, + "loss": 0.8508, + "mean_token_accuracy": 0.7498721599578857, + "num_tokens": 5470369.0, + "step": 1610 + }, + { + "epoch": 0.016259183427676745, + "learning_rate": 0.00019675017062106067, + "loss": 0.8265, + "mean_token_accuracy": 0.7556636273860932, + "num_tokens": 5504487.0, + "step": 1620 + }, + { + "epoch": 0.016359548757477218, + "learning_rate": 0.00019673009755510058, + "loss": 0.8231, + "mean_token_accuracy": 0.75765740275383, + "num_tokens": 5538679.0, + "step": 1630 + }, + { + "epoch": 0.01645991408727769, + "learning_rate": 0.00019671002448914048, + "loss": 0.8756, + "mean_token_accuracy": 0.7481065690517426, + "num_tokens": 5573500.0, + "step": 1640 + }, + { + "epoch": 0.016560279417078164, + "learning_rate": 0.0001966899514231804, + "loss": 0.8371, + "mean_token_accuracy": 0.7557444095611572, + "num_tokens": 5607047.0, + "step": 1650 + }, + { + "epoch": 0.016660644746878638, + "learning_rate": 0.00019666987835722027, + "loss": 0.8114, + "mean_token_accuracy": 0.7623445272445679, + "num_tokens": 5641450.0, + "step": 1660 + }, + { + "epoch": 0.01676101007667911, + "learning_rate": 0.0001966498052912602, + "loss": 0.8551, + "mean_token_accuracy": 0.7489903330802917, + "num_tokens": 5674856.0, + "step": 1670 + }, + { + "epoch": 0.016861375406479584, + "learning_rate": 0.0001966297322253001, + "loss": 0.8021, + "mean_token_accuracy": 0.7655105769634247, + "num_tokens": 5708295.0, + "step": 1680 + }, + { + "epoch": 0.01696174073628006, + "learning_rate": 0.00019660965915934, + "loss": 0.8195, + "mean_token_accuracy": 0.7606033682823181, + "num_tokens": 5743318.0, + "step": 1690 + }, + { + "epoch": 0.017062106066080534, + "learning_rate": 0.0001965895860933799, + "loss": 0.8305, + "mean_token_accuracy": 0.7644929349422455, + "num_tokens": 5776744.0, + "step": 1700 + }, + { + "epoch": 0.017162471395881007, + "learning_rate": 0.00019656951302741982, + "loss": 0.8261, + "mean_token_accuracy": 0.7594692170619964, + "num_tokens": 5810694.0, + "step": 1710 + }, + { + "epoch": 0.01726283672568148, + "learning_rate": 0.00019654943996145972, + "loss": 0.8369, + "mean_token_accuracy": 0.7587471783161164, + "num_tokens": 5844392.0, + "step": 1720 + }, + { + "epoch": 0.017363202055481954, + "learning_rate": 0.00019652936689549963, + "loss": 0.8481, + "mean_token_accuracy": 0.7577917516231537, + "num_tokens": 5878431.0, + "step": 1730 + }, + { + "epoch": 0.017463567385282427, + "learning_rate": 0.00019650929382953954, + "loss": 0.8671, + "mean_token_accuracy": 0.7509515821933747, + "num_tokens": 5912731.0, + "step": 1740 + }, + { + "epoch": 0.017563932715082903, + "learning_rate": 0.00019648922076357942, + "loss": 0.8096, + "mean_token_accuracy": 0.7576501190662384, + "num_tokens": 5947053.0, + "step": 1750 + }, + { + "epoch": 0.017664298044883377, + "learning_rate": 0.00019646914769761936, + "loss": 0.8436, + "mean_token_accuracy": 0.7566677570343018, + "num_tokens": 5980908.0, + "step": 1760 + }, + { + "epoch": 0.01776466337468385, + "learning_rate": 0.00019644907463165924, + "loss": 0.8523, + "mean_token_accuracy": 0.7544825732707977, + "num_tokens": 6014535.0, + "step": 1770 + }, + { + "epoch": 0.017865028704484323, + "learning_rate": 0.00019642900156569915, + "loss": 0.8506, + "mean_token_accuracy": 0.7533735692501068, + "num_tokens": 6048756.0, + "step": 1780 + }, + { + "epoch": 0.017965394034284796, + "learning_rate": 0.00019640892849973906, + "loss": 0.8556, + "mean_token_accuracy": 0.752546352148056, + "num_tokens": 6082752.0, + "step": 1790 + }, + { + "epoch": 0.01806575936408527, + "learning_rate": 0.00019638885543377897, + "loss": 0.8173, + "mean_token_accuracy": 0.7617668688297272, + "num_tokens": 6116502.0, + "step": 1800 + }, + { + "epoch": 0.018166124693885743, + "learning_rate": 0.00019636878236781885, + "loss": 0.8204, + "mean_token_accuracy": 0.7598871469497681, + "num_tokens": 6150826.0, + "step": 1810 + }, + { + "epoch": 0.01826649002368622, + "learning_rate": 0.00019634870930185878, + "loss": 0.8139, + "mean_token_accuracy": 0.7583870530128479, + "num_tokens": 6185500.0, + "step": 1820 + }, + { + "epoch": 0.018366855353486693, + "learning_rate": 0.0001963286362358987, + "loss": 0.8235, + "mean_token_accuracy": 0.7577989399433136, + "num_tokens": 6219531.0, + "step": 1830 + }, + { + "epoch": 0.018467220683287166, + "learning_rate": 0.00019630856316993857, + "loss": 0.851, + "mean_token_accuracy": 0.7582792520523072, + "num_tokens": 6253286.0, + "step": 1840 + }, + { + "epoch": 0.01856758601308764, + "learning_rate": 0.0001962884901039785, + "loss": 0.8811, + "mean_token_accuracy": 0.7497155666351318, + "num_tokens": 6287058.0, + "step": 1850 + }, + { + "epoch": 0.018667951342888112, + "learning_rate": 0.0001962684170380184, + "loss": 0.8278, + "mean_token_accuracy": 0.7637346804141998, + "num_tokens": 6321137.0, + "step": 1860 + }, + { + "epoch": 0.018768316672688586, + "learning_rate": 0.0001962483439720583, + "loss": 0.8389, + "mean_token_accuracy": 0.7530131101608276, + "num_tokens": 6355801.0, + "step": 1870 + }, + { + "epoch": 0.01886868200248906, + "learning_rate": 0.0001962282709060982, + "loss": 0.8367, + "mean_token_accuracy": 0.7559464156627655, + "num_tokens": 6388657.0, + "step": 1880 + }, + { + "epoch": 0.018969047332289535, + "learning_rate": 0.00019620819784013811, + "loss": 0.829, + "mean_token_accuracy": 0.7582254111766815, + "num_tokens": 6422783.0, + "step": 1890 + }, + { + "epoch": 0.01906941266209001, + "learning_rate": 0.00019618812477417802, + "loss": 0.8133, + "mean_token_accuracy": 0.7625649392604827, + "num_tokens": 6457489.0, + "step": 1900 + }, + { + "epoch": 0.019169777991890482, + "learning_rate": 0.00019616805170821793, + "loss": 0.8093, + "mean_token_accuracy": 0.7617171883583069, + "num_tokens": 6491382.0, + "step": 1910 + }, + { + "epoch": 0.019270143321690955, + "learning_rate": 0.0001961479786422578, + "loss": 0.8071, + "mean_token_accuracy": 0.7619174361228943, + "num_tokens": 6525576.0, + "step": 1920 + }, + { + "epoch": 0.01937050865149143, + "learning_rate": 0.00019612790557629775, + "loss": 0.8224, + "mean_token_accuracy": 0.7651695072650909, + "num_tokens": 6559225.0, + "step": 1930 + }, + { + "epoch": 0.0194708739812919, + "learning_rate": 0.00019610783251033763, + "loss": 0.855, + "mean_token_accuracy": 0.7547216534614563, + "num_tokens": 6593907.0, + "step": 1940 + }, + { + "epoch": 0.019571239311092375, + "learning_rate": 0.00019608775944437754, + "loss": 0.8261, + "mean_token_accuracy": 0.7579889893531799, + "num_tokens": 6628286.0, + "step": 1950 + }, + { + "epoch": 0.01967160464089285, + "learning_rate": 0.00019606768637841745, + "loss": 0.8517, + "mean_token_accuracy": 0.7559162437915802, + "num_tokens": 6662442.0, + "step": 1960 + }, + { + "epoch": 0.019771969970693325, + "learning_rate": 0.00019604761331245735, + "loss": 0.8528, + "mean_token_accuracy": 0.7507839500904083, + "num_tokens": 6696329.0, + "step": 1970 + }, + { + "epoch": 0.019872335300493798, + "learning_rate": 0.00019602754024649726, + "loss": 0.8579, + "mean_token_accuracy": 0.7551623106002807, + "num_tokens": 6730903.0, + "step": 1980 + }, + { + "epoch": 0.01997270063029427, + "learning_rate": 0.00019600746718053717, + "loss": 0.8307, + "mean_token_accuracy": 0.7526181817054749, + "num_tokens": 6763865.0, + "step": 1990 + }, + { + "epoch": 0.020073065960094744, + "learning_rate": 0.00019598739411457708, + "loss": 0.8469, + "mean_token_accuracy": 0.7611814558506012, + "num_tokens": 6798513.0, + "step": 2000 + }, + { + "epoch": 0.020173431289895218, + "learning_rate": 0.00019596732104861696, + "loss": 0.8208, + "mean_token_accuracy": 0.7589188933372497, + "num_tokens": 6832618.0, + "step": 2010 + }, + { + "epoch": 0.02027379661969569, + "learning_rate": 0.0001959472479826569, + "loss": 0.8369, + "mean_token_accuracy": 0.749679434299469, + "num_tokens": 6866166.0, + "step": 2020 + }, + { + "epoch": 0.020374161949496167, + "learning_rate": 0.00019592717491669678, + "loss": 0.8788, + "mean_token_accuracy": 0.7494403779506683, + "num_tokens": 6899501.0, + "step": 2030 + }, + { + "epoch": 0.02047452727929664, + "learning_rate": 0.00019590710185073669, + "loss": 0.8044, + "mean_token_accuracy": 0.7660996496677399, + "num_tokens": 6933758.0, + "step": 2040 + }, + { + "epoch": 0.020574892609097114, + "learning_rate": 0.0001958870287847766, + "loss": 0.8321, + "mean_token_accuracy": 0.7600698232650757, + "num_tokens": 6967869.0, + "step": 2050 + }, + { + "epoch": 0.020675257938897587, + "learning_rate": 0.0001958669557188165, + "loss": 0.8138, + "mean_token_accuracy": 0.7660489320755005, + "num_tokens": 7002140.0, + "step": 2060 + }, + { + "epoch": 0.02077562326869806, + "learning_rate": 0.0001958468826528564, + "loss": 0.8206, + "mean_token_accuracy": 0.7583360552787781, + "num_tokens": 7035964.0, + "step": 2070 + }, + { + "epoch": 0.020875988598498534, + "learning_rate": 0.00019582680958689632, + "loss": 0.8539, + "mean_token_accuracy": 0.7558043360710144, + "num_tokens": 7069864.0, + "step": 2080 + }, + { + "epoch": 0.020976353928299007, + "learning_rate": 0.00019580673652093623, + "loss": 0.8416, + "mean_token_accuracy": 0.754914653301239, + "num_tokens": 7104474.0, + "step": 2090 + }, + { + "epoch": 0.021076719258099483, + "learning_rate": 0.0001957866634549761, + "loss": 0.8469, + "mean_token_accuracy": 0.75110724568367, + "num_tokens": 7139229.0, + "step": 2100 + }, + { + "epoch": 0.021177084587899957, + "learning_rate": 0.00019576659038901605, + "loss": 0.8357, + "mean_token_accuracy": 0.755988621711731, + "num_tokens": 7173015.0, + "step": 2110 + }, + { + "epoch": 0.02127744991770043, + "learning_rate": 0.00019574651732305593, + "loss": 0.8501, + "mean_token_accuracy": 0.75484619140625, + "num_tokens": 7206350.0, + "step": 2120 + }, + { + "epoch": 0.021377815247500903, + "learning_rate": 0.00019572644425709584, + "loss": 0.8369, + "mean_token_accuracy": 0.7622098982334137, + "num_tokens": 7240468.0, + "step": 2130 + }, + { + "epoch": 0.021478180577301376, + "learning_rate": 0.00019570637119113574, + "loss": 0.8346, + "mean_token_accuracy": 0.7651883065700531, + "num_tokens": 7274498.0, + "step": 2140 + }, + { + "epoch": 0.02157854590710185, + "learning_rate": 0.00019568629812517565, + "loss": 0.8617, + "mean_token_accuracy": 0.7555427491664887, + "num_tokens": 7307634.0, + "step": 2150 + }, + { + "epoch": 0.021678911236902323, + "learning_rate": 0.00019566622505921553, + "loss": 0.8433, + "mean_token_accuracy": 0.7512418270111084, + "num_tokens": 7341779.0, + "step": 2160 + }, + { + "epoch": 0.0217792765667028, + "learning_rate": 0.00019564615199325547, + "loss": 0.8554, + "mean_token_accuracy": 0.753146630525589, + "num_tokens": 7375947.0, + "step": 2170 + }, + { + "epoch": 0.021879641896503273, + "learning_rate": 0.00019562607892729538, + "loss": 0.8531, + "mean_token_accuracy": 0.7535173892974854, + "num_tokens": 7410782.0, + "step": 2180 + }, + { + "epoch": 0.021980007226303746, + "learning_rate": 0.00019560600586133526, + "loss": 0.8368, + "mean_token_accuracy": 0.7546063840389252, + "num_tokens": 7443934.0, + "step": 2190 + }, + { + "epoch": 0.02208037255610422, + "learning_rate": 0.0001955859327953752, + "loss": 0.8564, + "mean_token_accuracy": 0.756107634305954, + "num_tokens": 7478420.0, + "step": 2200 + }, + { + "epoch": 0.022180737885904692, + "learning_rate": 0.00019556585972941508, + "loss": 0.8275, + "mean_token_accuracy": 0.7583844363689423, + "num_tokens": 7512780.0, + "step": 2210 + }, + { + "epoch": 0.022281103215705166, + "learning_rate": 0.00019554578666345498, + "loss": 0.8519, + "mean_token_accuracy": 0.7547212541103363, + "num_tokens": 7547171.0, + "step": 2220 + }, + { + "epoch": 0.022381468545505642, + "learning_rate": 0.0001955257135974949, + "loss": 0.8197, + "mean_token_accuracy": 0.757226973772049, + "num_tokens": 7581359.0, + "step": 2230 + }, + { + "epoch": 0.022481833875306115, + "learning_rate": 0.0001955056405315348, + "loss": 0.8461, + "mean_token_accuracy": 0.7656774163246155, + "num_tokens": 7615372.0, + "step": 2240 + }, + { + "epoch": 0.02258219920510659, + "learning_rate": 0.00019548556746557468, + "loss": 0.8458, + "mean_token_accuracy": 0.7544702410697937, + "num_tokens": 7649479.0, + "step": 2250 + }, + { + "epoch": 0.022682564534907062, + "learning_rate": 0.00019546549439961462, + "loss": 0.8542, + "mean_token_accuracy": 0.7525253236293793, + "num_tokens": 7683870.0, + "step": 2260 + }, + { + "epoch": 0.022782929864707535, + "learning_rate": 0.0001954454213336545, + "loss": 0.8423, + "mean_token_accuracy": 0.7568866968154907, + "num_tokens": 7717550.0, + "step": 2270 + }, + { + "epoch": 0.02288329519450801, + "learning_rate": 0.0001954253482676944, + "loss": 0.822, + "mean_token_accuracy": 0.7563924074172974, + "num_tokens": 7751661.0, + "step": 2280 + }, + { + "epoch": 0.02298366052430848, + "learning_rate": 0.00019540527520173432, + "loss": 0.8308, + "mean_token_accuracy": 0.7572165787220001, + "num_tokens": 7786291.0, + "step": 2290 + }, + { + "epoch": 0.023084025854108958, + "learning_rate": 0.00019538520213577422, + "loss": 0.793, + "mean_token_accuracy": 0.7661900997161866, + "num_tokens": 7820722.0, + "step": 2300 + }, + { + "epoch": 0.02318439118390943, + "learning_rate": 0.00019536512906981413, + "loss": 0.8043, + "mean_token_accuracy": 0.7659907758235931, + "num_tokens": 7855180.0, + "step": 2310 + }, + { + "epoch": 0.023284756513709905, + "learning_rate": 0.00019534505600385404, + "loss": 0.7967, + "mean_token_accuracy": 0.7661457180976867, + "num_tokens": 7888552.0, + "step": 2320 + }, + { + "epoch": 0.023385121843510378, + "learning_rate": 0.00019532498293789395, + "loss": 0.8339, + "mean_token_accuracy": 0.7558695316314697, + "num_tokens": 7921169.0, + "step": 2330 + }, + { + "epoch": 0.02348548717331085, + "learning_rate": 0.00019530490987193383, + "loss": 0.8095, + "mean_token_accuracy": 0.76091068983078, + "num_tokens": 7955024.0, + "step": 2340 + }, + { + "epoch": 0.023585852503111324, + "learning_rate": 0.00019528483680597377, + "loss": 0.8205, + "mean_token_accuracy": 0.7617243111133576, + "num_tokens": 7988653.0, + "step": 2350 + }, + { + "epoch": 0.023686217832911798, + "learning_rate": 0.00019526476374001365, + "loss": 0.826, + "mean_token_accuracy": 0.7584989905357361, + "num_tokens": 8022319.0, + "step": 2360 + }, + { + "epoch": 0.023786583162712274, + "learning_rate": 0.00019524469067405356, + "loss": 0.827, + "mean_token_accuracy": 0.7621460676193237, + "num_tokens": 8055876.0, + "step": 2370 + }, + { + "epoch": 0.023886948492512747, + "learning_rate": 0.00019522461760809346, + "loss": 0.797, + "mean_token_accuracy": 0.7639261364936829, + "num_tokens": 8089693.0, + "step": 2380 + }, + { + "epoch": 0.02398731382231322, + "learning_rate": 0.00019520454454213337, + "loss": 0.8024, + "mean_token_accuracy": 0.7636609375476837, + "num_tokens": 8124115.0, + "step": 2390 + }, + { + "epoch": 0.024087679152113694, + "learning_rate": 0.00019518447147617328, + "loss": 0.8272, + "mean_token_accuracy": 0.7648244261741638, + "num_tokens": 8158023.0, + "step": 2400 + }, + { + "epoch": 0.024188044481914167, + "learning_rate": 0.0001951643984102132, + "loss": 0.8149, + "mean_token_accuracy": 0.7608605980873108, + "num_tokens": 8192278.0, + "step": 2410 + }, + { + "epoch": 0.02428840981171464, + "learning_rate": 0.0001951443253442531, + "loss": 0.8373, + "mean_token_accuracy": 0.755948281288147, + "num_tokens": 8226602.0, + "step": 2420 + }, + { + "epoch": 0.024388775141515114, + "learning_rate": 0.00019512425227829298, + "loss": 0.8351, + "mean_token_accuracy": 0.7608046889305115, + "num_tokens": 8260675.0, + "step": 2430 + }, + { + "epoch": 0.02448914047131559, + "learning_rate": 0.00019510417921233292, + "loss": 0.7979, + "mean_token_accuracy": 0.7635708749294281, + "num_tokens": 8294714.0, + "step": 2440 + }, + { + "epoch": 0.024589505801116063, + "learning_rate": 0.0001950841061463728, + "loss": 0.853, + "mean_token_accuracy": 0.7571332097053528, + "num_tokens": 8328444.0, + "step": 2450 + }, + { + "epoch": 0.024689871130916537, + "learning_rate": 0.00019506403308041273, + "loss": 0.8606, + "mean_token_accuracy": 0.744694834947586, + "num_tokens": 8362891.0, + "step": 2460 + }, + { + "epoch": 0.02479023646071701, + "learning_rate": 0.0001950439600144526, + "loss": 0.8332, + "mean_token_accuracy": 0.7588581085205078, + "num_tokens": 8397433.0, + "step": 2470 + }, + { + "epoch": 0.024890601790517483, + "learning_rate": 0.00019502388694849252, + "loss": 0.8089, + "mean_token_accuracy": 0.7658759117126465, + "num_tokens": 8431278.0, + "step": 2480 + }, + { + "epoch": 0.024990967120317956, + "learning_rate": 0.00019500381388253243, + "loss": 0.8243, + "mean_token_accuracy": 0.759179824590683, + "num_tokens": 8465674.0, + "step": 2490 + }, + { + "epoch": 0.02509133245011843, + "learning_rate": 0.00019498374081657234, + "loss": 0.8507, + "mean_token_accuracy": 0.7583933115005493, + "num_tokens": 8499186.0, + "step": 2500 + }, + { + "epoch": 0.025191697779918906, + "learning_rate": 0.00019496366775061222, + "loss": 0.8371, + "mean_token_accuracy": 0.7609995067119598, + "num_tokens": 8533547.0, + "step": 2510 + }, + { + "epoch": 0.02529206310971938, + "learning_rate": 0.00019494359468465216, + "loss": 0.8217, + "mean_token_accuracy": 0.7622859716415405, + "num_tokens": 8568232.0, + "step": 2520 + }, + { + "epoch": 0.025392428439519853, + "learning_rate": 0.00019492352161869206, + "loss": 0.8346, + "mean_token_accuracy": 0.7621785938739777, + "num_tokens": 8602586.0, + "step": 2530 + }, + { + "epoch": 0.025492793769320326, + "learning_rate": 0.00019490344855273195, + "loss": 0.8109, + "mean_token_accuracy": 0.7586685180664062, + "num_tokens": 8636640.0, + "step": 2540 + }, + { + "epoch": 0.0255931590991208, + "learning_rate": 0.00019488337548677188, + "loss": 0.8157, + "mean_token_accuracy": 0.7647418260574341, + "num_tokens": 8670420.0, + "step": 2550 + }, + { + "epoch": 0.025693524428921272, + "learning_rate": 0.00019486330242081176, + "loss": 0.8071, + "mean_token_accuracy": 0.7660414576530457, + "num_tokens": 8704404.0, + "step": 2560 + }, + { + "epoch": 0.025793889758721746, + "learning_rate": 0.00019484322935485167, + "loss": 0.8118, + "mean_token_accuracy": 0.763026088476181, + "num_tokens": 8738337.0, + "step": 2570 + }, + { + "epoch": 0.025894255088522222, + "learning_rate": 0.00019482315628889158, + "loss": 0.8186, + "mean_token_accuracy": 0.7586533546447753, + "num_tokens": 8772155.0, + "step": 2580 + }, + { + "epoch": 0.025994620418322695, + "learning_rate": 0.0001948030832229315, + "loss": 0.8472, + "mean_token_accuracy": 0.7485378384590149, + "num_tokens": 8805291.0, + "step": 2590 + }, + { + "epoch": 0.02609498574812317, + "learning_rate": 0.00019478301015697137, + "loss": 0.8416, + "mean_token_accuracy": 0.7523237645626069, + "num_tokens": 8838352.0, + "step": 2600 + }, + { + "epoch": 0.026195351077923642, + "learning_rate": 0.0001947629370910113, + "loss": 0.834, + "mean_token_accuracy": 0.7580128014087677, + "num_tokens": 8871752.0, + "step": 2610 + }, + { + "epoch": 0.026295716407724115, + "learning_rate": 0.00019474286402505119, + "loss": 0.8085, + "mean_token_accuracy": 0.7614288806915284, + "num_tokens": 8906014.0, + "step": 2620 + }, + { + "epoch": 0.02639608173752459, + "learning_rate": 0.0001947227909590911, + "loss": 0.8158, + "mean_token_accuracy": 0.7616944968700409, + "num_tokens": 8941204.0, + "step": 2630 + }, + { + "epoch": 0.02649644706732506, + "learning_rate": 0.000194702717893131, + "loss": 0.8104, + "mean_token_accuracy": 0.7650873243808747, + "num_tokens": 8974391.0, + "step": 2640 + }, + { + "epoch": 0.026596812397125538, + "learning_rate": 0.0001946826448271709, + "loss": 0.7893, + "mean_token_accuracy": 0.7691265761852264, + "num_tokens": 9008066.0, + "step": 2650 + }, + { + "epoch": 0.02669717772692601, + "learning_rate": 0.00019466257176121082, + "loss": 0.7948, + "mean_token_accuracy": 0.7700909733772278, + "num_tokens": 9042380.0, + "step": 2660 + }, + { + "epoch": 0.026797543056726485, + "learning_rate": 0.00019464249869525073, + "loss": 0.8391, + "mean_token_accuracy": 0.7572174370288849, + "num_tokens": 9076897.0, + "step": 2670 + }, + { + "epoch": 0.026897908386526958, + "learning_rate": 0.00019462242562929064, + "loss": 0.8382, + "mean_token_accuracy": 0.7565006077289581, + "num_tokens": 9110755.0, + "step": 2680 + }, + { + "epoch": 0.02699827371632743, + "learning_rate": 0.00019460235256333052, + "loss": 0.8443, + "mean_token_accuracy": 0.7534610092639923, + "num_tokens": 9144780.0, + "step": 2690 + }, + { + "epoch": 0.027098639046127904, + "learning_rate": 0.00019458227949737045, + "loss": 0.8376, + "mean_token_accuracy": 0.751280415058136, + "num_tokens": 9178297.0, + "step": 2700 + }, + { + "epoch": 0.02719900437592838, + "learning_rate": 0.00019456220643141033, + "loss": 0.8161, + "mean_token_accuracy": 0.7588511765003204, + "num_tokens": 9212281.0, + "step": 2710 + }, + { + "epoch": 0.027299369705728854, + "learning_rate": 0.00019454213336545024, + "loss": 0.8257, + "mean_token_accuracy": 0.7590669870376587, + "num_tokens": 9246800.0, + "step": 2720 + }, + { + "epoch": 0.027399735035529327, + "learning_rate": 0.00019452206029949015, + "loss": 0.8108, + "mean_token_accuracy": 0.7625915348529816, + "num_tokens": 9280862.0, + "step": 2730 + }, + { + "epoch": 0.0275001003653298, + "learning_rate": 0.00019450198723353006, + "loss": 0.7889, + "mean_token_accuracy": 0.7649468660354615, + "num_tokens": 9316013.0, + "step": 2740 + }, + { + "epoch": 0.027600465695130274, + "learning_rate": 0.00019448191416756997, + "loss": 0.8283, + "mean_token_accuracy": 0.7558753788471222, + "num_tokens": 9349913.0, + "step": 2750 + }, + { + "epoch": 0.027700831024930747, + "learning_rate": 0.00019446184110160988, + "loss": 0.7758, + "mean_token_accuracy": 0.7654128670692444, + "num_tokens": 9384092.0, + "step": 2760 + }, + { + "epoch": 0.02780119635473122, + "learning_rate": 0.00019444176803564979, + "loss": 0.7991, + "mean_token_accuracy": 0.7651127219200134, + "num_tokens": 9418417.0, + "step": 2770 + }, + { + "epoch": 0.027901561684531697, + "learning_rate": 0.00019442169496968967, + "loss": 0.8285, + "mean_token_accuracy": 0.7555812895298004, + "num_tokens": 9453247.0, + "step": 2780 + }, + { + "epoch": 0.02800192701433217, + "learning_rate": 0.0001944016219037296, + "loss": 0.8166, + "mean_token_accuracy": 0.758303964138031, + "num_tokens": 9487349.0, + "step": 2790 + }, + { + "epoch": 0.028102292344132643, + "learning_rate": 0.00019438154883776948, + "loss": 0.7975, + "mean_token_accuracy": 0.7672683656215668, + "num_tokens": 9521217.0, + "step": 2800 + }, + { + "epoch": 0.028202657673933117, + "learning_rate": 0.0001943614757718094, + "loss": 0.8159, + "mean_token_accuracy": 0.7600618541240692, + "num_tokens": 9554836.0, + "step": 2810 + }, + { + "epoch": 0.02830302300373359, + "learning_rate": 0.0001943414027058493, + "loss": 0.8429, + "mean_token_accuracy": 0.7548216879367828, + "num_tokens": 9589253.0, + "step": 2820 + }, + { + "epoch": 0.028403388333534063, + "learning_rate": 0.0001943213296398892, + "loss": 0.8392, + "mean_token_accuracy": 0.7594896078109741, + "num_tokens": 9623090.0, + "step": 2830 + }, + { + "epoch": 0.028503753663334536, + "learning_rate": 0.0001943012565739291, + "loss": 0.8061, + "mean_token_accuracy": 0.7643302738666534, + "num_tokens": 9656910.0, + "step": 2840 + }, + { + "epoch": 0.028604118993135013, + "learning_rate": 0.00019428118350796903, + "loss": 0.8187, + "mean_token_accuracy": 0.7644733011722564, + "num_tokens": 9689992.0, + "step": 2850 + }, + { + "epoch": 0.028704484322935486, + "learning_rate": 0.0001942611104420089, + "loss": 0.8526, + "mean_token_accuracy": 0.7513968527317048, + "num_tokens": 9723413.0, + "step": 2860 + }, + { + "epoch": 0.02880484965273596, + "learning_rate": 0.00019424103737604882, + "loss": 0.8517, + "mean_token_accuracy": 0.7544140577316284, + "num_tokens": 9757325.0, + "step": 2870 + }, + { + "epoch": 0.028905214982536433, + "learning_rate": 0.00019422096431008875, + "loss": 0.8198, + "mean_token_accuracy": 0.7595404148101806, + "num_tokens": 9791668.0, + "step": 2880 + }, + { + "epoch": 0.029005580312336906, + "learning_rate": 0.00019420089124412863, + "loss": 0.8164, + "mean_token_accuracy": 0.7569047451019287, + "num_tokens": 9826222.0, + "step": 2890 + }, + { + "epoch": 0.02910594564213738, + "learning_rate": 0.00019418081817816854, + "loss": 0.8688, + "mean_token_accuracy": 0.7560630202293396, + "num_tokens": 9860177.0, + "step": 2900 + }, + { + "epoch": 0.029206310971937852, + "learning_rate": 0.00019416074511220845, + "loss": 0.8121, + "mean_token_accuracy": 0.7619596660137177, + "num_tokens": 9894213.0, + "step": 2910 + }, + { + "epoch": 0.02930667630173833, + "learning_rate": 0.00019414067204624836, + "loss": 0.7963, + "mean_token_accuracy": 0.7662225306034088, + "num_tokens": 9927913.0, + "step": 2920 + }, + { + "epoch": 0.029407041631538802, + "learning_rate": 0.00019412059898028824, + "loss": 0.829, + "mean_token_accuracy": 0.7606053411960602, + "num_tokens": 9961850.0, + "step": 2930 + }, + { + "epoch": 0.029507406961339275, + "learning_rate": 0.00019410052591432817, + "loss": 0.8381, + "mean_token_accuracy": 0.7542055785655976, + "num_tokens": 9996592.0, + "step": 2940 + }, + { + "epoch": 0.02960777229113975, + "learning_rate": 0.00019408045284836806, + "loss": 0.8097, + "mean_token_accuracy": 0.7627164542675018, + "num_tokens": 10030623.0, + "step": 2950 + }, + { + "epoch": 0.029708137620940222, + "learning_rate": 0.00019406037978240796, + "loss": 0.8179, + "mean_token_accuracy": 0.759533429145813, + "num_tokens": 10065371.0, + "step": 2960 + }, + { + "epoch": 0.029808502950740695, + "learning_rate": 0.00019404030671644787, + "loss": 0.7864, + "mean_token_accuracy": 0.76891188621521, + "num_tokens": 10098693.0, + "step": 2970 + }, + { + "epoch": 0.02990886828054117, + "learning_rate": 0.00019402023365048778, + "loss": 0.8138, + "mean_token_accuracy": 0.7631476044654846, + "num_tokens": 10132077.0, + "step": 2980 + }, + { + "epoch": 0.030009233610341645, + "learning_rate": 0.0001940001605845277, + "loss": 0.8085, + "mean_token_accuracy": 0.7628714203834533, + "num_tokens": 10167034.0, + "step": 2990 + }, + { + "epoch": 0.030109598940142118, + "learning_rate": 0.0001939800875185676, + "loss": 0.8067, + "mean_token_accuracy": 0.76093710064888, + "num_tokens": 10200994.0, + "step": 3000 + }, + { + "epoch": 0.03020996426994259, + "learning_rate": 0.0001939600144526075, + "loss": 0.8056, + "mean_token_accuracy": 0.7656333386898041, + "num_tokens": 10235556.0, + "step": 3010 + }, + { + "epoch": 0.030310329599743065, + "learning_rate": 0.00019393994138664741, + "loss": 0.8413, + "mean_token_accuracy": 0.7463635027408599, + "num_tokens": 10269354.0, + "step": 3020 + }, + { + "epoch": 0.030410694929543538, + "learning_rate": 0.00019391986832068732, + "loss": 0.8107, + "mean_token_accuracy": 0.7647533237934112, + "num_tokens": 10303415.0, + "step": 3030 + }, + { + "epoch": 0.03051106025934401, + "learning_rate": 0.0001938997952547272, + "loss": 0.8596, + "mean_token_accuracy": 0.7526327192783355, + "num_tokens": 10336602.0, + "step": 3040 + }, + { + "epoch": 0.030611425589144484, + "learning_rate": 0.00019387972218876714, + "loss": 0.8229, + "mean_token_accuracy": 0.7578138887882233, + "num_tokens": 10369955.0, + "step": 3050 + }, + { + "epoch": 0.03071179091894496, + "learning_rate": 0.00019385964912280702, + "loss": 0.8348, + "mean_token_accuracy": 0.7555415332317352, + "num_tokens": 10404298.0, + "step": 3060 + }, + { + "epoch": 0.030812156248745434, + "learning_rate": 0.00019383957605684693, + "loss": 0.8314, + "mean_token_accuracy": 0.7591325759887695, + "num_tokens": 10438557.0, + "step": 3070 + }, + { + "epoch": 0.030912521578545907, + "learning_rate": 0.00019381950299088684, + "loss": 0.8409, + "mean_token_accuracy": 0.7593413949012756, + "num_tokens": 10472895.0, + "step": 3080 + }, + { + "epoch": 0.03101288690834638, + "learning_rate": 0.00019379942992492675, + "loss": 0.8414, + "mean_token_accuracy": 0.7592377960681915, + "num_tokens": 10507101.0, + "step": 3090 + }, + { + "epoch": 0.031113252238146854, + "learning_rate": 0.00019377935685896666, + "loss": 0.7824, + "mean_token_accuracy": 0.7731334388256073, + "num_tokens": 10541341.0, + "step": 3100 + }, + { + "epoch": 0.031213617567947327, + "learning_rate": 0.00019375928379300656, + "loss": 0.8333, + "mean_token_accuracy": 0.7570551693439483, + "num_tokens": 10575589.0, + "step": 3110 + }, + { + "epoch": 0.031313982897747804, + "learning_rate": 0.00019373921072704647, + "loss": 0.8084, + "mean_token_accuracy": 0.7645867586135864, + "num_tokens": 10609867.0, + "step": 3120 + }, + { + "epoch": 0.031414348227548274, + "learning_rate": 0.00019371913766108635, + "loss": 0.8437, + "mean_token_accuracy": 0.7533444285392761, + "num_tokens": 10643442.0, + "step": 3130 + }, + { + "epoch": 0.03151471355734875, + "learning_rate": 0.0001936990645951263, + "loss": 0.8101, + "mean_token_accuracy": 0.7585695147514343, + "num_tokens": 10677750.0, + "step": 3140 + }, + { + "epoch": 0.03161507888714922, + "learning_rate": 0.00019367899152916617, + "loss": 0.8215, + "mean_token_accuracy": 0.7583079099655151, + "num_tokens": 10711656.0, + "step": 3150 + }, + { + "epoch": 0.0317154442169497, + "learning_rate": 0.00019365891846320608, + "loss": 0.8354, + "mean_token_accuracy": 0.7559507787227631, + "num_tokens": 10745944.0, + "step": 3160 + }, + { + "epoch": 0.03181580954675017, + "learning_rate": 0.000193638845397246, + "loss": 0.8082, + "mean_token_accuracy": 0.7597402095794678, + "num_tokens": 10780421.0, + "step": 3170 + }, + { + "epoch": 0.03191617487655064, + "learning_rate": 0.0001936187723312859, + "loss": 0.8305, + "mean_token_accuracy": 0.7550306975841522, + "num_tokens": 10813665.0, + "step": 3180 + }, + { + "epoch": 0.03201654020635112, + "learning_rate": 0.00019359869926532578, + "loss": 0.8174, + "mean_token_accuracy": 0.7608563065528869, + "num_tokens": 10848641.0, + "step": 3190 + }, + { + "epoch": 0.03211690553615159, + "learning_rate": 0.0001935786261993657, + "loss": 0.8205, + "mean_token_accuracy": 0.7681922614574432, + "num_tokens": 10883127.0, + "step": 3200 + }, + { + "epoch": 0.032217270865952066, + "learning_rate": 0.0001935585531334056, + "loss": 0.8385, + "mean_token_accuracy": 0.7587725281715393, + "num_tokens": 10916869.0, + "step": 3210 + }, + { + "epoch": 0.032317636195752536, + "learning_rate": 0.0001935384800674455, + "loss": 0.8125, + "mean_token_accuracy": 0.7589336574077606, + "num_tokens": 10951318.0, + "step": 3220 + }, + { + "epoch": 0.03241800152555301, + "learning_rate": 0.00019351840700148544, + "loss": 0.8238, + "mean_token_accuracy": 0.7592109203338623, + "num_tokens": 10985495.0, + "step": 3230 + }, + { + "epoch": 0.03251836685535349, + "learning_rate": 0.00019349833393552532, + "loss": 0.8172, + "mean_token_accuracy": 0.7625975668430328, + "num_tokens": 11018921.0, + "step": 3240 + }, + { + "epoch": 0.03261873218515396, + "learning_rate": 0.00019347826086956523, + "loss": 0.8189, + "mean_token_accuracy": 0.7608864843845368, + "num_tokens": 11053086.0, + "step": 3250 + }, + { + "epoch": 0.032719097514954436, + "learning_rate": 0.00019345818780360514, + "loss": 0.788, + "mean_token_accuracy": 0.7709313690662384, + "num_tokens": 11086654.0, + "step": 3260 + }, + { + "epoch": 0.032819462844754906, + "learning_rate": 0.00019343811473764504, + "loss": 0.8214, + "mean_token_accuracy": 0.7595510005950927, + "num_tokens": 11120931.0, + "step": 3270 + }, + { + "epoch": 0.03291982817455538, + "learning_rate": 0.00019341804167168493, + "loss": 0.8331, + "mean_token_accuracy": 0.75942742228508, + "num_tokens": 11154413.0, + "step": 3280 + }, + { + "epoch": 0.03302019350435585, + "learning_rate": 0.00019339796860572486, + "loss": 0.7951, + "mean_token_accuracy": 0.7642982721328735, + "num_tokens": 11188382.0, + "step": 3290 + }, + { + "epoch": 0.03312055883415633, + "learning_rate": 0.00019337789553976474, + "loss": 0.8003, + "mean_token_accuracy": 0.7682574689388275, + "num_tokens": 11222513.0, + "step": 3300 + }, + { + "epoch": 0.033220924163956805, + "learning_rate": 0.00019335782247380465, + "loss": 0.7966, + "mean_token_accuracy": 0.7670561671257019, + "num_tokens": 11257447.0, + "step": 3310 + }, + { + "epoch": 0.033321289493757275, + "learning_rate": 0.00019333774940784456, + "loss": 0.8133, + "mean_token_accuracy": 0.7631431698799134, + "num_tokens": 11290812.0, + "step": 3320 + }, + { + "epoch": 0.03342165482355775, + "learning_rate": 0.00019331767634188447, + "loss": 0.8435, + "mean_token_accuracy": 0.7573554813861847, + "num_tokens": 11324627.0, + "step": 3330 + }, + { + "epoch": 0.03352202015335822, + "learning_rate": 0.00019329760327592438, + "loss": 0.8221, + "mean_token_accuracy": 0.7549627840518951, + "num_tokens": 11358198.0, + "step": 3340 + }, + { + "epoch": 0.0336223854831587, + "learning_rate": 0.00019327753020996428, + "loss": 0.79, + "mean_token_accuracy": 0.7678623855113983, + "num_tokens": 11392606.0, + "step": 3350 + }, + { + "epoch": 0.03372275081295917, + "learning_rate": 0.0001932574571440042, + "loss": 0.8377, + "mean_token_accuracy": 0.7548870742321014, + "num_tokens": 11427108.0, + "step": 3360 + }, + { + "epoch": 0.033823116142759645, + "learning_rate": 0.00019323738407804407, + "loss": 0.821, + "mean_token_accuracy": 0.7596335887908936, + "num_tokens": 11460882.0, + "step": 3370 + }, + { + "epoch": 0.03392348147256012, + "learning_rate": 0.000193217311012084, + "loss": 0.8233, + "mean_token_accuracy": 0.7633667171001435, + "num_tokens": 11495166.0, + "step": 3380 + }, + { + "epoch": 0.03402384680236059, + "learning_rate": 0.0001931972379461239, + "loss": 0.8403, + "mean_token_accuracy": 0.7576093554496766, + "num_tokens": 11528914.0, + "step": 3390 + }, + { + "epoch": 0.03412421213216107, + "learning_rate": 0.0001931771648801638, + "loss": 0.8033, + "mean_token_accuracy": 0.7655123353004456, + "num_tokens": 11562638.0, + "step": 3400 + }, + { + "epoch": 0.03422457746196154, + "learning_rate": 0.0001931570918142037, + "loss": 0.8692, + "mean_token_accuracy": 0.7498386919498443, + "num_tokens": 11596992.0, + "step": 3410 + }, + { + "epoch": 0.034324942791762014, + "learning_rate": 0.00019313701874824362, + "loss": 0.8059, + "mean_token_accuracy": 0.7620149791240692, + "num_tokens": 11630807.0, + "step": 3420 + }, + { + "epoch": 0.034425308121562484, + "learning_rate": 0.00019311694568228353, + "loss": 0.8336, + "mean_token_accuracy": 0.7583272874355316, + "num_tokens": 11664527.0, + "step": 3430 + }, + { + "epoch": 0.03452567345136296, + "learning_rate": 0.00019309687261632343, + "loss": 0.8161, + "mean_token_accuracy": 0.7626073122024536, + "num_tokens": 11698423.0, + "step": 3440 + }, + { + "epoch": 0.03462603878116344, + "learning_rate": 0.00019307679955036334, + "loss": 0.7976, + "mean_token_accuracy": 0.7633013188838959, + "num_tokens": 11732303.0, + "step": 3450 + }, + { + "epoch": 0.03472640411096391, + "learning_rate": 0.00019305672648440322, + "loss": 0.8361, + "mean_token_accuracy": 0.7670786142349243, + "num_tokens": 11766441.0, + "step": 3460 + }, + { + "epoch": 0.034826769440764384, + "learning_rate": 0.00019303665341844316, + "loss": 0.8558, + "mean_token_accuracy": 0.7520733714103699, + "num_tokens": 11800699.0, + "step": 3470 + }, + { + "epoch": 0.034927134770564854, + "learning_rate": 0.00019301658035248304, + "loss": 0.8169, + "mean_token_accuracy": 0.7605992496013642, + "num_tokens": 11834888.0, + "step": 3480 + }, + { + "epoch": 0.03502750010036533, + "learning_rate": 0.00019299650728652295, + "loss": 0.8118, + "mean_token_accuracy": 0.7634969353675842, + "num_tokens": 11869188.0, + "step": 3490 + }, + { + "epoch": 0.03512786543016581, + "learning_rate": 0.00019297643422056286, + "loss": 0.8435, + "mean_token_accuracy": 0.7566763997077942, + "num_tokens": 11903158.0, + "step": 3500 + }, + { + "epoch": 0.03522823075996628, + "learning_rate": 0.00019295636115460277, + "loss": 0.8218, + "mean_token_accuracy": 0.7639656007289887, + "num_tokens": 11936631.0, + "step": 3510 + }, + { + "epoch": 0.03532859608976675, + "learning_rate": 0.00019293628808864265, + "loss": 0.8302, + "mean_token_accuracy": 0.7581159353256226, + "num_tokens": 11971564.0, + "step": 3520 + }, + { + "epoch": 0.03542896141956722, + "learning_rate": 0.00019291621502268258, + "loss": 0.7918, + "mean_token_accuracy": 0.771466726064682, + "num_tokens": 12005548.0, + "step": 3530 + }, + { + "epoch": 0.0355293267493677, + "learning_rate": 0.00019289614195672246, + "loss": 0.8442, + "mean_token_accuracy": 0.7578944623470306, + "num_tokens": 12039494.0, + "step": 3540 + }, + { + "epoch": 0.03562969207916817, + "learning_rate": 0.00019287606889076237, + "loss": 0.8083, + "mean_token_accuracy": 0.7562072098255157, + "num_tokens": 12073597.0, + "step": 3550 + }, + { + "epoch": 0.035730057408968646, + "learning_rate": 0.00019285599582480228, + "loss": 0.7956, + "mean_token_accuracy": 0.769059157371521, + "num_tokens": 12107546.0, + "step": 3560 + }, + { + "epoch": 0.03583042273876912, + "learning_rate": 0.0001928359227588422, + "loss": 0.8408, + "mean_token_accuracy": 0.7596532464027405, + "num_tokens": 12141065.0, + "step": 3570 + }, + { + "epoch": 0.03593078806856959, + "learning_rate": 0.0001928158496928821, + "loss": 0.8233, + "mean_token_accuracy": 0.7560832560062408, + "num_tokens": 12174410.0, + "step": 3580 + }, + { + "epoch": 0.03603115339837007, + "learning_rate": 0.000192795776626922, + "loss": 0.8252, + "mean_token_accuracy": 0.7569872558116912, + "num_tokens": 12207748.0, + "step": 3590 + }, + { + "epoch": 0.03613151872817054, + "learning_rate": 0.00019277570356096191, + "loss": 0.8257, + "mean_token_accuracy": 0.7610264837741851, + "num_tokens": 12241312.0, + "step": 3600 + }, + { + "epoch": 0.036231884057971016, + "learning_rate": 0.00019275563049500182, + "loss": 0.8012, + "mean_token_accuracy": 0.7594651341438293, + "num_tokens": 12274973.0, + "step": 3610 + }, + { + "epoch": 0.036332249387771486, + "learning_rate": 0.00019273555742904173, + "loss": 0.8264, + "mean_token_accuracy": 0.7608615458011627, + "num_tokens": 12308354.0, + "step": 3620 + }, + { + "epoch": 0.03643261471757196, + "learning_rate": 0.0001927154843630816, + "loss": 0.8471, + "mean_token_accuracy": 0.7569738268852234, + "num_tokens": 12341595.0, + "step": 3630 + }, + { + "epoch": 0.03653298004737244, + "learning_rate": 0.00019269541129712155, + "loss": 0.8124, + "mean_token_accuracy": 0.7671969056129455, + "num_tokens": 12375909.0, + "step": 3640 + }, + { + "epoch": 0.03663334537717291, + "learning_rate": 0.00019267533823116143, + "loss": 0.83, + "mean_token_accuracy": 0.7595268547534942, + "num_tokens": 12409430.0, + "step": 3650 + }, + { + "epoch": 0.036733710706973385, + "learning_rate": 0.00019265526516520134, + "loss": 0.8292, + "mean_token_accuracy": 0.7604560315608978, + "num_tokens": 12443177.0, + "step": 3660 + }, + { + "epoch": 0.036834076036773855, + "learning_rate": 0.00019263519209924125, + "loss": 0.811, + "mean_token_accuracy": 0.7625544607639313, + "num_tokens": 12477266.0, + "step": 3670 + }, + { + "epoch": 0.03693444136657433, + "learning_rate": 0.00019261511903328115, + "loss": 0.8131, + "mean_token_accuracy": 0.7592061042785645, + "num_tokens": 12510949.0, + "step": 3680 + }, + { + "epoch": 0.0370348066963748, + "learning_rate": 0.00019259504596732106, + "loss": 0.8476, + "mean_token_accuracy": 0.7568705081939697, + "num_tokens": 12544909.0, + "step": 3690 + }, + { + "epoch": 0.03713517202617528, + "learning_rate": 0.00019257497290136097, + "loss": 0.8184, + "mean_token_accuracy": 0.7610429286956787, + "num_tokens": 12578295.0, + "step": 3700 + }, + { + "epoch": 0.037235537355975755, + "learning_rate": 0.00019255489983540088, + "loss": 0.8185, + "mean_token_accuracy": 0.7600680828094483, + "num_tokens": 12612334.0, + "step": 3710 + }, + { + "epoch": 0.037335902685776225, + "learning_rate": 0.00019253482676944076, + "loss": 0.7809, + "mean_token_accuracy": 0.7732314109802246, + "num_tokens": 12646883.0, + "step": 3720 + }, + { + "epoch": 0.0374362680155767, + "learning_rate": 0.0001925147537034807, + "loss": 0.8161, + "mean_token_accuracy": 0.7603020191192627, + "num_tokens": 12681201.0, + "step": 3730 + }, + { + "epoch": 0.03753663334537717, + "learning_rate": 0.00019249468063752058, + "loss": 0.8437, + "mean_token_accuracy": 0.755571311712265, + "num_tokens": 12714592.0, + "step": 3740 + }, + { + "epoch": 0.03763699867517765, + "learning_rate": 0.0001924746075715605, + "loss": 0.8964, + "mean_token_accuracy": 0.7415451884269715, + "num_tokens": 12748583.0, + "step": 3750 + }, + { + "epoch": 0.03773736400497812, + "learning_rate": 0.0001924545345056004, + "loss": 0.8537, + "mean_token_accuracy": 0.7552414834499359, + "num_tokens": 12781649.0, + "step": 3760 + }, + { + "epoch": 0.037837729334778594, + "learning_rate": 0.0001924344614396403, + "loss": 0.8194, + "mean_token_accuracy": 0.7623369455337524, + "num_tokens": 12814395.0, + "step": 3770 + }, + { + "epoch": 0.03793809466457907, + "learning_rate": 0.0001924143883736802, + "loss": 0.8169, + "mean_token_accuracy": 0.7644883871078492, + "num_tokens": 12847968.0, + "step": 3780 + }, + { + "epoch": 0.03803845999437954, + "learning_rate": 0.00019239431530772012, + "loss": 0.8128, + "mean_token_accuracy": 0.7627908825874329, + "num_tokens": 12882042.0, + "step": 3790 + }, + { + "epoch": 0.03813882532418002, + "learning_rate": 0.00019237424224176003, + "loss": 0.8135, + "mean_token_accuracy": 0.7674229919910431, + "num_tokens": 12915962.0, + "step": 3800 + }, + { + "epoch": 0.03823919065398049, + "learning_rate": 0.0001923541691757999, + "loss": 0.8152, + "mean_token_accuracy": 0.7644250571727753, + "num_tokens": 12950108.0, + "step": 3810 + }, + { + "epoch": 0.038339555983780964, + "learning_rate": 0.00019233409610983985, + "loss": 0.8407, + "mean_token_accuracy": 0.7574917793273925, + "num_tokens": 12983602.0, + "step": 3820 + }, + { + "epoch": 0.038439921313581434, + "learning_rate": 0.00019231402304387973, + "loss": 0.8331, + "mean_token_accuracy": 0.7552855551242829, + "num_tokens": 13017565.0, + "step": 3830 + }, + { + "epoch": 0.03854028664338191, + "learning_rate": 0.00019229394997791964, + "loss": 0.8185, + "mean_token_accuracy": 0.7646740972995758, + "num_tokens": 13051376.0, + "step": 3840 + }, + { + "epoch": 0.03864065197318239, + "learning_rate": 0.00019227387691195954, + "loss": 0.8064, + "mean_token_accuracy": 0.762885594367981, + "num_tokens": 13085818.0, + "step": 3850 + }, + { + "epoch": 0.03874101730298286, + "learning_rate": 0.00019225380384599945, + "loss": 0.79, + "mean_token_accuracy": 0.7621721744537353, + "num_tokens": 13119886.0, + "step": 3860 + }, + { + "epoch": 0.03884138263278333, + "learning_rate": 0.00019223373078003933, + "loss": 0.8072, + "mean_token_accuracy": 0.7587761878967285, + "num_tokens": 13154493.0, + "step": 3870 + }, + { + "epoch": 0.0389417479625838, + "learning_rate": 0.00019221365771407927, + "loss": 0.7764, + "mean_token_accuracy": 0.7698749780654908, + "num_tokens": 13188706.0, + "step": 3880 + }, + { + "epoch": 0.03904211329238428, + "learning_rate": 0.00019219358464811915, + "loss": 0.8168, + "mean_token_accuracy": 0.7628201723098755, + "num_tokens": 13222666.0, + "step": 3890 + }, + { + "epoch": 0.03914247862218475, + "learning_rate": 0.00019217351158215906, + "loss": 0.8126, + "mean_token_accuracy": 0.7653783857822418, + "num_tokens": 13256982.0, + "step": 3900 + }, + { + "epoch": 0.039242843951985226, + "learning_rate": 0.00019215343851619897, + "loss": 0.811, + "mean_token_accuracy": 0.7596830606460572, + "num_tokens": 13290715.0, + "step": 3910 + }, + { + "epoch": 0.0393432092817857, + "learning_rate": 0.00019213336545023888, + "loss": 0.8311, + "mean_token_accuracy": 0.758405339717865, + "num_tokens": 13325075.0, + "step": 3920 + }, + { + "epoch": 0.03944357461158617, + "learning_rate": 0.00019211329238427878, + "loss": 0.812, + "mean_token_accuracy": 0.7626287162303924, + "num_tokens": 13358187.0, + "step": 3930 + }, + { + "epoch": 0.03954393994138665, + "learning_rate": 0.0001920932193183187, + "loss": 0.8166, + "mean_token_accuracy": 0.7628508031368255, + "num_tokens": 13392473.0, + "step": 3940 + }, + { + "epoch": 0.03964430527118712, + "learning_rate": 0.0001920731462523586, + "loss": 0.8274, + "mean_token_accuracy": 0.7561886072158813, + "num_tokens": 13426117.0, + "step": 3950 + }, + { + "epoch": 0.039744670600987596, + "learning_rate": 0.00019205307318639848, + "loss": 0.8141, + "mean_token_accuracy": 0.7664759397506714, + "num_tokens": 13459599.0, + "step": 3960 + }, + { + "epoch": 0.039845035930788066, + "learning_rate": 0.00019203300012043842, + "loss": 0.809, + "mean_token_accuracy": 0.7616986215114594, + "num_tokens": 13493007.0, + "step": 3970 + }, + { + "epoch": 0.03994540126058854, + "learning_rate": 0.0001920129270544783, + "loss": 0.7988, + "mean_token_accuracy": 0.7667593657970428, + "num_tokens": 13526790.0, + "step": 3980 + }, + { + "epoch": 0.04004576659038902, + "learning_rate": 0.0001919928539885182, + "loss": 0.805, + "mean_token_accuracy": 0.7676305174827576, + "num_tokens": 13560353.0, + "step": 3990 + }, + { + "epoch": 0.04014613192018949, + "learning_rate": 0.00019197278092255812, + "loss": 0.8011, + "mean_token_accuracy": 0.7701820015907288, + "num_tokens": 13594409.0, + "step": 4000 + }, + { + "epoch": 0.040246497249989965, + "learning_rate": 0.00019195270785659802, + "loss": 0.8209, + "mean_token_accuracy": 0.7571946740150451, + "num_tokens": 13628492.0, + "step": 4010 + }, + { + "epoch": 0.040346862579790435, + "learning_rate": 0.00019193263479063793, + "loss": 0.8245, + "mean_token_accuracy": 0.7589803755283355, + "num_tokens": 13661763.0, + "step": 4020 + }, + { + "epoch": 0.04044722790959091, + "learning_rate": 0.00019191256172467784, + "loss": 0.814, + "mean_token_accuracy": 0.7596362948417663, + "num_tokens": 13695269.0, + "step": 4030 + }, + { + "epoch": 0.04054759323939138, + "learning_rate": 0.00019189248865871775, + "loss": 0.7936, + "mean_token_accuracy": 0.7661742925643921, + "num_tokens": 13728774.0, + "step": 4040 + }, + { + "epoch": 0.04064795856919186, + "learning_rate": 0.00019187241559275763, + "loss": 0.7932, + "mean_token_accuracy": 0.7682706117630005, + "num_tokens": 13762389.0, + "step": 4050 + }, + { + "epoch": 0.040748323898992335, + "learning_rate": 0.00019185234252679757, + "loss": 0.8024, + "mean_token_accuracy": 0.7650616884231567, + "num_tokens": 13796268.0, + "step": 4060 + }, + { + "epoch": 0.040848689228792805, + "learning_rate": 0.00019183226946083745, + "loss": 0.8043, + "mean_token_accuracy": 0.7669219195842742, + "num_tokens": 13829749.0, + "step": 4070 + }, + { + "epoch": 0.04094905455859328, + "learning_rate": 0.00019181219639487736, + "loss": 0.8131, + "mean_token_accuracy": 0.7608605742454528, + "num_tokens": 13863689.0, + "step": 4080 + }, + { + "epoch": 0.04104941988839375, + "learning_rate": 0.00019179212332891727, + "loss": 0.7973, + "mean_token_accuracy": 0.7637056112289429, + "num_tokens": 13897105.0, + "step": 4090 + }, + { + "epoch": 0.04114978521819423, + "learning_rate": 0.00019177205026295717, + "loss": 0.8293, + "mean_token_accuracy": 0.7573158740997314, + "num_tokens": 13930387.0, + "step": 4100 + }, + { + "epoch": 0.0412501505479947, + "learning_rate": 0.00019175197719699705, + "loss": 0.804, + "mean_token_accuracy": 0.7686714947223663, + "num_tokens": 13964275.0, + "step": 4110 + }, + { + "epoch": 0.041350515877795174, + "learning_rate": 0.000191731904131037, + "loss": 0.7523, + "mean_token_accuracy": 0.7722469091415405, + "num_tokens": 13998231.0, + "step": 4120 + }, + { + "epoch": 0.04145088120759565, + "learning_rate": 0.0001917118310650769, + "loss": 0.7834, + "mean_token_accuracy": 0.7652732789516449, + "num_tokens": 14032704.0, + "step": 4130 + }, + { + "epoch": 0.04155124653739612, + "learning_rate": 0.00019169175799911678, + "loss": 0.7995, + "mean_token_accuracy": 0.7662194430828094, + "num_tokens": 14066622.0, + "step": 4140 + }, + { + "epoch": 0.0416516118671966, + "learning_rate": 0.00019167168493315672, + "loss": 0.8139, + "mean_token_accuracy": 0.7601560235023499, + "num_tokens": 14101121.0, + "step": 4150 + }, + { + "epoch": 0.04175197719699707, + "learning_rate": 0.0001916516118671966, + "loss": 0.8401, + "mean_token_accuracy": 0.7569827854633331, + "num_tokens": 14135345.0, + "step": 4160 + }, + { + "epoch": 0.041852342526797544, + "learning_rate": 0.00019163153880123653, + "loss": 0.7911, + "mean_token_accuracy": 0.7664677023887634, + "num_tokens": 14169416.0, + "step": 4170 + }, + { + "epoch": 0.041952707856598014, + "learning_rate": 0.00019161146573527641, + "loss": 0.7994, + "mean_token_accuracy": 0.7639586329460144, + "num_tokens": 14204283.0, + "step": 4180 + }, + { + "epoch": 0.04205307318639849, + "learning_rate": 0.00019159139266931632, + "loss": 0.7728, + "mean_token_accuracy": 0.7709622740745544, + "num_tokens": 14239003.0, + "step": 4190 + }, + { + "epoch": 0.04215343851619897, + "learning_rate": 0.00019157131960335623, + "loss": 0.8221, + "mean_token_accuracy": 0.758518660068512, + "num_tokens": 14272386.0, + "step": 4200 + }, + { + "epoch": 0.04225380384599944, + "learning_rate": 0.00019155124653739614, + "loss": 0.8204, + "mean_token_accuracy": 0.7598104774951935, + "num_tokens": 14305825.0, + "step": 4210 + }, + { + "epoch": 0.04235416917579991, + "learning_rate": 0.00019153117347143602, + "loss": 0.8086, + "mean_token_accuracy": 0.7655596077442169, + "num_tokens": 14340525.0, + "step": 4220 + }, + { + "epoch": 0.04245453450560038, + "learning_rate": 0.00019151110040547596, + "loss": 0.8273, + "mean_token_accuracy": 0.7571021318435669, + "num_tokens": 14374981.0, + "step": 4230 + }, + { + "epoch": 0.04255489983540086, + "learning_rate": 0.00019149102733951584, + "loss": 0.7844, + "mean_token_accuracy": 0.7691513001918793, + "num_tokens": 14408364.0, + "step": 4240 + }, + { + "epoch": 0.04265526516520133, + "learning_rate": 0.00019147095427355575, + "loss": 0.8186, + "mean_token_accuracy": 0.7621715486049652, + "num_tokens": 14441851.0, + "step": 4250 + }, + { + "epoch": 0.042755630495001806, + "learning_rate": 0.00019145088120759565, + "loss": 0.8229, + "mean_token_accuracy": 0.762150514125824, + "num_tokens": 14475783.0, + "step": 4260 + }, + { + "epoch": 0.04285599582480228, + "learning_rate": 0.00019143080814163556, + "loss": 0.8216, + "mean_token_accuracy": 0.7614712715148926, + "num_tokens": 14509383.0, + "step": 4270 + }, + { + "epoch": 0.04295636115460275, + "learning_rate": 0.00019141073507567547, + "loss": 0.8182, + "mean_token_accuracy": 0.7644801437854767, + "num_tokens": 14543595.0, + "step": 4280 + }, + { + "epoch": 0.04305672648440323, + "learning_rate": 0.00019139066200971538, + "loss": 0.7619, + "mean_token_accuracy": 0.781198114156723, + "num_tokens": 14577480.0, + "step": 4290 + }, + { + "epoch": 0.0431570918142037, + "learning_rate": 0.0001913705889437553, + "loss": 0.7718, + "mean_token_accuracy": 0.7747524976730347, + "num_tokens": 14612021.0, + "step": 4300 + }, + { + "epoch": 0.043257457144004176, + "learning_rate": 0.00019135051587779517, + "loss": 0.8136, + "mean_token_accuracy": 0.7664998054504395, + "num_tokens": 14646010.0, + "step": 4310 + }, + { + "epoch": 0.043357822473804646, + "learning_rate": 0.0001913304428118351, + "loss": 0.7982, + "mean_token_accuracy": 0.7697717070579528, + "num_tokens": 14679159.0, + "step": 4320 + }, + { + "epoch": 0.04345818780360512, + "learning_rate": 0.00019131036974587499, + "loss": 0.8073, + "mean_token_accuracy": 0.7655534505844116, + "num_tokens": 14712845.0, + "step": 4330 + }, + { + "epoch": 0.0435585531334056, + "learning_rate": 0.0001912902966799149, + "loss": 0.8319, + "mean_token_accuracy": 0.760830146074295, + "num_tokens": 14747070.0, + "step": 4340 + }, + { + "epoch": 0.04365891846320607, + "learning_rate": 0.0001912702236139548, + "loss": 0.8218, + "mean_token_accuracy": 0.7607136905193329, + "num_tokens": 14780892.0, + "step": 4350 + }, + { + "epoch": 0.043759283793006545, + "learning_rate": 0.0001912501505479947, + "loss": 0.821, + "mean_token_accuracy": 0.7604890406131745, + "num_tokens": 14814844.0, + "step": 4360 + }, + { + "epoch": 0.043859649122807015, + "learning_rate": 0.00019123007748203462, + "loss": 0.8344, + "mean_token_accuracy": 0.7620271623134613, + "num_tokens": 14849397.0, + "step": 4370 + }, + { + "epoch": 0.04396001445260749, + "learning_rate": 0.00019121000441607453, + "loss": 0.8168, + "mean_token_accuracy": 0.7646451532840729, + "num_tokens": 14884507.0, + "step": 4380 + }, + { + "epoch": 0.04406037978240796, + "learning_rate": 0.00019118993135011444, + "loss": 0.8326, + "mean_token_accuracy": 0.7582274377346039, + "num_tokens": 14917952.0, + "step": 4390 + }, + { + "epoch": 0.04416074511220844, + "learning_rate": 0.00019116985828415432, + "loss": 0.7943, + "mean_token_accuracy": 0.7630038142204285, + "num_tokens": 14951593.0, + "step": 4400 + }, + { + "epoch": 0.044261110442008915, + "learning_rate": 0.00019114978521819425, + "loss": 0.8004, + "mean_token_accuracy": 0.7646883130073547, + "num_tokens": 14986092.0, + "step": 4410 + }, + { + "epoch": 0.044361475771809385, + "learning_rate": 0.00019112971215223414, + "loss": 0.7422, + "mean_token_accuracy": 0.7789775013923645, + "num_tokens": 15020485.0, + "step": 4420 + }, + { + "epoch": 0.04446184110160986, + "learning_rate": 0.00019110963908627404, + "loss": 0.8134, + "mean_token_accuracy": 0.7608291804790497, + "num_tokens": 15054328.0, + "step": 4430 + }, + { + "epoch": 0.04456220643141033, + "learning_rate": 0.00019108956602031395, + "loss": 0.8157, + "mean_token_accuracy": 0.7607727348804474, + "num_tokens": 15088045.0, + "step": 4440 + }, + { + "epoch": 0.04466257176121081, + "learning_rate": 0.00019106949295435386, + "loss": 0.8194, + "mean_token_accuracy": 0.7610091507434845, + "num_tokens": 15120903.0, + "step": 4450 + }, + { + "epoch": 0.044762937091011284, + "learning_rate": 0.00019104941988839374, + "loss": 0.8549, + "mean_token_accuracy": 0.7528641760349274, + "num_tokens": 15154821.0, + "step": 4460 + }, + { + "epoch": 0.044863302420811754, + "learning_rate": 0.00019102934682243368, + "loss": 0.7874, + "mean_token_accuracy": 0.7704406261444092, + "num_tokens": 15188544.0, + "step": 4470 + }, + { + "epoch": 0.04496366775061223, + "learning_rate": 0.00019100927375647359, + "loss": 0.8244, + "mean_token_accuracy": 0.7597645819187164, + "num_tokens": 15222804.0, + "step": 4480 + }, + { + "epoch": 0.0450640330804127, + "learning_rate": 0.00019098920069051347, + "loss": 0.7967, + "mean_token_accuracy": 0.7645935952663422, + "num_tokens": 15257498.0, + "step": 4490 + }, + { + "epoch": 0.04516439841021318, + "learning_rate": 0.0001909691276245534, + "loss": 0.7711, + "mean_token_accuracy": 0.7738887727260589, + "num_tokens": 15291150.0, + "step": 4500 + }, + { + "epoch": 0.04526476374001365, + "learning_rate": 0.00019094905455859328, + "loss": 0.8196, + "mean_token_accuracy": 0.7628287553787232, + "num_tokens": 15325608.0, + "step": 4510 + }, + { + "epoch": 0.045365129069814124, + "learning_rate": 0.0001909289814926332, + "loss": 0.8097, + "mean_token_accuracy": 0.7615756452083587, + "num_tokens": 15359817.0, + "step": 4520 + }, + { + "epoch": 0.0454654943996146, + "learning_rate": 0.0001909089084266731, + "loss": 0.7865, + "mean_token_accuracy": 0.7654139697551727, + "num_tokens": 15393899.0, + "step": 4530 + }, + { + "epoch": 0.04556585972941507, + "learning_rate": 0.000190888835360713, + "loss": 0.8154, + "mean_token_accuracy": 0.7623386085033417, + "num_tokens": 15427234.0, + "step": 4540 + }, + { + "epoch": 0.04566622505921555, + "learning_rate": 0.0001908687622947529, + "loss": 0.8044, + "mean_token_accuracy": 0.7596213340759277, + "num_tokens": 15460609.0, + "step": 4550 + }, + { + "epoch": 0.04576659038901602, + "learning_rate": 0.00019084868922879283, + "loss": 0.7949, + "mean_token_accuracy": 0.7677416563034057, + "num_tokens": 15494983.0, + "step": 4560 + }, + { + "epoch": 0.04586695571881649, + "learning_rate": 0.0001908286161628327, + "loss": 0.7998, + "mean_token_accuracy": 0.759462857246399, + "num_tokens": 15527836.0, + "step": 4570 + }, + { + "epoch": 0.04596732104861696, + "learning_rate": 0.00019080854309687262, + "loss": 0.8461, + "mean_token_accuracy": 0.7568655669689178, + "num_tokens": 15561348.0, + "step": 4580 + }, + { + "epoch": 0.04606768637841744, + "learning_rate": 0.00019078847003091252, + "loss": 0.8358, + "mean_token_accuracy": 0.7562499463558197, + "num_tokens": 15595890.0, + "step": 4590 + }, + { + "epoch": 0.046168051708217916, + "learning_rate": 0.00019076839696495243, + "loss": 0.841, + "mean_token_accuracy": 0.7540477454662323, + "num_tokens": 15630814.0, + "step": 4600 + }, + { + "epoch": 0.046268417038018386, + "learning_rate": 0.00019074832389899234, + "loss": 0.8379, + "mean_token_accuracy": 0.7596671104431152, + "num_tokens": 15665342.0, + "step": 4610 + }, + { + "epoch": 0.04636878236781886, + "learning_rate": 0.00019072825083303225, + "loss": 0.7917, + "mean_token_accuracy": 0.7665965020656585, + "num_tokens": 15699006.0, + "step": 4620 + }, + { + "epoch": 0.04646914769761933, + "learning_rate": 0.00019070817776707216, + "loss": 0.806, + "mean_token_accuracy": 0.7658841371536255, + "num_tokens": 15733812.0, + "step": 4630 + }, + { + "epoch": 0.04656951302741981, + "learning_rate": 0.00019068810470111204, + "loss": 0.7696, + "mean_token_accuracy": 0.7712407052516937, + "num_tokens": 15768185.0, + "step": 4640 + }, + { + "epoch": 0.04666987835722028, + "learning_rate": 0.00019066803163515197, + "loss": 0.7868, + "mean_token_accuracy": 0.7670133650302887, + "num_tokens": 15802046.0, + "step": 4650 + }, + { + "epoch": 0.046770243687020756, + "learning_rate": 0.00019064795856919186, + "loss": 0.8039, + "mean_token_accuracy": 0.7610798418521881, + "num_tokens": 15836439.0, + "step": 4660 + }, + { + "epoch": 0.04687060901682123, + "learning_rate": 0.00019062788550323176, + "loss": 0.7943, + "mean_token_accuracy": 0.7643402874469757, + "num_tokens": 15869996.0, + "step": 4670 + }, + { + "epoch": 0.0469709743466217, + "learning_rate": 0.00019060781243727167, + "loss": 0.826, + "mean_token_accuracy": 0.7603221535682678, + "num_tokens": 15903732.0, + "step": 4680 + }, + { + "epoch": 0.04707133967642218, + "learning_rate": 0.00019058773937131158, + "loss": 0.7764, + "mean_token_accuracy": 0.7736131608486175, + "num_tokens": 15938228.0, + "step": 4690 + }, + { + "epoch": 0.04717170500622265, + "learning_rate": 0.0001905676663053515, + "loss": 0.8019, + "mean_token_accuracy": 0.7617711782455444, + "num_tokens": 15971639.0, + "step": 4700 + }, + { + "epoch": 0.047272070336023125, + "learning_rate": 0.0001905475932393914, + "loss": 0.8024, + "mean_token_accuracy": 0.765626859664917, + "num_tokens": 16005456.0, + "step": 4710 + }, + { + "epoch": 0.047372435665823595, + "learning_rate": 0.0001905275201734313, + "loss": 0.8245, + "mean_token_accuracy": 0.7578832507133484, + "num_tokens": 16039943.0, + "step": 4720 + }, + { + "epoch": 0.04747280099562407, + "learning_rate": 0.00019050744710747122, + "loss": 0.8159, + "mean_token_accuracy": 0.7593542397022247, + "num_tokens": 16073997.0, + "step": 4730 + }, + { + "epoch": 0.04757316632542455, + "learning_rate": 0.00019048737404151112, + "loss": 0.8401, + "mean_token_accuracy": 0.7576812863349914, + "num_tokens": 16108978.0, + "step": 4740 + }, + { + "epoch": 0.04767353165522502, + "learning_rate": 0.000190467300975551, + "loss": 0.802, + "mean_token_accuracy": 0.7665064334869385, + "num_tokens": 16143274.0, + "step": 4750 + }, + { + "epoch": 0.047773896985025495, + "learning_rate": 0.00019044722790959094, + "loss": 0.7668, + "mean_token_accuracy": 0.7717243552207946, + "num_tokens": 16177844.0, + "step": 4760 + }, + { + "epoch": 0.047874262314825965, + "learning_rate": 0.00019042715484363082, + "loss": 0.8272, + "mean_token_accuracy": 0.7543803930282593, + "num_tokens": 16212293.0, + "step": 4770 + }, + { + "epoch": 0.04797462764462644, + "learning_rate": 0.00019040708177767073, + "loss": 0.7838, + "mean_token_accuracy": 0.766845291852951, + "num_tokens": 16246046.0, + "step": 4780 + }, + { + "epoch": 0.04807499297442691, + "learning_rate": 0.00019038700871171064, + "loss": 0.7978, + "mean_token_accuracy": 0.764685869216919, + "num_tokens": 16279922.0, + "step": 4790 + }, + { + "epoch": 0.04817535830422739, + "learning_rate": 0.00019036693564575055, + "loss": 0.8131, + "mean_token_accuracy": 0.762106591463089, + "num_tokens": 16313301.0, + "step": 4800 + }, + { + "epoch": 0.048275723634027864, + "learning_rate": 0.00019034686257979043, + "loss": 0.7785, + "mean_token_accuracy": 0.762081903219223, + "num_tokens": 16347030.0, + "step": 4810 + }, + { + "epoch": 0.048376088963828334, + "learning_rate": 0.00019032678951383036, + "loss": 0.8192, + "mean_token_accuracy": 0.7583778619766235, + "num_tokens": 16380294.0, + "step": 4820 + }, + { + "epoch": 0.04847645429362881, + "learning_rate": 0.00019030671644787027, + "loss": 0.8274, + "mean_token_accuracy": 0.7571999251842498, + "num_tokens": 16414833.0, + "step": 4830 + }, + { + "epoch": 0.04857681962342928, + "learning_rate": 0.00019028664338191015, + "loss": 0.808, + "mean_token_accuracy": 0.7681930124759674, + "num_tokens": 16448628.0, + "step": 4840 + }, + { + "epoch": 0.04867718495322976, + "learning_rate": 0.0001902665703159501, + "loss": 0.7956, + "mean_token_accuracy": 0.7681915581226348, + "num_tokens": 16482605.0, + "step": 4850 + }, + { + "epoch": 0.04877755028303023, + "learning_rate": 0.00019024649724998997, + "loss": 0.7698, + "mean_token_accuracy": 0.7775806069374085, + "num_tokens": 16516846.0, + "step": 4860 + }, + { + "epoch": 0.048877915612830704, + "learning_rate": 0.00019022642418402988, + "loss": 0.8486, + "mean_token_accuracy": 0.7511551916599274, + "num_tokens": 16550932.0, + "step": 4870 + }, + { + "epoch": 0.04897828094263118, + "learning_rate": 0.0001902063511180698, + "loss": 0.785, + "mean_token_accuracy": 0.7689824163913727, + "num_tokens": 16585156.0, + "step": 4880 + }, + { + "epoch": 0.04907864627243165, + "learning_rate": 0.0001901862780521097, + "loss": 0.8578, + "mean_token_accuracy": 0.7557364404201508, + "num_tokens": 16619347.0, + "step": 4890 + }, + { + "epoch": 0.04917901160223213, + "learning_rate": 0.00019016620498614958, + "loss": 0.7943, + "mean_token_accuracy": 0.7654554963111877, + "num_tokens": 16652773.0, + "step": 4900 + }, + { + "epoch": 0.0492793769320326, + "learning_rate": 0.0001901461319201895, + "loss": 0.8235, + "mean_token_accuracy": 0.7565623998641968, + "num_tokens": 16686677.0, + "step": 4910 + }, + { + "epoch": 0.04937974226183307, + "learning_rate": 0.0001901260588542294, + "loss": 0.7759, + "mean_token_accuracy": 0.7688578844070435, + "num_tokens": 16720701.0, + "step": 4920 + }, + { + "epoch": 0.04948010759163354, + "learning_rate": 0.0001901059857882693, + "loss": 0.8117, + "mean_token_accuracy": 0.761589401960373, + "num_tokens": 16754870.0, + "step": 4930 + }, + { + "epoch": 0.04958047292143402, + "learning_rate": 0.0001900859127223092, + "loss": 0.8042, + "mean_token_accuracy": 0.7648223102092743, + "num_tokens": 16789281.0, + "step": 4940 + }, + { + "epoch": 0.049680838251234496, + "learning_rate": 0.00019006583965634912, + "loss": 0.8184, + "mean_token_accuracy": 0.7596215605735779, + "num_tokens": 16823379.0, + "step": 4950 + }, + { + "epoch": 0.049781203581034966, + "learning_rate": 0.00019004576659038903, + "loss": 0.8424, + "mean_token_accuracy": 0.7572415292263031, + "num_tokens": 16856561.0, + "step": 4960 + }, + { + "epoch": 0.04988156891083544, + "learning_rate": 0.00019002569352442894, + "loss": 0.8194, + "mean_token_accuracy": 0.7631000757217408, + "num_tokens": 16889736.0, + "step": 4970 + }, + { + "epoch": 0.04998193424063591, + "learning_rate": 0.00019000562045846884, + "loss": 0.811, + "mean_token_accuracy": 0.7635967433452606, + "num_tokens": 16922931.0, + "step": 4980 + }, + { + "epoch": 0.05008229957043639, + "learning_rate": 0.00018998554739250873, + "loss": 0.7788, + "mean_token_accuracy": 0.7682659387588501, + "num_tokens": 16957466.0, + "step": 4990 + }, + { + "epoch": 0.05018266490023686, + "learning_rate": 0.00018996547432654866, + "loss": 0.7996, + "mean_token_accuracy": 0.7649333596229553, + "num_tokens": 16991761.0, + "step": 5000 + }, + { + "epoch": 0.050283030230037336, + "learning_rate": 0.00018994540126058854, + "loss": 0.8438, + "mean_token_accuracy": 0.7554546117782592, + "num_tokens": 17026294.0, + "step": 5010 + }, + { + "epoch": 0.05038339555983781, + "learning_rate": 0.00018992532819462845, + "loss": 0.8006, + "mean_token_accuracy": 0.7630142390727996, + "num_tokens": 17060231.0, + "step": 5020 + }, + { + "epoch": 0.05048376088963828, + "learning_rate": 0.00018990525512866836, + "loss": 0.7855, + "mean_token_accuracy": 0.7714180409908294, + "num_tokens": 17095013.0, + "step": 5030 + }, + { + "epoch": 0.05058412621943876, + "learning_rate": 0.00018988518206270827, + "loss": 0.821, + "mean_token_accuracy": 0.7537748515605927, + "num_tokens": 17128747.0, + "step": 5040 + }, + { + "epoch": 0.05068449154923923, + "learning_rate": 0.00018986510899674818, + "loss": 0.8498, + "mean_token_accuracy": 0.7544196486473084, + "num_tokens": 17162701.0, + "step": 5050 + }, + { + "epoch": 0.050784856879039705, + "learning_rate": 0.00018984503593078809, + "loss": 0.7982, + "mean_token_accuracy": 0.7683187246322631, + "num_tokens": 17196760.0, + "step": 5060 + }, + { + "epoch": 0.050885222208840175, + "learning_rate": 0.000189824962864828, + "loss": 0.8024, + "mean_token_accuracy": 0.7660270392894745, + "num_tokens": 17230284.0, + "step": 5070 + }, + { + "epoch": 0.05098558753864065, + "learning_rate": 0.00018980488979886787, + "loss": 0.821, + "mean_token_accuracy": 0.7614680528640747, + "num_tokens": 17264549.0, + "step": 5080 + }, + { + "epoch": 0.05108595286844113, + "learning_rate": 0.0001897848167329078, + "loss": 0.8164, + "mean_token_accuracy": 0.7596682369709015, + "num_tokens": 17298632.0, + "step": 5090 + }, + { + "epoch": 0.0511863181982416, + "learning_rate": 0.0001897647436669477, + "loss": 0.8164, + "mean_token_accuracy": 0.7643806874752045, + "num_tokens": 17332557.0, + "step": 5100 + }, + { + "epoch": 0.051286683528042075, + "learning_rate": 0.0001897446706009876, + "loss": 0.8234, + "mean_token_accuracy": 0.7651040554046631, + "num_tokens": 17365809.0, + "step": 5110 + }, + { + "epoch": 0.051387048857842545, + "learning_rate": 0.0001897245975350275, + "loss": 0.8118, + "mean_token_accuracy": 0.7640089511871337, + "num_tokens": 17400122.0, + "step": 5120 + }, + { + "epoch": 0.05148741418764302, + "learning_rate": 0.00018970452446906742, + "loss": 0.7918, + "mean_token_accuracy": 0.7671834468841553, + "num_tokens": 17434037.0, + "step": 5130 + }, + { + "epoch": 0.05158777951744349, + "learning_rate": 0.0001896844514031073, + "loss": 0.7833, + "mean_token_accuracy": 0.7701202273368836, + "num_tokens": 17467825.0, + "step": 5140 + }, + { + "epoch": 0.05168814484724397, + "learning_rate": 0.00018966437833714723, + "loss": 0.7972, + "mean_token_accuracy": 0.7589609801769257, + "num_tokens": 17501028.0, + "step": 5150 + }, + { + "epoch": 0.051788510177044444, + "learning_rate": 0.00018964430527118712, + "loss": 0.8106, + "mean_token_accuracy": 0.7608213603496552, + "num_tokens": 17535782.0, + "step": 5160 + }, + { + "epoch": 0.051888875506844914, + "learning_rate": 0.00018962423220522702, + "loss": 0.8292, + "mean_token_accuracy": 0.7518568873405457, + "num_tokens": 17569420.0, + "step": 5170 + }, + { + "epoch": 0.05198924083664539, + "learning_rate": 0.00018960415913926696, + "loss": 0.8025, + "mean_token_accuracy": 0.7592430770397186, + "num_tokens": 17603583.0, + "step": 5180 + }, + { + "epoch": 0.05208960616644586, + "learning_rate": 0.00018958408607330684, + "loss": 0.8245, + "mean_token_accuracy": 0.7620608747005463, + "num_tokens": 17637921.0, + "step": 5190 + }, + { + "epoch": 0.05218997149624634, + "learning_rate": 0.00018956401300734675, + "loss": 0.8265, + "mean_token_accuracy": 0.7579002261161805, + "num_tokens": 17671881.0, + "step": 5200 + }, + { + "epoch": 0.05229033682604681, + "learning_rate": 0.00018954393994138666, + "loss": 0.7723, + "mean_token_accuracy": 0.776001226902008, + "num_tokens": 17705190.0, + "step": 5210 + }, + { + "epoch": 0.052390702155847284, + "learning_rate": 0.00018952386687542657, + "loss": 0.8015, + "mean_token_accuracy": 0.7666917979717255, + "num_tokens": 17738155.0, + "step": 5220 + }, + { + "epoch": 0.05249106748564776, + "learning_rate": 0.00018950379380946645, + "loss": 0.7992, + "mean_token_accuracy": 0.7608095228672027, + "num_tokens": 17772226.0, + "step": 5230 + }, + { + "epoch": 0.05259143281544823, + "learning_rate": 0.00018948372074350638, + "loss": 0.7702, + "mean_token_accuracy": 0.777134358882904, + "num_tokens": 17805812.0, + "step": 5240 + }, + { + "epoch": 0.05269179814524871, + "learning_rate": 0.00018946364767754626, + "loss": 0.8004, + "mean_token_accuracy": 0.7648840487003327, + "num_tokens": 17841031.0, + "step": 5250 + }, + { + "epoch": 0.05279216347504918, + "learning_rate": 0.00018944357461158617, + "loss": 0.8193, + "mean_token_accuracy": 0.7593564450740814, + "num_tokens": 17875531.0, + "step": 5260 + }, + { + "epoch": 0.05289252880484965, + "learning_rate": 0.00018942350154562608, + "loss": 0.8054, + "mean_token_accuracy": 0.7660769641399383, + "num_tokens": 17909494.0, + "step": 5270 + }, + { + "epoch": 0.05299289413465012, + "learning_rate": 0.000189403428479666, + "loss": 0.8046, + "mean_token_accuracy": 0.7677799701690674, + "num_tokens": 17944588.0, + "step": 5280 + }, + { + "epoch": 0.0530932594644506, + "learning_rate": 0.0001893833554137059, + "loss": 0.8204, + "mean_token_accuracy": 0.7590183019638062, + "num_tokens": 17978905.0, + "step": 5290 + }, + { + "epoch": 0.053193624794251076, + "learning_rate": 0.0001893632823477458, + "loss": 0.8164, + "mean_token_accuracy": 0.7615972459316254, + "num_tokens": 18013101.0, + "step": 5300 + }, + { + "epoch": 0.053293990124051546, + "learning_rate": 0.00018934320928178571, + "loss": 0.8286, + "mean_token_accuracy": 0.7581937134265899, + "num_tokens": 18046969.0, + "step": 5310 + }, + { + "epoch": 0.05339435545385202, + "learning_rate": 0.00018932313621582562, + "loss": 0.8018, + "mean_token_accuracy": 0.7623614311218262, + "num_tokens": 18079866.0, + "step": 5320 + }, + { + "epoch": 0.05349472078365249, + "learning_rate": 0.00018930306314986553, + "loss": 0.8099, + "mean_token_accuracy": 0.7652176499366761, + "num_tokens": 18114087.0, + "step": 5330 + }, + { + "epoch": 0.05359508611345297, + "learning_rate": 0.0001892829900839054, + "loss": 0.7845, + "mean_token_accuracy": 0.7658193945884705, + "num_tokens": 18147960.0, + "step": 5340 + }, + { + "epoch": 0.05369545144325344, + "learning_rate": 0.00018926291701794535, + "loss": 0.8017, + "mean_token_accuracy": 0.7609344720840454, + "num_tokens": 18181170.0, + "step": 5350 + }, + { + "epoch": 0.053795816773053916, + "learning_rate": 0.00018924284395198523, + "loss": 0.8241, + "mean_token_accuracy": 0.761503380537033, + "num_tokens": 18216036.0, + "step": 5360 + }, + { + "epoch": 0.05389618210285439, + "learning_rate": 0.00018922277088602514, + "loss": 0.7819, + "mean_token_accuracy": 0.7689382612705231, + "num_tokens": 18249563.0, + "step": 5370 + }, + { + "epoch": 0.05399654743265486, + "learning_rate": 0.00018920269782006505, + "loss": 0.7923, + "mean_token_accuracy": 0.7651596367359161, + "num_tokens": 18282234.0, + "step": 5380 + }, + { + "epoch": 0.05409691276245534, + "learning_rate": 0.00018918262475410496, + "loss": 0.8435, + "mean_token_accuracy": 0.7542744994163513, + "num_tokens": 18315301.0, + "step": 5390 + }, + { + "epoch": 0.05419727809225581, + "learning_rate": 0.00018916255168814486, + "loss": 0.805, + "mean_token_accuracy": 0.7645738780498504, + "num_tokens": 18349370.0, + "step": 5400 + }, + { + "epoch": 0.054297643422056285, + "learning_rate": 0.00018914247862218477, + "loss": 0.837, + "mean_token_accuracy": 0.7534904599189758, + "num_tokens": 18383501.0, + "step": 5410 + }, + { + "epoch": 0.05439800875185676, + "learning_rate": 0.00018912240555622468, + "loss": 0.7729, + "mean_token_accuracy": 0.7718036055564881, + "num_tokens": 18417804.0, + "step": 5420 + }, + { + "epoch": 0.05449837408165723, + "learning_rate": 0.00018910233249026456, + "loss": 0.8023, + "mean_token_accuracy": 0.7666881501674652, + "num_tokens": 18450802.0, + "step": 5430 + }, + { + "epoch": 0.05459873941145771, + "learning_rate": 0.0001890822594243045, + "loss": 0.8038, + "mean_token_accuracy": 0.7667160868644715, + "num_tokens": 18485355.0, + "step": 5440 + }, + { + "epoch": 0.05469910474125818, + "learning_rate": 0.00018906218635834438, + "loss": 0.8123, + "mean_token_accuracy": 0.761625474691391, + "num_tokens": 18519045.0, + "step": 5450 + }, + { + "epoch": 0.054799470071058655, + "learning_rate": 0.0001890421132923843, + "loss": 0.8261, + "mean_token_accuracy": 0.7566151797771454, + "num_tokens": 18553858.0, + "step": 5460 + }, + { + "epoch": 0.054899835400859125, + "learning_rate": 0.0001890220402264242, + "loss": 0.8256, + "mean_token_accuracy": 0.7587904393672943, + "num_tokens": 18587941.0, + "step": 5470 + }, + { + "epoch": 0.0550002007306596, + "learning_rate": 0.0001890019671604641, + "loss": 0.829, + "mean_token_accuracy": 0.7643349528312683, + "num_tokens": 18621442.0, + "step": 5480 + }, + { + "epoch": 0.05510056606046008, + "learning_rate": 0.00018898189409450399, + "loss": 0.7805, + "mean_token_accuracy": 0.7764574468135834, + "num_tokens": 18655346.0, + "step": 5490 + }, + { + "epoch": 0.05520093139026055, + "learning_rate": 0.00018896182102854392, + "loss": 0.7657, + "mean_token_accuracy": 0.7703535377979278, + "num_tokens": 18689412.0, + "step": 5500 + }, + { + "epoch": 0.055301296720061024, + "learning_rate": 0.0001889417479625838, + "loss": 0.7821, + "mean_token_accuracy": 0.763988482952118, + "num_tokens": 18722288.0, + "step": 5510 + }, + { + "epoch": 0.055401662049861494, + "learning_rate": 0.0001889216748966237, + "loss": 0.7861, + "mean_token_accuracy": 0.7680335581302643, + "num_tokens": 18756723.0, + "step": 5520 + }, + { + "epoch": 0.05550202737966197, + "learning_rate": 0.00018890160183066365, + "loss": 0.8263, + "mean_token_accuracy": 0.7613557398319244, + "num_tokens": 18791263.0, + "step": 5530 + }, + { + "epoch": 0.05560239270946244, + "learning_rate": 0.00018888152876470353, + "loss": 0.8333, + "mean_token_accuracy": 0.7546876013278961, + "num_tokens": 18825148.0, + "step": 5540 + }, + { + "epoch": 0.05570275803926292, + "learning_rate": 0.00018886145569874344, + "loss": 0.8102, + "mean_token_accuracy": 0.7602154076099396, + "num_tokens": 18859192.0, + "step": 5550 + }, + { + "epoch": 0.055803123369063394, + "learning_rate": 0.00018884138263278334, + "loss": 0.8232, + "mean_token_accuracy": 0.7617478847503663, + "num_tokens": 18893079.0, + "step": 5560 + }, + { + "epoch": 0.055903488698863864, + "learning_rate": 0.00018882130956682325, + "loss": 0.8078, + "mean_token_accuracy": 0.7636166334152221, + "num_tokens": 18927014.0, + "step": 5570 + }, + { + "epoch": 0.05600385402866434, + "learning_rate": 0.00018880123650086313, + "loss": 0.8533, + "mean_token_accuracy": 0.7467453896999359, + "num_tokens": 18962129.0, + "step": 5580 + }, + { + "epoch": 0.05610421935846481, + "learning_rate": 0.00018878116343490307, + "loss": 0.7834, + "mean_token_accuracy": 0.7670481979846955, + "num_tokens": 18995617.0, + "step": 5590 + }, + { + "epoch": 0.05620458468826529, + "learning_rate": 0.00018876109036894295, + "loss": 0.7936, + "mean_token_accuracy": 0.7654320299625397, + "num_tokens": 19029412.0, + "step": 5600 + }, + { + "epoch": 0.05630495001806576, + "learning_rate": 0.00018874101730298286, + "loss": 0.7918, + "mean_token_accuracy": 0.7685347139835358, + "num_tokens": 19063413.0, + "step": 5610 + }, + { + "epoch": 0.05640531534786623, + "learning_rate": 0.00018872094423702277, + "loss": 0.7651, + "mean_token_accuracy": 0.7734270513057708, + "num_tokens": 19097359.0, + "step": 5620 + }, + { + "epoch": 0.05650568067766671, + "learning_rate": 0.00018870087117106268, + "loss": 0.7928, + "mean_token_accuracy": 0.7665821790695191, + "num_tokens": 19131252.0, + "step": 5630 + }, + { + "epoch": 0.05660604600746718, + "learning_rate": 0.00018868079810510258, + "loss": 0.7886, + "mean_token_accuracy": 0.7623964071273803, + "num_tokens": 19165014.0, + "step": 5640 + }, + { + "epoch": 0.056706411337267656, + "learning_rate": 0.0001886607250391425, + "loss": 0.767, + "mean_token_accuracy": 0.7693248212337493, + "num_tokens": 19198196.0, + "step": 5650 + }, + { + "epoch": 0.056806776667068126, + "learning_rate": 0.0001886406519731824, + "loss": 0.8134, + "mean_token_accuracy": 0.7667059004306793, + "num_tokens": 19231774.0, + "step": 5660 + }, + { + "epoch": 0.0569071419968686, + "learning_rate": 0.00018862057890722228, + "loss": 0.7965, + "mean_token_accuracy": 0.7676830589771271, + "num_tokens": 19266436.0, + "step": 5670 + }, + { + "epoch": 0.05700750732666907, + "learning_rate": 0.00018860050584126222, + "loss": 0.7978, + "mean_token_accuracy": 0.7694530487060547, + "num_tokens": 19299446.0, + "step": 5680 + }, + { + "epoch": 0.05710787265646955, + "learning_rate": 0.0001885804327753021, + "loss": 0.8187, + "mean_token_accuracy": 0.7586834967136383, + "num_tokens": 19333807.0, + "step": 5690 + }, + { + "epoch": 0.057208237986270026, + "learning_rate": 0.000188560359709342, + "loss": 0.772, + "mean_token_accuracy": 0.7735353410243988, + "num_tokens": 19368038.0, + "step": 5700 + }, + { + "epoch": 0.057308603316070496, + "learning_rate": 0.00018854028664338192, + "loss": 0.8039, + "mean_token_accuracy": 0.7609234035015107, + "num_tokens": 19402947.0, + "step": 5710 + }, + { + "epoch": 0.05740896864587097, + "learning_rate": 0.00018852021357742183, + "loss": 0.7999, + "mean_token_accuracy": 0.7657185137271881, + "num_tokens": 19437044.0, + "step": 5720 + }, + { + "epoch": 0.05750933397567144, + "learning_rate": 0.00018850014051146173, + "loss": 0.7695, + "mean_token_accuracy": 0.7703326880931854, + "num_tokens": 19470934.0, + "step": 5730 + }, + { + "epoch": 0.05760969930547192, + "learning_rate": 0.00018848006744550164, + "loss": 0.8243, + "mean_token_accuracy": 0.7622361481189728, + "num_tokens": 19503986.0, + "step": 5740 + }, + { + "epoch": 0.05771006463527239, + "learning_rate": 0.00018845999437954155, + "loss": 0.8077, + "mean_token_accuracy": 0.768898606300354, + "num_tokens": 19538084.0, + "step": 5750 + }, + { + "epoch": 0.057810429965072865, + "learning_rate": 0.00018843992131358143, + "loss": 0.7856, + "mean_token_accuracy": 0.7670232474803924, + "num_tokens": 19572080.0, + "step": 5760 + }, + { + "epoch": 0.05791079529487334, + "learning_rate": 0.00018841984824762137, + "loss": 0.8298, + "mean_token_accuracy": 0.7527221262454986, + "num_tokens": 19606159.0, + "step": 5770 + }, + { + "epoch": 0.05801116062467381, + "learning_rate": 0.00018839977518166125, + "loss": 0.8162, + "mean_token_accuracy": 0.7591395795345306, + "num_tokens": 19640673.0, + "step": 5780 + }, + { + "epoch": 0.05811152595447429, + "learning_rate": 0.00018837970211570116, + "loss": 0.7917, + "mean_token_accuracy": 0.7707108378410339, + "num_tokens": 19674604.0, + "step": 5790 + }, + { + "epoch": 0.05821189128427476, + "learning_rate": 0.00018835962904974107, + "loss": 0.8416, + "mean_token_accuracy": 0.7613542258739472, + "num_tokens": 19707873.0, + "step": 5800 + }, + { + "epoch": 0.058312256614075235, + "learning_rate": 0.00018833955598378097, + "loss": 0.8096, + "mean_token_accuracy": 0.75683753490448, + "num_tokens": 19742363.0, + "step": 5810 + }, + { + "epoch": 0.058412621943875705, + "learning_rate": 0.00018831948291782086, + "loss": 0.81, + "mean_token_accuracy": 0.7634640634059906, + "num_tokens": 19776866.0, + "step": 5820 + }, + { + "epoch": 0.05851298727367618, + "learning_rate": 0.0001882994098518608, + "loss": 0.7921, + "mean_token_accuracy": 0.7701465368270874, + "num_tokens": 19810644.0, + "step": 5830 + }, + { + "epoch": 0.05861335260347666, + "learning_rate": 0.00018827933678590067, + "loss": 0.7958, + "mean_token_accuracy": 0.7674748599529266, + "num_tokens": 19845030.0, + "step": 5840 + }, + { + "epoch": 0.05871371793327713, + "learning_rate": 0.00018825926371994058, + "loss": 0.7968, + "mean_token_accuracy": 0.7612373232841492, + "num_tokens": 19878641.0, + "step": 5850 + }, + { + "epoch": 0.058814083263077604, + "learning_rate": 0.0001882391906539805, + "loss": 0.8012, + "mean_token_accuracy": 0.7664192676544189, + "num_tokens": 19912612.0, + "step": 5860 + }, + { + "epoch": 0.058914448592878074, + "learning_rate": 0.0001882191175880204, + "loss": 0.8111, + "mean_token_accuracy": 0.7672783672809601, + "num_tokens": 19946931.0, + "step": 5870 + }, + { + "epoch": 0.05901481392267855, + "learning_rate": 0.0001881990445220603, + "loss": 0.7656, + "mean_token_accuracy": 0.7663740038871765, + "num_tokens": 19980517.0, + "step": 5880 + }, + { + "epoch": 0.05911517925247902, + "learning_rate": 0.00018817897145610021, + "loss": 0.814, + "mean_token_accuracy": 0.7602796375751495, + "num_tokens": 20014767.0, + "step": 5890 + }, + { + "epoch": 0.0592155445822795, + "learning_rate": 0.00018815889839014012, + "loss": 0.7862, + "mean_token_accuracy": 0.768184608221054, + "num_tokens": 20049856.0, + "step": 5900 + }, + { + "epoch": 0.059315909912079974, + "learning_rate": 0.00018813882532418003, + "loss": 0.811, + "mean_token_accuracy": 0.762929767370224, + "num_tokens": 20084071.0, + "step": 5910 + }, + { + "epoch": 0.059416275241880444, + "learning_rate": 0.00018811875225821994, + "loss": 0.8411, + "mean_token_accuracy": 0.7571568787097931, + "num_tokens": 20117537.0, + "step": 5920 + }, + { + "epoch": 0.05951664057168092, + "learning_rate": 0.00018809867919225982, + "loss": 0.7808, + "mean_token_accuracy": 0.7661379158496857, + "num_tokens": 20151452.0, + "step": 5930 + }, + { + "epoch": 0.05961700590148139, + "learning_rate": 0.00018807860612629976, + "loss": 0.8045, + "mean_token_accuracy": 0.7613177597522736, + "num_tokens": 20186055.0, + "step": 5940 + }, + { + "epoch": 0.05971737123128187, + "learning_rate": 0.00018805853306033964, + "loss": 0.8308, + "mean_token_accuracy": 0.7547689199447631, + "num_tokens": 20219685.0, + "step": 5950 + }, + { + "epoch": 0.05981773656108234, + "learning_rate": 0.00018803845999437955, + "loss": 0.7782, + "mean_token_accuracy": 0.7654559493064881, + "num_tokens": 20252861.0, + "step": 5960 + }, + { + "epoch": 0.05991810189088281, + "learning_rate": 0.00018801838692841945, + "loss": 0.8142, + "mean_token_accuracy": 0.7605828762054443, + "num_tokens": 20287153.0, + "step": 5970 + }, + { + "epoch": 0.06001846722068329, + "learning_rate": 0.00018799831386245936, + "loss": 0.7865, + "mean_token_accuracy": 0.7667762041091919, + "num_tokens": 20320973.0, + "step": 5980 + }, + { + "epoch": 0.06011883255048376, + "learning_rate": 0.00018797824079649927, + "loss": 0.8286, + "mean_token_accuracy": 0.760528302192688, + "num_tokens": 20355336.0, + "step": 5990 + }, + { + "epoch": 0.060219197880284236, + "learning_rate": 0.00018795816773053918, + "loss": 0.7953, + "mean_token_accuracy": 0.7689983487129212, + "num_tokens": 20389318.0, + "step": 6000 + }, + { + "epoch": 0.060319563210084706, + "learning_rate": 0.0001879380946645791, + "loss": 0.7804, + "mean_token_accuracy": 0.7755901873111725, + "num_tokens": 20423818.0, + "step": 6010 + }, + { + "epoch": 0.06041992853988518, + "learning_rate": 0.00018791802159861897, + "loss": 0.842, + "mean_token_accuracy": 0.7587439954280853, + "num_tokens": 20457672.0, + "step": 6020 + }, + { + "epoch": 0.06052029386968565, + "learning_rate": 0.0001878979485326589, + "loss": 0.8397, + "mean_token_accuracy": 0.7565126895904541, + "num_tokens": 20491344.0, + "step": 6030 + }, + { + "epoch": 0.06062065919948613, + "learning_rate": 0.0001878778754666988, + "loss": 0.7981, + "mean_token_accuracy": 0.7695219695568085, + "num_tokens": 20526064.0, + "step": 6040 + }, + { + "epoch": 0.060721024529286606, + "learning_rate": 0.0001878578024007387, + "loss": 0.7987, + "mean_token_accuracy": 0.7648639619350434, + "num_tokens": 20559452.0, + "step": 6050 + }, + { + "epoch": 0.060821389859087076, + "learning_rate": 0.0001878377293347786, + "loss": 0.809, + "mean_token_accuracy": 0.7631817996501923, + "num_tokens": 20593229.0, + "step": 6060 + }, + { + "epoch": 0.06092175518888755, + "learning_rate": 0.0001878176562688185, + "loss": 0.7956, + "mean_token_accuracy": 0.7655171811580658, + "num_tokens": 20626658.0, + "step": 6070 + }, + { + "epoch": 0.06102212051868802, + "learning_rate": 0.00018779758320285842, + "loss": 0.815, + "mean_token_accuracy": 0.76067014336586, + "num_tokens": 20660950.0, + "step": 6080 + }, + { + "epoch": 0.0611224858484885, + "learning_rate": 0.00018777751013689833, + "loss": 0.7855, + "mean_token_accuracy": 0.7704148888587952, + "num_tokens": 20695240.0, + "step": 6090 + }, + { + "epoch": 0.06122285117828897, + "learning_rate": 0.00018775743707093824, + "loss": 0.777, + "mean_token_accuracy": 0.7698096513748169, + "num_tokens": 20729588.0, + "step": 6100 + }, + { + "epoch": 0.061323216508089445, + "learning_rate": 0.00018773736400497812, + "loss": 0.8143, + "mean_token_accuracy": 0.7658511698246002, + "num_tokens": 20763084.0, + "step": 6110 + }, + { + "epoch": 0.06142358183788992, + "learning_rate": 0.00018771729093901805, + "loss": 0.7913, + "mean_token_accuracy": 0.7673853039741516, + "num_tokens": 20797083.0, + "step": 6120 + }, + { + "epoch": 0.06152394716769039, + "learning_rate": 0.00018769721787305794, + "loss": 0.7981, + "mean_token_accuracy": 0.7638794362545014, + "num_tokens": 20831358.0, + "step": 6130 + }, + { + "epoch": 0.06162431249749087, + "learning_rate": 0.00018767714480709784, + "loss": 0.8172, + "mean_token_accuracy": 0.7574215590953827, + "num_tokens": 20866454.0, + "step": 6140 + }, + { + "epoch": 0.06172467782729134, + "learning_rate": 0.00018765707174113775, + "loss": 0.7934, + "mean_token_accuracy": 0.768745094537735, + "num_tokens": 20899962.0, + "step": 6150 + }, + { + "epoch": 0.061825043157091815, + "learning_rate": 0.00018763699867517766, + "loss": 0.8202, + "mean_token_accuracy": 0.7607693433761596, + "num_tokens": 20933697.0, + "step": 6160 + }, + { + "epoch": 0.061925408486892285, + "learning_rate": 0.00018761692560921754, + "loss": 0.7861, + "mean_token_accuracy": 0.7652881443500519, + "num_tokens": 20968060.0, + "step": 6170 + }, + { + "epoch": 0.06202577381669276, + "learning_rate": 0.00018759685254325748, + "loss": 0.7731, + "mean_token_accuracy": 0.7703279852867126, + "num_tokens": 21001696.0, + "step": 6180 + }, + { + "epoch": 0.06212613914649324, + "learning_rate": 0.00018757677947729736, + "loss": 0.8066, + "mean_token_accuracy": 0.7638004124164581, + "num_tokens": 21035406.0, + "step": 6190 + }, + { + "epoch": 0.06222650447629371, + "learning_rate": 0.00018755670641133727, + "loss": 0.8317, + "mean_token_accuracy": 0.7551860272884369, + "num_tokens": 21069683.0, + "step": 6200 + }, + { + "epoch": 0.062326869806094184, + "learning_rate": 0.00018753663334537718, + "loss": 0.7973, + "mean_token_accuracy": 0.7640761077404022, + "num_tokens": 21103087.0, + "step": 6210 + }, + { + "epoch": 0.062427235135894654, + "learning_rate": 0.00018751656027941708, + "loss": 0.8224, + "mean_token_accuracy": 0.7616025328636169, + "num_tokens": 21137491.0, + "step": 6220 + }, + { + "epoch": 0.06252760046569512, + "learning_rate": 0.000187496487213457, + "loss": 0.7994, + "mean_token_accuracy": 0.7634743452072144, + "num_tokens": 21170793.0, + "step": 6230 + }, + { + "epoch": 0.06262796579549561, + "learning_rate": 0.0001874764141474969, + "loss": 0.7774, + "mean_token_accuracy": 0.7705293118953704, + "num_tokens": 21204817.0, + "step": 6240 + }, + { + "epoch": 0.06272833112529608, + "learning_rate": 0.0001874563410815368, + "loss": 0.7837, + "mean_token_accuracy": 0.7658221244812011, + "num_tokens": 21238410.0, + "step": 6250 + }, + { + "epoch": 0.06282869645509655, + "learning_rate": 0.0001874362680155767, + "loss": 0.7713, + "mean_token_accuracy": 0.7699131309986115, + "num_tokens": 21272207.0, + "step": 6260 + }, + { + "epoch": 0.06292906178489703, + "learning_rate": 0.00018741619494961663, + "loss": 0.8096, + "mean_token_accuracy": 0.7599456548690796, + "num_tokens": 21306565.0, + "step": 6270 + }, + { + "epoch": 0.0630294271146975, + "learning_rate": 0.0001873961218836565, + "loss": 0.8294, + "mean_token_accuracy": 0.7624841749668121, + "num_tokens": 21340759.0, + "step": 6280 + }, + { + "epoch": 0.06312979244449797, + "learning_rate": 0.00018737604881769642, + "loss": 0.7795, + "mean_token_accuracy": 0.7709579408168793, + "num_tokens": 21374808.0, + "step": 6290 + }, + { + "epoch": 0.06323015777429844, + "learning_rate": 0.00018735597575173632, + "loss": 0.8122, + "mean_token_accuracy": 0.768221527338028, + "num_tokens": 21408934.0, + "step": 6300 + }, + { + "epoch": 0.06333052310409892, + "learning_rate": 0.00018733590268577623, + "loss": 0.7999, + "mean_token_accuracy": 0.7624027013778687, + "num_tokens": 21443766.0, + "step": 6310 + }, + { + "epoch": 0.0634308884338994, + "learning_rate": 0.00018731582961981614, + "loss": 0.8013, + "mean_token_accuracy": 0.7636422693729401, + "num_tokens": 21476818.0, + "step": 6320 + }, + { + "epoch": 0.06353125376369986, + "learning_rate": 0.00018729575655385605, + "loss": 0.8473, + "mean_token_accuracy": 0.7541101336479187, + "num_tokens": 21510554.0, + "step": 6330 + }, + { + "epoch": 0.06363161909350035, + "learning_rate": 0.00018727568348789596, + "loss": 0.7798, + "mean_token_accuracy": 0.7720778703689575, + "num_tokens": 21544946.0, + "step": 6340 + }, + { + "epoch": 0.06373198442330082, + "learning_rate": 0.00018725561042193584, + "loss": 0.8102, + "mean_token_accuracy": 0.7652732551097869, + "num_tokens": 21578855.0, + "step": 6350 + }, + { + "epoch": 0.06383234975310129, + "learning_rate": 0.00018723553735597578, + "loss": 0.8019, + "mean_token_accuracy": 0.7628812253475189, + "num_tokens": 21612750.0, + "step": 6360 + }, + { + "epoch": 0.06393271508290176, + "learning_rate": 0.00018721546429001566, + "loss": 0.8047, + "mean_token_accuracy": 0.7649907410144806, + "num_tokens": 21646545.0, + "step": 6370 + }, + { + "epoch": 0.06403308041270224, + "learning_rate": 0.00018719539122405556, + "loss": 0.7387, + "mean_token_accuracy": 0.7732436716556549, + "num_tokens": 21679576.0, + "step": 6380 + }, + { + "epoch": 0.06413344574250271, + "learning_rate": 0.00018717531815809547, + "loss": 0.7835, + "mean_token_accuracy": 0.7719547331333161, + "num_tokens": 21713415.0, + "step": 6390 + }, + { + "epoch": 0.06423381107230318, + "learning_rate": 0.00018715524509213538, + "loss": 0.8116, + "mean_token_accuracy": 0.7636037707328797, + "num_tokens": 21748100.0, + "step": 6400 + }, + { + "epoch": 0.06433417640210366, + "learning_rate": 0.00018713517202617526, + "loss": 0.8141, + "mean_token_accuracy": 0.7599149942398071, + "num_tokens": 21782455.0, + "step": 6410 + }, + { + "epoch": 0.06443454173190413, + "learning_rate": 0.0001871150989602152, + "loss": 0.7932, + "mean_token_accuracy": 0.7646901726722717, + "num_tokens": 21815891.0, + "step": 6420 + }, + { + "epoch": 0.0645349070617046, + "learning_rate": 0.0001870950258942551, + "loss": 0.8204, + "mean_token_accuracy": 0.7630632758140564, + "num_tokens": 21850242.0, + "step": 6430 + }, + { + "epoch": 0.06463527239150507, + "learning_rate": 0.00018707495282829502, + "loss": 0.8234, + "mean_token_accuracy": 0.7595869898796082, + "num_tokens": 21884118.0, + "step": 6440 + }, + { + "epoch": 0.06473563772130556, + "learning_rate": 0.00018705487976233492, + "loss": 0.8086, + "mean_token_accuracy": 0.7603508055210113, + "num_tokens": 21918370.0, + "step": 6450 + }, + { + "epoch": 0.06483600305110603, + "learning_rate": 0.0001870348066963748, + "loss": 0.8086, + "mean_token_accuracy": 0.7649601578712464, + "num_tokens": 21952680.0, + "step": 6460 + }, + { + "epoch": 0.0649363683809065, + "learning_rate": 0.00018701473363041474, + "loss": 0.7808, + "mean_token_accuracy": 0.7692488193511963, + "num_tokens": 21986556.0, + "step": 6470 + }, + { + "epoch": 0.06503673371070698, + "learning_rate": 0.00018699466056445462, + "loss": 0.7904, + "mean_token_accuracy": 0.7678544044494628, + "num_tokens": 22020264.0, + "step": 6480 + }, + { + "epoch": 0.06513709904050745, + "learning_rate": 0.00018697458749849453, + "loss": 0.8102, + "mean_token_accuracy": 0.757061505317688, + "num_tokens": 22054571.0, + "step": 6490 + }, + { + "epoch": 0.06523746437030792, + "learning_rate": 0.00018695451443253444, + "loss": 0.8058, + "mean_token_accuracy": 0.7630744695663452, + "num_tokens": 22088121.0, + "step": 6500 + }, + { + "epoch": 0.06533782970010839, + "learning_rate": 0.00018693444136657435, + "loss": 0.7819, + "mean_token_accuracy": 0.7664906919002533, + "num_tokens": 22121552.0, + "step": 6510 + }, + { + "epoch": 0.06543819502990887, + "learning_rate": 0.00018691436830061423, + "loss": 0.8029, + "mean_token_accuracy": 0.7638392865657806, + "num_tokens": 22155401.0, + "step": 6520 + }, + { + "epoch": 0.06553856035970934, + "learning_rate": 0.00018689429523465416, + "loss": 0.8128, + "mean_token_accuracy": 0.7656901359558106, + "num_tokens": 22190370.0, + "step": 6530 + }, + { + "epoch": 0.06563892568950981, + "learning_rate": 0.00018687422216869405, + "loss": 0.7885, + "mean_token_accuracy": 0.7664203882217407, + "num_tokens": 22224623.0, + "step": 6540 + }, + { + "epoch": 0.0657392910193103, + "learning_rate": 0.00018685414910273395, + "loss": 0.8051, + "mean_token_accuracy": 0.7663968801498413, + "num_tokens": 22257909.0, + "step": 6550 + }, + { + "epoch": 0.06583965634911076, + "learning_rate": 0.00018683407603677386, + "loss": 0.7753, + "mean_token_accuracy": 0.7702917993068695, + "num_tokens": 22292308.0, + "step": 6560 + }, + { + "epoch": 0.06594002167891123, + "learning_rate": 0.00018681400297081377, + "loss": 0.8258, + "mean_token_accuracy": 0.7632131099700927, + "num_tokens": 22326205.0, + "step": 6570 + }, + { + "epoch": 0.0660403870087117, + "learning_rate": 0.00018679392990485368, + "loss": 0.7981, + "mean_token_accuracy": 0.7664714992046356, + "num_tokens": 22360295.0, + "step": 6580 + }, + { + "epoch": 0.06614075233851219, + "learning_rate": 0.0001867738568388936, + "loss": 0.8162, + "mean_token_accuracy": 0.7592804372310639, + "num_tokens": 22393878.0, + "step": 6590 + }, + { + "epoch": 0.06624111766831266, + "learning_rate": 0.0001867537837729335, + "loss": 0.7815, + "mean_token_accuracy": 0.7708893895149231, + "num_tokens": 22427401.0, + "step": 6600 + }, + { + "epoch": 0.06634148299811313, + "learning_rate": 0.00018673371070697338, + "loss": 0.7533, + "mean_token_accuracy": 0.7742358803749084, + "num_tokens": 22461573.0, + "step": 6610 + }, + { + "epoch": 0.06644184832791361, + "learning_rate": 0.0001867136376410133, + "loss": 0.7825, + "mean_token_accuracy": 0.7690136432647705, + "num_tokens": 22495932.0, + "step": 6620 + }, + { + "epoch": 0.06654221365771408, + "learning_rate": 0.0001866935645750532, + "loss": 0.7695, + "mean_token_accuracy": 0.772958654165268, + "num_tokens": 22530271.0, + "step": 6630 + }, + { + "epoch": 0.06664257898751455, + "learning_rate": 0.0001866734915090931, + "loss": 0.7696, + "mean_token_accuracy": 0.7698410391807556, + "num_tokens": 22564450.0, + "step": 6640 + }, + { + "epoch": 0.06674294431731502, + "learning_rate": 0.000186653418443133, + "loss": 0.7832, + "mean_token_accuracy": 0.7672110676765442, + "num_tokens": 22598384.0, + "step": 6650 + }, + { + "epoch": 0.0668433096471155, + "learning_rate": 0.00018663334537717292, + "loss": 0.8045, + "mean_token_accuracy": 0.7631735801696777, + "num_tokens": 22632404.0, + "step": 6660 + }, + { + "epoch": 0.06694367497691597, + "learning_rate": 0.00018661327231121283, + "loss": 0.8113, + "mean_token_accuracy": 0.7584132015705108, + "num_tokens": 22666582.0, + "step": 6670 + }, + { + "epoch": 0.06704404030671644, + "learning_rate": 0.00018659319924525274, + "loss": 0.8197, + "mean_token_accuracy": 0.7588787019252777, + "num_tokens": 22700042.0, + "step": 6680 + }, + { + "epoch": 0.06714440563651693, + "learning_rate": 0.00018657312617929265, + "loss": 0.7848, + "mean_token_accuracy": 0.7639056861400604, + "num_tokens": 22734093.0, + "step": 6690 + }, + { + "epoch": 0.0672447709663174, + "learning_rate": 0.00018655305311333253, + "loss": 0.7943, + "mean_token_accuracy": 0.768567031621933, + "num_tokens": 22768710.0, + "step": 6700 + }, + { + "epoch": 0.06734513629611787, + "learning_rate": 0.00018653298004737246, + "loss": 0.7933, + "mean_token_accuracy": 0.77075697183609, + "num_tokens": 22802873.0, + "step": 6710 + }, + { + "epoch": 0.06744550162591834, + "learning_rate": 0.00018651290698141234, + "loss": 0.7788, + "mean_token_accuracy": 0.7654812693595886, + "num_tokens": 22837076.0, + "step": 6720 + }, + { + "epoch": 0.06754586695571882, + "learning_rate": 0.00018649283391545225, + "loss": 0.7879, + "mean_token_accuracy": 0.767909950017929, + "num_tokens": 22870632.0, + "step": 6730 + }, + { + "epoch": 0.06764623228551929, + "learning_rate": 0.00018647276084949216, + "loss": 0.8248, + "mean_token_accuracy": 0.7626499176025391, + "num_tokens": 22904468.0, + "step": 6740 + }, + { + "epoch": 0.06774659761531976, + "learning_rate": 0.00018645268778353207, + "loss": 0.8024, + "mean_token_accuracy": 0.7642915844917297, + "num_tokens": 22938185.0, + "step": 6750 + }, + { + "epoch": 0.06784696294512024, + "learning_rate": 0.00018643261471757195, + "loss": 0.8006, + "mean_token_accuracy": 0.7666011452674866, + "num_tokens": 22971572.0, + "step": 6760 + }, + { + "epoch": 0.06794732827492071, + "learning_rate": 0.00018641254165161189, + "loss": 0.8288, + "mean_token_accuracy": 0.7597508609294892, + "num_tokens": 23005463.0, + "step": 6770 + }, + { + "epoch": 0.06804769360472118, + "learning_rate": 0.0001863924685856518, + "loss": 0.8122, + "mean_token_accuracy": 0.7596763968467712, + "num_tokens": 23040406.0, + "step": 6780 + }, + { + "epoch": 0.06814805893452165, + "learning_rate": 0.00018637239551969168, + "loss": 0.8016, + "mean_token_accuracy": 0.7657992899417877, + "num_tokens": 23074368.0, + "step": 6790 + }, + { + "epoch": 0.06824842426432214, + "learning_rate": 0.0001863523224537316, + "loss": 0.7887, + "mean_token_accuracy": 0.7637387990951539, + "num_tokens": 23108197.0, + "step": 6800 + }, + { + "epoch": 0.0683487895941226, + "learning_rate": 0.0001863322493877715, + "loss": 0.7786, + "mean_token_accuracy": 0.7647190570831299, + "num_tokens": 23142110.0, + "step": 6810 + }, + { + "epoch": 0.06844915492392308, + "learning_rate": 0.0001863121763218114, + "loss": 0.7971, + "mean_token_accuracy": 0.7630793511867523, + "num_tokens": 23176423.0, + "step": 6820 + }, + { + "epoch": 0.06854952025372356, + "learning_rate": 0.0001862921032558513, + "loss": 0.8011, + "mean_token_accuracy": 0.7649743497371674, + "num_tokens": 23210845.0, + "step": 6830 + }, + { + "epoch": 0.06864988558352403, + "learning_rate": 0.00018627203018989122, + "loss": 0.7749, + "mean_token_accuracy": 0.7704343676567078, + "num_tokens": 23244552.0, + "step": 6840 + }, + { + "epoch": 0.0687502509133245, + "learning_rate": 0.0001862519571239311, + "loss": 0.7721, + "mean_token_accuracy": 0.7698425590991974, + "num_tokens": 23277814.0, + "step": 6850 + }, + { + "epoch": 0.06885061624312497, + "learning_rate": 0.00018623188405797103, + "loss": 0.7882, + "mean_token_accuracy": 0.7701736092567444, + "num_tokens": 23312519.0, + "step": 6860 + }, + { + "epoch": 0.06895098157292545, + "learning_rate": 0.00018621181099201092, + "loss": 0.7998, + "mean_token_accuracy": 0.7650366485118866, + "num_tokens": 23345465.0, + "step": 6870 + }, + { + "epoch": 0.06905134690272592, + "learning_rate": 0.00018619173792605082, + "loss": 0.812, + "mean_token_accuracy": 0.7643380880355835, + "num_tokens": 23379659.0, + "step": 6880 + }, + { + "epoch": 0.06915171223252639, + "learning_rate": 0.00018617166486009073, + "loss": 0.7994, + "mean_token_accuracy": 0.7671465694904327, + "num_tokens": 23413846.0, + "step": 6890 + }, + { + "epoch": 0.06925207756232687, + "learning_rate": 0.00018615159179413064, + "loss": 0.7822, + "mean_token_accuracy": 0.7706863880157471, + "num_tokens": 23448483.0, + "step": 6900 + }, + { + "epoch": 0.06935244289212734, + "learning_rate": 0.00018613151872817055, + "loss": 0.8162, + "mean_token_accuracy": 0.7635308921337127, + "num_tokens": 23482708.0, + "step": 6910 + }, + { + "epoch": 0.06945280822192781, + "learning_rate": 0.00018611144566221046, + "loss": 0.795, + "mean_token_accuracy": 0.7642087519168854, + "num_tokens": 23516631.0, + "step": 6920 + }, + { + "epoch": 0.0695531735517283, + "learning_rate": 0.00018609137259625037, + "loss": 0.7962, + "mean_token_accuracy": 0.7656026661396027, + "num_tokens": 23549636.0, + "step": 6930 + }, + { + "epoch": 0.06965353888152877, + "learning_rate": 0.00018607129953029025, + "loss": 0.7884, + "mean_token_accuracy": 0.7681177496910095, + "num_tokens": 23583937.0, + "step": 6940 + }, + { + "epoch": 0.06975390421132924, + "learning_rate": 0.00018605122646433018, + "loss": 0.7803, + "mean_token_accuracy": 0.7695082247257232, + "num_tokens": 23617720.0, + "step": 6950 + }, + { + "epoch": 0.06985426954112971, + "learning_rate": 0.00018603115339837006, + "loss": 0.8068, + "mean_token_accuracy": 0.7647221088409424, + "num_tokens": 23652403.0, + "step": 6960 + }, + { + "epoch": 0.06995463487093019, + "learning_rate": 0.00018601108033240997, + "loss": 0.804, + "mean_token_accuracy": 0.7643355369567871, + "num_tokens": 23686213.0, + "step": 6970 + }, + { + "epoch": 0.07005500020073066, + "learning_rate": 0.00018599100726644988, + "loss": 0.7881, + "mean_token_accuracy": 0.7634240865707398, + "num_tokens": 23720434.0, + "step": 6980 + }, + { + "epoch": 0.07015536553053113, + "learning_rate": 0.0001859709342004898, + "loss": 0.7431, + "mean_token_accuracy": 0.7756571233272552, + "num_tokens": 23754142.0, + "step": 6990 + }, + { + "epoch": 0.07025573086033161, + "learning_rate": 0.0001859508611345297, + "loss": 0.7755, + "mean_token_accuracy": 0.7678376853466033, + "num_tokens": 23788474.0, + "step": 7000 + }, + { + "epoch": 0.07035609619013208, + "learning_rate": 0.0001859307880685696, + "loss": 0.7939, + "mean_token_accuracy": 0.7618476390838623, + "num_tokens": 23822495.0, + "step": 7010 + }, + { + "epoch": 0.07045646151993255, + "learning_rate": 0.00018591071500260952, + "loss": 0.7935, + "mean_token_accuracy": 0.7679507672786713, + "num_tokens": 23856653.0, + "step": 7020 + }, + { + "epoch": 0.07055682684973302, + "learning_rate": 0.00018589064193664942, + "loss": 0.8062, + "mean_token_accuracy": 0.7621446549892426, + "num_tokens": 23889845.0, + "step": 7030 + }, + { + "epoch": 0.0706571921795335, + "learning_rate": 0.00018587056887068933, + "loss": 0.7955, + "mean_token_accuracy": 0.7612752199172974, + "num_tokens": 23923933.0, + "step": 7040 + }, + { + "epoch": 0.07075755750933398, + "learning_rate": 0.0001858504958047292, + "loss": 0.8045, + "mean_token_accuracy": 0.7675998091697693, + "num_tokens": 23958128.0, + "step": 7050 + }, + { + "epoch": 0.07085792283913445, + "learning_rate": 0.00018583042273876915, + "loss": 0.7695, + "mean_token_accuracy": 0.7677767932415008, + "num_tokens": 23991852.0, + "step": 7060 + }, + { + "epoch": 0.07095828816893493, + "learning_rate": 0.00018581034967280903, + "loss": 0.7968, + "mean_token_accuracy": 0.7666783332824707, + "num_tokens": 24025509.0, + "step": 7070 + }, + { + "epoch": 0.0710586534987354, + "learning_rate": 0.00018579027660684894, + "loss": 0.7608, + "mean_token_accuracy": 0.7742595195770263, + "num_tokens": 24059977.0, + "step": 7080 + }, + { + "epoch": 0.07115901882853587, + "learning_rate": 0.00018577020354088885, + "loss": 0.8159, + "mean_token_accuracy": 0.7611697912216187, + "num_tokens": 24094490.0, + "step": 7090 + }, + { + "epoch": 0.07125938415833634, + "learning_rate": 0.00018575013047492876, + "loss": 0.7988, + "mean_token_accuracy": 0.7634016036987304, + "num_tokens": 24127862.0, + "step": 7100 + }, + { + "epoch": 0.07135974948813682, + "learning_rate": 0.00018573005740896864, + "loss": 0.8365, + "mean_token_accuracy": 0.75287726521492, + "num_tokens": 24162831.0, + "step": 7110 + }, + { + "epoch": 0.07146011481793729, + "learning_rate": 0.00018570998434300857, + "loss": 0.7845, + "mean_token_accuracy": 0.7638778507709503, + "num_tokens": 24196205.0, + "step": 7120 + }, + { + "epoch": 0.07156048014773776, + "learning_rate": 0.00018568991127704848, + "loss": 0.816, + "mean_token_accuracy": 0.7571133255958558, + "num_tokens": 24230360.0, + "step": 7130 + }, + { + "epoch": 0.07166084547753825, + "learning_rate": 0.00018566983821108836, + "loss": 0.8029, + "mean_token_accuracy": 0.7698984265327453, + "num_tokens": 24264184.0, + "step": 7140 + }, + { + "epoch": 0.07176121080733872, + "learning_rate": 0.0001856497651451283, + "loss": 0.8, + "mean_token_accuracy": 0.7596933901309967, + "num_tokens": 24298488.0, + "step": 7150 + }, + { + "epoch": 0.07186157613713919, + "learning_rate": 0.00018562969207916818, + "loss": 0.7838, + "mean_token_accuracy": 0.7674479365348816, + "num_tokens": 24332168.0, + "step": 7160 + }, + { + "epoch": 0.07196194146693966, + "learning_rate": 0.0001856096190132081, + "loss": 0.7817, + "mean_token_accuracy": 0.7701567053794861, + "num_tokens": 24367218.0, + "step": 7170 + }, + { + "epoch": 0.07206230679674014, + "learning_rate": 0.000185589545947248, + "loss": 0.8054, + "mean_token_accuracy": 0.7614714801311493, + "num_tokens": 24401414.0, + "step": 7180 + }, + { + "epoch": 0.07216267212654061, + "learning_rate": 0.0001855694728812879, + "loss": 0.8169, + "mean_token_accuracy": 0.7615014910697937, + "num_tokens": 24434667.0, + "step": 7190 + }, + { + "epoch": 0.07226303745634108, + "learning_rate": 0.00018554939981532779, + "loss": 0.8453, + "mean_token_accuracy": 0.7534982144832612, + "num_tokens": 24467459.0, + "step": 7200 + }, + { + "epoch": 0.07236340278614156, + "learning_rate": 0.00018552932674936772, + "loss": 0.825, + "mean_token_accuracy": 0.7568074822425842, + "num_tokens": 24501863.0, + "step": 7210 + }, + { + "epoch": 0.07246376811594203, + "learning_rate": 0.0001855092536834076, + "loss": 0.8232, + "mean_token_accuracy": 0.7650467276573181, + "num_tokens": 24536523.0, + "step": 7220 + }, + { + "epoch": 0.0725641334457425, + "learning_rate": 0.0001854891806174475, + "loss": 0.7662, + "mean_token_accuracy": 0.7714950680732727, + "num_tokens": 24569789.0, + "step": 7230 + }, + { + "epoch": 0.07266449877554297, + "learning_rate": 0.00018546910755148742, + "loss": 0.7812, + "mean_token_accuracy": 0.7700926840305329, + "num_tokens": 24603356.0, + "step": 7240 + }, + { + "epoch": 0.07276486410534345, + "learning_rate": 0.00018544903448552733, + "loss": 0.8097, + "mean_token_accuracy": 0.7624179661273957, + "num_tokens": 24636880.0, + "step": 7250 + }, + { + "epoch": 0.07286522943514392, + "learning_rate": 0.00018542896141956724, + "loss": 0.7745, + "mean_token_accuracy": 0.7721749603748321, + "num_tokens": 24670012.0, + "step": 7260 + }, + { + "epoch": 0.0729655947649444, + "learning_rate": 0.00018540888835360714, + "loss": 0.7861, + "mean_token_accuracy": 0.7649307548999786, + "num_tokens": 24705021.0, + "step": 7270 + }, + { + "epoch": 0.07306596009474488, + "learning_rate": 0.00018538881528764705, + "loss": 0.8028, + "mean_token_accuracy": 0.7616039216518402, + "num_tokens": 24739152.0, + "step": 7280 + }, + { + "epoch": 0.07316632542454535, + "learning_rate": 0.00018536874222168693, + "loss": 0.7838, + "mean_token_accuracy": 0.7636917471885681, + "num_tokens": 24772941.0, + "step": 7290 + }, + { + "epoch": 0.07326669075434582, + "learning_rate": 0.00018534866915572687, + "loss": 0.7688, + "mean_token_accuracy": 0.7758508145809173, + "num_tokens": 24807079.0, + "step": 7300 + }, + { + "epoch": 0.07336705608414629, + "learning_rate": 0.00018532859608976675, + "loss": 0.7727, + "mean_token_accuracy": 0.7693508982658386, + "num_tokens": 24841006.0, + "step": 7310 + }, + { + "epoch": 0.07346742141394677, + "learning_rate": 0.00018530852302380666, + "loss": 0.8136, + "mean_token_accuracy": 0.7646665930747986, + "num_tokens": 24874708.0, + "step": 7320 + }, + { + "epoch": 0.07356778674374724, + "learning_rate": 0.00018528844995784657, + "loss": 0.7939, + "mean_token_accuracy": 0.7661986827850342, + "num_tokens": 24907841.0, + "step": 7330 + }, + { + "epoch": 0.07366815207354771, + "learning_rate": 0.00018526837689188648, + "loss": 0.8078, + "mean_token_accuracy": 0.76460902094841, + "num_tokens": 24941688.0, + "step": 7340 + }, + { + "epoch": 0.0737685174033482, + "learning_rate": 0.00018524830382592639, + "loss": 0.7928, + "mean_token_accuracy": 0.7639065086841583, + "num_tokens": 24975598.0, + "step": 7350 + }, + { + "epoch": 0.07386888273314866, + "learning_rate": 0.0001852282307599663, + "loss": 0.7972, + "mean_token_accuracy": 0.7660596668720245, + "num_tokens": 25009904.0, + "step": 7360 + }, + { + "epoch": 0.07396924806294913, + "learning_rate": 0.0001852081576940062, + "loss": 0.8195, + "mean_token_accuracy": 0.761925333738327, + "num_tokens": 25044157.0, + "step": 7370 + }, + { + "epoch": 0.0740696133927496, + "learning_rate": 0.00018518808462804608, + "loss": 0.8299, + "mean_token_accuracy": 0.7579504311084747, + "num_tokens": 25078167.0, + "step": 7380 + }, + { + "epoch": 0.07416997872255009, + "learning_rate": 0.00018516801156208602, + "loss": 0.8098, + "mean_token_accuracy": 0.7582357406616211, + "num_tokens": 25113228.0, + "step": 7390 + }, + { + "epoch": 0.07427034405235056, + "learning_rate": 0.0001851479384961259, + "loss": 0.8331, + "mean_token_accuracy": 0.7541563868522644, + "num_tokens": 25146882.0, + "step": 7400 + }, + { + "epoch": 0.07437070938215103, + "learning_rate": 0.0001851278654301658, + "loss": 0.8157, + "mean_token_accuracy": 0.7633441150188446, + "num_tokens": 25181415.0, + "step": 7410 + }, + { + "epoch": 0.07447107471195151, + "learning_rate": 0.00018510779236420572, + "loss": 0.7911, + "mean_token_accuracy": 0.7619963705539703, + "num_tokens": 25214350.0, + "step": 7420 + }, + { + "epoch": 0.07457144004175198, + "learning_rate": 0.00018508771929824563, + "loss": 0.8051, + "mean_token_accuracy": 0.7647240459918976, + "num_tokens": 25247448.0, + "step": 7430 + }, + { + "epoch": 0.07467180537155245, + "learning_rate": 0.0001850676462322855, + "loss": 0.7904, + "mean_token_accuracy": 0.76084805727005, + "num_tokens": 25281821.0, + "step": 7440 + }, + { + "epoch": 0.07477217070135292, + "learning_rate": 0.00018504757316632544, + "loss": 0.7992, + "mean_token_accuracy": 0.7663967788219452, + "num_tokens": 25315809.0, + "step": 7450 + }, + { + "epoch": 0.0748725360311534, + "learning_rate": 0.00018502750010036532, + "loss": 0.7854, + "mean_token_accuracy": 0.7667467296123505, + "num_tokens": 25349531.0, + "step": 7460 + }, + { + "epoch": 0.07497290136095387, + "learning_rate": 0.00018500742703440523, + "loss": 0.7869, + "mean_token_accuracy": 0.7643426060676575, + "num_tokens": 25384776.0, + "step": 7470 + }, + { + "epoch": 0.07507326669075434, + "learning_rate": 0.00018498735396844514, + "loss": 0.8214, + "mean_token_accuracy": 0.7597658336162567, + "num_tokens": 25418496.0, + "step": 7480 + }, + { + "epoch": 0.07517363202055483, + "learning_rate": 0.00018496728090248505, + "loss": 0.795, + "mean_token_accuracy": 0.7658503949642181, + "num_tokens": 25452606.0, + "step": 7490 + }, + { + "epoch": 0.0752739973503553, + "learning_rate": 0.00018494720783652496, + "loss": 0.8209, + "mean_token_accuracy": 0.7629762351512909, + "num_tokens": 25487228.0, + "step": 7500 + }, + { + "epoch": 0.07537436268015577, + "learning_rate": 0.00018492713477056487, + "loss": 0.8016, + "mean_token_accuracy": 0.7633273899555206, + "num_tokens": 25521640.0, + "step": 7510 + }, + { + "epoch": 0.07547472800995624, + "learning_rate": 0.00018490706170460477, + "loss": 0.7946, + "mean_token_accuracy": 0.768276309967041, + "num_tokens": 25555665.0, + "step": 7520 + }, + { + "epoch": 0.07557509333975672, + "learning_rate": 0.00018488698863864466, + "loss": 0.7937, + "mean_token_accuracy": 0.7652099788188934, + "num_tokens": 25589412.0, + "step": 7530 + }, + { + "epoch": 0.07567545866955719, + "learning_rate": 0.0001848669155726846, + "loss": 0.8144, + "mean_token_accuracy": 0.764784699678421, + "num_tokens": 25623812.0, + "step": 7540 + }, + { + "epoch": 0.07577582399935766, + "learning_rate": 0.00018484684250672447, + "loss": 0.7747, + "mean_token_accuracy": 0.7708411574363708, + "num_tokens": 25657610.0, + "step": 7550 + }, + { + "epoch": 0.07587618932915814, + "learning_rate": 0.00018482676944076438, + "loss": 0.7728, + "mean_token_accuracy": 0.7676181554794311, + "num_tokens": 25692063.0, + "step": 7560 + }, + { + "epoch": 0.07597655465895861, + "learning_rate": 0.0001848066963748043, + "loss": 0.7648, + "mean_token_accuracy": 0.7707294762134552, + "num_tokens": 25726717.0, + "step": 7570 + }, + { + "epoch": 0.07607691998875908, + "learning_rate": 0.0001847866233088442, + "loss": 0.8065, + "mean_token_accuracy": 0.7685012996196747, + "num_tokens": 25760066.0, + "step": 7580 + }, + { + "epoch": 0.07617728531855955, + "learning_rate": 0.0001847665502428841, + "loss": 0.8118, + "mean_token_accuracy": 0.7668388724327088, + "num_tokens": 25794087.0, + "step": 7590 + }, + { + "epoch": 0.07627765064836003, + "learning_rate": 0.00018474647717692401, + "loss": 0.8276, + "mean_token_accuracy": 0.7590035438537598, + "num_tokens": 25827788.0, + "step": 7600 + }, + { + "epoch": 0.0763780159781605, + "learning_rate": 0.00018472640411096392, + "loss": 0.7972, + "mean_token_accuracy": 0.7652108430862427, + "num_tokens": 25861486.0, + "step": 7610 + }, + { + "epoch": 0.07647838130796097, + "learning_rate": 0.00018470633104500383, + "loss": 0.7782, + "mean_token_accuracy": 0.7683241486549377, + "num_tokens": 25896175.0, + "step": 7620 + }, + { + "epoch": 0.07657874663776146, + "learning_rate": 0.00018468625797904374, + "loss": 0.7888, + "mean_token_accuracy": 0.7642484068870544, + "num_tokens": 25930565.0, + "step": 7630 + }, + { + "epoch": 0.07667911196756193, + "learning_rate": 0.00018466618491308362, + "loss": 0.8218, + "mean_token_accuracy": 0.7603274822235108, + "num_tokens": 25964200.0, + "step": 7640 + }, + { + "epoch": 0.0767794772973624, + "learning_rate": 0.00018464611184712356, + "loss": 0.7992, + "mean_token_accuracy": 0.7627223074436188, + "num_tokens": 25998157.0, + "step": 7650 + }, + { + "epoch": 0.07687984262716287, + "learning_rate": 0.00018462603878116344, + "loss": 0.8036, + "mean_token_accuracy": 0.7680601716041565, + "num_tokens": 26032645.0, + "step": 7660 + }, + { + "epoch": 0.07698020795696335, + "learning_rate": 0.00018460596571520335, + "loss": 0.7804, + "mean_token_accuracy": 0.7695116221904754, + "num_tokens": 26066749.0, + "step": 7670 + }, + { + "epoch": 0.07708057328676382, + "learning_rate": 0.00018458589264924325, + "loss": 0.8028, + "mean_token_accuracy": 0.7702985823154449, + "num_tokens": 26100853.0, + "step": 7680 + }, + { + "epoch": 0.07718093861656429, + "learning_rate": 0.00018456581958328316, + "loss": 0.7806, + "mean_token_accuracy": 0.7728835463523864, + "num_tokens": 26134719.0, + "step": 7690 + }, + { + "epoch": 0.07728130394636477, + "learning_rate": 0.00018454574651732307, + "loss": 0.7949, + "mean_token_accuracy": 0.7665352702140809, + "num_tokens": 26169126.0, + "step": 7700 + }, + { + "epoch": 0.07738166927616524, + "learning_rate": 0.00018452567345136298, + "loss": 0.7926, + "mean_token_accuracy": 0.7647746622562408, + "num_tokens": 26202249.0, + "step": 7710 + }, + { + "epoch": 0.07748203460596571, + "learning_rate": 0.0001845056003854029, + "loss": 0.8082, + "mean_token_accuracy": 0.7587997853755951, + "num_tokens": 26236838.0, + "step": 7720 + }, + { + "epoch": 0.07758239993576618, + "learning_rate": 0.00018448552731944277, + "loss": 0.7877, + "mean_token_accuracy": 0.7682729542255402, + "num_tokens": 26271047.0, + "step": 7730 + }, + { + "epoch": 0.07768276526556667, + "learning_rate": 0.0001844654542534827, + "loss": 0.825, + "mean_token_accuracy": 0.7565823674201966, + "num_tokens": 26305741.0, + "step": 7740 + }, + { + "epoch": 0.07778313059536714, + "learning_rate": 0.0001844453811875226, + "loss": 0.826, + "mean_token_accuracy": 0.7599569141864777, + "num_tokens": 26339915.0, + "step": 7750 + }, + { + "epoch": 0.0778834959251676, + "learning_rate": 0.0001844253081215625, + "loss": 0.7724, + "mean_token_accuracy": 0.7702906250953674, + "num_tokens": 26374166.0, + "step": 7760 + }, + { + "epoch": 0.07798386125496809, + "learning_rate": 0.0001844052350556024, + "loss": 0.7858, + "mean_token_accuracy": 0.769506961107254, + "num_tokens": 26407465.0, + "step": 7770 + }, + { + "epoch": 0.07808422658476856, + "learning_rate": 0.0001843851619896423, + "loss": 0.8037, + "mean_token_accuracy": 0.7590090334415436, + "num_tokens": 26441910.0, + "step": 7780 + }, + { + "epoch": 0.07818459191456903, + "learning_rate": 0.0001843650889236822, + "loss": 0.8069, + "mean_token_accuracy": 0.7618598759174346, + "num_tokens": 26475249.0, + "step": 7790 + }, + { + "epoch": 0.0782849572443695, + "learning_rate": 0.00018434501585772213, + "loss": 0.7804, + "mean_token_accuracy": 0.7672445714473725, + "num_tokens": 26510028.0, + "step": 7800 + }, + { + "epoch": 0.07838532257416998, + "learning_rate": 0.000184324942791762, + "loss": 0.821, + "mean_token_accuracy": 0.764594703912735, + "num_tokens": 26543386.0, + "step": 7810 + }, + { + "epoch": 0.07848568790397045, + "learning_rate": 0.00018430486972580192, + "loss": 0.8064, + "mean_token_accuracy": 0.7608125746250153, + "num_tokens": 26576560.0, + "step": 7820 + }, + { + "epoch": 0.07858605323377092, + "learning_rate": 0.00018428479665984183, + "loss": 0.8145, + "mean_token_accuracy": 0.7621243953704834, + "num_tokens": 26609899.0, + "step": 7830 + }, + { + "epoch": 0.0786864185635714, + "learning_rate": 0.00018426472359388174, + "loss": 0.7989, + "mean_token_accuracy": 0.7658592283725738, + "num_tokens": 26644506.0, + "step": 7840 + }, + { + "epoch": 0.07878678389337188, + "learning_rate": 0.00018424465052792164, + "loss": 0.7831, + "mean_token_accuracy": 0.7703222453594207, + "num_tokens": 26678803.0, + "step": 7850 + }, + { + "epoch": 0.07888714922317235, + "learning_rate": 0.00018422457746196155, + "loss": 0.7862, + "mean_token_accuracy": 0.7615216493606567, + "num_tokens": 26712506.0, + "step": 7860 + }, + { + "epoch": 0.07898751455297282, + "learning_rate": 0.00018420450439600146, + "loss": 0.7728, + "mean_token_accuracy": 0.7699089527130127, + "num_tokens": 26746081.0, + "step": 7870 + }, + { + "epoch": 0.0790878798827733, + "learning_rate": 0.00018418443133004134, + "loss": 0.7888, + "mean_token_accuracy": 0.7717827081680297, + "num_tokens": 26779973.0, + "step": 7880 + }, + { + "epoch": 0.07918824521257377, + "learning_rate": 0.00018416435826408128, + "loss": 0.8071, + "mean_token_accuracy": 0.7643128275871277, + "num_tokens": 26814769.0, + "step": 7890 + }, + { + "epoch": 0.07928861054237424, + "learning_rate": 0.00018414428519812116, + "loss": 0.7867, + "mean_token_accuracy": 0.7633980870246887, + "num_tokens": 26848312.0, + "step": 7900 + }, + { + "epoch": 0.07938897587217472, + "learning_rate": 0.00018412421213216107, + "loss": 0.8387, + "mean_token_accuracy": 0.7578362107276917, + "num_tokens": 26881942.0, + "step": 7910 + }, + { + "epoch": 0.07948934120197519, + "learning_rate": 0.00018410413906620098, + "loss": 0.8043, + "mean_token_accuracy": 0.7660013616085053, + "num_tokens": 26916642.0, + "step": 7920 + }, + { + "epoch": 0.07958970653177566, + "learning_rate": 0.00018408406600024088, + "loss": 0.7709, + "mean_token_accuracy": 0.7725791335105896, + "num_tokens": 26950942.0, + "step": 7930 + }, + { + "epoch": 0.07969007186157613, + "learning_rate": 0.0001840639929342808, + "loss": 0.8346, + "mean_token_accuracy": 0.7565326988697052, + "num_tokens": 26985030.0, + "step": 7940 + }, + { + "epoch": 0.07979043719137661, + "learning_rate": 0.0001840439198683207, + "loss": 0.781, + "mean_token_accuracy": 0.7720654487609864, + "num_tokens": 27018067.0, + "step": 7950 + }, + { + "epoch": 0.07989080252117708, + "learning_rate": 0.0001840238468023606, + "loss": 0.8246, + "mean_token_accuracy": 0.75545853972435, + "num_tokens": 27051615.0, + "step": 7960 + }, + { + "epoch": 0.07999116785097755, + "learning_rate": 0.0001840037737364005, + "loss": 0.8261, + "mean_token_accuracy": 0.7600622177124023, + "num_tokens": 27085181.0, + "step": 7970 + }, + { + "epoch": 0.08009153318077804, + "learning_rate": 0.00018398370067044043, + "loss": 0.814, + "mean_token_accuracy": 0.7612695872783661, + "num_tokens": 27119116.0, + "step": 7980 + }, + { + "epoch": 0.08019189851057851, + "learning_rate": 0.0001839636276044803, + "loss": 0.8058, + "mean_token_accuracy": 0.7696108520030975, + "num_tokens": 27154478.0, + "step": 7990 + }, + { + "epoch": 0.08029226384037898, + "learning_rate": 0.00018394355453852022, + "loss": 0.811, + "mean_token_accuracy": 0.7640083312988282, + "num_tokens": 27188890.0, + "step": 8000 + }, + { + "epoch": 0.08039262917017945, + "learning_rate": 0.00018392348147256012, + "loss": 0.8061, + "mean_token_accuracy": 0.7589396297931671, + "num_tokens": 27222650.0, + "step": 8010 + }, + { + "epoch": 0.08049299449997993, + "learning_rate": 0.00018390340840660003, + "loss": 0.8015, + "mean_token_accuracy": 0.7603662014007568, + "num_tokens": 27256163.0, + "step": 8020 + }, + { + "epoch": 0.0805933598297804, + "learning_rate": 0.00018388333534063994, + "loss": 0.8024, + "mean_token_accuracy": 0.766388326883316, + "num_tokens": 27289939.0, + "step": 8030 + }, + { + "epoch": 0.08069372515958087, + "learning_rate": 0.00018386326227467985, + "loss": 0.7853, + "mean_token_accuracy": 0.7673959374427796, + "num_tokens": 27324482.0, + "step": 8040 + }, + { + "epoch": 0.08079409048938135, + "learning_rate": 0.00018384318920871976, + "loss": 0.8211, + "mean_token_accuracy": 0.7607272922992706, + "num_tokens": 27358513.0, + "step": 8050 + }, + { + "epoch": 0.08089445581918182, + "learning_rate": 0.00018382311614275964, + "loss": 0.801, + "mean_token_accuracy": 0.7661828458309173, + "num_tokens": 27392044.0, + "step": 8060 + }, + { + "epoch": 0.0809948211489823, + "learning_rate": 0.00018380304307679958, + "loss": 0.8001, + "mean_token_accuracy": 0.7657620906829834, + "num_tokens": 27425618.0, + "step": 8070 + }, + { + "epoch": 0.08109518647878276, + "learning_rate": 0.00018378297001083946, + "loss": 0.7737, + "mean_token_accuracy": 0.773236620426178, + "num_tokens": 27460506.0, + "step": 8080 + }, + { + "epoch": 0.08119555180858325, + "learning_rate": 0.00018376289694487937, + "loss": 0.7914, + "mean_token_accuracy": 0.7647178828716278, + "num_tokens": 27494448.0, + "step": 8090 + }, + { + "epoch": 0.08129591713838372, + "learning_rate": 0.00018374282387891927, + "loss": 0.8235, + "mean_token_accuracy": 0.7590629518032074, + "num_tokens": 27529463.0, + "step": 8100 + }, + { + "epoch": 0.08139628246818419, + "learning_rate": 0.00018372275081295918, + "loss": 0.7411, + "mean_token_accuracy": 0.7821636378765107, + "num_tokens": 27564132.0, + "step": 8110 + }, + { + "epoch": 0.08149664779798467, + "learning_rate": 0.00018370267774699906, + "loss": 0.8074, + "mean_token_accuracy": 0.7685580670833587, + "num_tokens": 27597888.0, + "step": 8120 + }, + { + "epoch": 0.08159701312778514, + "learning_rate": 0.000183682604681039, + "loss": 0.8054, + "mean_token_accuracy": 0.765894103050232, + "num_tokens": 27631531.0, + "step": 8130 + }, + { + "epoch": 0.08169737845758561, + "learning_rate": 0.00018366253161507888, + "loss": 0.7771, + "mean_token_accuracy": 0.7699494779109954, + "num_tokens": 27665523.0, + "step": 8140 + }, + { + "epoch": 0.08179774378738608, + "learning_rate": 0.00018364245854911882, + "loss": 0.7586, + "mean_token_accuracy": 0.773178231716156, + "num_tokens": 27699754.0, + "step": 8150 + }, + { + "epoch": 0.08189810911718656, + "learning_rate": 0.0001836223854831587, + "loss": 0.7507, + "mean_token_accuracy": 0.7754209101200104, + "num_tokens": 27733210.0, + "step": 8160 + }, + { + "epoch": 0.08199847444698703, + "learning_rate": 0.0001836023124171986, + "loss": 0.7712, + "mean_token_accuracy": 0.7670442402362824, + "num_tokens": 27767777.0, + "step": 8170 + }, + { + "epoch": 0.0820988397767875, + "learning_rate": 0.00018358223935123851, + "loss": 0.8371, + "mean_token_accuracy": 0.7562036275863647, + "num_tokens": 27801779.0, + "step": 8180 + }, + { + "epoch": 0.08219920510658799, + "learning_rate": 0.00018356216628527842, + "loss": 0.7753, + "mean_token_accuracy": 0.7712762773036956, + "num_tokens": 27835493.0, + "step": 8190 + }, + { + "epoch": 0.08229957043638846, + "learning_rate": 0.00018354209321931833, + "loss": 0.7857, + "mean_token_accuracy": 0.7714332640171051, + "num_tokens": 27868848.0, + "step": 8200 + }, + { + "epoch": 0.08239993576618893, + "learning_rate": 0.00018352202015335824, + "loss": 0.7889, + "mean_token_accuracy": 0.764836972951889, + "num_tokens": 27902676.0, + "step": 8210 + }, + { + "epoch": 0.0825003010959894, + "learning_rate": 0.00018350194708739815, + "loss": 0.7917, + "mean_token_accuracy": 0.7639157354831696, + "num_tokens": 27936893.0, + "step": 8220 + }, + { + "epoch": 0.08260066642578988, + "learning_rate": 0.00018348187402143803, + "loss": 0.8124, + "mean_token_accuracy": 0.7611936211585999, + "num_tokens": 27971349.0, + "step": 8230 + }, + { + "epoch": 0.08270103175559035, + "learning_rate": 0.00018346180095547796, + "loss": 0.7885, + "mean_token_accuracy": 0.7635602414608001, + "num_tokens": 28005360.0, + "step": 8240 + }, + { + "epoch": 0.08280139708539082, + "learning_rate": 0.00018344172788951785, + "loss": 0.8182, + "mean_token_accuracy": 0.7626757025718689, + "num_tokens": 28039496.0, + "step": 8250 + }, + { + "epoch": 0.0829017624151913, + "learning_rate": 0.00018342165482355775, + "loss": 0.8021, + "mean_token_accuracy": 0.7612757861614228, + "num_tokens": 28073988.0, + "step": 8260 + }, + { + "epoch": 0.08300212774499177, + "learning_rate": 0.00018340158175759766, + "loss": 0.7705, + "mean_token_accuracy": 0.7759433329105377, + "num_tokens": 28108105.0, + "step": 8270 + }, + { + "epoch": 0.08310249307479224, + "learning_rate": 0.00018338150869163757, + "loss": 0.783, + "mean_token_accuracy": 0.7666752696037292, + "num_tokens": 28141570.0, + "step": 8280 + }, + { + "epoch": 0.08320285840459271, + "learning_rate": 0.00018336143562567748, + "loss": 0.7812, + "mean_token_accuracy": 0.7679860413074493, + "num_tokens": 28175667.0, + "step": 8290 + }, + { + "epoch": 0.0833032237343932, + "learning_rate": 0.0001833413625597174, + "loss": 0.7937, + "mean_token_accuracy": 0.771624231338501, + "num_tokens": 28209112.0, + "step": 8300 + }, + { + "epoch": 0.08340358906419366, + "learning_rate": 0.0001833212894937573, + "loss": 0.7765, + "mean_token_accuracy": 0.7699212431907654, + "num_tokens": 28242271.0, + "step": 8310 + }, + { + "epoch": 0.08350395439399413, + "learning_rate": 0.00018330121642779718, + "loss": 0.8077, + "mean_token_accuracy": 0.7627488255500794, + "num_tokens": 28275861.0, + "step": 8320 + }, + { + "epoch": 0.08360431972379462, + "learning_rate": 0.0001832811433618371, + "loss": 0.8258, + "mean_token_accuracy": 0.757368391752243, + "num_tokens": 28308668.0, + "step": 8330 + }, + { + "epoch": 0.08370468505359509, + "learning_rate": 0.000183261070295877, + "loss": 0.7845, + "mean_token_accuracy": 0.766782796382904, + "num_tokens": 28342565.0, + "step": 8340 + }, + { + "epoch": 0.08380505038339556, + "learning_rate": 0.0001832409972299169, + "loss": 0.7845, + "mean_token_accuracy": 0.7720321476459503, + "num_tokens": 28376767.0, + "step": 8350 + }, + { + "epoch": 0.08390541571319603, + "learning_rate": 0.0001832209241639568, + "loss": 0.7766, + "mean_token_accuracy": 0.7695994555950165, + "num_tokens": 28409804.0, + "step": 8360 + }, + { + "epoch": 0.08400578104299651, + "learning_rate": 0.00018320085109799672, + "loss": 0.815, + "mean_token_accuracy": 0.7584184944629669, + "num_tokens": 28444956.0, + "step": 8370 + }, + { + "epoch": 0.08410614637279698, + "learning_rate": 0.00018318077803203663, + "loss": 0.825, + "mean_token_accuracy": 0.7594221532344818, + "num_tokens": 28478777.0, + "step": 8380 + }, + { + "epoch": 0.08420651170259745, + "learning_rate": 0.00018316070496607654, + "loss": 0.8124, + "mean_token_accuracy": 0.761949211359024, + "num_tokens": 28513212.0, + "step": 8390 + }, + { + "epoch": 0.08430687703239793, + "learning_rate": 0.00018314063190011645, + "loss": 0.7748, + "mean_token_accuracy": 0.7677722752094269, + "num_tokens": 28547306.0, + "step": 8400 + }, + { + "epoch": 0.0844072423621984, + "learning_rate": 0.00018312055883415633, + "loss": 0.8043, + "mean_token_accuracy": 0.7592228293418884, + "num_tokens": 28580947.0, + "step": 8410 + }, + { + "epoch": 0.08450760769199887, + "learning_rate": 0.00018310048576819626, + "loss": 0.7855, + "mean_token_accuracy": 0.7644309282302857, + "num_tokens": 28615511.0, + "step": 8420 + }, + { + "epoch": 0.08460797302179934, + "learning_rate": 0.00018308041270223614, + "loss": 0.7721, + "mean_token_accuracy": 0.7723537027835846, + "num_tokens": 28650137.0, + "step": 8430 + }, + { + "epoch": 0.08470833835159983, + "learning_rate": 0.00018306033963627605, + "loss": 0.85, + "mean_token_accuracy": 0.7568152248859406, + "num_tokens": 28684894.0, + "step": 8440 + }, + { + "epoch": 0.0848087036814003, + "learning_rate": 0.00018304026657031596, + "loss": 0.7921, + "mean_token_accuracy": 0.766416597366333, + "num_tokens": 28718933.0, + "step": 8450 + }, + { + "epoch": 0.08490906901120077, + "learning_rate": 0.00018302019350435587, + "loss": 0.8001, + "mean_token_accuracy": 0.7644974291324615, + "num_tokens": 28752719.0, + "step": 8460 + }, + { + "epoch": 0.08500943434100125, + "learning_rate": 0.00018300012043839575, + "loss": 0.8108, + "mean_token_accuracy": 0.7660545587539673, + "num_tokens": 28787113.0, + "step": 8470 + }, + { + "epoch": 0.08510979967080172, + "learning_rate": 0.00018298004737243569, + "loss": 0.7598, + "mean_token_accuracy": 0.7736972510814667, + "num_tokens": 28821222.0, + "step": 8480 + }, + { + "epoch": 0.08521016500060219, + "learning_rate": 0.00018295997430647557, + "loss": 0.7866, + "mean_token_accuracy": 0.7729543089866638, + "num_tokens": 28855377.0, + "step": 8490 + }, + { + "epoch": 0.08531053033040266, + "learning_rate": 0.00018293990124051548, + "loss": 0.7669, + "mean_token_accuracy": 0.7719655096530914, + "num_tokens": 28889960.0, + "step": 8500 + }, + { + "epoch": 0.08541089566020314, + "learning_rate": 0.00018291982817455538, + "loss": 0.8095, + "mean_token_accuracy": 0.7601831316947937, + "num_tokens": 28924470.0, + "step": 8510 + }, + { + "epoch": 0.08551126099000361, + "learning_rate": 0.0001828997551085953, + "loss": 0.8041, + "mean_token_accuracy": 0.7582235693931579, + "num_tokens": 28957673.0, + "step": 8520 + }, + { + "epoch": 0.08561162631980408, + "learning_rate": 0.0001828796820426352, + "loss": 0.788, + "mean_token_accuracy": 0.7658786296844482, + "num_tokens": 28991285.0, + "step": 8530 + }, + { + "epoch": 0.08571199164960457, + "learning_rate": 0.0001828596089766751, + "loss": 0.7883, + "mean_token_accuracy": 0.766554594039917, + "num_tokens": 29025102.0, + "step": 8540 + }, + { + "epoch": 0.08581235697940504, + "learning_rate": 0.00018283953591071502, + "loss": 0.7781, + "mean_token_accuracy": 0.7628990948200226, + "num_tokens": 29059866.0, + "step": 8550 + }, + { + "epoch": 0.0859127223092055, + "learning_rate": 0.0001828194628447549, + "loss": 0.792, + "mean_token_accuracy": 0.7650415420532226, + "num_tokens": 29094399.0, + "step": 8560 + }, + { + "epoch": 0.08601308763900598, + "learning_rate": 0.00018279938977879483, + "loss": 0.8129, + "mean_token_accuracy": 0.7575330376625061, + "num_tokens": 29128148.0, + "step": 8570 + }, + { + "epoch": 0.08611345296880646, + "learning_rate": 0.00018277931671283472, + "loss": 0.8154, + "mean_token_accuracy": 0.7631605803966522, + "num_tokens": 29162146.0, + "step": 8580 + }, + { + "epoch": 0.08621381829860693, + "learning_rate": 0.00018275924364687462, + "loss": 0.7924, + "mean_token_accuracy": 0.7658519327640534, + "num_tokens": 29197231.0, + "step": 8590 + }, + { + "epoch": 0.0863141836284074, + "learning_rate": 0.00018273917058091453, + "loss": 0.7935, + "mean_token_accuracy": 0.7624973893165589, + "num_tokens": 29231195.0, + "step": 8600 + }, + { + "epoch": 0.08641454895820788, + "learning_rate": 0.00018271909751495444, + "loss": 0.8187, + "mean_token_accuracy": 0.7632297515869141, + "num_tokens": 29265717.0, + "step": 8610 + }, + { + "epoch": 0.08651491428800835, + "learning_rate": 0.00018269902444899435, + "loss": 0.7962, + "mean_token_accuracy": 0.7655292451381683, + "num_tokens": 29299063.0, + "step": 8620 + }, + { + "epoch": 0.08661527961780882, + "learning_rate": 0.00018267895138303426, + "loss": 0.779, + "mean_token_accuracy": 0.7777730166912079, + "num_tokens": 29333094.0, + "step": 8630 + }, + { + "epoch": 0.08671564494760929, + "learning_rate": 0.00018265887831707417, + "loss": 0.8155, + "mean_token_accuracy": 0.7669682502746582, + "num_tokens": 29367809.0, + "step": 8640 + }, + { + "epoch": 0.08681601027740977, + "learning_rate": 0.00018263880525111405, + "loss": 0.813, + "mean_token_accuracy": 0.7619749963283539, + "num_tokens": 29401517.0, + "step": 8650 + }, + { + "epoch": 0.08691637560721024, + "learning_rate": 0.00018261873218515398, + "loss": 0.7736, + "mean_token_accuracy": 0.7691554009914399, + "num_tokens": 29435888.0, + "step": 8660 + }, + { + "epoch": 0.08701674093701071, + "learning_rate": 0.00018259865911919386, + "loss": 0.7964, + "mean_token_accuracy": 0.7643998801708222, + "num_tokens": 29469495.0, + "step": 8670 + }, + { + "epoch": 0.0871171062668112, + "learning_rate": 0.00018257858605323377, + "loss": 0.803, + "mean_token_accuracy": 0.7638863921165466, + "num_tokens": 29503322.0, + "step": 8680 + }, + { + "epoch": 0.08721747159661167, + "learning_rate": 0.00018255851298727368, + "loss": 0.7765, + "mean_token_accuracy": 0.7672784090042114, + "num_tokens": 29537549.0, + "step": 8690 + }, + { + "epoch": 0.08731783692641214, + "learning_rate": 0.0001825384399213136, + "loss": 0.8106, + "mean_token_accuracy": 0.7580951035022736, + "num_tokens": 29572158.0, + "step": 8700 + }, + { + "epoch": 0.08741820225621261, + "learning_rate": 0.0001825183668553535, + "loss": 0.8063, + "mean_token_accuracy": 0.7586085200309753, + "num_tokens": 29606342.0, + "step": 8710 + }, + { + "epoch": 0.08751856758601309, + "learning_rate": 0.0001824982937893934, + "loss": 0.8092, + "mean_token_accuracy": 0.76483913064003, + "num_tokens": 29639627.0, + "step": 8720 + }, + { + "epoch": 0.08761893291581356, + "learning_rate": 0.00018247822072343332, + "loss": 0.7798, + "mean_token_accuracy": 0.7659261226654053, + "num_tokens": 29673673.0, + "step": 8730 + }, + { + "epoch": 0.08771929824561403, + "learning_rate": 0.00018245814765747322, + "loss": 0.773, + "mean_token_accuracy": 0.7755686104297638, + "num_tokens": 29707564.0, + "step": 8740 + }, + { + "epoch": 0.08781966357541451, + "learning_rate": 0.00018243807459151313, + "loss": 0.7927, + "mean_token_accuracy": 0.7612753689289093, + "num_tokens": 29741585.0, + "step": 8750 + }, + { + "epoch": 0.08792002890521498, + "learning_rate": 0.00018241800152555301, + "loss": 0.7785, + "mean_token_accuracy": 0.7699299335479737, + "num_tokens": 29775306.0, + "step": 8760 + }, + { + "epoch": 0.08802039423501545, + "learning_rate": 0.00018239792845959295, + "loss": 0.7927, + "mean_token_accuracy": 0.7664937555789948, + "num_tokens": 29808521.0, + "step": 8770 + }, + { + "epoch": 0.08812075956481592, + "learning_rate": 0.00018237785539363283, + "loss": 0.781, + "mean_token_accuracy": 0.7734834969043731, + "num_tokens": 29841888.0, + "step": 8780 + }, + { + "epoch": 0.0882211248946164, + "learning_rate": 0.00018235778232767274, + "loss": 0.7841, + "mean_token_accuracy": 0.7714802920818329, + "num_tokens": 29875937.0, + "step": 8790 + }, + { + "epoch": 0.08832149022441688, + "learning_rate": 0.00018233770926171265, + "loss": 0.7641, + "mean_token_accuracy": 0.7700235188007355, + "num_tokens": 29909628.0, + "step": 8800 + }, + { + "epoch": 0.08842185555421735, + "learning_rate": 0.00018231763619575256, + "loss": 0.7819, + "mean_token_accuracy": 0.7715400278568267, + "num_tokens": 29943880.0, + "step": 8810 + }, + { + "epoch": 0.08852222088401783, + "learning_rate": 0.00018229756312979244, + "loss": 0.7568, + "mean_token_accuracy": 0.7760605990886689, + "num_tokens": 29977827.0, + "step": 8820 + }, + { + "epoch": 0.0886225862138183, + "learning_rate": 0.00018227749006383237, + "loss": 0.7517, + "mean_token_accuracy": 0.780300235748291, + "num_tokens": 30011993.0, + "step": 8830 + }, + { + "epoch": 0.08872295154361877, + "learning_rate": 0.00018225741699787225, + "loss": 0.7856, + "mean_token_accuracy": 0.763048404455185, + "num_tokens": 30046264.0, + "step": 8840 + }, + { + "epoch": 0.08882331687341925, + "learning_rate": 0.00018223734393191216, + "loss": 0.8117, + "mean_token_accuracy": 0.7608951687812805, + "num_tokens": 30080946.0, + "step": 8850 + }, + { + "epoch": 0.08892368220321972, + "learning_rate": 0.00018221727086595207, + "loss": 0.7817, + "mean_token_accuracy": 0.7685857653617859, + "num_tokens": 30114139.0, + "step": 8860 + }, + { + "epoch": 0.08902404753302019, + "learning_rate": 0.00018219719779999198, + "loss": 0.7778, + "mean_token_accuracy": 0.7680936872959137, + "num_tokens": 30148943.0, + "step": 8870 + }, + { + "epoch": 0.08912441286282066, + "learning_rate": 0.0001821771247340319, + "loss": 0.7883, + "mean_token_accuracy": 0.7649091064929963, + "num_tokens": 30182765.0, + "step": 8880 + }, + { + "epoch": 0.08922477819262115, + "learning_rate": 0.0001821570516680718, + "loss": 0.7993, + "mean_token_accuracy": 0.7652966022491455, + "num_tokens": 30216428.0, + "step": 8890 + }, + { + "epoch": 0.08932514352242162, + "learning_rate": 0.0001821369786021117, + "loss": 0.805, + "mean_token_accuracy": 0.7664391279220581, + "num_tokens": 30249886.0, + "step": 8900 + }, + { + "epoch": 0.08942550885222209, + "learning_rate": 0.00018211690553615159, + "loss": 0.7606, + "mean_token_accuracy": 0.7713489532470703, + "num_tokens": 30284478.0, + "step": 8910 + }, + { + "epoch": 0.08952587418202257, + "learning_rate": 0.00018209683247019152, + "loss": 0.8324, + "mean_token_accuracy": 0.7595540165901185, + "num_tokens": 30318152.0, + "step": 8920 + }, + { + "epoch": 0.08962623951182304, + "learning_rate": 0.0001820767594042314, + "loss": 0.8069, + "mean_token_accuracy": 0.7607889533042907, + "num_tokens": 30352097.0, + "step": 8930 + }, + { + "epoch": 0.08972660484162351, + "learning_rate": 0.0001820566863382713, + "loss": 0.7659, + "mean_token_accuracy": 0.7716902375221253, + "num_tokens": 30386993.0, + "step": 8940 + }, + { + "epoch": 0.08982697017142398, + "learning_rate": 0.00018203661327231122, + "loss": 0.8017, + "mean_token_accuracy": 0.7665991187095642, + "num_tokens": 30421404.0, + "step": 8950 + }, + { + "epoch": 0.08992733550122446, + "learning_rate": 0.00018201654020635113, + "loss": 0.8137, + "mean_token_accuracy": 0.7588241100311279, + "num_tokens": 30455514.0, + "step": 8960 + }, + { + "epoch": 0.09002770083102493, + "learning_rate": 0.00018199646714039104, + "loss": 0.7789, + "mean_token_accuracy": 0.7674042224884033, + "num_tokens": 30488335.0, + "step": 8970 + }, + { + "epoch": 0.0901280661608254, + "learning_rate": 0.00018197639407443094, + "loss": 0.7598, + "mean_token_accuracy": 0.7746587514877319, + "num_tokens": 30522594.0, + "step": 8980 + }, + { + "epoch": 0.09022843149062588, + "learning_rate": 0.00018195632100847085, + "loss": 0.7845, + "mean_token_accuracy": 0.7681942880153656, + "num_tokens": 30556175.0, + "step": 8990 + }, + { + "epoch": 0.09032879682042635, + "learning_rate": 0.00018193624794251073, + "loss": 0.8158, + "mean_token_accuracy": 0.7650823891162872, + "num_tokens": 30590301.0, + "step": 9000 + }, + { + "epoch": 0.09042916215022682, + "learning_rate": 0.00018191617487655067, + "loss": 0.7983, + "mean_token_accuracy": 0.7667717099189758, + "num_tokens": 30624330.0, + "step": 9010 + }, + { + "epoch": 0.0905295274800273, + "learning_rate": 0.00018189610181059055, + "loss": 0.7941, + "mean_token_accuracy": 0.7668941855430603, + "num_tokens": 30658103.0, + "step": 9020 + }, + { + "epoch": 0.09062989280982778, + "learning_rate": 0.00018187602874463046, + "loss": 0.7656, + "mean_token_accuracy": 0.7736150443553924, + "num_tokens": 30692457.0, + "step": 9030 + }, + { + "epoch": 0.09073025813962825, + "learning_rate": 0.00018185595567867037, + "loss": 0.8097, + "mean_token_accuracy": 0.7703277707099915, + "num_tokens": 30725813.0, + "step": 9040 + }, + { + "epoch": 0.09083062346942872, + "learning_rate": 0.00018183588261271028, + "loss": 0.7845, + "mean_token_accuracy": 0.7693876445293426, + "num_tokens": 30760046.0, + "step": 9050 + }, + { + "epoch": 0.0909309887992292, + "learning_rate": 0.00018181580954675016, + "loss": 0.7914, + "mean_token_accuracy": 0.7648736119270325, + "num_tokens": 30794043.0, + "step": 9060 + }, + { + "epoch": 0.09103135412902967, + "learning_rate": 0.0001817957364807901, + "loss": 0.7953, + "mean_token_accuracy": 0.7657828867435456, + "num_tokens": 30827493.0, + "step": 9070 + }, + { + "epoch": 0.09113171945883014, + "learning_rate": 0.00018177566341482998, + "loss": 0.7707, + "mean_token_accuracy": 0.7668934762477875, + "num_tokens": 30861987.0, + "step": 9080 + }, + { + "epoch": 0.09123208478863061, + "learning_rate": 0.00018175559034886988, + "loss": 0.847, + "mean_token_accuracy": 0.7515221536159515, + "num_tokens": 30895773.0, + "step": 9090 + }, + { + "epoch": 0.0913324501184311, + "learning_rate": 0.00018173551728290982, + "loss": 0.7897, + "mean_token_accuracy": 0.7714468240737915, + "num_tokens": 30930474.0, + "step": 9100 + }, + { + "epoch": 0.09143281544823156, + "learning_rate": 0.0001817154442169497, + "loss": 0.7664, + "mean_token_accuracy": 0.7724806427955627, + "num_tokens": 30964582.0, + "step": 9110 + }, + { + "epoch": 0.09153318077803203, + "learning_rate": 0.0001816953711509896, + "loss": 0.7767, + "mean_token_accuracy": 0.7632918655872345, + "num_tokens": 30998736.0, + "step": 9120 + }, + { + "epoch": 0.09163354610783252, + "learning_rate": 0.00018167529808502952, + "loss": 0.8133, + "mean_token_accuracy": 0.7608244955539704, + "num_tokens": 31033467.0, + "step": 9130 + }, + { + "epoch": 0.09173391143763299, + "learning_rate": 0.00018165522501906943, + "loss": 0.7775, + "mean_token_accuracy": 0.7722931623458862, + "num_tokens": 31067147.0, + "step": 9140 + }, + { + "epoch": 0.09183427676743346, + "learning_rate": 0.0001816351519531093, + "loss": 0.787, + "mean_token_accuracy": 0.7637144982814789, + "num_tokens": 31101075.0, + "step": 9150 + }, + { + "epoch": 0.09193464209723393, + "learning_rate": 0.00018161507888714924, + "loss": 0.8038, + "mean_token_accuracy": 0.7647253572940826, + "num_tokens": 31134763.0, + "step": 9160 + }, + { + "epoch": 0.09203500742703441, + "learning_rate": 0.00018159500582118912, + "loss": 0.7955, + "mean_token_accuracy": 0.7666331231594086, + "num_tokens": 31169302.0, + "step": 9170 + }, + { + "epoch": 0.09213537275683488, + "learning_rate": 0.00018157493275522903, + "loss": 0.7631, + "mean_token_accuracy": 0.7757180273532868, + "num_tokens": 31203530.0, + "step": 9180 + }, + { + "epoch": 0.09223573808663535, + "learning_rate": 0.00018155485968926894, + "loss": 0.7848, + "mean_token_accuracy": 0.7622224748134613, + "num_tokens": 31237590.0, + "step": 9190 + }, + { + "epoch": 0.09233610341643583, + "learning_rate": 0.00018153478662330885, + "loss": 0.8142, + "mean_token_accuracy": 0.7676658689975738, + "num_tokens": 31272006.0, + "step": 9200 + }, + { + "epoch": 0.0924364687462363, + "learning_rate": 0.00018151471355734876, + "loss": 0.7727, + "mean_token_accuracy": 0.768430107831955, + "num_tokens": 31306088.0, + "step": 9210 + }, + { + "epoch": 0.09253683407603677, + "learning_rate": 0.00018149464049138867, + "loss": 0.7906, + "mean_token_accuracy": 0.7649446725845337, + "num_tokens": 31339380.0, + "step": 9220 + }, + { + "epoch": 0.09263719940583724, + "learning_rate": 0.00018147456742542857, + "loss": 0.8076, + "mean_token_accuracy": 0.768731153011322, + "num_tokens": 31374097.0, + "step": 9230 + }, + { + "epoch": 0.09273756473563773, + "learning_rate": 0.00018145449435946846, + "loss": 0.7783, + "mean_token_accuracy": 0.7694973766803741, + "num_tokens": 31407852.0, + "step": 9240 + }, + { + "epoch": 0.0928379300654382, + "learning_rate": 0.0001814344212935084, + "loss": 0.785, + "mean_token_accuracy": 0.7713075160980225, + "num_tokens": 31441940.0, + "step": 9250 + }, + { + "epoch": 0.09293829539523867, + "learning_rate": 0.00018141434822754827, + "loss": 0.7901, + "mean_token_accuracy": 0.7695594906806946, + "num_tokens": 31476335.0, + "step": 9260 + }, + { + "epoch": 0.09303866072503915, + "learning_rate": 0.00018139427516158818, + "loss": 0.7791, + "mean_token_accuracy": 0.7696987748146057, + "num_tokens": 31510293.0, + "step": 9270 + }, + { + "epoch": 0.09313902605483962, + "learning_rate": 0.0001813742020956281, + "loss": 0.7658, + "mean_token_accuracy": 0.770842558145523, + "num_tokens": 31543727.0, + "step": 9280 + }, + { + "epoch": 0.09323939138464009, + "learning_rate": 0.000181354129029668, + "loss": 0.7833, + "mean_token_accuracy": 0.7661703586578369, + "num_tokens": 31577350.0, + "step": 9290 + }, + { + "epoch": 0.09333975671444056, + "learning_rate": 0.0001813340559637079, + "loss": 0.8069, + "mean_token_accuracy": 0.7651128113269806, + "num_tokens": 31611382.0, + "step": 9300 + }, + { + "epoch": 0.09344012204424104, + "learning_rate": 0.00018131398289774781, + "loss": 0.788, + "mean_token_accuracy": 0.7651427328586579, + "num_tokens": 31645425.0, + "step": 9310 + }, + { + "epoch": 0.09354048737404151, + "learning_rate": 0.00018129390983178772, + "loss": 0.7876, + "mean_token_accuracy": 0.763335132598877, + "num_tokens": 31679613.0, + "step": 9320 + }, + { + "epoch": 0.09364085270384198, + "learning_rate": 0.00018127383676582763, + "loss": 0.7858, + "mean_token_accuracy": 0.7680640757083893, + "num_tokens": 31713418.0, + "step": 9330 + }, + { + "epoch": 0.09374121803364246, + "learning_rate": 0.00018125376369986754, + "loss": 0.7791, + "mean_token_accuracy": 0.7704873025417328, + "num_tokens": 31747103.0, + "step": 9340 + }, + { + "epoch": 0.09384158336344293, + "learning_rate": 0.00018123369063390742, + "loss": 0.7988, + "mean_token_accuracy": 0.7634690701961517, + "num_tokens": 31780966.0, + "step": 9350 + }, + { + "epoch": 0.0939419486932434, + "learning_rate": 0.00018121361756794736, + "loss": 0.8216, + "mean_token_accuracy": 0.7603338420391083, + "num_tokens": 31814446.0, + "step": 9360 + }, + { + "epoch": 0.09404231402304387, + "learning_rate": 0.00018119354450198724, + "loss": 0.7842, + "mean_token_accuracy": 0.7677425026893616, + "num_tokens": 31849355.0, + "step": 9370 + }, + { + "epoch": 0.09414267935284436, + "learning_rate": 0.00018117347143602715, + "loss": 0.7905, + "mean_token_accuracy": 0.768053936958313, + "num_tokens": 31883524.0, + "step": 9380 + }, + { + "epoch": 0.09424304468264483, + "learning_rate": 0.00018115339837006706, + "loss": 0.818, + "mean_token_accuracy": 0.7665216565132141, + "num_tokens": 31916837.0, + "step": 9390 + }, + { + "epoch": 0.0943434100124453, + "learning_rate": 0.00018113332530410696, + "loss": 0.7615, + "mean_token_accuracy": 0.7733565986156463, + "num_tokens": 31950958.0, + "step": 9400 + }, + { + "epoch": 0.09444377534224578, + "learning_rate": 0.00018111325223814685, + "loss": 0.8145, + "mean_token_accuracy": 0.7630878150463104, + "num_tokens": 31985483.0, + "step": 9410 + }, + { + "epoch": 0.09454414067204625, + "learning_rate": 0.00018109317917218678, + "loss": 0.7871, + "mean_token_accuracy": 0.7698763608932495, + "num_tokens": 32019177.0, + "step": 9420 + }, + { + "epoch": 0.09464450600184672, + "learning_rate": 0.00018107310610622666, + "loss": 0.797, + "mean_token_accuracy": 0.7613940715789795, + "num_tokens": 32052859.0, + "step": 9430 + }, + { + "epoch": 0.09474487133164719, + "learning_rate": 0.00018105303304026657, + "loss": 0.7935, + "mean_token_accuracy": 0.7656313002109527, + "num_tokens": 32086478.0, + "step": 9440 + }, + { + "epoch": 0.09484523666144767, + "learning_rate": 0.0001810329599743065, + "loss": 0.8287, + "mean_token_accuracy": 0.7582162857055664, + "num_tokens": 32120084.0, + "step": 9450 + }, + { + "epoch": 0.09494560199124814, + "learning_rate": 0.0001810128869083464, + "loss": 0.7766, + "mean_token_accuracy": 0.7686365067958831, + "num_tokens": 32154693.0, + "step": 9460 + }, + { + "epoch": 0.09504596732104861, + "learning_rate": 0.0001809928138423863, + "loss": 0.8127, + "mean_token_accuracy": 0.7605416655540467, + "num_tokens": 32188248.0, + "step": 9470 + }, + { + "epoch": 0.0951463326508491, + "learning_rate": 0.0001809727407764262, + "loss": 0.7957, + "mean_token_accuracy": 0.7632535398006439, + "num_tokens": 32222370.0, + "step": 9480 + }, + { + "epoch": 0.09524669798064957, + "learning_rate": 0.0001809526677104661, + "loss": 0.7844, + "mean_token_accuracy": 0.7648251771926879, + "num_tokens": 32256138.0, + "step": 9490 + }, + { + "epoch": 0.09534706331045004, + "learning_rate": 0.000180932594644506, + "loss": 0.7997, + "mean_token_accuracy": 0.7668353676795959, + "num_tokens": 32290337.0, + "step": 9500 + }, + { + "epoch": 0.0954474286402505, + "learning_rate": 0.00018091252157854593, + "loss": 0.7716, + "mean_token_accuracy": 0.7700516879558563, + "num_tokens": 32324631.0, + "step": 9510 + }, + { + "epoch": 0.09554779397005099, + "learning_rate": 0.0001808924485125858, + "loss": 0.7645, + "mean_token_accuracy": 0.7741646885871887, + "num_tokens": 32358596.0, + "step": 9520 + }, + { + "epoch": 0.09564815929985146, + "learning_rate": 0.00018087237544662572, + "loss": 0.7946, + "mean_token_accuracy": 0.7669793128967285, + "num_tokens": 32393177.0, + "step": 9530 + }, + { + "epoch": 0.09574852462965193, + "learning_rate": 0.00018085230238066563, + "loss": 0.7961, + "mean_token_accuracy": 0.7640884757041931, + "num_tokens": 32427640.0, + "step": 9540 + }, + { + "epoch": 0.09584888995945241, + "learning_rate": 0.00018083222931470554, + "loss": 0.7889, + "mean_token_accuracy": 0.76604523062706, + "num_tokens": 32462185.0, + "step": 9550 + }, + { + "epoch": 0.09594925528925288, + "learning_rate": 0.00018081215624874544, + "loss": 0.7562, + "mean_token_accuracy": 0.7752231001853943, + "num_tokens": 32496524.0, + "step": 9560 + }, + { + "epoch": 0.09604962061905335, + "learning_rate": 0.00018079208318278535, + "loss": 0.7754, + "mean_token_accuracy": 0.7691753149032593, + "num_tokens": 32530189.0, + "step": 9570 + }, + { + "epoch": 0.09614998594885382, + "learning_rate": 0.00018077201011682526, + "loss": 0.7747, + "mean_token_accuracy": 0.7719720363616943, + "num_tokens": 32564461.0, + "step": 9580 + }, + { + "epoch": 0.0962503512786543, + "learning_rate": 0.00018075193705086514, + "loss": 0.7645, + "mean_token_accuracy": 0.7691185414791107, + "num_tokens": 32598437.0, + "step": 9590 + }, + { + "epoch": 0.09635071660845478, + "learning_rate": 0.00018073186398490508, + "loss": 0.8126, + "mean_token_accuracy": 0.7618482708930969, + "num_tokens": 32632841.0, + "step": 9600 + }, + { + "epoch": 0.09645108193825525, + "learning_rate": 0.00018071179091894496, + "loss": 0.8236, + "mean_token_accuracy": 0.7573092579841614, + "num_tokens": 32667525.0, + "step": 9610 + }, + { + "epoch": 0.09655144726805573, + "learning_rate": 0.00018069171785298487, + "loss": 0.7857, + "mean_token_accuracy": 0.7663219451904297, + "num_tokens": 32701330.0, + "step": 9620 + }, + { + "epoch": 0.0966518125978562, + "learning_rate": 0.00018067164478702478, + "loss": 0.7591, + "mean_token_accuracy": 0.7785889625549316, + "num_tokens": 32736175.0, + "step": 9630 + }, + { + "epoch": 0.09675217792765667, + "learning_rate": 0.00018065157172106468, + "loss": 0.7752, + "mean_token_accuracy": 0.7701292335987091, + "num_tokens": 32769996.0, + "step": 9640 + }, + { + "epoch": 0.09685254325745714, + "learning_rate": 0.0001806314986551046, + "loss": 0.7483, + "mean_token_accuracy": 0.7770219802856445, + "num_tokens": 32803281.0, + "step": 9650 + }, + { + "epoch": 0.09695290858725762, + "learning_rate": 0.0001806114255891445, + "loss": 0.7839, + "mean_token_accuracy": 0.769777649641037, + "num_tokens": 32837087.0, + "step": 9660 + }, + { + "epoch": 0.09705327391705809, + "learning_rate": 0.0001805913525231844, + "loss": 0.7771, + "mean_token_accuracy": 0.7717701971530915, + "num_tokens": 32871869.0, + "step": 9670 + }, + { + "epoch": 0.09715363924685856, + "learning_rate": 0.0001805712794572243, + "loss": 0.7861, + "mean_token_accuracy": 0.7715424120426178, + "num_tokens": 32905679.0, + "step": 9680 + }, + { + "epoch": 0.09725400457665904, + "learning_rate": 0.00018055120639126423, + "loss": 0.7865, + "mean_token_accuracy": 0.7647394895553589, + "num_tokens": 32939742.0, + "step": 9690 + }, + { + "epoch": 0.09735436990645951, + "learning_rate": 0.0001805311333253041, + "loss": 0.787, + "mean_token_accuracy": 0.7655929684638977, + "num_tokens": 32974249.0, + "step": 9700 + }, + { + "epoch": 0.09745473523625998, + "learning_rate": 0.00018051106025934402, + "loss": 0.8307, + "mean_token_accuracy": 0.7551734566688537, + "num_tokens": 33007680.0, + "step": 9710 + }, + { + "epoch": 0.09755510056606045, + "learning_rate": 0.00018049098719338393, + "loss": 0.7873, + "mean_token_accuracy": 0.7685339212417602, + "num_tokens": 33041980.0, + "step": 9720 + }, + { + "epoch": 0.09765546589586094, + "learning_rate": 0.00018047091412742383, + "loss": 0.7787, + "mean_token_accuracy": 0.7710682153701782, + "num_tokens": 33077135.0, + "step": 9730 + }, + { + "epoch": 0.09775583122566141, + "learning_rate": 0.00018045084106146372, + "loss": 0.7827, + "mean_token_accuracy": 0.7675726175308227, + "num_tokens": 33110794.0, + "step": 9740 + }, + { + "epoch": 0.09785619655546188, + "learning_rate": 0.00018043076799550365, + "loss": 0.8017, + "mean_token_accuracy": 0.7666629195213318, + "num_tokens": 33144064.0, + "step": 9750 + }, + { + "epoch": 0.09795656188526236, + "learning_rate": 0.00018041069492954353, + "loss": 0.7768, + "mean_token_accuracy": 0.7662809491157532, + "num_tokens": 33178610.0, + "step": 9760 + }, + { + "epoch": 0.09805692721506283, + "learning_rate": 0.00018039062186358344, + "loss": 0.7484, + "mean_token_accuracy": 0.7748051345348358, + "num_tokens": 33211709.0, + "step": 9770 + }, + { + "epoch": 0.0981572925448633, + "learning_rate": 0.00018037054879762335, + "loss": 0.8243, + "mean_token_accuracy": 0.7520861685276031, + "num_tokens": 33245552.0, + "step": 9780 + }, + { + "epoch": 0.09825765787466377, + "learning_rate": 0.00018035047573166326, + "loss": 0.7679, + "mean_token_accuracy": 0.771792608499527, + "num_tokens": 33280308.0, + "step": 9790 + }, + { + "epoch": 0.09835802320446425, + "learning_rate": 0.00018033040266570317, + "loss": 0.7574, + "mean_token_accuracy": 0.7754374146461487, + "num_tokens": 33313523.0, + "step": 9800 + }, + { + "epoch": 0.09845838853426472, + "learning_rate": 0.00018031032959974307, + "loss": 0.7779, + "mean_token_accuracy": 0.7665438055992126, + "num_tokens": 33348278.0, + "step": 9810 + }, + { + "epoch": 0.0985587538640652, + "learning_rate": 0.00018029025653378298, + "loss": 0.7522, + "mean_token_accuracy": 0.7775404155254364, + "num_tokens": 33383632.0, + "step": 9820 + }, + { + "epoch": 0.09865911919386568, + "learning_rate": 0.00018027018346782286, + "loss": 0.7928, + "mean_token_accuracy": 0.7668094635009766, + "num_tokens": 33418353.0, + "step": 9830 + }, + { + "epoch": 0.09875948452366615, + "learning_rate": 0.0001802501104018628, + "loss": 0.8022, + "mean_token_accuracy": 0.7708871126174927, + "num_tokens": 33452423.0, + "step": 9840 + }, + { + "epoch": 0.09885984985346662, + "learning_rate": 0.00018023003733590268, + "loss": 0.7816, + "mean_token_accuracy": 0.7649633705615997, + "num_tokens": 33486446.0, + "step": 9850 + }, + { + "epoch": 0.09896021518326709, + "learning_rate": 0.00018020996426994262, + "loss": 0.8215, + "mean_token_accuracy": 0.7617051899433136, + "num_tokens": 33519984.0, + "step": 9860 + }, + { + "epoch": 0.09906058051306757, + "learning_rate": 0.0001801898912039825, + "loss": 0.8101, + "mean_token_accuracy": 0.7568509519100189, + "num_tokens": 33554988.0, + "step": 9870 + }, + { + "epoch": 0.09916094584286804, + "learning_rate": 0.0001801698181380224, + "loss": 0.7937, + "mean_token_accuracy": 0.7650300979614257, + "num_tokens": 33589544.0, + "step": 9880 + }, + { + "epoch": 0.09926131117266851, + "learning_rate": 0.00018014974507206231, + "loss": 0.7901, + "mean_token_accuracy": 0.7662486851215362, + "num_tokens": 33623148.0, + "step": 9890 + }, + { + "epoch": 0.09936167650246899, + "learning_rate": 0.00018012967200610222, + "loss": 0.7486, + "mean_token_accuracy": 0.770133638381958, + "num_tokens": 33657576.0, + "step": 9900 + }, + { + "epoch": 0.09946204183226946, + "learning_rate": 0.00018010959894014213, + "loss": 0.8253, + "mean_token_accuracy": 0.7663521468639374, + "num_tokens": 33691433.0, + "step": 9910 + }, + { + "epoch": 0.09956240716206993, + "learning_rate": 0.00018008952587418204, + "loss": 0.8082, + "mean_token_accuracy": 0.7643501996994019, + "num_tokens": 33725430.0, + "step": 9920 + }, + { + "epoch": 0.0996627724918704, + "learning_rate": 0.00018006945280822195, + "loss": 0.7961, + "mean_token_accuracy": 0.7636694729328155, + "num_tokens": 33759779.0, + "step": 9930 + }, + { + "epoch": 0.09976313782167089, + "learning_rate": 0.00018004937974226183, + "loss": 0.7872, + "mean_token_accuracy": 0.7669819295406342, + "num_tokens": 33794158.0, + "step": 9940 + }, + { + "epoch": 0.09986350315147136, + "learning_rate": 0.00018002930667630177, + "loss": 0.757, + "mean_token_accuracy": 0.7733592569828034, + "num_tokens": 33828132.0, + "step": 9950 + }, + { + "epoch": 0.09996386848127183, + "learning_rate": 0.00018000923361034165, + "loss": 0.7771, + "mean_token_accuracy": 0.7673372983932495, + "num_tokens": 33862552.0, + "step": 9960 + }, + { + "epoch": 0.10006423381107231, + "learning_rate": 0.00017998916054438155, + "loss": 0.8106, + "mean_token_accuracy": 0.7603930771350861, + "num_tokens": 33895266.0, + "step": 9970 + }, + { + "epoch": 0.10016459914087278, + "learning_rate": 0.00017996908747842146, + "loss": 0.7752, + "mean_token_accuracy": 0.7717368602752686, + "num_tokens": 33928639.0, + "step": 9980 + }, + { + "epoch": 0.10026496447067325, + "learning_rate": 0.00017994901441246137, + "loss": 0.7536, + "mean_token_accuracy": 0.7732951700687408, + "num_tokens": 33962493.0, + "step": 9990 + }, + { + "epoch": 0.10036532980047372, + "learning_rate": 0.00017992894134650128, + "loss": 0.7912, + "mean_token_accuracy": 0.7701098620891571, + "num_tokens": 33995585.0, + "step": 10000 + }, + { + "epoch": 0.1004656951302742, + "learning_rate": 0.0001799088682805412, + "loss": 0.8131, + "mean_token_accuracy": 0.7622293293476105, + "num_tokens": 34029514.0, + "step": 10010 + }, + { + "epoch": 0.10056606046007467, + "learning_rate": 0.0001798887952145811, + "loss": 0.7735, + "mean_token_accuracy": 0.7684919655323028, + "num_tokens": 34062780.0, + "step": 10020 + }, + { + "epoch": 0.10066642578987514, + "learning_rate": 0.00017986872214862098, + "loss": 0.766, + "mean_token_accuracy": 0.7764488875865936, + "num_tokens": 34096411.0, + "step": 10030 + }, + { + "epoch": 0.10076679111967562, + "learning_rate": 0.00017984864908266091, + "loss": 0.7748, + "mean_token_accuracy": 0.7689181506633759, + "num_tokens": 34130781.0, + "step": 10040 + }, + { + "epoch": 0.1008671564494761, + "learning_rate": 0.0001798285760167008, + "loss": 0.8258, + "mean_token_accuracy": 0.7614941120147705, + "num_tokens": 34164604.0, + "step": 10050 + }, + { + "epoch": 0.10096752177927656, + "learning_rate": 0.0001798085029507407, + "loss": 0.8176, + "mean_token_accuracy": 0.7642528653144837, + "num_tokens": 34198526.0, + "step": 10060 + }, + { + "epoch": 0.10106788710907703, + "learning_rate": 0.0001797884298847806, + "loss": 0.8101, + "mean_token_accuracy": 0.7603436768054962, + "num_tokens": 34232408.0, + "step": 10070 + }, + { + "epoch": 0.10116825243887752, + "learning_rate": 0.00017976835681882052, + "loss": 0.8015, + "mean_token_accuracy": 0.7639372229576111, + "num_tokens": 34266649.0, + "step": 10080 + }, + { + "epoch": 0.10126861776867799, + "learning_rate": 0.0001797482837528604, + "loss": 0.7727, + "mean_token_accuracy": 0.7697113692760468, + "num_tokens": 34300849.0, + "step": 10090 + }, + { + "epoch": 0.10136898309847846, + "learning_rate": 0.00017972821068690034, + "loss": 0.7529, + "mean_token_accuracy": 0.7766829371452332, + "num_tokens": 34335580.0, + "step": 10100 + }, + { + "epoch": 0.10146934842827894, + "learning_rate": 0.00017970813762094022, + "loss": 0.8069, + "mean_token_accuracy": 0.7638198852539062, + "num_tokens": 34370229.0, + "step": 10110 + }, + { + "epoch": 0.10156971375807941, + "learning_rate": 0.00017968806455498013, + "loss": 0.7881, + "mean_token_accuracy": 0.7672926723957062, + "num_tokens": 34404429.0, + "step": 10120 + }, + { + "epoch": 0.10167007908787988, + "learning_rate": 0.00017966799148902004, + "loss": 0.7835, + "mean_token_accuracy": 0.7664349377155304, + "num_tokens": 34437979.0, + "step": 10130 + }, + { + "epoch": 0.10177044441768035, + "learning_rate": 0.00017964791842305994, + "loss": 0.8127, + "mean_token_accuracy": 0.758906751871109, + "num_tokens": 34472067.0, + "step": 10140 + }, + { + "epoch": 0.10187080974748083, + "learning_rate": 0.00017962784535709985, + "loss": 0.7766, + "mean_token_accuracy": 0.7701891541481019, + "num_tokens": 34506834.0, + "step": 10150 + }, + { + "epoch": 0.1019711750772813, + "learning_rate": 0.00017960777229113976, + "loss": 0.7671, + "mean_token_accuracy": 0.7738985598087311, + "num_tokens": 34542076.0, + "step": 10160 + }, + { + "epoch": 0.10207154040708177, + "learning_rate": 0.00017958769922517967, + "loss": 0.7977, + "mean_token_accuracy": 0.7637203812599183, + "num_tokens": 34576739.0, + "step": 10170 + }, + { + "epoch": 0.10217190573688226, + "learning_rate": 0.00017956762615921955, + "loss": 0.7948, + "mean_token_accuracy": 0.7669504582881927, + "num_tokens": 34610972.0, + "step": 10180 + }, + { + "epoch": 0.10227227106668273, + "learning_rate": 0.00017954755309325949, + "loss": 0.74, + "mean_token_accuracy": 0.7822540640830994, + "num_tokens": 34645218.0, + "step": 10190 + }, + { + "epoch": 0.1023726363964832, + "learning_rate": 0.00017952748002729937, + "loss": 0.7851, + "mean_token_accuracy": 0.7663270890712738, + "num_tokens": 34679317.0, + "step": 10200 + }, + { + "epoch": 0.10247300172628367, + "learning_rate": 0.00017950740696133928, + "loss": 0.7438, + "mean_token_accuracy": 0.782097053527832, + "num_tokens": 34713589.0, + "step": 10210 + }, + { + "epoch": 0.10257336705608415, + "learning_rate": 0.00017948733389537918, + "loss": 0.7882, + "mean_token_accuracy": 0.7661328732967376, + "num_tokens": 34747582.0, + "step": 10220 + }, + { + "epoch": 0.10267373238588462, + "learning_rate": 0.0001794672608294191, + "loss": 0.7566, + "mean_token_accuracy": 0.7741984486579895, + "num_tokens": 34781547.0, + "step": 10230 + }, + { + "epoch": 0.10277409771568509, + "learning_rate": 0.000179447187763459, + "loss": 0.8143, + "mean_token_accuracy": 0.7658887326717376, + "num_tokens": 34815953.0, + "step": 10240 + }, + { + "epoch": 0.10287446304548557, + "learning_rate": 0.0001794271146974989, + "loss": 0.7885, + "mean_token_accuracy": 0.7683747112751007, + "num_tokens": 34849623.0, + "step": 10250 + }, + { + "epoch": 0.10297482837528604, + "learning_rate": 0.00017940704163153882, + "loss": 0.7784, + "mean_token_accuracy": 0.7713934361934662, + "num_tokens": 34883376.0, + "step": 10260 + }, + { + "epoch": 0.10307519370508651, + "learning_rate": 0.0001793869685655787, + "loss": 0.7724, + "mean_token_accuracy": 0.7745378196239472, + "num_tokens": 34917673.0, + "step": 10270 + }, + { + "epoch": 0.10317555903488698, + "learning_rate": 0.00017936689549961864, + "loss": 0.7647, + "mean_token_accuracy": 0.7662047564983367, + "num_tokens": 34951154.0, + "step": 10280 + }, + { + "epoch": 0.10327592436468747, + "learning_rate": 0.00017934682243365852, + "loss": 0.8227, + "mean_token_accuracy": 0.7628067374229431, + "num_tokens": 34985037.0, + "step": 10290 + }, + { + "epoch": 0.10337628969448794, + "learning_rate": 0.00017932674936769842, + "loss": 0.7846, + "mean_token_accuracy": 0.7674853265285492, + "num_tokens": 35018599.0, + "step": 10300 + }, + { + "epoch": 0.1034766550242884, + "learning_rate": 0.00017930667630173833, + "loss": 0.785, + "mean_token_accuracy": 0.7672294676303864, + "num_tokens": 35052701.0, + "step": 10310 + }, + { + "epoch": 0.10357702035408889, + "learning_rate": 0.00017928660323577824, + "loss": 0.7519, + "mean_token_accuracy": 0.7754966616630554, + "num_tokens": 35086618.0, + "step": 10320 + }, + { + "epoch": 0.10367738568388936, + "learning_rate": 0.00017926653016981812, + "loss": 0.7699, + "mean_token_accuracy": 0.771609491109848, + "num_tokens": 35120506.0, + "step": 10330 + }, + { + "epoch": 0.10377775101368983, + "learning_rate": 0.00017924645710385806, + "loss": 0.7826, + "mean_token_accuracy": 0.7697823762893676, + "num_tokens": 35154462.0, + "step": 10340 + }, + { + "epoch": 0.1038781163434903, + "learning_rate": 0.00017922638403789797, + "loss": 0.8021, + "mean_token_accuracy": 0.7638498783111572, + "num_tokens": 35188876.0, + "step": 10350 + }, + { + "epoch": 0.10397848167329078, + "learning_rate": 0.00017920631097193785, + "loss": 0.7639, + "mean_token_accuracy": 0.772318959236145, + "num_tokens": 35222612.0, + "step": 10360 + }, + { + "epoch": 0.10407884700309125, + "learning_rate": 0.00017918623790597778, + "loss": 0.7741, + "mean_token_accuracy": 0.7691188335418702, + "num_tokens": 35256951.0, + "step": 10370 + }, + { + "epoch": 0.10417921233289172, + "learning_rate": 0.00017916616484001767, + "loss": 0.7602, + "mean_token_accuracy": 0.7751318573951721, + "num_tokens": 35291125.0, + "step": 10380 + }, + { + "epoch": 0.1042795776626922, + "learning_rate": 0.00017914609177405757, + "loss": 0.8093, + "mean_token_accuracy": 0.7600766003131867, + "num_tokens": 35325526.0, + "step": 10390 + }, + { + "epoch": 0.10437994299249267, + "learning_rate": 0.00017912601870809748, + "loss": 0.7839, + "mean_token_accuracy": 0.770651638507843, + "num_tokens": 35359603.0, + "step": 10400 + }, + { + "epoch": 0.10448030832229314, + "learning_rate": 0.0001791059456421374, + "loss": 0.8134, + "mean_token_accuracy": 0.7629783511161804, + "num_tokens": 35394005.0, + "step": 10410 + }, + { + "epoch": 0.10458067365209361, + "learning_rate": 0.0001790858725761773, + "loss": 0.7882, + "mean_token_accuracy": 0.7687924087047577, + "num_tokens": 35427765.0, + "step": 10420 + }, + { + "epoch": 0.1046810389818941, + "learning_rate": 0.0001790657995102172, + "loss": 0.7628, + "mean_token_accuracy": 0.7761599898338318, + "num_tokens": 35462276.0, + "step": 10430 + }, + { + "epoch": 0.10478140431169457, + "learning_rate": 0.0001790457264442571, + "loss": 0.7984, + "mean_token_accuracy": 0.7601453244686127, + "num_tokens": 35495851.0, + "step": 10440 + }, + { + "epoch": 0.10488176964149504, + "learning_rate": 0.00017902565337829702, + "loss": 0.7783, + "mean_token_accuracy": 0.7701234340667724, + "num_tokens": 35529293.0, + "step": 10450 + }, + { + "epoch": 0.10498213497129552, + "learning_rate": 0.0001790055803123369, + "loss": 0.8224, + "mean_token_accuracy": 0.7610841393470764, + "num_tokens": 35562951.0, + "step": 10460 + }, + { + "epoch": 0.10508250030109599, + "learning_rate": 0.00017898550724637681, + "loss": 0.7961, + "mean_token_accuracy": 0.7697411417961121, + "num_tokens": 35596293.0, + "step": 10470 + }, + { + "epoch": 0.10518286563089646, + "learning_rate": 0.00017896543418041672, + "loss": 0.7798, + "mean_token_accuracy": 0.7662987589836121, + "num_tokens": 35630647.0, + "step": 10480 + }, + { + "epoch": 0.10528323096069693, + "learning_rate": 0.00017894536111445663, + "loss": 0.7993, + "mean_token_accuracy": 0.7630761504173279, + "num_tokens": 35665123.0, + "step": 10490 + }, + { + "epoch": 0.10538359629049741, + "learning_rate": 0.00017892528804849654, + "loss": 0.7891, + "mean_token_accuracy": 0.7697969257831574, + "num_tokens": 35699146.0, + "step": 10500 + }, + { + "epoch": 0.10548396162029788, + "learning_rate": 0.00017890521498253645, + "loss": 0.7781, + "mean_token_accuracy": 0.7654927611351013, + "num_tokens": 35733136.0, + "step": 10510 + }, + { + "epoch": 0.10558432695009835, + "learning_rate": 0.00017888514191657636, + "loss": 0.795, + "mean_token_accuracy": 0.7694994390010834, + "num_tokens": 35767045.0, + "step": 10520 + }, + { + "epoch": 0.10568469227989884, + "learning_rate": 0.00017886506885061624, + "loss": 0.7664, + "mean_token_accuracy": 0.7748150587081909, + "num_tokens": 35799958.0, + "step": 10530 + }, + { + "epoch": 0.1057850576096993, + "learning_rate": 0.00017884499578465617, + "loss": 0.773, + "mean_token_accuracy": 0.7681718349456788, + "num_tokens": 35835426.0, + "step": 10540 + }, + { + "epoch": 0.10588542293949978, + "learning_rate": 0.00017882492271869605, + "loss": 0.7709, + "mean_token_accuracy": 0.7701553642749787, + "num_tokens": 35870072.0, + "step": 10550 + }, + { + "epoch": 0.10598578826930025, + "learning_rate": 0.00017880484965273596, + "loss": 0.7635, + "mean_token_accuracy": 0.7779048621654511, + "num_tokens": 35903911.0, + "step": 10560 + }, + { + "epoch": 0.10608615359910073, + "learning_rate": 0.00017878477658677587, + "loss": 0.7711, + "mean_token_accuracy": 0.7651203393936157, + "num_tokens": 35937883.0, + "step": 10570 + }, + { + "epoch": 0.1061865189289012, + "learning_rate": 0.00017876470352081578, + "loss": 0.7576, + "mean_token_accuracy": 0.7720681846141815, + "num_tokens": 35971773.0, + "step": 10580 + }, + { + "epoch": 0.10628688425870167, + "learning_rate": 0.0001787446304548557, + "loss": 0.7987, + "mean_token_accuracy": 0.7652650296688079, + "num_tokens": 36005676.0, + "step": 10590 + }, + { + "epoch": 0.10638724958850215, + "learning_rate": 0.0001787245573888956, + "loss": 0.7918, + "mean_token_accuracy": 0.7614519000053406, + "num_tokens": 36040256.0, + "step": 10600 + }, + { + "epoch": 0.10648761491830262, + "learning_rate": 0.0001787044843229355, + "loss": 0.7874, + "mean_token_accuracy": 0.7717543840408325, + "num_tokens": 36074289.0, + "step": 10610 + }, + { + "epoch": 0.10658798024810309, + "learning_rate": 0.00017868441125697539, + "loss": 0.7797, + "mean_token_accuracy": 0.7678600788116455, + "num_tokens": 36108241.0, + "step": 10620 + }, + { + "epoch": 0.10668834557790356, + "learning_rate": 0.00017866433819101532, + "loss": 0.7728, + "mean_token_accuracy": 0.7684706568717956, + "num_tokens": 36142590.0, + "step": 10630 + }, + { + "epoch": 0.10678871090770405, + "learning_rate": 0.0001786442651250552, + "loss": 0.7741, + "mean_token_accuracy": 0.7725037276744843, + "num_tokens": 36176355.0, + "step": 10640 + }, + { + "epoch": 0.10688907623750452, + "learning_rate": 0.0001786241920590951, + "loss": 0.7625, + "mean_token_accuracy": 0.7765066862106323, + "num_tokens": 36210760.0, + "step": 10650 + }, + { + "epoch": 0.10698944156730499, + "learning_rate": 0.00017860411899313502, + "loss": 0.8049, + "mean_token_accuracy": 0.7634962856769562, + "num_tokens": 36245787.0, + "step": 10660 + }, + { + "epoch": 0.10708980689710547, + "learning_rate": 0.00017858404592717493, + "loss": 0.7719, + "mean_token_accuracy": 0.7657606959342956, + "num_tokens": 36279324.0, + "step": 10670 + }, + { + "epoch": 0.10719017222690594, + "learning_rate": 0.0001785639728612148, + "loss": 0.7691, + "mean_token_accuracy": 0.7721742331981659, + "num_tokens": 36313393.0, + "step": 10680 + }, + { + "epoch": 0.10729053755670641, + "learning_rate": 0.00017854389979525475, + "loss": 0.7626, + "mean_token_accuracy": 0.7692029237747192, + "num_tokens": 36347216.0, + "step": 10690 + }, + { + "epoch": 0.10739090288650688, + "learning_rate": 0.00017852382672929465, + "loss": 0.8148, + "mean_token_accuracy": 0.7642192721366883, + "num_tokens": 36381240.0, + "step": 10700 + }, + { + "epoch": 0.10749126821630736, + "learning_rate": 0.00017850375366333454, + "loss": 0.7572, + "mean_token_accuracy": 0.7711041688919067, + "num_tokens": 36415161.0, + "step": 10710 + }, + { + "epoch": 0.10759163354610783, + "learning_rate": 0.00017848368059737447, + "loss": 0.7795, + "mean_token_accuracy": 0.7689418256282806, + "num_tokens": 36450114.0, + "step": 10720 + }, + { + "epoch": 0.1076919988759083, + "learning_rate": 0.00017846360753141435, + "loss": 0.7732, + "mean_token_accuracy": 0.764790666103363, + "num_tokens": 36483827.0, + "step": 10730 + }, + { + "epoch": 0.10779236420570878, + "learning_rate": 0.00017844353446545426, + "loss": 0.8257, + "mean_token_accuracy": 0.7528440475463867, + "num_tokens": 36518401.0, + "step": 10740 + }, + { + "epoch": 0.10789272953550925, + "learning_rate": 0.00017842346139949417, + "loss": 0.799, + "mean_token_accuracy": 0.7689604461193085, + "num_tokens": 36552415.0, + "step": 10750 + }, + { + "epoch": 0.10799309486530972, + "learning_rate": 0.00017840338833353408, + "loss": 0.7553, + "mean_token_accuracy": 0.7767434477806091, + "num_tokens": 36585872.0, + "step": 10760 + }, + { + "epoch": 0.1080934601951102, + "learning_rate": 0.00017838331526757396, + "loss": 0.785, + "mean_token_accuracy": 0.7629287362098693, + "num_tokens": 36620050.0, + "step": 10770 + }, + { + "epoch": 0.10819382552491068, + "learning_rate": 0.0001783632422016139, + "loss": 0.7585, + "mean_token_accuracy": 0.7698633432388305, + "num_tokens": 36653788.0, + "step": 10780 + }, + { + "epoch": 0.10829419085471115, + "learning_rate": 0.00017834316913565378, + "loss": 0.8034, + "mean_token_accuracy": 0.7642245471477509, + "num_tokens": 36687477.0, + "step": 10790 + }, + { + "epoch": 0.10839455618451162, + "learning_rate": 0.00017832309606969368, + "loss": 0.7852, + "mean_token_accuracy": 0.7684082210063934, + "num_tokens": 36721177.0, + "step": 10800 + }, + { + "epoch": 0.1084949215143121, + "learning_rate": 0.0001783030230037336, + "loss": 0.7901, + "mean_token_accuracy": 0.7634345769882203, + "num_tokens": 36754202.0, + "step": 10810 + }, + { + "epoch": 0.10859528684411257, + "learning_rate": 0.0001782829499377735, + "loss": 0.784, + "mean_token_accuracy": 0.7708740293979645, + "num_tokens": 36788811.0, + "step": 10820 + }, + { + "epoch": 0.10869565217391304, + "learning_rate": 0.0001782628768718134, + "loss": 0.782, + "mean_token_accuracy": 0.7696825981140136, + "num_tokens": 36822957.0, + "step": 10830 + }, + { + "epoch": 0.10879601750371352, + "learning_rate": 0.00017824280380585332, + "loss": 0.775, + "mean_token_accuracy": 0.7708654582500458, + "num_tokens": 36858058.0, + "step": 10840 + }, + { + "epoch": 0.108896382833514, + "learning_rate": 0.00017822273073989323, + "loss": 0.7599, + "mean_token_accuracy": 0.7714969336986541, + "num_tokens": 36891877.0, + "step": 10850 + }, + { + "epoch": 0.10899674816331446, + "learning_rate": 0.0001782026576739331, + "loss": 0.7899, + "mean_token_accuracy": 0.7672240257263183, + "num_tokens": 36926216.0, + "step": 10860 + }, + { + "epoch": 0.10909711349311493, + "learning_rate": 0.00017818258460797304, + "loss": 0.7896, + "mean_token_accuracy": 0.7663983047008515, + "num_tokens": 36960170.0, + "step": 10870 + }, + { + "epoch": 0.10919747882291542, + "learning_rate": 0.00017816251154201292, + "loss": 0.7492, + "mean_token_accuracy": 0.7793428659439087, + "num_tokens": 36994234.0, + "step": 10880 + }, + { + "epoch": 0.10929784415271589, + "learning_rate": 0.00017814243847605283, + "loss": 0.7637, + "mean_token_accuracy": 0.7706003427505493, + "num_tokens": 37027842.0, + "step": 10890 + }, + { + "epoch": 0.10939820948251636, + "learning_rate": 0.00017812236541009274, + "loss": 0.788, + "mean_token_accuracy": 0.7689258813858032, + "num_tokens": 37062157.0, + "step": 10900 + }, + { + "epoch": 0.10949857481231684, + "learning_rate": 0.00017810229234413265, + "loss": 0.7415, + "mean_token_accuracy": 0.7800822496414185, + "num_tokens": 37096416.0, + "step": 10910 + }, + { + "epoch": 0.10959894014211731, + "learning_rate": 0.00017808221927817256, + "loss": 0.7996, + "mean_token_accuracy": 0.7646092355251313, + "num_tokens": 37129570.0, + "step": 10920 + }, + { + "epoch": 0.10969930547191778, + "learning_rate": 0.00017806214621221247, + "loss": 0.7887, + "mean_token_accuracy": 0.7637861371040344, + "num_tokens": 37163649.0, + "step": 10930 + }, + { + "epoch": 0.10979967080171825, + "learning_rate": 0.00017804207314625237, + "loss": 0.7577, + "mean_token_accuracy": 0.7768438696861267, + "num_tokens": 37197267.0, + "step": 10940 + }, + { + "epoch": 0.10990003613151873, + "learning_rate": 0.00017802200008029226, + "loss": 0.8056, + "mean_token_accuracy": 0.7628251135349273, + "num_tokens": 37231308.0, + "step": 10950 + }, + { + "epoch": 0.1100004014613192, + "learning_rate": 0.0001780019270143322, + "loss": 0.7858, + "mean_token_accuracy": 0.7645903825759888, + "num_tokens": 37264848.0, + "step": 10960 + }, + { + "epoch": 0.11010076679111967, + "learning_rate": 0.00017798185394837207, + "loss": 0.7817, + "mean_token_accuracy": 0.7644063472747803, + "num_tokens": 37298911.0, + "step": 10970 + }, + { + "epoch": 0.11020113212092016, + "learning_rate": 0.000177961780882412, + "loss": 0.785, + "mean_token_accuracy": 0.7657126247882843, + "num_tokens": 37332105.0, + "step": 10980 + }, + { + "epoch": 0.11030149745072063, + "learning_rate": 0.0001779417078164519, + "loss": 0.7851, + "mean_token_accuracy": 0.7642782807350159, + "num_tokens": 37366442.0, + "step": 10990 + }, + { + "epoch": 0.1104018627805211, + "learning_rate": 0.0001779216347504918, + "loss": 0.7621, + "mean_token_accuracy": 0.7642432451248169, + "num_tokens": 37400575.0, + "step": 11000 + }, + { + "epoch": 0.11050222811032157, + "learning_rate": 0.0001779015616845317, + "loss": 0.7885, + "mean_token_accuracy": 0.7645276188850403, + "num_tokens": 37434658.0, + "step": 11010 + }, + { + "epoch": 0.11060259344012205, + "learning_rate": 0.00017788148861857162, + "loss": 0.8082, + "mean_token_accuracy": 0.7625736057758331, + "num_tokens": 37469762.0, + "step": 11020 + }, + { + "epoch": 0.11070295876992252, + "learning_rate": 0.0001778614155526115, + "loss": 0.7881, + "mean_token_accuracy": 0.7737322926521302, + "num_tokens": 37504309.0, + "step": 11030 + }, + { + "epoch": 0.11080332409972299, + "learning_rate": 0.00017784134248665143, + "loss": 0.7881, + "mean_token_accuracy": 0.7622285485267639, + "num_tokens": 37537634.0, + "step": 11040 + }, + { + "epoch": 0.11090368942952347, + "learning_rate": 0.00017782126942069134, + "loss": 0.7971, + "mean_token_accuracy": 0.7630579233169555, + "num_tokens": 37571291.0, + "step": 11050 + }, + { + "epoch": 0.11100405475932394, + "learning_rate": 0.00017780119635473122, + "loss": 0.7835, + "mean_token_accuracy": 0.7660659909248352, + "num_tokens": 37605243.0, + "step": 11060 + }, + { + "epoch": 0.11110442008912441, + "learning_rate": 0.00017778112328877116, + "loss": 0.7883, + "mean_token_accuracy": 0.7664074063301086, + "num_tokens": 37638583.0, + "step": 11070 + }, + { + "epoch": 0.11120478541892488, + "learning_rate": 0.00017776105022281104, + "loss": 0.8163, + "mean_token_accuracy": 0.7627486288547516, + "num_tokens": 37672756.0, + "step": 11080 + }, + { + "epoch": 0.11130515074872536, + "learning_rate": 0.00017774097715685095, + "loss": 0.7845, + "mean_token_accuracy": 0.7649985313415527, + "num_tokens": 37706226.0, + "step": 11090 + }, + { + "epoch": 0.11140551607852583, + "learning_rate": 0.00017772090409089086, + "loss": 0.7781, + "mean_token_accuracy": 0.7736667335033417, + "num_tokens": 37739816.0, + "step": 11100 + }, + { + "epoch": 0.1115058814083263, + "learning_rate": 0.00017770083102493076, + "loss": 0.7798, + "mean_token_accuracy": 0.7703223526477814, + "num_tokens": 37774363.0, + "step": 11110 + }, + { + "epoch": 0.11160624673812679, + "learning_rate": 0.00017768075795897065, + "loss": 0.7972, + "mean_token_accuracy": 0.7607849955558776, + "num_tokens": 37809032.0, + "step": 11120 + }, + { + "epoch": 0.11170661206792726, + "learning_rate": 0.00017766068489301058, + "loss": 0.7755, + "mean_token_accuracy": 0.773020726442337, + "num_tokens": 37843114.0, + "step": 11130 + }, + { + "epoch": 0.11180697739772773, + "learning_rate": 0.00017764061182705046, + "loss": 0.8009, + "mean_token_accuracy": 0.7607036411762238, + "num_tokens": 37876581.0, + "step": 11140 + }, + { + "epoch": 0.1119073427275282, + "learning_rate": 0.00017762053876109037, + "loss": 0.7588, + "mean_token_accuracy": 0.7713505566120148, + "num_tokens": 37911079.0, + "step": 11150 + }, + { + "epoch": 0.11200770805732868, + "learning_rate": 0.00017760046569513028, + "loss": 0.8049, + "mean_token_accuracy": 0.7616325080394745, + "num_tokens": 37945303.0, + "step": 11160 + }, + { + "epoch": 0.11210807338712915, + "learning_rate": 0.0001775803926291702, + "loss": 0.8093, + "mean_token_accuracy": 0.7597049415111542, + "num_tokens": 37978943.0, + "step": 11170 + }, + { + "epoch": 0.11220843871692962, + "learning_rate": 0.0001775603195632101, + "loss": 0.7977, + "mean_token_accuracy": 0.7681370735168457, + "num_tokens": 38013071.0, + "step": 11180 + }, + { + "epoch": 0.1123088040467301, + "learning_rate": 0.00017754024649725, + "loss": 0.8246, + "mean_token_accuracy": 0.7641762137413025, + "num_tokens": 38046353.0, + "step": 11190 + }, + { + "epoch": 0.11240916937653057, + "learning_rate": 0.0001775201734312899, + "loss": 0.8302, + "mean_token_accuracy": 0.7551983535289765, + "num_tokens": 38079892.0, + "step": 11200 + }, + { + "epoch": 0.11250953470633104, + "learning_rate": 0.0001775001003653298, + "loss": 0.7994, + "mean_token_accuracy": 0.7642681956291199, + "num_tokens": 38113690.0, + "step": 11210 + }, + { + "epoch": 0.11260990003613151, + "learning_rate": 0.00017748002729936973, + "loss": 0.7823, + "mean_token_accuracy": 0.7686408400535584, + "num_tokens": 38147364.0, + "step": 11220 + }, + { + "epoch": 0.112710265365932, + "learning_rate": 0.0001774599542334096, + "loss": 0.7785, + "mean_token_accuracy": 0.7673284769058227, + "num_tokens": 38181641.0, + "step": 11230 + }, + { + "epoch": 0.11281063069573247, + "learning_rate": 0.00017743988116744952, + "loss": 0.7671, + "mean_token_accuracy": 0.7764685571193695, + "num_tokens": 38215665.0, + "step": 11240 + }, + { + "epoch": 0.11291099602553294, + "learning_rate": 0.00017741980810148943, + "loss": 0.8261, + "mean_token_accuracy": 0.7562175869941712, + "num_tokens": 38250324.0, + "step": 11250 + }, + { + "epoch": 0.11301136135533342, + "learning_rate": 0.00017739973503552934, + "loss": 0.75, + "mean_token_accuracy": 0.7702659010887146, + "num_tokens": 38284395.0, + "step": 11260 + }, + { + "epoch": 0.11311172668513389, + "learning_rate": 0.00017737966196956924, + "loss": 0.8218, + "mean_token_accuracy": 0.7622061729431152, + "num_tokens": 38318500.0, + "step": 11270 + }, + { + "epoch": 0.11321209201493436, + "learning_rate": 0.00017735958890360915, + "loss": 0.7934, + "mean_token_accuracy": 0.7680340647697449, + "num_tokens": 38352413.0, + "step": 11280 + }, + { + "epoch": 0.11331245734473483, + "learning_rate": 0.00017733951583764906, + "loss": 0.7642, + "mean_token_accuracy": 0.7741311669349671, + "num_tokens": 38385939.0, + "step": 11290 + }, + { + "epoch": 0.11341282267453531, + "learning_rate": 0.00017731944277168894, + "loss": 0.7932, + "mean_token_accuracy": 0.7647429883480072, + "num_tokens": 38420540.0, + "step": 11300 + }, + { + "epoch": 0.11351318800433578, + "learning_rate": 0.00017729936970572888, + "loss": 0.8164, + "mean_token_accuracy": 0.7598032474517822, + "num_tokens": 38454312.0, + "step": 11310 + }, + { + "epoch": 0.11361355333413625, + "learning_rate": 0.00017727929663976876, + "loss": 0.7763, + "mean_token_accuracy": 0.7746975064277649, + "num_tokens": 38488831.0, + "step": 11320 + }, + { + "epoch": 0.11371391866393674, + "learning_rate": 0.00017725922357380867, + "loss": 0.7958, + "mean_token_accuracy": 0.7677113354206085, + "num_tokens": 38521896.0, + "step": 11330 + }, + { + "epoch": 0.1138142839937372, + "learning_rate": 0.00017723915050784858, + "loss": 0.7477, + "mean_token_accuracy": 0.7796377956867218, + "num_tokens": 38556722.0, + "step": 11340 + }, + { + "epoch": 0.11391464932353768, + "learning_rate": 0.00017721907744188849, + "loss": 0.7595, + "mean_token_accuracy": 0.7726167142391205, + "num_tokens": 38591405.0, + "step": 11350 + }, + { + "epoch": 0.11401501465333815, + "learning_rate": 0.00017719900437592837, + "loss": 0.7673, + "mean_token_accuracy": 0.7699409604072571, + "num_tokens": 38625518.0, + "step": 11360 + }, + { + "epoch": 0.11411537998313863, + "learning_rate": 0.0001771789313099683, + "loss": 0.7798, + "mean_token_accuracy": 0.7713293433189392, + "num_tokens": 38659584.0, + "step": 11370 + }, + { + "epoch": 0.1142157453129391, + "learning_rate": 0.00017715885824400818, + "loss": 0.7973, + "mean_token_accuracy": 0.7608528554439544, + "num_tokens": 38693605.0, + "step": 11380 + }, + { + "epoch": 0.11431611064273957, + "learning_rate": 0.0001771387851780481, + "loss": 0.8145, + "mean_token_accuracy": 0.766344141960144, + "num_tokens": 38728476.0, + "step": 11390 + }, + { + "epoch": 0.11441647597254005, + "learning_rate": 0.00017711871211208803, + "loss": 0.7791, + "mean_token_accuracy": 0.7720429956912994, + "num_tokens": 38762922.0, + "step": 11400 + }, + { + "epoch": 0.11451684130234052, + "learning_rate": 0.0001770986390461279, + "loss": 0.7659, + "mean_token_accuracy": 0.7721791803836823, + "num_tokens": 38796838.0, + "step": 11410 + }, + { + "epoch": 0.11461720663214099, + "learning_rate": 0.00017707856598016782, + "loss": 0.7609, + "mean_token_accuracy": 0.7671987414360046, + "num_tokens": 38830903.0, + "step": 11420 + }, + { + "epoch": 0.11471757196194146, + "learning_rate": 0.00017705849291420773, + "loss": 0.795, + "mean_token_accuracy": 0.7672559738159179, + "num_tokens": 38865312.0, + "step": 11430 + }, + { + "epoch": 0.11481793729174194, + "learning_rate": 0.00017703841984824763, + "loss": 0.7741, + "mean_token_accuracy": 0.7725123465061188, + "num_tokens": 38900004.0, + "step": 11440 + }, + { + "epoch": 0.11491830262154241, + "learning_rate": 0.00017701834678228752, + "loss": 0.7713, + "mean_token_accuracy": 0.7691251873970032, + "num_tokens": 38934537.0, + "step": 11450 + }, + { + "epoch": 0.11501866795134288, + "learning_rate": 0.00017699827371632745, + "loss": 0.7772, + "mean_token_accuracy": 0.7705145180225372, + "num_tokens": 38967988.0, + "step": 11460 + }, + { + "epoch": 0.11511903328114337, + "learning_rate": 0.00017697820065036733, + "loss": 0.756, + "mean_token_accuracy": 0.7800585031509399, + "num_tokens": 39001441.0, + "step": 11470 + }, + { + "epoch": 0.11521939861094384, + "learning_rate": 0.00017695812758440724, + "loss": 0.768, + "mean_token_accuracy": 0.7769594490528107, + "num_tokens": 39034929.0, + "step": 11480 + }, + { + "epoch": 0.11531976394074431, + "learning_rate": 0.00017693805451844715, + "loss": 0.7913, + "mean_token_accuracy": 0.7646923243999482, + "num_tokens": 39068092.0, + "step": 11490 + }, + { + "epoch": 0.11542012927054478, + "learning_rate": 0.00017691798145248706, + "loss": 0.7768, + "mean_token_accuracy": 0.7709584832191467, + "num_tokens": 39101540.0, + "step": 11500 + }, + { + "epoch": 0.11552049460034526, + "learning_rate": 0.00017689790838652697, + "loss": 0.8017, + "mean_token_accuracy": 0.7663677096366882, + "num_tokens": 39136047.0, + "step": 11510 + }, + { + "epoch": 0.11562085993014573, + "learning_rate": 0.00017687783532056687, + "loss": 0.7653, + "mean_token_accuracy": 0.7705176889896392, + "num_tokens": 39169501.0, + "step": 11520 + }, + { + "epoch": 0.1157212252599462, + "learning_rate": 0.00017685776225460678, + "loss": 0.8023, + "mean_token_accuracy": 0.7634245574474334, + "num_tokens": 39203477.0, + "step": 11530 + }, + { + "epoch": 0.11582159058974668, + "learning_rate": 0.00017683768918864666, + "loss": 0.7639, + "mean_token_accuracy": 0.7677269458770752, + "num_tokens": 39238060.0, + "step": 11540 + }, + { + "epoch": 0.11592195591954715, + "learning_rate": 0.0001768176161226866, + "loss": 0.7859, + "mean_token_accuracy": 0.7660326838493348, + "num_tokens": 39271841.0, + "step": 11550 + }, + { + "epoch": 0.11602232124934762, + "learning_rate": 0.00017679754305672648, + "loss": 0.7583, + "mean_token_accuracy": 0.7717775106430054, + "num_tokens": 39306606.0, + "step": 11560 + }, + { + "epoch": 0.1161226865791481, + "learning_rate": 0.00017677746999076642, + "loss": 0.7661, + "mean_token_accuracy": 0.7701225757598877, + "num_tokens": 39339475.0, + "step": 11570 + }, + { + "epoch": 0.11622305190894858, + "learning_rate": 0.0001767573969248063, + "loss": 0.7757, + "mean_token_accuracy": 0.7728428721427918, + "num_tokens": 39374240.0, + "step": 11580 + }, + { + "epoch": 0.11632341723874905, + "learning_rate": 0.0001767373238588462, + "loss": 0.7842, + "mean_token_accuracy": 0.7713092923164367, + "num_tokens": 39408018.0, + "step": 11590 + }, + { + "epoch": 0.11642378256854952, + "learning_rate": 0.00017671725079288611, + "loss": 0.7551, + "mean_token_accuracy": 0.7804297387599946, + "num_tokens": 39442330.0, + "step": 11600 + }, + { + "epoch": 0.11652414789835, + "learning_rate": 0.00017669717772692602, + "loss": 0.7865, + "mean_token_accuracy": 0.7714122951030731, + "num_tokens": 39475806.0, + "step": 11610 + }, + { + "epoch": 0.11662451322815047, + "learning_rate": 0.00017667710466096593, + "loss": 0.793, + "mean_token_accuracy": 0.766773521900177, + "num_tokens": 39510580.0, + "step": 11620 + }, + { + "epoch": 0.11672487855795094, + "learning_rate": 0.00017665703159500584, + "loss": 0.747, + "mean_token_accuracy": 0.7717756271362305, + "num_tokens": 39544057.0, + "step": 11630 + }, + { + "epoch": 0.11682524388775141, + "learning_rate": 0.00017663695852904575, + "loss": 0.7983, + "mean_token_accuracy": 0.7713942110538483, + "num_tokens": 39578119.0, + "step": 11640 + }, + { + "epoch": 0.11692560921755189, + "learning_rate": 0.00017661688546308563, + "loss": 0.7699, + "mean_token_accuracy": 0.7693363547325134, + "num_tokens": 39612377.0, + "step": 11650 + }, + { + "epoch": 0.11702597454735236, + "learning_rate": 0.00017659681239712557, + "loss": 0.7723, + "mean_token_accuracy": 0.7707055330276489, + "num_tokens": 39646664.0, + "step": 11660 + }, + { + "epoch": 0.11712633987715283, + "learning_rate": 0.00017657673933116545, + "loss": 0.7642, + "mean_token_accuracy": 0.7722592294216156, + "num_tokens": 39680694.0, + "step": 11670 + }, + { + "epoch": 0.11722670520695332, + "learning_rate": 0.00017655666626520536, + "loss": 0.7999, + "mean_token_accuracy": 0.7656277120113373, + "num_tokens": 39715597.0, + "step": 11680 + }, + { + "epoch": 0.11732707053675379, + "learning_rate": 0.00017653659319924526, + "loss": 0.7726, + "mean_token_accuracy": 0.7747666537761688, + "num_tokens": 39750466.0, + "step": 11690 + }, + { + "epoch": 0.11742743586655426, + "learning_rate": 0.00017651652013328517, + "loss": 0.8171, + "mean_token_accuracy": 0.76343132853508, + "num_tokens": 39784127.0, + "step": 11700 + }, + { + "epoch": 0.11752780119635473, + "learning_rate": 0.00017649644706732505, + "loss": 0.7874, + "mean_token_accuracy": 0.7643001914024353, + "num_tokens": 39818279.0, + "step": 11710 + }, + { + "epoch": 0.11762816652615521, + "learning_rate": 0.000176476374001365, + "loss": 0.8281, + "mean_token_accuracy": 0.764520788192749, + "num_tokens": 39852065.0, + "step": 11720 + }, + { + "epoch": 0.11772853185595568, + "learning_rate": 0.00017645630093540487, + "loss": 0.7999, + "mean_token_accuracy": 0.7661543011665344, + "num_tokens": 39886218.0, + "step": 11730 + }, + { + "epoch": 0.11782889718575615, + "learning_rate": 0.00017643622786944478, + "loss": 0.7623, + "mean_token_accuracy": 0.7742419481277466, + "num_tokens": 39919453.0, + "step": 11740 + }, + { + "epoch": 0.11792926251555663, + "learning_rate": 0.00017641615480348471, + "loss": 0.7836, + "mean_token_accuracy": 0.7672594904899597, + "num_tokens": 39954125.0, + "step": 11750 + }, + { + "epoch": 0.1180296278453571, + "learning_rate": 0.0001763960817375246, + "loss": 0.7726, + "mean_token_accuracy": 0.7788445174694061, + "num_tokens": 39988348.0, + "step": 11760 + }, + { + "epoch": 0.11812999317515757, + "learning_rate": 0.0001763760086715645, + "loss": 0.8272, + "mean_token_accuracy": 0.7619171619415284, + "num_tokens": 40022296.0, + "step": 11770 + }, + { + "epoch": 0.11823035850495804, + "learning_rate": 0.0001763559356056044, + "loss": 0.7774, + "mean_token_accuracy": 0.7701909244060516, + "num_tokens": 40055180.0, + "step": 11780 + }, + { + "epoch": 0.11833072383475852, + "learning_rate": 0.00017633586253964432, + "loss": 0.7398, + "mean_token_accuracy": 0.7765741109848022, + "num_tokens": 40089322.0, + "step": 11790 + }, + { + "epoch": 0.118431089164559, + "learning_rate": 0.0001763157894736842, + "loss": 0.7684, + "mean_token_accuracy": 0.776421868801117, + "num_tokens": 40123226.0, + "step": 11800 + }, + { + "epoch": 0.11853145449435946, + "learning_rate": 0.00017629571640772414, + "loss": 0.8092, + "mean_token_accuracy": 0.7604811728000641, + "num_tokens": 40156888.0, + "step": 11810 + }, + { + "epoch": 0.11863181982415995, + "learning_rate": 0.00017627564334176402, + "loss": 0.7697, + "mean_token_accuracy": 0.7683253526687622, + "num_tokens": 40190380.0, + "step": 11820 + }, + { + "epoch": 0.11873218515396042, + "learning_rate": 0.00017625557027580393, + "loss": 0.7996, + "mean_token_accuracy": 0.7628776550292968, + "num_tokens": 40224206.0, + "step": 11830 + }, + { + "epoch": 0.11883255048376089, + "learning_rate": 0.00017623549720984384, + "loss": 0.7741, + "mean_token_accuracy": 0.7673757433891296, + "num_tokens": 40257463.0, + "step": 11840 + }, + { + "epoch": 0.11893291581356136, + "learning_rate": 0.00017621542414388374, + "loss": 0.8199, + "mean_token_accuracy": 0.7614277958869934, + "num_tokens": 40290925.0, + "step": 11850 + }, + { + "epoch": 0.11903328114336184, + "learning_rate": 0.00017619535107792365, + "loss": 0.8024, + "mean_token_accuracy": 0.7650829792022705, + "num_tokens": 40324936.0, + "step": 11860 + }, + { + "epoch": 0.11913364647316231, + "learning_rate": 0.00017617527801196356, + "loss": 0.8039, + "mean_token_accuracy": 0.7632757902145386, + "num_tokens": 40358512.0, + "step": 11870 + }, + { + "epoch": 0.11923401180296278, + "learning_rate": 0.00017615520494600347, + "loss": 0.7785, + "mean_token_accuracy": 0.7703190386295319, + "num_tokens": 40391900.0, + "step": 11880 + }, + { + "epoch": 0.11933437713276326, + "learning_rate": 0.00017613513188004335, + "loss": 0.7905, + "mean_token_accuracy": 0.762644600868225, + "num_tokens": 40425909.0, + "step": 11890 + }, + { + "epoch": 0.11943474246256373, + "learning_rate": 0.0001761150588140833, + "loss": 0.7733, + "mean_token_accuracy": 0.7715180158615113, + "num_tokens": 40460001.0, + "step": 11900 + }, + { + "epoch": 0.1195351077923642, + "learning_rate": 0.00017609498574812317, + "loss": 0.764, + "mean_token_accuracy": 0.7699169874191284, + "num_tokens": 40493921.0, + "step": 11910 + }, + { + "epoch": 0.11963547312216467, + "learning_rate": 0.00017607491268216308, + "loss": 0.7863, + "mean_token_accuracy": 0.7684384703636169, + "num_tokens": 40527849.0, + "step": 11920 + }, + { + "epoch": 0.11973583845196516, + "learning_rate": 0.00017605483961620298, + "loss": 0.7991, + "mean_token_accuracy": 0.7640502333641053, + "num_tokens": 40562200.0, + "step": 11930 + }, + { + "epoch": 0.11983620378176563, + "learning_rate": 0.0001760347665502429, + "loss": 0.802, + "mean_token_accuracy": 0.7624570906162262, + "num_tokens": 40595828.0, + "step": 11940 + }, + { + "epoch": 0.1199365691115661, + "learning_rate": 0.0001760146934842828, + "loss": 0.7966, + "mean_token_accuracy": 0.7684255540370941, + "num_tokens": 40629479.0, + "step": 11950 + }, + { + "epoch": 0.12003693444136658, + "learning_rate": 0.0001759946204183227, + "loss": 0.748, + "mean_token_accuracy": 0.7810657501220704, + "num_tokens": 40663397.0, + "step": 11960 + }, + { + "epoch": 0.12013729977116705, + "learning_rate": 0.00017597454735236262, + "loss": 0.7789, + "mean_token_accuracy": 0.7606176555156707, + "num_tokens": 40697411.0, + "step": 11970 + }, + { + "epoch": 0.12023766510096752, + "learning_rate": 0.0001759544742864025, + "loss": 0.7962, + "mean_token_accuracy": 0.7685517072677612, + "num_tokens": 40731045.0, + "step": 11980 + }, + { + "epoch": 0.12033803043076799, + "learning_rate": 0.00017593440122044244, + "loss": 0.7857, + "mean_token_accuracy": 0.7689754724502563, + "num_tokens": 40764613.0, + "step": 11990 + }, + { + "epoch": 0.12043839576056847, + "learning_rate": 0.00017591432815448232, + "loss": 0.7416, + "mean_token_accuracy": 0.7737857520580291, + "num_tokens": 40798558.0, + "step": 12000 + }, + { + "epoch": 0.12053876109036894, + "learning_rate": 0.00017589425508852223, + "loss": 0.8079, + "mean_token_accuracy": 0.7625069737434387, + "num_tokens": 40832288.0, + "step": 12010 + }, + { + "epoch": 0.12063912642016941, + "learning_rate": 0.00017587418202256213, + "loss": 0.8001, + "mean_token_accuracy": 0.7698694944381714, + "num_tokens": 40866218.0, + "step": 12020 + }, + { + "epoch": 0.1207394917499699, + "learning_rate": 0.00017585410895660204, + "loss": 0.7995, + "mean_token_accuracy": 0.7681800425052643, + "num_tokens": 40900843.0, + "step": 12030 + }, + { + "epoch": 0.12083985707977037, + "learning_rate": 0.00017583403589064192, + "loss": 0.8066, + "mean_token_accuracy": 0.7637708008289337, + "num_tokens": 40934399.0, + "step": 12040 + }, + { + "epoch": 0.12094022240957084, + "learning_rate": 0.00017581396282468186, + "loss": 0.7766, + "mean_token_accuracy": 0.7660633981227875, + "num_tokens": 40968768.0, + "step": 12050 + }, + { + "epoch": 0.1210405877393713, + "learning_rate": 0.00017579388975872174, + "loss": 0.7732, + "mean_token_accuracy": 0.7718873798847199, + "num_tokens": 41002363.0, + "step": 12060 + }, + { + "epoch": 0.12114095306917179, + "learning_rate": 0.00017577381669276165, + "loss": 0.7614, + "mean_token_accuracy": 0.775162810087204, + "num_tokens": 41037020.0, + "step": 12070 + }, + { + "epoch": 0.12124131839897226, + "learning_rate": 0.00017575374362680156, + "loss": 0.831, + "mean_token_accuracy": 0.7604571998119354, + "num_tokens": 41071366.0, + "step": 12080 + }, + { + "epoch": 0.12134168372877273, + "learning_rate": 0.00017573367056084147, + "loss": 0.8195, + "mean_token_accuracy": 0.7606946229934692, + "num_tokens": 41105049.0, + "step": 12090 + }, + { + "epoch": 0.12144204905857321, + "learning_rate": 0.00017571359749488137, + "loss": 0.7906, + "mean_token_accuracy": 0.7686561584472656, + "num_tokens": 41139040.0, + "step": 12100 + }, + { + "epoch": 0.12154241438837368, + "learning_rate": 0.00017569352442892128, + "loss": 0.794, + "mean_token_accuracy": 0.7679334044456482, + "num_tokens": 41172738.0, + "step": 12110 + }, + { + "epoch": 0.12164277971817415, + "learning_rate": 0.0001756734513629612, + "loss": 0.7825, + "mean_token_accuracy": 0.7688836455345154, + "num_tokens": 41207544.0, + "step": 12120 + }, + { + "epoch": 0.12174314504797462, + "learning_rate": 0.0001756533782970011, + "loss": 0.79, + "mean_token_accuracy": 0.7671124160289764, + "num_tokens": 41241678.0, + "step": 12130 + }, + { + "epoch": 0.1218435103777751, + "learning_rate": 0.000175633305231041, + "loss": 0.786, + "mean_token_accuracy": 0.7698677480220795, + "num_tokens": 41276109.0, + "step": 12140 + }, + { + "epoch": 0.12194387570757557, + "learning_rate": 0.0001756132321650809, + "loss": 0.7705, + "mean_token_accuracy": 0.7711529910564423, + "num_tokens": 41309967.0, + "step": 12150 + }, + { + "epoch": 0.12204424103737604, + "learning_rate": 0.00017559315909912082, + "loss": 0.7946, + "mean_token_accuracy": 0.7652078151702881, + "num_tokens": 41344595.0, + "step": 12160 + }, + { + "epoch": 0.12214460636717653, + "learning_rate": 0.0001755730860331607, + "loss": 0.7935, + "mean_token_accuracy": 0.7659879446029663, + "num_tokens": 41378590.0, + "step": 12170 + }, + { + "epoch": 0.122244971696977, + "learning_rate": 0.00017555301296720061, + "loss": 0.7731, + "mean_token_accuracy": 0.770485919713974, + "num_tokens": 41412020.0, + "step": 12180 + }, + { + "epoch": 0.12234533702677747, + "learning_rate": 0.00017553293990124052, + "loss": 0.7958, + "mean_token_accuracy": 0.7665983974933624, + "num_tokens": 41446265.0, + "step": 12190 + }, + { + "epoch": 0.12244570235657794, + "learning_rate": 0.00017551286683528043, + "loss": 0.7606, + "mean_token_accuracy": 0.7740192413330078, + "num_tokens": 41479493.0, + "step": 12200 + }, + { + "epoch": 0.12254606768637842, + "learning_rate": 0.00017549279376932034, + "loss": 0.7853, + "mean_token_accuracy": 0.7652707397937775, + "num_tokens": 41513536.0, + "step": 12210 + }, + { + "epoch": 0.12264643301617889, + "learning_rate": 0.00017547272070336025, + "loss": 0.7618, + "mean_token_accuracy": 0.7741611421108245, + "num_tokens": 41547227.0, + "step": 12220 + }, + { + "epoch": 0.12274679834597936, + "learning_rate": 0.00017545264763740016, + "loss": 0.768, + "mean_token_accuracy": 0.7714941918849945, + "num_tokens": 41581441.0, + "step": 12230 + }, + { + "epoch": 0.12284716367577984, + "learning_rate": 0.00017543257457144004, + "loss": 0.7809, + "mean_token_accuracy": 0.7698556900024414, + "num_tokens": 41615059.0, + "step": 12240 + }, + { + "epoch": 0.12294752900558031, + "learning_rate": 0.00017541250150547997, + "loss": 0.7832, + "mean_token_accuracy": 0.7657558023929596, + "num_tokens": 41649299.0, + "step": 12250 + }, + { + "epoch": 0.12304789433538078, + "learning_rate": 0.00017539242843951985, + "loss": 0.7607, + "mean_token_accuracy": 0.7744082927703857, + "num_tokens": 41682483.0, + "step": 12260 + }, + { + "epoch": 0.12314825966518125, + "learning_rate": 0.00017537235537355976, + "loss": 0.808, + "mean_token_accuracy": 0.7617681801319123, + "num_tokens": 41716531.0, + "step": 12270 + }, + { + "epoch": 0.12324862499498174, + "learning_rate": 0.00017535228230759967, + "loss": 0.7707, + "mean_token_accuracy": 0.7723277449607849, + "num_tokens": 41750691.0, + "step": 12280 + }, + { + "epoch": 0.1233489903247822, + "learning_rate": 0.00017533220924163958, + "loss": 0.7608, + "mean_token_accuracy": 0.7751142323017121, + "num_tokens": 41785619.0, + "step": 12290 + }, + { + "epoch": 0.12344935565458268, + "learning_rate": 0.0001753121361756795, + "loss": 0.7678, + "mean_token_accuracy": 0.7734646201133728, + "num_tokens": 41818417.0, + "step": 12300 + }, + { + "epoch": 0.12354972098438316, + "learning_rate": 0.0001752920631097194, + "loss": 0.7596, + "mean_token_accuracy": 0.7770093083381653, + "num_tokens": 41852925.0, + "step": 12310 + }, + { + "epoch": 0.12365008631418363, + "learning_rate": 0.0001752719900437593, + "loss": 0.7708, + "mean_token_accuracy": 0.7711196780204773, + "num_tokens": 41887457.0, + "step": 12320 + }, + { + "epoch": 0.1237504516439841, + "learning_rate": 0.0001752519169777992, + "loss": 0.7318, + "mean_token_accuracy": 0.7761717677116394, + "num_tokens": 41921253.0, + "step": 12330 + }, + { + "epoch": 0.12385081697378457, + "learning_rate": 0.00017523184391183912, + "loss": 0.7849, + "mean_token_accuracy": 0.7733409106731415, + "num_tokens": 41955293.0, + "step": 12340 + }, + { + "epoch": 0.12395118230358505, + "learning_rate": 0.000175211770845879, + "loss": 0.8089, + "mean_token_accuracy": 0.761337673664093, + "num_tokens": 41989698.0, + "step": 12350 + }, + { + "epoch": 0.12405154763338552, + "learning_rate": 0.0001751916977799189, + "loss": 0.788, + "mean_token_accuracy": 0.7657052159309388, + "num_tokens": 42023229.0, + "step": 12360 + }, + { + "epoch": 0.12415191296318599, + "learning_rate": 0.00017517162471395882, + "loss": 0.7943, + "mean_token_accuracy": 0.7652049005031586, + "num_tokens": 42056794.0, + "step": 12370 + }, + { + "epoch": 0.12425227829298648, + "learning_rate": 0.00017515155164799873, + "loss": 0.7835, + "mean_token_accuracy": 0.7664673566818238, + "num_tokens": 42090348.0, + "step": 12380 + }, + { + "epoch": 0.12435264362278695, + "learning_rate": 0.0001751314785820386, + "loss": 0.7946, + "mean_token_accuracy": 0.7590865314006805, + "num_tokens": 42123920.0, + "step": 12390 + }, + { + "epoch": 0.12445300895258742, + "learning_rate": 0.00017511140551607855, + "loss": 0.7847, + "mean_token_accuracy": 0.7666195809841156, + "num_tokens": 42157663.0, + "step": 12400 + }, + { + "epoch": 0.12455337428238789, + "learning_rate": 0.00017509133245011843, + "loss": 0.7946, + "mean_token_accuracy": 0.765533983707428, + "num_tokens": 42191417.0, + "step": 12410 + }, + { + "epoch": 0.12465373961218837, + "learning_rate": 0.00017507125938415834, + "loss": 0.7981, + "mean_token_accuracy": 0.7656021595001221, + "num_tokens": 42225247.0, + "step": 12420 + }, + { + "epoch": 0.12475410494198884, + "learning_rate": 0.00017505118631819824, + "loss": 0.7686, + "mean_token_accuracy": 0.769657415151596, + "num_tokens": 42259252.0, + "step": 12430 + }, + { + "epoch": 0.12485447027178931, + "learning_rate": 0.00017503111325223815, + "loss": 0.8012, + "mean_token_accuracy": 0.7693645060062408, + "num_tokens": 42292686.0, + "step": 12440 + }, + { + "epoch": 0.12495483560158979, + "learning_rate": 0.00017501104018627806, + "loss": 0.8029, + "mean_token_accuracy": 0.7659431755542755, + "num_tokens": 42326756.0, + "step": 12450 + }, + { + "epoch": 0.12505520093139025, + "learning_rate": 0.00017499096712031797, + "loss": 0.7851, + "mean_token_accuracy": 0.767655348777771, + "num_tokens": 42360582.0, + "step": 12460 + }, + { + "epoch": 0.12515556626119073, + "learning_rate": 0.00017497089405435788, + "loss": 0.8064, + "mean_token_accuracy": 0.761356520652771, + "num_tokens": 42394863.0, + "step": 12470 + }, + { + "epoch": 0.12525593159099122, + "learning_rate": 0.00017495082098839776, + "loss": 0.7849, + "mean_token_accuracy": 0.7705150127410889, + "num_tokens": 42428642.0, + "step": 12480 + }, + { + "epoch": 0.12535629692079167, + "learning_rate": 0.0001749307479224377, + "loss": 0.7495, + "mean_token_accuracy": 0.7836252212524414, + "num_tokens": 42463108.0, + "step": 12490 + }, + { + "epoch": 0.12545666225059215, + "learning_rate": 0.00017491067485647758, + "loss": 0.7507, + "mean_token_accuracy": 0.7728869378566742, + "num_tokens": 42496448.0, + "step": 12500 + }, + { + "epoch": 0.12555702758039264, + "learning_rate": 0.00017489060179051748, + "loss": 0.76, + "mean_token_accuracy": 0.7759355187416077, + "num_tokens": 42529912.0, + "step": 12510 + }, + { + "epoch": 0.1256573929101931, + "learning_rate": 0.0001748705287245574, + "loss": 0.7994, + "mean_token_accuracy": 0.7663152515888214, + "num_tokens": 42563978.0, + "step": 12520 + }, + { + "epoch": 0.12575775823999358, + "learning_rate": 0.0001748504556585973, + "loss": 0.7565, + "mean_token_accuracy": 0.7709584891796112, + "num_tokens": 42598037.0, + "step": 12530 + }, + { + "epoch": 0.12585812356979406, + "learning_rate": 0.0001748303825926372, + "loss": 0.8008, + "mean_token_accuracy": 0.7673484742641449, + "num_tokens": 42631788.0, + "step": 12540 + }, + { + "epoch": 0.12595848889959452, + "learning_rate": 0.00017481030952667712, + "loss": 0.7768, + "mean_token_accuracy": 0.7681606829166412, + "num_tokens": 42666401.0, + "step": 12550 + }, + { + "epoch": 0.126058854229395, + "learning_rate": 0.00017479023646071703, + "loss": 0.7879, + "mean_token_accuracy": 0.7740061402320861, + "num_tokens": 42699968.0, + "step": 12560 + }, + { + "epoch": 0.12615921955919548, + "learning_rate": 0.0001747701633947569, + "loss": 0.7701, + "mean_token_accuracy": 0.7727460920810699, + "num_tokens": 42733680.0, + "step": 12570 + }, + { + "epoch": 0.12625958488899594, + "learning_rate": 0.00017475009032879684, + "loss": 0.8036, + "mean_token_accuracy": 0.7588761568069458, + "num_tokens": 42767954.0, + "step": 12580 + }, + { + "epoch": 0.12635995021879642, + "learning_rate": 0.00017473001726283672, + "loss": 0.7755, + "mean_token_accuracy": 0.7718429625034332, + "num_tokens": 42802447.0, + "step": 12590 + }, + { + "epoch": 0.12646031554859688, + "learning_rate": 0.00017470994419687663, + "loss": 0.7585, + "mean_token_accuracy": 0.7763899385929107, + "num_tokens": 42836185.0, + "step": 12600 + }, + { + "epoch": 0.12656068087839736, + "learning_rate": 0.00017468987113091654, + "loss": 0.7922, + "mean_token_accuracy": 0.7698125064373016, + "num_tokens": 42870463.0, + "step": 12610 + }, + { + "epoch": 0.12666104620819785, + "learning_rate": 0.00017466979806495645, + "loss": 0.7756, + "mean_token_accuracy": 0.7690317809581757, + "num_tokens": 42904594.0, + "step": 12620 + }, + { + "epoch": 0.1267614115379983, + "learning_rate": 0.00017464972499899633, + "loss": 0.7595, + "mean_token_accuracy": 0.7723953187465668, + "num_tokens": 42938652.0, + "step": 12630 + }, + { + "epoch": 0.1268617768677988, + "learning_rate": 0.00017462965193303627, + "loss": 0.8115, + "mean_token_accuracy": 0.7605502486228943, + "num_tokens": 42972464.0, + "step": 12640 + }, + { + "epoch": 0.12696214219759927, + "learning_rate": 0.00017460957886707618, + "loss": 0.7672, + "mean_token_accuracy": 0.7675876438617706, + "num_tokens": 43007157.0, + "step": 12650 + }, + { + "epoch": 0.12706250752739973, + "learning_rate": 0.00017458950580111606, + "loss": 0.7688, + "mean_token_accuracy": 0.770320039987564, + "num_tokens": 43040658.0, + "step": 12660 + }, + { + "epoch": 0.1271628728572002, + "learning_rate": 0.000174569432735156, + "loss": 0.7849, + "mean_token_accuracy": 0.763702666759491, + "num_tokens": 43075908.0, + "step": 12670 + }, + { + "epoch": 0.1272632381870007, + "learning_rate": 0.00017454935966919587, + "loss": 0.8181, + "mean_token_accuracy": 0.7626882672309876, + "num_tokens": 43109535.0, + "step": 12680 + }, + { + "epoch": 0.12736360351680115, + "learning_rate": 0.0001745292866032358, + "loss": 0.7753, + "mean_token_accuracy": 0.7663200795650482, + "num_tokens": 43143526.0, + "step": 12690 + }, + { + "epoch": 0.12746396884660163, + "learning_rate": 0.0001745092135372757, + "loss": 0.7728, + "mean_token_accuracy": 0.7678152918815613, + "num_tokens": 43176797.0, + "step": 12700 + }, + { + "epoch": 0.12756433417640212, + "learning_rate": 0.0001744891404713156, + "loss": 0.7946, + "mean_token_accuracy": 0.7646638870239257, + "num_tokens": 43210092.0, + "step": 12710 + }, + { + "epoch": 0.12766469950620257, + "learning_rate": 0.0001744690674053555, + "loss": 0.7792, + "mean_token_accuracy": 0.7689422249794007, + "num_tokens": 43244132.0, + "step": 12720 + }, + { + "epoch": 0.12776506483600306, + "learning_rate": 0.00017444899433939542, + "loss": 0.789, + "mean_token_accuracy": 0.7684858202934265, + "num_tokens": 43278611.0, + "step": 12730 + }, + { + "epoch": 0.1278654301658035, + "learning_rate": 0.0001744289212734353, + "loss": 0.7591, + "mean_token_accuracy": 0.7765051007270813, + "num_tokens": 43313373.0, + "step": 12740 + }, + { + "epoch": 0.127965795495604, + "learning_rate": 0.00017440884820747523, + "loss": 0.7795, + "mean_token_accuracy": 0.7724325597286225, + "num_tokens": 43347203.0, + "step": 12750 + }, + { + "epoch": 0.12806616082540448, + "learning_rate": 0.00017438877514151511, + "loss": 0.7674, + "mean_token_accuracy": 0.7737890899181366, + "num_tokens": 43381067.0, + "step": 12760 + }, + { + "epoch": 0.12816652615520494, + "learning_rate": 0.00017436870207555502, + "loss": 0.7716, + "mean_token_accuracy": 0.7662975430488587, + "num_tokens": 43415482.0, + "step": 12770 + }, + { + "epoch": 0.12826689148500542, + "learning_rate": 0.00017434862900959493, + "loss": 0.7805, + "mean_token_accuracy": 0.7716028571128846, + "num_tokens": 43449886.0, + "step": 12780 + }, + { + "epoch": 0.1283672568148059, + "learning_rate": 0.00017432855594363484, + "loss": 0.7626, + "mean_token_accuracy": 0.7711127996444702, + "num_tokens": 43484309.0, + "step": 12790 + }, + { + "epoch": 0.12846762214460636, + "learning_rate": 0.00017430848287767475, + "loss": 0.7954, + "mean_token_accuracy": 0.7629608392715455, + "num_tokens": 43518256.0, + "step": 12800 + }, + { + "epoch": 0.12856798747440684, + "learning_rate": 0.00017428840981171466, + "loss": 0.7683, + "mean_token_accuracy": 0.772105598449707, + "num_tokens": 43551721.0, + "step": 12810 + }, + { + "epoch": 0.12866835280420733, + "learning_rate": 0.00017426833674575456, + "loss": 0.7997, + "mean_token_accuracy": 0.7652229070663452, + "num_tokens": 43585449.0, + "step": 12820 + }, + { + "epoch": 0.12876871813400778, + "learning_rate": 0.00017424826367979445, + "loss": 0.7671, + "mean_token_accuracy": 0.7684259057044983, + "num_tokens": 43618648.0, + "step": 12830 + }, + { + "epoch": 0.12886908346380826, + "learning_rate": 0.00017422819061383438, + "loss": 0.7742, + "mean_token_accuracy": 0.7688802659511567, + "num_tokens": 43653129.0, + "step": 12840 + }, + { + "epoch": 0.12896944879360875, + "learning_rate": 0.00017420811754787426, + "loss": 0.7974, + "mean_token_accuracy": 0.7685005486011505, + "num_tokens": 43687601.0, + "step": 12850 + }, + { + "epoch": 0.1290698141234092, + "learning_rate": 0.00017418804448191417, + "loss": 0.7689, + "mean_token_accuracy": 0.7680033624172211, + "num_tokens": 43721180.0, + "step": 12860 + }, + { + "epoch": 0.1291701794532097, + "learning_rate": 0.00017416797141595408, + "loss": 0.8088, + "mean_token_accuracy": 0.7594873309135437, + "num_tokens": 43754834.0, + "step": 12870 + }, + { + "epoch": 0.12927054478301014, + "learning_rate": 0.000174147898349994, + "loss": 0.7885, + "mean_token_accuracy": 0.7675781488418579, + "num_tokens": 43788573.0, + "step": 12880 + }, + { + "epoch": 0.12937091011281063, + "learning_rate": 0.0001741278252840339, + "loss": 0.7913, + "mean_token_accuracy": 0.7689393699169159, + "num_tokens": 43823352.0, + "step": 12890 + }, + { + "epoch": 0.1294712754426111, + "learning_rate": 0.0001741077522180738, + "loss": 0.7955, + "mean_token_accuracy": 0.7641589105129242, + "num_tokens": 43857292.0, + "step": 12900 + }, + { + "epoch": 0.12957164077241157, + "learning_rate": 0.0001740876791521137, + "loss": 0.7823, + "mean_token_accuracy": 0.7730109691619873, + "num_tokens": 43892081.0, + "step": 12910 + }, + { + "epoch": 0.12967200610221205, + "learning_rate": 0.0001740676060861536, + "loss": 0.7547, + "mean_token_accuracy": 0.7731576800346375, + "num_tokens": 43925939.0, + "step": 12920 + }, + { + "epoch": 0.12977237143201253, + "learning_rate": 0.00017404753302019353, + "loss": 0.7879, + "mean_token_accuracy": 0.7724081039428711, + "num_tokens": 43959747.0, + "step": 12930 + }, + { + "epoch": 0.129872736761813, + "learning_rate": 0.0001740274599542334, + "loss": 0.7784, + "mean_token_accuracy": 0.7701088905334472, + "num_tokens": 43993034.0, + "step": 12940 + }, + { + "epoch": 0.12997310209161347, + "learning_rate": 0.00017400738688827332, + "loss": 0.7616, + "mean_token_accuracy": 0.7703144550323486, + "num_tokens": 44026791.0, + "step": 12950 + }, + { + "epoch": 0.13007346742141396, + "learning_rate": 0.00017398731382231323, + "loss": 0.7712, + "mean_token_accuracy": 0.7708591520786285, + "num_tokens": 44060490.0, + "step": 12960 + }, + { + "epoch": 0.1301738327512144, + "learning_rate": 0.00017396724075635314, + "loss": 0.7745, + "mean_token_accuracy": 0.7685743629932403, + "num_tokens": 44095062.0, + "step": 12970 + }, + { + "epoch": 0.1302741980810149, + "learning_rate": 0.00017394716769039302, + "loss": 0.792, + "mean_token_accuracy": 0.7664016485214233, + "num_tokens": 44129691.0, + "step": 12980 + }, + { + "epoch": 0.13037456341081538, + "learning_rate": 0.00017392709462443295, + "loss": 0.7776, + "mean_token_accuracy": 0.7692232489585876, + "num_tokens": 44164031.0, + "step": 12990 + }, + { + "epoch": 0.13047492874061584, + "learning_rate": 0.00017390702155847286, + "loss": 0.7897, + "mean_token_accuracy": 0.7714962363243103, + "num_tokens": 44197894.0, + "step": 13000 + }, + { + "epoch": 0.13057529407041632, + "learning_rate": 0.00017388694849251274, + "loss": 0.791, + "mean_token_accuracy": 0.7653005301952363, + "num_tokens": 44232236.0, + "step": 13010 + }, + { + "epoch": 0.13067565940021678, + "learning_rate": 0.00017386687542655268, + "loss": 0.8147, + "mean_token_accuracy": 0.7650872945785523, + "num_tokens": 44267014.0, + "step": 13020 + }, + { + "epoch": 0.13077602473001726, + "learning_rate": 0.00017384680236059256, + "loss": 0.7727, + "mean_token_accuracy": 0.7726529896259308, + "num_tokens": 44300640.0, + "step": 13030 + }, + { + "epoch": 0.13087639005981774, + "learning_rate": 0.00017382672929463247, + "loss": 0.7807, + "mean_token_accuracy": 0.7766844749450683, + "num_tokens": 44335628.0, + "step": 13040 + }, + { + "epoch": 0.1309767553896182, + "learning_rate": 0.00017380665622867238, + "loss": 0.7817, + "mean_token_accuracy": 0.7728781461715698, + "num_tokens": 44369668.0, + "step": 13050 + }, + { + "epoch": 0.13107712071941868, + "learning_rate": 0.00017378658316271229, + "loss": 0.7737, + "mean_token_accuracy": 0.7709382057189942, + "num_tokens": 44404473.0, + "step": 13060 + }, + { + "epoch": 0.13117748604921917, + "learning_rate": 0.00017376651009675217, + "loss": 0.8177, + "mean_token_accuracy": 0.7549030959606171, + "num_tokens": 44438206.0, + "step": 13070 + }, + { + "epoch": 0.13127785137901962, + "learning_rate": 0.0001737464370307921, + "loss": 0.7607, + "mean_token_accuracy": 0.7736218094825744, + "num_tokens": 44473666.0, + "step": 13080 + }, + { + "epoch": 0.1313782167088201, + "learning_rate": 0.00017372636396483198, + "loss": 0.8073, + "mean_token_accuracy": 0.766367393732071, + "num_tokens": 44507583.0, + "step": 13090 + }, + { + "epoch": 0.1314785820386206, + "learning_rate": 0.0001737062908988719, + "loss": 0.7592, + "mean_token_accuracy": 0.7713600337505341, + "num_tokens": 44540798.0, + "step": 13100 + }, + { + "epoch": 0.13157894736842105, + "learning_rate": 0.0001736862178329118, + "loss": 0.7622, + "mean_token_accuracy": 0.7700433492660522, + "num_tokens": 44574823.0, + "step": 13110 + }, + { + "epoch": 0.13167931269822153, + "learning_rate": 0.0001736661447669517, + "loss": 0.797, + "mean_token_accuracy": 0.7680361986160278, + "num_tokens": 44608377.0, + "step": 13120 + }, + { + "epoch": 0.131779678028022, + "learning_rate": 0.00017364607170099162, + "loss": 0.7792, + "mean_token_accuracy": 0.7709780335426331, + "num_tokens": 44642990.0, + "step": 13130 + }, + { + "epoch": 0.13188004335782247, + "learning_rate": 0.00017362599863503153, + "loss": 0.7647, + "mean_token_accuracy": 0.7713236749172211, + "num_tokens": 44677186.0, + "step": 13140 + }, + { + "epoch": 0.13198040868762295, + "learning_rate": 0.00017360592556907143, + "loss": 0.8078, + "mean_token_accuracy": 0.7607882797718049, + "num_tokens": 44711522.0, + "step": 13150 + }, + { + "epoch": 0.1320807740174234, + "learning_rate": 0.00017358585250311132, + "loss": 0.7737, + "mean_token_accuracy": 0.7688131511211396, + "num_tokens": 44746232.0, + "step": 13160 + }, + { + "epoch": 0.1321811393472239, + "learning_rate": 0.00017356577943715125, + "loss": 0.7885, + "mean_token_accuracy": 0.7671611368656158, + "num_tokens": 44779911.0, + "step": 13170 + }, + { + "epoch": 0.13228150467702438, + "learning_rate": 0.00017354570637119113, + "loss": 0.7855, + "mean_token_accuracy": 0.7711513102054596, + "num_tokens": 44813918.0, + "step": 13180 + }, + { + "epoch": 0.13238187000682483, + "learning_rate": 0.00017352563330523104, + "loss": 0.7996, + "mean_token_accuracy": 0.7630888521671295, + "num_tokens": 44847945.0, + "step": 13190 + }, + { + "epoch": 0.13248223533662531, + "learning_rate": 0.00017350556023927095, + "loss": 0.7831, + "mean_token_accuracy": 0.7665793359279632, + "num_tokens": 44882085.0, + "step": 13200 + }, + { + "epoch": 0.1325826006664258, + "learning_rate": 0.00017348548717331086, + "loss": 0.8153, + "mean_token_accuracy": 0.7603378415107727, + "num_tokens": 44916298.0, + "step": 13210 + }, + { + "epoch": 0.13268296599622625, + "learning_rate": 0.00017346541410735077, + "loss": 0.7559, + "mean_token_accuracy": 0.7715738892555237, + "num_tokens": 44949774.0, + "step": 13220 + }, + { + "epoch": 0.13278333132602674, + "learning_rate": 0.00017344534104139067, + "loss": 0.7429, + "mean_token_accuracy": 0.77811558842659, + "num_tokens": 44983903.0, + "step": 13230 + }, + { + "epoch": 0.13288369665582722, + "learning_rate": 0.00017342526797543058, + "loss": 0.7714, + "mean_token_accuracy": 0.7692193686962128, + "num_tokens": 45018521.0, + "step": 13240 + }, + { + "epoch": 0.13298406198562768, + "learning_rate": 0.00017340519490947046, + "loss": 0.7701, + "mean_token_accuracy": 0.770143574476242, + "num_tokens": 45052925.0, + "step": 13250 + }, + { + "epoch": 0.13308442731542816, + "learning_rate": 0.0001733851218435104, + "loss": 0.7908, + "mean_token_accuracy": 0.7723272562026977, + "num_tokens": 45086762.0, + "step": 13260 + }, + { + "epoch": 0.13318479264522864, + "learning_rate": 0.00017336504877755028, + "loss": 0.7799, + "mean_token_accuracy": 0.770423299074173, + "num_tokens": 45120480.0, + "step": 13270 + }, + { + "epoch": 0.1332851579750291, + "learning_rate": 0.00017334497571159022, + "loss": 0.792, + "mean_token_accuracy": 0.7626452445983887, + "num_tokens": 45155019.0, + "step": 13280 + }, + { + "epoch": 0.13338552330482958, + "learning_rate": 0.0001733249026456301, + "loss": 0.7716, + "mean_token_accuracy": 0.7737775027751923, + "num_tokens": 45190033.0, + "step": 13290 + }, + { + "epoch": 0.13348588863463004, + "learning_rate": 0.00017330482957967, + "loss": 0.785, + "mean_token_accuracy": 0.7683071434497833, + "num_tokens": 45223426.0, + "step": 13300 + }, + { + "epoch": 0.13358625396443052, + "learning_rate": 0.00017328475651370992, + "loss": 0.7866, + "mean_token_accuracy": 0.7668528437614441, + "num_tokens": 45256840.0, + "step": 13310 + }, + { + "epoch": 0.133686619294231, + "learning_rate": 0.00017326468344774982, + "loss": 0.8124, + "mean_token_accuracy": 0.7612246215343476, + "num_tokens": 45290629.0, + "step": 13320 + }, + { + "epoch": 0.13378698462403146, + "learning_rate": 0.0001732446103817897, + "loss": 0.8165, + "mean_token_accuracy": 0.7597314715385437, + "num_tokens": 45324283.0, + "step": 13330 + }, + { + "epoch": 0.13388734995383195, + "learning_rate": 0.00017322453731582964, + "loss": 0.7603, + "mean_token_accuracy": 0.7741209208965302, + "num_tokens": 45358674.0, + "step": 13340 + }, + { + "epoch": 0.13398771528363243, + "learning_rate": 0.00017320446424986955, + "loss": 0.7705, + "mean_token_accuracy": 0.7722501635551453, + "num_tokens": 45393358.0, + "step": 13350 + }, + { + "epoch": 0.1340880806134329, + "learning_rate": 0.00017318439118390943, + "loss": 0.8138, + "mean_token_accuracy": 0.759548419713974, + "num_tokens": 45428044.0, + "step": 13360 + }, + { + "epoch": 0.13418844594323337, + "learning_rate": 0.00017316431811794937, + "loss": 0.7779, + "mean_token_accuracy": 0.7725479602813721, + "num_tokens": 45463074.0, + "step": 13370 + }, + { + "epoch": 0.13428881127303385, + "learning_rate": 0.00017314424505198925, + "loss": 0.7742, + "mean_token_accuracy": 0.7658045768737793, + "num_tokens": 45497004.0, + "step": 13380 + }, + { + "epoch": 0.1343891766028343, + "learning_rate": 0.00017312417198602916, + "loss": 0.7651, + "mean_token_accuracy": 0.7743133664131164, + "num_tokens": 45531498.0, + "step": 13390 + }, + { + "epoch": 0.1344895419326348, + "learning_rate": 0.00017310409892006906, + "loss": 0.8109, + "mean_token_accuracy": 0.7595912873744964, + "num_tokens": 45565567.0, + "step": 13400 + }, + { + "epoch": 0.13458990726243528, + "learning_rate": 0.00017308402585410897, + "loss": 0.7704, + "mean_token_accuracy": 0.772896945476532, + "num_tokens": 45599978.0, + "step": 13410 + }, + { + "epoch": 0.13469027259223573, + "learning_rate": 0.00017306395278814885, + "loss": 0.771, + "mean_token_accuracy": 0.7661577820777893, + "num_tokens": 45633574.0, + "step": 13420 + }, + { + "epoch": 0.13479063792203622, + "learning_rate": 0.0001730438797221888, + "loss": 0.8021, + "mean_token_accuracy": 0.7706047177314759, + "num_tokens": 45667545.0, + "step": 13430 + }, + { + "epoch": 0.13489100325183667, + "learning_rate": 0.00017302380665622867, + "loss": 0.7708, + "mean_token_accuracy": 0.7734810650348664, + "num_tokens": 45701413.0, + "step": 13440 + }, + { + "epoch": 0.13499136858163716, + "learning_rate": 0.00017300373359026858, + "loss": 0.8189, + "mean_token_accuracy": 0.7598798215389252, + "num_tokens": 45735144.0, + "step": 13450 + }, + { + "epoch": 0.13509173391143764, + "learning_rate": 0.0001729836605243085, + "loss": 0.8261, + "mean_token_accuracy": 0.7524699211120606, + "num_tokens": 45768067.0, + "step": 13460 + }, + { + "epoch": 0.1351920992412381, + "learning_rate": 0.0001729635874583484, + "loss": 0.7728, + "mean_token_accuracy": 0.7695520401000977, + "num_tokens": 45802032.0, + "step": 13470 + }, + { + "epoch": 0.13529246457103858, + "learning_rate": 0.0001729435143923883, + "loss": 0.7707, + "mean_token_accuracy": 0.773700475692749, + "num_tokens": 45835979.0, + "step": 13480 + }, + { + "epoch": 0.13539282990083906, + "learning_rate": 0.0001729234413264282, + "loss": 0.7717, + "mean_token_accuracy": 0.772723913192749, + "num_tokens": 45870257.0, + "step": 13490 + }, + { + "epoch": 0.13549319523063952, + "learning_rate": 0.00017290336826046812, + "loss": 0.7493, + "mean_token_accuracy": 0.771820068359375, + "num_tokens": 45904177.0, + "step": 13500 + }, + { + "epoch": 0.13559356056044, + "learning_rate": 0.000172883295194508, + "loss": 0.7885, + "mean_token_accuracy": 0.7701919913291931, + "num_tokens": 45937497.0, + "step": 13510 + }, + { + "epoch": 0.13569392589024049, + "learning_rate": 0.00017286322212854794, + "loss": 0.7851, + "mean_token_accuracy": 0.7701319694519043, + "num_tokens": 45971675.0, + "step": 13520 + }, + { + "epoch": 0.13579429122004094, + "learning_rate": 0.00017284314906258782, + "loss": 0.7632, + "mean_token_accuracy": 0.7749830961227417, + "num_tokens": 46005934.0, + "step": 13530 + }, + { + "epoch": 0.13589465654984142, + "learning_rate": 0.00017282307599662773, + "loss": 0.7927, + "mean_token_accuracy": 0.7665489256381989, + "num_tokens": 46040017.0, + "step": 13540 + }, + { + "epoch": 0.1359950218796419, + "learning_rate": 0.00017280300293066764, + "loss": 0.7818, + "mean_token_accuracy": 0.7697871625423431, + "num_tokens": 46074303.0, + "step": 13550 + }, + { + "epoch": 0.13609538720944236, + "learning_rate": 0.00017278292986470754, + "loss": 0.7797, + "mean_token_accuracy": 0.7691508531570435, + "num_tokens": 46107970.0, + "step": 13560 + }, + { + "epoch": 0.13619575253924285, + "learning_rate": 0.00017276285679874745, + "loss": 0.7599, + "mean_token_accuracy": 0.7740316569805146, + "num_tokens": 46142060.0, + "step": 13570 + }, + { + "epoch": 0.1362961178690433, + "learning_rate": 0.00017274278373278736, + "loss": 0.7739, + "mean_token_accuracy": 0.7710063636302948, + "num_tokens": 46176680.0, + "step": 13580 + }, + { + "epoch": 0.1363964831988438, + "learning_rate": 0.00017272271066682727, + "loss": 0.7414, + "mean_token_accuracy": 0.7800506114959717, + "num_tokens": 46210560.0, + "step": 13590 + }, + { + "epoch": 0.13649684852864427, + "learning_rate": 0.00017270263760086715, + "loss": 0.7753, + "mean_token_accuracy": 0.7694782733917236, + "num_tokens": 46244876.0, + "step": 13600 + }, + { + "epoch": 0.13659721385844473, + "learning_rate": 0.0001726825645349071, + "loss": 0.8214, + "mean_token_accuracy": 0.7506749331951141, + "num_tokens": 46278744.0, + "step": 13610 + }, + { + "epoch": 0.1366975791882452, + "learning_rate": 0.00017266249146894697, + "loss": 0.7883, + "mean_token_accuracy": 0.772595876455307, + "num_tokens": 46312450.0, + "step": 13620 + }, + { + "epoch": 0.1367979445180457, + "learning_rate": 0.00017264241840298688, + "loss": 0.7715, + "mean_token_accuracy": 0.7711716651916504, + "num_tokens": 46346374.0, + "step": 13630 + }, + { + "epoch": 0.13689830984784615, + "learning_rate": 0.00017262234533702679, + "loss": 0.7385, + "mean_token_accuracy": 0.7801128923892975, + "num_tokens": 46380150.0, + "step": 13640 + }, + { + "epoch": 0.13699867517764663, + "learning_rate": 0.0001726022722710667, + "loss": 0.7758, + "mean_token_accuracy": 0.7712238490581512, + "num_tokens": 46414625.0, + "step": 13650 + }, + { + "epoch": 0.13709904050744712, + "learning_rate": 0.00017258219920510657, + "loss": 0.7841, + "mean_token_accuracy": 0.7679083704948425, + "num_tokens": 46448971.0, + "step": 13660 + }, + { + "epoch": 0.13719940583724757, + "learning_rate": 0.0001725621261391465, + "loss": 0.7807, + "mean_token_accuracy": 0.7680625975131988, + "num_tokens": 46483608.0, + "step": 13670 + }, + { + "epoch": 0.13729977116704806, + "learning_rate": 0.0001725420530731864, + "loss": 0.7679, + "mean_token_accuracy": 0.7741383075714111, + "num_tokens": 46517840.0, + "step": 13680 + }, + { + "epoch": 0.13740013649684854, + "learning_rate": 0.0001725219800072263, + "loss": 0.7813, + "mean_token_accuracy": 0.7687681138515472, + "num_tokens": 46552218.0, + "step": 13690 + }, + { + "epoch": 0.137500501826649, + "learning_rate": 0.00017250190694126624, + "loss": 0.7856, + "mean_token_accuracy": 0.7702401280403137, + "num_tokens": 46586259.0, + "step": 13700 + }, + { + "epoch": 0.13760086715644948, + "learning_rate": 0.00017248183387530612, + "loss": 0.7791, + "mean_token_accuracy": 0.7646296799182892, + "num_tokens": 46620640.0, + "step": 13710 + }, + { + "epoch": 0.13770123248624994, + "learning_rate": 0.00017246176080934603, + "loss": 0.7743, + "mean_token_accuracy": 0.7727301299571991, + "num_tokens": 46654435.0, + "step": 13720 + }, + { + "epoch": 0.13780159781605042, + "learning_rate": 0.00017244168774338593, + "loss": 0.7903, + "mean_token_accuracy": 0.7676368415355682, + "num_tokens": 46688023.0, + "step": 13730 + }, + { + "epoch": 0.1379019631458509, + "learning_rate": 0.00017242161467742584, + "loss": 0.7861, + "mean_token_accuracy": 0.7680228412151336, + "num_tokens": 46722401.0, + "step": 13740 + }, + { + "epoch": 0.13800232847565136, + "learning_rate": 0.00017240154161146572, + "loss": 0.8088, + "mean_token_accuracy": 0.7624124407768249, + "num_tokens": 46756080.0, + "step": 13750 + }, + { + "epoch": 0.13810269380545184, + "learning_rate": 0.00017238146854550566, + "loss": 0.7681, + "mean_token_accuracy": 0.7686403095722198, + "num_tokens": 46790453.0, + "step": 13760 + }, + { + "epoch": 0.13820305913525233, + "learning_rate": 0.00017236139547954554, + "loss": 0.7623, + "mean_token_accuracy": 0.7764238238334655, + "num_tokens": 46824206.0, + "step": 13770 + }, + { + "epoch": 0.13830342446505278, + "learning_rate": 0.00017234132241358545, + "loss": 0.7614, + "mean_token_accuracy": 0.7711726546287536, + "num_tokens": 46857842.0, + "step": 13780 + }, + { + "epoch": 0.13840378979485327, + "learning_rate": 0.00017232124934762536, + "loss": 0.7812, + "mean_token_accuracy": 0.769701623916626, + "num_tokens": 46891852.0, + "step": 13790 + }, + { + "epoch": 0.13850415512465375, + "learning_rate": 0.00017230117628166527, + "loss": 0.812, + "mean_token_accuracy": 0.7646488845348358, + "num_tokens": 46925378.0, + "step": 13800 + }, + { + "epoch": 0.1386045204544542, + "learning_rate": 0.00017228110321570517, + "loss": 0.7333, + "mean_token_accuracy": 0.7735948204994202, + "num_tokens": 46959647.0, + "step": 13810 + }, + { + "epoch": 0.1387048857842547, + "learning_rate": 0.00017226103014974508, + "loss": 0.7702, + "mean_token_accuracy": 0.7705456852912903, + "num_tokens": 46993300.0, + "step": 13820 + }, + { + "epoch": 0.13880525111405517, + "learning_rate": 0.000172240957083785, + "loss": 0.7841, + "mean_token_accuracy": 0.7709096789360046, + "num_tokens": 47027822.0, + "step": 13830 + }, + { + "epoch": 0.13890561644385563, + "learning_rate": 0.0001722208840178249, + "loss": 0.7351, + "mean_token_accuracy": 0.7875620603561402, + "num_tokens": 47062331.0, + "step": 13840 + }, + { + "epoch": 0.1390059817736561, + "learning_rate": 0.0001722008109518648, + "loss": 0.7799, + "mean_token_accuracy": 0.7704236924648284, + "num_tokens": 47095947.0, + "step": 13850 + }, + { + "epoch": 0.1391063471034566, + "learning_rate": 0.0001721807378859047, + "loss": 0.7928, + "mean_token_accuracy": 0.7634164929389954, + "num_tokens": 47129887.0, + "step": 13860 + }, + { + "epoch": 0.13920671243325705, + "learning_rate": 0.00017216066481994462, + "loss": 0.7675, + "mean_token_accuracy": 0.7728378593921661, + "num_tokens": 47164407.0, + "step": 13870 + }, + { + "epoch": 0.13930707776305754, + "learning_rate": 0.0001721405917539845, + "loss": 0.7953, + "mean_token_accuracy": 0.7675823390483856, + "num_tokens": 47197902.0, + "step": 13880 + }, + { + "epoch": 0.139407443092858, + "learning_rate": 0.00017212051868802441, + "loss": 0.7996, + "mean_token_accuracy": 0.7673685848712921, + "num_tokens": 47231665.0, + "step": 13890 + }, + { + "epoch": 0.13950780842265847, + "learning_rate": 0.00017210044562206432, + "loss": 0.7756, + "mean_token_accuracy": 0.765827351808548, + "num_tokens": 47265497.0, + "step": 13900 + }, + { + "epoch": 0.13960817375245896, + "learning_rate": 0.00017208037255610423, + "loss": 0.794, + "mean_token_accuracy": 0.7675317227840424, + "num_tokens": 47299717.0, + "step": 13910 + }, + { + "epoch": 0.13970853908225941, + "learning_rate": 0.00017206029949014414, + "loss": 0.7529, + "mean_token_accuracy": 0.775213748216629, + "num_tokens": 47333205.0, + "step": 13920 + }, + { + "epoch": 0.1398089044120599, + "learning_rate": 0.00017204022642418405, + "loss": 0.7833, + "mean_token_accuracy": 0.7670728325843811, + "num_tokens": 47367000.0, + "step": 13930 + }, + { + "epoch": 0.13990926974186038, + "learning_rate": 0.00017202015335822396, + "loss": 0.7525, + "mean_token_accuracy": 0.7673534214496612, + "num_tokens": 47400247.0, + "step": 13940 + }, + { + "epoch": 0.14000963507166084, + "learning_rate": 0.00017200008029226384, + "loss": 0.7609, + "mean_token_accuracy": 0.7697259187698364, + "num_tokens": 47433823.0, + "step": 13950 + }, + { + "epoch": 0.14011000040146132, + "learning_rate": 0.00017198000722630377, + "loss": 0.7617, + "mean_token_accuracy": 0.7738004982471466, + "num_tokens": 47468682.0, + "step": 13960 + }, + { + "epoch": 0.1402103657312618, + "learning_rate": 0.00017195993416034366, + "loss": 0.7536, + "mean_token_accuracy": 0.7769059181213379, + "num_tokens": 47502876.0, + "step": 13970 + }, + { + "epoch": 0.14031073106106226, + "learning_rate": 0.00017193986109438356, + "loss": 0.7609, + "mean_token_accuracy": 0.7735214591026306, + "num_tokens": 47537313.0, + "step": 13980 + }, + { + "epoch": 0.14041109639086274, + "learning_rate": 0.00017191978802842347, + "loss": 0.773, + "mean_token_accuracy": 0.7725825011730194, + "num_tokens": 47571993.0, + "step": 13990 + }, + { + "epoch": 0.14051146172066323, + "learning_rate": 0.00017189971496246338, + "loss": 0.8027, + "mean_token_accuracy": 0.7586640000343323, + "num_tokens": 47605283.0, + "step": 14000 + }, + { + "epoch": 0.14061182705046368, + "learning_rate": 0.00017187964189650326, + "loss": 0.7599, + "mean_token_accuracy": 0.7648543298244477, + "num_tokens": 47639356.0, + "step": 14010 + }, + { + "epoch": 0.14071219238026417, + "learning_rate": 0.0001718595688305432, + "loss": 0.7727, + "mean_token_accuracy": 0.7667241334915161, + "num_tokens": 47673439.0, + "step": 14020 + }, + { + "epoch": 0.14081255771006462, + "learning_rate": 0.00017183949576458308, + "loss": 0.7986, + "mean_token_accuracy": 0.7616683006286621, + "num_tokens": 47708473.0, + "step": 14030 + }, + { + "epoch": 0.1409129230398651, + "learning_rate": 0.000171819422698623, + "loss": 0.7705, + "mean_token_accuracy": 0.7730585336685181, + "num_tokens": 47742040.0, + "step": 14040 + }, + { + "epoch": 0.1410132883696656, + "learning_rate": 0.00017179934963266292, + "loss": 0.7786, + "mean_token_accuracy": 0.7654690504074096, + "num_tokens": 47776275.0, + "step": 14050 + }, + { + "epoch": 0.14111365369946605, + "learning_rate": 0.0001717792765667028, + "loss": 0.7641, + "mean_token_accuracy": 0.7734162449836731, + "num_tokens": 47810210.0, + "step": 14060 + }, + { + "epoch": 0.14121401902926653, + "learning_rate": 0.0001717592035007427, + "loss": 0.8132, + "mean_token_accuracy": 0.7598636031150818, + "num_tokens": 47844089.0, + "step": 14070 + }, + { + "epoch": 0.141314384359067, + "learning_rate": 0.00017173913043478262, + "loss": 0.8046, + "mean_token_accuracy": 0.7569852828979492, + "num_tokens": 47878100.0, + "step": 14080 + }, + { + "epoch": 0.14141474968886747, + "learning_rate": 0.00017171905736882253, + "loss": 0.7758, + "mean_token_accuracy": 0.7700919866561889, + "num_tokens": 47911663.0, + "step": 14090 + }, + { + "epoch": 0.14151511501866795, + "learning_rate": 0.0001716989843028624, + "loss": 0.7978, + "mean_token_accuracy": 0.7650790452957154, + "num_tokens": 47945287.0, + "step": 14100 + }, + { + "epoch": 0.14161548034846844, + "learning_rate": 0.00017167891123690235, + "loss": 0.7581, + "mean_token_accuracy": 0.769956111907959, + "num_tokens": 47979839.0, + "step": 14110 + }, + { + "epoch": 0.1417158456782689, + "learning_rate": 0.00017165883817094223, + "loss": 0.8178, + "mean_token_accuracy": 0.7598431885242463, + "num_tokens": 48013703.0, + "step": 14120 + }, + { + "epoch": 0.14181621100806938, + "learning_rate": 0.00017163876510498214, + "loss": 0.7827, + "mean_token_accuracy": 0.7717898309230804, + "num_tokens": 48048922.0, + "step": 14130 + }, + { + "epoch": 0.14191657633786986, + "learning_rate": 0.00017161869203902204, + "loss": 0.7783, + "mean_token_accuracy": 0.7692624986171722, + "num_tokens": 48083289.0, + "step": 14140 + }, + { + "epoch": 0.14201694166767032, + "learning_rate": 0.00017159861897306195, + "loss": 0.768, + "mean_token_accuracy": 0.7684755384922027, + "num_tokens": 48117632.0, + "step": 14150 + }, + { + "epoch": 0.1421173069974708, + "learning_rate": 0.00017157854590710186, + "loss": 0.775, + "mean_token_accuracy": 0.7717197239398956, + "num_tokens": 48151932.0, + "step": 14160 + }, + { + "epoch": 0.14221767232727126, + "learning_rate": 0.00017155847284114177, + "loss": 0.7717, + "mean_token_accuracy": 0.770142924785614, + "num_tokens": 48186237.0, + "step": 14170 + }, + { + "epoch": 0.14231803765707174, + "learning_rate": 0.00017153839977518168, + "loss": 0.7625, + "mean_token_accuracy": 0.774982887506485, + "num_tokens": 48220618.0, + "step": 14180 + }, + { + "epoch": 0.14241840298687222, + "learning_rate": 0.00017151832670922156, + "loss": 0.7561, + "mean_token_accuracy": 0.7678909063339233, + "num_tokens": 48254715.0, + "step": 14190 + }, + { + "epoch": 0.14251876831667268, + "learning_rate": 0.0001714982536432615, + "loss": 0.8216, + "mean_token_accuracy": 0.7582562386989593, + "num_tokens": 48289057.0, + "step": 14200 + }, + { + "epoch": 0.14261913364647316, + "learning_rate": 0.00017147818057730138, + "loss": 0.7678, + "mean_token_accuracy": 0.7684305965900421, + "num_tokens": 48322743.0, + "step": 14210 + }, + { + "epoch": 0.14271949897627365, + "learning_rate": 0.00017145810751134128, + "loss": 0.775, + "mean_token_accuracy": 0.7674304842948914, + "num_tokens": 48356844.0, + "step": 14220 + }, + { + "epoch": 0.1428198643060741, + "learning_rate": 0.0001714380344453812, + "loss": 0.7682, + "mean_token_accuracy": 0.7700712382793427, + "num_tokens": 48391103.0, + "step": 14230 + }, + { + "epoch": 0.14292022963587458, + "learning_rate": 0.0001714179613794211, + "loss": 0.7638, + "mean_token_accuracy": 0.7687857925891877, + "num_tokens": 48426188.0, + "step": 14240 + }, + { + "epoch": 0.14302059496567507, + "learning_rate": 0.000171397888313461, + "loss": 0.8046, + "mean_token_accuracy": 0.765725177526474, + "num_tokens": 48459984.0, + "step": 14250 + }, + { + "epoch": 0.14312096029547552, + "learning_rate": 0.00017137781524750092, + "loss": 0.7996, + "mean_token_accuracy": 0.7675525188446045, + "num_tokens": 48493797.0, + "step": 14260 + }, + { + "epoch": 0.143221325625276, + "learning_rate": 0.00017135774218154083, + "loss": 0.7695, + "mean_token_accuracy": 0.7674437403678894, + "num_tokens": 48527438.0, + "step": 14270 + }, + { + "epoch": 0.1433216909550765, + "learning_rate": 0.0001713376691155807, + "loss": 0.7818, + "mean_token_accuracy": 0.7690040349960328, + "num_tokens": 48561319.0, + "step": 14280 + }, + { + "epoch": 0.14342205628487695, + "learning_rate": 0.00017131759604962064, + "loss": 0.7419, + "mean_token_accuracy": 0.7776353180408477, + "num_tokens": 48596375.0, + "step": 14290 + }, + { + "epoch": 0.14352242161467743, + "learning_rate": 0.00017129752298366053, + "loss": 0.8173, + "mean_token_accuracy": 0.7611851871013642, + "num_tokens": 48629504.0, + "step": 14300 + }, + { + "epoch": 0.1436227869444779, + "learning_rate": 0.00017127744991770043, + "loss": 0.7744, + "mean_token_accuracy": 0.77262002825737, + "num_tokens": 48663457.0, + "step": 14310 + }, + { + "epoch": 0.14372315227427837, + "learning_rate": 0.00017125737685174034, + "loss": 0.7743, + "mean_token_accuracy": 0.7743302881717682, + "num_tokens": 48696690.0, + "step": 14320 + }, + { + "epoch": 0.14382351760407885, + "learning_rate": 0.00017123730378578025, + "loss": 0.75, + "mean_token_accuracy": 0.7791252076625824, + "num_tokens": 48730493.0, + "step": 14330 + }, + { + "epoch": 0.1439238829338793, + "learning_rate": 0.00017121723071982013, + "loss": 0.7756, + "mean_token_accuracy": 0.7683629155158996, + "num_tokens": 48764417.0, + "step": 14340 + }, + { + "epoch": 0.1440242482636798, + "learning_rate": 0.00017119715765386007, + "loss": 0.7569, + "mean_token_accuracy": 0.7765732944011688, + "num_tokens": 48798453.0, + "step": 14350 + }, + { + "epoch": 0.14412461359348028, + "learning_rate": 0.00017117708458789995, + "loss": 0.7683, + "mean_token_accuracy": 0.7712306499481201, + "num_tokens": 48832693.0, + "step": 14360 + }, + { + "epoch": 0.14422497892328073, + "learning_rate": 0.00017115701152193986, + "loss": 0.7457, + "mean_token_accuracy": 0.7717716634273529, + "num_tokens": 48866575.0, + "step": 14370 + }, + { + "epoch": 0.14432534425308122, + "learning_rate": 0.00017113693845597977, + "loss": 0.7663, + "mean_token_accuracy": 0.7678154647350312, + "num_tokens": 48901108.0, + "step": 14380 + }, + { + "epoch": 0.1444257095828817, + "learning_rate": 0.00017111686539001967, + "loss": 0.7707, + "mean_token_accuracy": 0.7703318357467651, + "num_tokens": 48934997.0, + "step": 14390 + }, + { + "epoch": 0.14452607491268216, + "learning_rate": 0.0001710967923240596, + "loss": 0.8135, + "mean_token_accuracy": 0.7601113379001617, + "num_tokens": 48968946.0, + "step": 14400 + }, + { + "epoch": 0.14462644024248264, + "learning_rate": 0.0001710767192580995, + "loss": 0.7806, + "mean_token_accuracy": 0.7674680829048157, + "num_tokens": 49002596.0, + "step": 14410 + }, + { + "epoch": 0.14472680557228312, + "learning_rate": 0.0001710566461921394, + "loss": 0.7753, + "mean_token_accuracy": 0.7743801653385163, + "num_tokens": 49037227.0, + "step": 14420 + }, + { + "epoch": 0.14482717090208358, + "learning_rate": 0.0001710365731261793, + "loss": 0.7743, + "mean_token_accuracy": 0.7689658284187317, + "num_tokens": 49071575.0, + "step": 14430 + }, + { + "epoch": 0.14492753623188406, + "learning_rate": 0.00017101650006021922, + "loss": 0.7885, + "mean_token_accuracy": 0.7673587083816529, + "num_tokens": 49105269.0, + "step": 14440 + }, + { + "epoch": 0.14502790156168452, + "learning_rate": 0.0001709964269942591, + "loss": 0.7291, + "mean_token_accuracy": 0.7780017077922821, + "num_tokens": 49139078.0, + "step": 14450 + }, + { + "epoch": 0.145128266891485, + "learning_rate": 0.00017097635392829903, + "loss": 0.7903, + "mean_token_accuracy": 0.763459712266922, + "num_tokens": 49172279.0, + "step": 14460 + }, + { + "epoch": 0.1452286322212855, + "learning_rate": 0.00017095628086233891, + "loss": 0.7744, + "mean_token_accuracy": 0.7665413856506348, + "num_tokens": 49206375.0, + "step": 14470 + }, + { + "epoch": 0.14532899755108594, + "learning_rate": 0.00017093620779637882, + "loss": 0.7583, + "mean_token_accuracy": 0.7723636865615845, + "num_tokens": 49239652.0, + "step": 14480 + }, + { + "epoch": 0.14542936288088643, + "learning_rate": 0.00017091613473041873, + "loss": 0.7851, + "mean_token_accuracy": 0.7731632351875305, + "num_tokens": 49274454.0, + "step": 14490 + }, + { + "epoch": 0.1455297282106869, + "learning_rate": 0.00017089606166445864, + "loss": 0.7677, + "mean_token_accuracy": 0.7742032051086426, + "num_tokens": 49308392.0, + "step": 14500 + }, + { + "epoch": 0.14563009354048737, + "learning_rate": 0.00017087598859849855, + "loss": 0.7791, + "mean_token_accuracy": 0.7644475340843201, + "num_tokens": 49342432.0, + "step": 14510 + }, + { + "epoch": 0.14573045887028785, + "learning_rate": 0.00017085591553253846, + "loss": 0.762, + "mean_token_accuracy": 0.7713985919952393, + "num_tokens": 49376858.0, + "step": 14520 + }, + { + "epoch": 0.14583082420008833, + "learning_rate": 0.00017083584246657836, + "loss": 0.7637, + "mean_token_accuracy": 0.7681733310222626, + "num_tokens": 49410766.0, + "step": 14530 + }, + { + "epoch": 0.1459311895298888, + "learning_rate": 0.00017081576940061825, + "loss": 0.7734, + "mean_token_accuracy": 0.7684456408023834, + "num_tokens": 49444756.0, + "step": 14540 + }, + { + "epoch": 0.14603155485968927, + "learning_rate": 0.00017079569633465818, + "loss": 0.7742, + "mean_token_accuracy": 0.7629444479942322, + "num_tokens": 49478718.0, + "step": 14550 + }, + { + "epoch": 0.14613192018948976, + "learning_rate": 0.00017077562326869806, + "loss": 0.7801, + "mean_token_accuracy": 0.7721074879169464, + "num_tokens": 49512966.0, + "step": 14560 + }, + { + "epoch": 0.1462322855192902, + "learning_rate": 0.00017075555020273797, + "loss": 0.8258, + "mean_token_accuracy": 0.7574770987033844, + "num_tokens": 49546625.0, + "step": 14570 + }, + { + "epoch": 0.1463326508490907, + "learning_rate": 0.00017073547713677788, + "loss": 0.7797, + "mean_token_accuracy": 0.7676370680332184, + "num_tokens": 49580349.0, + "step": 14580 + }, + { + "epoch": 0.14643301617889115, + "learning_rate": 0.0001707154040708178, + "loss": 0.7727, + "mean_token_accuracy": 0.7711577177047729, + "num_tokens": 49615199.0, + "step": 14590 + }, + { + "epoch": 0.14653338150869163, + "learning_rate": 0.0001706953310048577, + "loss": 0.7873, + "mean_token_accuracy": 0.7690609931945801, + "num_tokens": 49649446.0, + "step": 14600 + }, + { + "epoch": 0.14663374683849212, + "learning_rate": 0.0001706752579388976, + "loss": 0.8099, + "mean_token_accuracy": 0.7618093013763427, + "num_tokens": 49684222.0, + "step": 14610 + }, + { + "epoch": 0.14673411216829257, + "learning_rate": 0.00017065518487293751, + "loss": 0.811, + "mean_token_accuracy": 0.7617361068725585, + "num_tokens": 49718135.0, + "step": 14620 + }, + { + "epoch": 0.14683447749809306, + "learning_rate": 0.0001706351118069774, + "loss": 0.7626, + "mean_token_accuracy": 0.7758596897125244, + "num_tokens": 49751759.0, + "step": 14630 + }, + { + "epoch": 0.14693484282789354, + "learning_rate": 0.00017061503874101733, + "loss": 0.7403, + "mean_token_accuracy": 0.779796940088272, + "num_tokens": 49785188.0, + "step": 14640 + }, + { + "epoch": 0.147035208157694, + "learning_rate": 0.0001705949656750572, + "loss": 0.7291, + "mean_token_accuracy": 0.7814127624034881, + "num_tokens": 49819304.0, + "step": 14650 + }, + { + "epoch": 0.14713557348749448, + "learning_rate": 0.00017057489260909712, + "loss": 0.738, + "mean_token_accuracy": 0.781837260723114, + "num_tokens": 49853347.0, + "step": 14660 + }, + { + "epoch": 0.14723593881729496, + "learning_rate": 0.00017055481954313703, + "loss": 0.8126, + "mean_token_accuracy": 0.7659143388271332, + "num_tokens": 49887091.0, + "step": 14670 + }, + { + "epoch": 0.14733630414709542, + "learning_rate": 0.00017053474647717694, + "loss": 0.7821, + "mean_token_accuracy": 0.762554156780243, + "num_tokens": 49920807.0, + "step": 14680 + }, + { + "epoch": 0.1474366694768959, + "learning_rate": 0.00017051467341121682, + "loss": 0.7683, + "mean_token_accuracy": 0.7699177026748657, + "num_tokens": 49954757.0, + "step": 14690 + }, + { + "epoch": 0.1475370348066964, + "learning_rate": 0.00017049460034525675, + "loss": 0.8059, + "mean_token_accuracy": 0.7631576359272003, + "num_tokens": 49988778.0, + "step": 14700 + }, + { + "epoch": 0.14763740013649684, + "learning_rate": 0.00017047452727929664, + "loss": 0.7575, + "mean_token_accuracy": 0.7731440722942352, + "num_tokens": 50022660.0, + "step": 14710 + }, + { + "epoch": 0.14773776546629733, + "learning_rate": 0.00017045445421333654, + "loss": 0.7977, + "mean_token_accuracy": 0.7649730324745179, + "num_tokens": 50057313.0, + "step": 14720 + }, + { + "epoch": 0.14783813079609778, + "learning_rate": 0.00017043438114737645, + "loss": 0.7949, + "mean_token_accuracy": 0.7624725639820099, + "num_tokens": 50091866.0, + "step": 14730 + }, + { + "epoch": 0.14793849612589827, + "learning_rate": 0.00017041430808141636, + "loss": 0.7782, + "mean_token_accuracy": 0.7648936033248901, + "num_tokens": 50125834.0, + "step": 14740 + }, + { + "epoch": 0.14803886145569875, + "learning_rate": 0.00017039423501545627, + "loss": 0.7624, + "mean_token_accuracy": 0.7722070574760437, + "num_tokens": 50159601.0, + "step": 14750 + }, + { + "epoch": 0.1481392267854992, + "learning_rate": 0.00017037416194949618, + "loss": 0.7902, + "mean_token_accuracy": 0.7632073402404785, + "num_tokens": 50193854.0, + "step": 14760 + }, + { + "epoch": 0.1482395921152997, + "learning_rate": 0.00017035408888353609, + "loss": 0.7849, + "mean_token_accuracy": 0.7690035998821259, + "num_tokens": 50226519.0, + "step": 14770 + }, + { + "epoch": 0.14833995744510017, + "learning_rate": 0.00017033401581757597, + "loss": 0.786, + "mean_token_accuracy": 0.76683349609375, + "num_tokens": 50260778.0, + "step": 14780 + }, + { + "epoch": 0.14844032277490063, + "learning_rate": 0.0001703139427516159, + "loss": 0.7987, + "mean_token_accuracy": 0.7645675659179687, + "num_tokens": 50295055.0, + "step": 14790 + }, + { + "epoch": 0.1485406881047011, + "learning_rate": 0.00017029386968565578, + "loss": 0.7995, + "mean_token_accuracy": 0.7587841510772705, + "num_tokens": 50329292.0, + "step": 14800 + }, + { + "epoch": 0.1486410534345016, + "learning_rate": 0.0001702737966196957, + "loss": 0.7646, + "mean_token_accuracy": 0.7711651980876922, + "num_tokens": 50363063.0, + "step": 14810 + }, + { + "epoch": 0.14874141876430205, + "learning_rate": 0.0001702537235537356, + "loss": 0.7713, + "mean_token_accuracy": 0.7693265795707702, + "num_tokens": 50396926.0, + "step": 14820 + }, + { + "epoch": 0.14884178409410254, + "learning_rate": 0.0001702336504877755, + "loss": 0.783, + "mean_token_accuracy": 0.7658595263957977, + "num_tokens": 50431613.0, + "step": 14830 + }, + { + "epoch": 0.14894214942390302, + "learning_rate": 0.00017021357742181542, + "loss": 0.7675, + "mean_token_accuracy": 0.7688614845275878, + "num_tokens": 50465709.0, + "step": 14840 + }, + { + "epoch": 0.14904251475370348, + "learning_rate": 0.00017019350435585533, + "loss": 0.7679, + "mean_token_accuracy": 0.7678883016109467, + "num_tokens": 50499759.0, + "step": 14850 + }, + { + "epoch": 0.14914288008350396, + "learning_rate": 0.00017017343128989523, + "loss": 0.7617, + "mean_token_accuracy": 0.770219212770462, + "num_tokens": 50532901.0, + "step": 14860 + }, + { + "epoch": 0.14924324541330442, + "learning_rate": 0.00017015335822393512, + "loss": 0.7395, + "mean_token_accuracy": 0.77974174618721, + "num_tokens": 50567043.0, + "step": 14870 + }, + { + "epoch": 0.1493436107431049, + "learning_rate": 0.00017013328515797505, + "loss": 0.7909, + "mean_token_accuracy": 0.7677434682846069, + "num_tokens": 50602267.0, + "step": 14880 + }, + { + "epoch": 0.14944397607290538, + "learning_rate": 0.00017011321209201493, + "loss": 0.7597, + "mean_token_accuracy": 0.7755030393600464, + "num_tokens": 50636462.0, + "step": 14890 + }, + { + "epoch": 0.14954434140270584, + "learning_rate": 0.00017009313902605484, + "loss": 0.7802, + "mean_token_accuracy": 0.7705316066741943, + "num_tokens": 50670148.0, + "step": 14900 + }, + { + "epoch": 0.14964470673250632, + "learning_rate": 0.00017007306596009475, + "loss": 0.7737, + "mean_token_accuracy": 0.7712871432304382, + "num_tokens": 50703722.0, + "step": 14910 + }, + { + "epoch": 0.1497450720623068, + "learning_rate": 0.00017005299289413466, + "loss": 0.7586, + "mean_token_accuracy": 0.7706503093242645, + "num_tokens": 50737562.0, + "step": 14920 + }, + { + "epoch": 0.14984543739210726, + "learning_rate": 0.00017003291982817454, + "loss": 0.7456, + "mean_token_accuracy": 0.777435052394867, + "num_tokens": 50772332.0, + "step": 14930 + }, + { + "epoch": 0.14994580272190774, + "learning_rate": 0.00017001284676221448, + "loss": 0.7653, + "mean_token_accuracy": 0.7687119841575623, + "num_tokens": 50806611.0, + "step": 14940 + }, + { + "epoch": 0.15004616805170823, + "learning_rate": 0.00016999277369625438, + "loss": 0.7887, + "mean_token_accuracy": 0.7700403153896331, + "num_tokens": 50840571.0, + "step": 14950 + }, + { + "epoch": 0.15014653338150868, + "learning_rate": 0.0001699727006302943, + "loss": 0.7526, + "mean_token_accuracy": 0.7817915320396424, + "num_tokens": 50874811.0, + "step": 14960 + }, + { + "epoch": 0.15024689871130917, + "learning_rate": 0.0001699526275643342, + "loss": 0.7738, + "mean_token_accuracy": 0.768299001455307, + "num_tokens": 50908397.0, + "step": 14970 + }, + { + "epoch": 0.15034726404110965, + "learning_rate": 0.00016993255449837408, + "loss": 0.7795, + "mean_token_accuracy": 0.7687034428119659, + "num_tokens": 50942598.0, + "step": 14980 + }, + { + "epoch": 0.1504476293709101, + "learning_rate": 0.00016991248143241402, + "loss": 0.7641, + "mean_token_accuracy": 0.777588176727295, + "num_tokens": 50976321.0, + "step": 14990 + }, + { + "epoch": 0.1505479947007106, + "learning_rate": 0.0001698924083664539, + "loss": 0.7864, + "mean_token_accuracy": 0.7661957383155823, + "num_tokens": 51010290.0, + "step": 15000 + }, + { + "epoch": 0.15064836003051105, + "learning_rate": 0.0001698723353004938, + "loss": 0.8026, + "mean_token_accuracy": 0.7674146234989166, + "num_tokens": 51044490.0, + "step": 15010 + }, + { + "epoch": 0.15074872536031153, + "learning_rate": 0.00016985226223453372, + "loss": 0.7927, + "mean_token_accuracy": 0.7660162925720215, + "num_tokens": 51078398.0, + "step": 15020 + }, + { + "epoch": 0.15084909069011201, + "learning_rate": 0.00016983218916857362, + "loss": 0.7849, + "mean_token_accuracy": 0.7597988963127136, + "num_tokens": 51112212.0, + "step": 15030 + }, + { + "epoch": 0.15094945601991247, + "learning_rate": 0.0001698121161026135, + "loss": 0.7827, + "mean_token_accuracy": 0.769049596786499, + "num_tokens": 51146235.0, + "step": 15040 + }, + { + "epoch": 0.15104982134971295, + "learning_rate": 0.00016979204303665344, + "loss": 0.7729, + "mean_token_accuracy": 0.7703625738620759, + "num_tokens": 51181217.0, + "step": 15050 + }, + { + "epoch": 0.15115018667951344, + "learning_rate": 0.00016977196997069332, + "loss": 0.7501, + "mean_token_accuracy": 0.7812409579753876, + "num_tokens": 51215132.0, + "step": 15060 + }, + { + "epoch": 0.1512505520093139, + "learning_rate": 0.00016975189690473323, + "loss": 0.7898, + "mean_token_accuracy": 0.7634902775287629, + "num_tokens": 51248088.0, + "step": 15070 + }, + { + "epoch": 0.15135091733911438, + "learning_rate": 0.00016973182383877314, + "loss": 0.7961, + "mean_token_accuracy": 0.765084159374237, + "num_tokens": 51282063.0, + "step": 15080 + }, + { + "epoch": 0.15145128266891486, + "learning_rate": 0.00016971175077281305, + "loss": 0.7772, + "mean_token_accuracy": 0.7728128671646118, + "num_tokens": 51315751.0, + "step": 15090 + }, + { + "epoch": 0.15155164799871532, + "learning_rate": 0.00016969167770685296, + "loss": 0.7762, + "mean_token_accuracy": 0.7731463789939881, + "num_tokens": 51350886.0, + "step": 15100 + }, + { + "epoch": 0.1516520133285158, + "learning_rate": 0.00016967160464089286, + "loss": 0.8285, + "mean_token_accuracy": 0.7553871512413025, + "num_tokens": 51385104.0, + "step": 15110 + }, + { + "epoch": 0.15175237865831628, + "learning_rate": 0.00016965153157493277, + "loss": 0.7773, + "mean_token_accuracy": 0.7678468465805054, + "num_tokens": 51418921.0, + "step": 15120 + }, + { + "epoch": 0.15185274398811674, + "learning_rate": 0.00016963145850897265, + "loss": 0.7839, + "mean_token_accuracy": 0.766031664609909, + "num_tokens": 51453508.0, + "step": 15130 + }, + { + "epoch": 0.15195310931791722, + "learning_rate": 0.0001696113854430126, + "loss": 0.7815, + "mean_token_accuracy": 0.7636368274688721, + "num_tokens": 51487504.0, + "step": 15140 + }, + { + "epoch": 0.15205347464771768, + "learning_rate": 0.00016959131237705247, + "loss": 0.7573, + "mean_token_accuracy": 0.7721414029598236, + "num_tokens": 51521862.0, + "step": 15150 + }, + { + "epoch": 0.15215383997751816, + "learning_rate": 0.00016957123931109238, + "loss": 0.7863, + "mean_token_accuracy": 0.7631633579730988, + "num_tokens": 51555799.0, + "step": 15160 + }, + { + "epoch": 0.15225420530731865, + "learning_rate": 0.0001695511662451323, + "loss": 0.7799, + "mean_token_accuracy": 0.7730798959732056, + "num_tokens": 51589540.0, + "step": 15170 + }, + { + "epoch": 0.1523545706371191, + "learning_rate": 0.0001695310931791722, + "loss": 0.7733, + "mean_token_accuracy": 0.770631343126297, + "num_tokens": 51622986.0, + "step": 15180 + }, + { + "epoch": 0.15245493596691959, + "learning_rate": 0.0001695110201132121, + "loss": 0.7931, + "mean_token_accuracy": 0.7658929049968719, + "num_tokens": 51657488.0, + "step": 15190 + }, + { + "epoch": 0.15255530129672007, + "learning_rate": 0.000169490947047252, + "loss": 0.7684, + "mean_token_accuracy": 0.7691733777523041, + "num_tokens": 51691318.0, + "step": 15200 + }, + { + "epoch": 0.15265566662652053, + "learning_rate": 0.00016947087398129192, + "loss": 0.7829, + "mean_token_accuracy": 0.7676796436309814, + "num_tokens": 51725571.0, + "step": 15210 + }, + { + "epoch": 0.152756031956321, + "learning_rate": 0.0001694508009153318, + "loss": 0.7736, + "mean_token_accuracy": 0.7698560178279876, + "num_tokens": 51760144.0, + "step": 15220 + }, + { + "epoch": 0.1528563972861215, + "learning_rate": 0.00016943072784937174, + "loss": 0.776, + "mean_token_accuracy": 0.7702752113342285, + "num_tokens": 51794828.0, + "step": 15230 + }, + { + "epoch": 0.15295676261592195, + "learning_rate": 0.00016941065478341162, + "loss": 0.7994, + "mean_token_accuracy": 0.7647412180900574, + "num_tokens": 51829991.0, + "step": 15240 + }, + { + "epoch": 0.15305712794572243, + "learning_rate": 0.00016939058171745153, + "loss": 0.8329, + "mean_token_accuracy": 0.7600164353847504, + "num_tokens": 51863756.0, + "step": 15250 + }, + { + "epoch": 0.15315749327552292, + "learning_rate": 0.00016937050865149144, + "loss": 0.7648, + "mean_token_accuracy": 0.7694015741348267, + "num_tokens": 51897795.0, + "step": 15260 + }, + { + "epoch": 0.15325785860532337, + "learning_rate": 0.00016935043558553135, + "loss": 0.7942, + "mean_token_accuracy": 0.7628164887428284, + "num_tokens": 51932470.0, + "step": 15270 + }, + { + "epoch": 0.15335822393512386, + "learning_rate": 0.00016933036251957123, + "loss": 0.7672, + "mean_token_accuracy": 0.7684712946414948, + "num_tokens": 51966083.0, + "step": 15280 + }, + { + "epoch": 0.1534585892649243, + "learning_rate": 0.00016931028945361116, + "loss": 0.7717, + "mean_token_accuracy": 0.7693732619285584, + "num_tokens": 52000227.0, + "step": 15290 + }, + { + "epoch": 0.1535589545947248, + "learning_rate": 0.00016929021638765107, + "loss": 0.7447, + "mean_token_accuracy": 0.7782359421253204, + "num_tokens": 52034381.0, + "step": 15300 + }, + { + "epoch": 0.15365931992452528, + "learning_rate": 0.00016927014332169095, + "loss": 0.7443, + "mean_token_accuracy": 0.7774894177913666, + "num_tokens": 52068730.0, + "step": 15310 + }, + { + "epoch": 0.15375968525432573, + "learning_rate": 0.0001692500702557309, + "loss": 0.7818, + "mean_token_accuracy": 0.7613789796829223, + "num_tokens": 52102583.0, + "step": 15320 + }, + { + "epoch": 0.15386005058412622, + "learning_rate": 0.00016922999718977077, + "loss": 0.7464, + "mean_token_accuracy": 0.7733263611793518, + "num_tokens": 52136611.0, + "step": 15330 + }, + { + "epoch": 0.1539604159139267, + "learning_rate": 0.00016920992412381068, + "loss": 0.8141, + "mean_token_accuracy": 0.7589938104152679, + "num_tokens": 52170087.0, + "step": 15340 + }, + { + "epoch": 0.15406078124372716, + "learning_rate": 0.00016918985105785059, + "loss": 0.7711, + "mean_token_accuracy": 0.7660266518592834, + "num_tokens": 52203630.0, + "step": 15350 + }, + { + "epoch": 0.15416114657352764, + "learning_rate": 0.0001691697779918905, + "loss": 0.7854, + "mean_token_accuracy": 0.767578762769699, + "num_tokens": 52237519.0, + "step": 15360 + }, + { + "epoch": 0.15426151190332812, + "learning_rate": 0.00016914970492593038, + "loss": 0.8112, + "mean_token_accuracy": 0.763132518529892, + "num_tokens": 52272011.0, + "step": 15370 + }, + { + "epoch": 0.15436187723312858, + "learning_rate": 0.0001691296318599703, + "loss": 0.7733, + "mean_token_accuracy": 0.7657889425754547, + "num_tokens": 52305881.0, + "step": 15380 + }, + { + "epoch": 0.15446224256292906, + "learning_rate": 0.0001691095587940102, + "loss": 0.7674, + "mean_token_accuracy": 0.7740002870559692, + "num_tokens": 52340078.0, + "step": 15390 + }, + { + "epoch": 0.15456260789272955, + "learning_rate": 0.0001690894857280501, + "loss": 0.7815, + "mean_token_accuracy": 0.7709534764289856, + "num_tokens": 52373189.0, + "step": 15400 + }, + { + "epoch": 0.15466297322253, + "learning_rate": 0.00016906941266209, + "loss": 0.7778, + "mean_token_accuracy": 0.770790982246399, + "num_tokens": 52407317.0, + "step": 15410 + }, + { + "epoch": 0.1547633385523305, + "learning_rate": 0.00016904933959612992, + "loss": 0.7848, + "mean_token_accuracy": 0.7632052719593048, + "num_tokens": 52441594.0, + "step": 15420 + }, + { + "epoch": 0.15486370388213094, + "learning_rate": 0.00016902926653016983, + "loss": 0.7897, + "mean_token_accuracy": 0.7655413448810577, + "num_tokens": 52476312.0, + "step": 15430 + }, + { + "epoch": 0.15496406921193143, + "learning_rate": 0.00016900919346420973, + "loss": 0.799, + "mean_token_accuracy": 0.7574868977069855, + "num_tokens": 52509946.0, + "step": 15440 + }, + { + "epoch": 0.1550644345417319, + "learning_rate": 0.00016898912039824964, + "loss": 0.7716, + "mean_token_accuracy": 0.7688789784908294, + "num_tokens": 52543677.0, + "step": 15450 + }, + { + "epoch": 0.15516479987153237, + "learning_rate": 0.00016896904733228952, + "loss": 0.783, + "mean_token_accuracy": 0.7685745835304261, + "num_tokens": 52578088.0, + "step": 15460 + }, + { + "epoch": 0.15526516520133285, + "learning_rate": 0.00016894897426632946, + "loss": 0.7759, + "mean_token_accuracy": 0.7655752122402191, + "num_tokens": 52611959.0, + "step": 15470 + }, + { + "epoch": 0.15536553053113333, + "learning_rate": 0.00016892890120036934, + "loss": 0.7806, + "mean_token_accuracy": 0.770868468284607, + "num_tokens": 52647202.0, + "step": 15480 + }, + { + "epoch": 0.1554658958609338, + "learning_rate": 0.00016890882813440925, + "loss": 0.7804, + "mean_token_accuracy": 0.7744951903820038, + "num_tokens": 52680968.0, + "step": 15490 + }, + { + "epoch": 0.15556626119073427, + "learning_rate": 0.00016888875506844916, + "loss": 0.754, + "mean_token_accuracy": 0.7730810880661011, + "num_tokens": 52715308.0, + "step": 15500 + }, + { + "epoch": 0.15566662652053476, + "learning_rate": 0.00016886868200248907, + "loss": 0.7843, + "mean_token_accuracy": 0.7653223693370819, + "num_tokens": 52749798.0, + "step": 15510 + }, + { + "epoch": 0.1557669918503352, + "learning_rate": 0.00016884860893652897, + "loss": 0.7951, + "mean_token_accuracy": 0.7614391505718231, + "num_tokens": 52782918.0, + "step": 15520 + }, + { + "epoch": 0.1558673571801357, + "learning_rate": 0.00016882853587056888, + "loss": 0.7665, + "mean_token_accuracy": 0.7676415383815766, + "num_tokens": 52816974.0, + "step": 15530 + }, + { + "epoch": 0.15596772250993618, + "learning_rate": 0.0001688084628046088, + "loss": 0.7866, + "mean_token_accuracy": 0.7668696820735932, + "num_tokens": 52851162.0, + "step": 15540 + }, + { + "epoch": 0.15606808783973664, + "learning_rate": 0.0001687883897386487, + "loss": 0.7694, + "mean_token_accuracy": 0.7691082119941711, + "num_tokens": 52884720.0, + "step": 15550 + }, + { + "epoch": 0.15616845316953712, + "learning_rate": 0.0001687683166726886, + "loss": 0.7733, + "mean_token_accuracy": 0.7732429683208466, + "num_tokens": 52917938.0, + "step": 15560 + }, + { + "epoch": 0.15626881849933758, + "learning_rate": 0.0001687482436067285, + "loss": 0.792, + "mean_token_accuracy": 0.7621237814426423, + "num_tokens": 52951666.0, + "step": 15570 + }, + { + "epoch": 0.15636918382913806, + "learning_rate": 0.00016872817054076843, + "loss": 0.7439, + "mean_token_accuracy": 0.7802545189857483, + "num_tokens": 52987559.0, + "step": 15580 + }, + { + "epoch": 0.15646954915893854, + "learning_rate": 0.0001687080974748083, + "loss": 0.7681, + "mean_token_accuracy": 0.7657202303409576, + "num_tokens": 53021331.0, + "step": 15590 + }, + { + "epoch": 0.156569914488739, + "learning_rate": 0.00016868802440884822, + "loss": 0.7732, + "mean_token_accuracy": 0.7699995994567871, + "num_tokens": 53055735.0, + "step": 15600 + }, + { + "epoch": 0.15667027981853948, + "learning_rate": 0.00016866795134288812, + "loss": 0.7566, + "mean_token_accuracy": 0.7705514073371887, + "num_tokens": 53089781.0, + "step": 15610 + }, + { + "epoch": 0.15677064514833997, + "learning_rate": 0.00016864787827692803, + "loss": 0.7681, + "mean_token_accuracy": 0.7708892226219177, + "num_tokens": 53123529.0, + "step": 15620 + }, + { + "epoch": 0.15687101047814042, + "learning_rate": 0.0001686278052109679, + "loss": 0.7513, + "mean_token_accuracy": 0.7754028618335724, + "num_tokens": 53157103.0, + "step": 15630 + }, + { + "epoch": 0.1569713758079409, + "learning_rate": 0.00016860773214500785, + "loss": 0.7515, + "mean_token_accuracy": 0.7748264670372009, + "num_tokens": 53191522.0, + "step": 15640 + }, + { + "epoch": 0.1570717411377414, + "learning_rate": 0.00016858765907904776, + "loss": 0.7506, + "mean_token_accuracy": 0.7732868671417237, + "num_tokens": 53224757.0, + "step": 15650 + }, + { + "epoch": 0.15717210646754184, + "learning_rate": 0.00016856758601308764, + "loss": 0.7498, + "mean_token_accuracy": 0.7753817021846772, + "num_tokens": 53258888.0, + "step": 15660 + }, + { + "epoch": 0.15727247179734233, + "learning_rate": 0.00016854751294712757, + "loss": 0.772, + "mean_token_accuracy": 0.7627705037593842, + "num_tokens": 53292080.0, + "step": 15670 + }, + { + "epoch": 0.1573728371271428, + "learning_rate": 0.00016852743988116746, + "loss": 0.7709, + "mean_token_accuracy": 0.7693831861019135, + "num_tokens": 53326293.0, + "step": 15680 + }, + { + "epoch": 0.15747320245694327, + "learning_rate": 0.00016850736681520736, + "loss": 0.7779, + "mean_token_accuracy": 0.7701425313949585, + "num_tokens": 53360079.0, + "step": 15690 + }, + { + "epoch": 0.15757356778674375, + "learning_rate": 0.00016848729374924727, + "loss": 0.766, + "mean_token_accuracy": 0.7696471452713013, + "num_tokens": 53394078.0, + "step": 15700 + }, + { + "epoch": 0.15767393311654423, + "learning_rate": 0.00016846722068328718, + "loss": 0.7701, + "mean_token_accuracy": 0.7699676394462586, + "num_tokens": 53428344.0, + "step": 15710 + }, + { + "epoch": 0.1577742984463447, + "learning_rate": 0.00016844714761732706, + "loss": 0.7798, + "mean_token_accuracy": 0.7695291221141816, + "num_tokens": 53461912.0, + "step": 15720 + }, + { + "epoch": 0.15787466377614517, + "learning_rate": 0.000168427074551367, + "loss": 0.8069, + "mean_token_accuracy": 0.7636789500713348, + "num_tokens": 53496403.0, + "step": 15730 + }, + { + "epoch": 0.15797502910594563, + "learning_rate": 0.00016840700148540688, + "loss": 0.7939, + "mean_token_accuracy": 0.7635593891143799, + "num_tokens": 53529907.0, + "step": 15740 + }, + { + "epoch": 0.1580753944357461, + "learning_rate": 0.0001683869284194468, + "loss": 0.7699, + "mean_token_accuracy": 0.7722089886665344, + "num_tokens": 53563525.0, + "step": 15750 + }, + { + "epoch": 0.1581757597655466, + "learning_rate": 0.0001683668553534867, + "loss": 0.7598, + "mean_token_accuracy": 0.7795711100101471, + "num_tokens": 53597740.0, + "step": 15760 + }, + { + "epoch": 0.15827612509534705, + "learning_rate": 0.0001683467822875266, + "loss": 0.7893, + "mean_token_accuracy": 0.7689566075801849, + "num_tokens": 53632244.0, + "step": 15770 + }, + { + "epoch": 0.15837649042514754, + "learning_rate": 0.0001683267092215665, + "loss": 0.7622, + "mean_token_accuracy": 0.7705060064792633, + "num_tokens": 53666099.0, + "step": 15780 + }, + { + "epoch": 0.15847685575494802, + "learning_rate": 0.00016830663615560642, + "loss": 0.7891, + "mean_token_accuracy": 0.7639210462570191, + "num_tokens": 53700311.0, + "step": 15790 + }, + { + "epoch": 0.15857722108474848, + "learning_rate": 0.00016828656308964633, + "loss": 0.7711, + "mean_token_accuracy": 0.7662554621696472, + "num_tokens": 53734915.0, + "step": 15800 + }, + { + "epoch": 0.15867758641454896, + "learning_rate": 0.0001682664900236862, + "loss": 0.7607, + "mean_token_accuracy": 0.7745907962322235, + "num_tokens": 53769792.0, + "step": 15810 + }, + { + "epoch": 0.15877795174434944, + "learning_rate": 0.00016824641695772615, + "loss": 0.7489, + "mean_token_accuracy": 0.7763136684894562, + "num_tokens": 53803658.0, + "step": 15820 + }, + { + "epoch": 0.1588783170741499, + "learning_rate": 0.00016822634389176603, + "loss": 0.7964, + "mean_token_accuracy": 0.7618490397930145, + "num_tokens": 53837440.0, + "step": 15830 + }, + { + "epoch": 0.15897868240395038, + "learning_rate": 0.00016820627082580594, + "loss": 0.7768, + "mean_token_accuracy": 0.7668090462684631, + "num_tokens": 53871063.0, + "step": 15840 + }, + { + "epoch": 0.15907904773375087, + "learning_rate": 0.00016818619775984584, + "loss": 0.7634, + "mean_token_accuracy": 0.7736083090305328, + "num_tokens": 53905460.0, + "step": 15850 + }, + { + "epoch": 0.15917941306355132, + "learning_rate": 0.00016816612469388575, + "loss": 0.7549, + "mean_token_accuracy": 0.7736191630363465, + "num_tokens": 53939217.0, + "step": 15860 + }, + { + "epoch": 0.1592797783933518, + "learning_rate": 0.00016814605162792566, + "loss": 0.7334, + "mean_token_accuracy": 0.7773832976818085, + "num_tokens": 53972404.0, + "step": 15870 + }, + { + "epoch": 0.15938014372315226, + "learning_rate": 0.00016812597856196557, + "loss": 0.8131, + "mean_token_accuracy": 0.7607673048973084, + "num_tokens": 54007085.0, + "step": 15880 + }, + { + "epoch": 0.15948050905295275, + "learning_rate": 0.00016810590549600548, + "loss": 0.7581, + "mean_token_accuracy": 0.7750826418399811, + "num_tokens": 54040901.0, + "step": 15890 + }, + { + "epoch": 0.15958087438275323, + "learning_rate": 0.00016808583243004536, + "loss": 0.7775, + "mean_token_accuracy": 0.7645307302474975, + "num_tokens": 54075068.0, + "step": 15900 + }, + { + "epoch": 0.15968123971255369, + "learning_rate": 0.0001680657593640853, + "loss": 0.7823, + "mean_token_accuracy": 0.7664214968681335, + "num_tokens": 54108768.0, + "step": 15910 + }, + { + "epoch": 0.15978160504235417, + "learning_rate": 0.00016804568629812518, + "loss": 0.7731, + "mean_token_accuracy": 0.7718466520309448, + "num_tokens": 54142779.0, + "step": 15920 + }, + { + "epoch": 0.15988197037215465, + "learning_rate": 0.00016802561323216508, + "loss": 0.7995, + "mean_token_accuracy": 0.7627302944660187, + "num_tokens": 54176709.0, + "step": 15930 + }, + { + "epoch": 0.1599823357019551, + "learning_rate": 0.000168005540166205, + "loss": 0.7952, + "mean_token_accuracy": 0.7675760447978973, + "num_tokens": 54211077.0, + "step": 15940 + }, + { + "epoch": 0.1600827010317556, + "learning_rate": 0.0001679854671002449, + "loss": 0.7905, + "mean_token_accuracy": 0.7670733034610748, + "num_tokens": 54245642.0, + "step": 15950 + }, + { + "epoch": 0.16018306636155608, + "learning_rate": 0.00016796539403428478, + "loss": 0.7676, + "mean_token_accuracy": 0.773389321565628, + "num_tokens": 54280193.0, + "step": 15960 + }, + { + "epoch": 0.16028343169135653, + "learning_rate": 0.00016794532096832472, + "loss": 0.7797, + "mean_token_accuracy": 0.7719764292240143, + "num_tokens": 54314135.0, + "step": 15970 + }, + { + "epoch": 0.16038379702115702, + "learning_rate": 0.0001679252479023646, + "loss": 0.7562, + "mean_token_accuracy": 0.780254477262497, + "num_tokens": 54347415.0, + "step": 15980 + }, + { + "epoch": 0.1604841623509575, + "learning_rate": 0.0001679051748364045, + "loss": 0.7524, + "mean_token_accuracy": 0.7712141573429108, + "num_tokens": 54382058.0, + "step": 15990 + }, + { + "epoch": 0.16058452768075795, + "learning_rate": 0.00016788510177044444, + "loss": 0.7944, + "mean_token_accuracy": 0.7686404109001159, + "num_tokens": 54416790.0, + "step": 16000 + }, + { + "epoch": 0.16068489301055844, + "learning_rate": 0.00016786502870448433, + "loss": 0.7819, + "mean_token_accuracy": 0.7646767497062683, + "num_tokens": 54451156.0, + "step": 16010 + }, + { + "epoch": 0.1607852583403589, + "learning_rate": 0.00016784495563852423, + "loss": 0.7854, + "mean_token_accuracy": 0.7703452050685883, + "num_tokens": 54485109.0, + "step": 16020 + }, + { + "epoch": 0.16088562367015938, + "learning_rate": 0.00016782488257256414, + "loss": 0.7607, + "mean_token_accuracy": 0.7728536605834961, + "num_tokens": 54519121.0, + "step": 16030 + }, + { + "epoch": 0.16098598899995986, + "learning_rate": 0.00016780480950660405, + "loss": 0.7745, + "mean_token_accuracy": 0.7680536806583405, + "num_tokens": 54552312.0, + "step": 16040 + }, + { + "epoch": 0.16108635432976032, + "learning_rate": 0.00016778473644064393, + "loss": 0.7939, + "mean_token_accuracy": 0.763797128200531, + "num_tokens": 54585602.0, + "step": 16050 + }, + { + "epoch": 0.1611867196595608, + "learning_rate": 0.00016776466337468387, + "loss": 0.7831, + "mean_token_accuracy": 0.7706405282020569, + "num_tokens": 54620257.0, + "step": 16060 + }, + { + "epoch": 0.16128708498936128, + "learning_rate": 0.00016774459030872375, + "loss": 0.8012, + "mean_token_accuracy": 0.7677317500114441, + "num_tokens": 54654400.0, + "step": 16070 + }, + { + "epoch": 0.16138745031916174, + "learning_rate": 0.00016772451724276366, + "loss": 0.7663, + "mean_token_accuracy": 0.7740169882774353, + "num_tokens": 54689429.0, + "step": 16080 + }, + { + "epoch": 0.16148781564896222, + "learning_rate": 0.00016770444417680357, + "loss": 0.762, + "mean_token_accuracy": 0.7705418944358826, + "num_tokens": 54723355.0, + "step": 16090 + }, + { + "epoch": 0.1615881809787627, + "learning_rate": 0.00016768437111084347, + "loss": 0.7956, + "mean_token_accuracy": 0.7653626322746276, + "num_tokens": 54757516.0, + "step": 16100 + }, + { + "epoch": 0.16168854630856316, + "learning_rate": 0.00016766429804488338, + "loss": 0.7442, + "mean_token_accuracy": 0.7787913143634796, + "num_tokens": 54791568.0, + "step": 16110 + }, + { + "epoch": 0.16178891163836365, + "learning_rate": 0.0001676442249789233, + "loss": 0.7666, + "mean_token_accuracy": 0.7725750982761384, + "num_tokens": 54825658.0, + "step": 16120 + }, + { + "epoch": 0.16188927696816413, + "learning_rate": 0.0001676241519129632, + "loss": 0.7641, + "mean_token_accuracy": 0.7700630605220795, + "num_tokens": 54859192.0, + "step": 16130 + }, + { + "epoch": 0.1619896422979646, + "learning_rate": 0.0001676040788470031, + "loss": 0.7685, + "mean_token_accuracy": 0.7750592708587647, + "num_tokens": 54893175.0, + "step": 16140 + }, + { + "epoch": 0.16209000762776507, + "learning_rate": 0.00016758400578104302, + "loss": 0.7562, + "mean_token_accuracy": 0.7745824337005616, + "num_tokens": 54927452.0, + "step": 16150 + }, + { + "epoch": 0.16219037295756553, + "learning_rate": 0.0001675639327150829, + "loss": 0.7662, + "mean_token_accuracy": 0.7729141354560852, + "num_tokens": 54961756.0, + "step": 16160 + }, + { + "epoch": 0.162290738287366, + "learning_rate": 0.00016754385964912283, + "loss": 0.7332, + "mean_token_accuracy": 0.7856162011623382, + "num_tokens": 54995486.0, + "step": 16170 + }, + { + "epoch": 0.1623911036171665, + "learning_rate": 0.00016752378658316271, + "loss": 0.7781, + "mean_token_accuracy": 0.7697393536567688, + "num_tokens": 55029693.0, + "step": 16180 + }, + { + "epoch": 0.16249146894696695, + "learning_rate": 0.00016750371351720262, + "loss": 0.7915, + "mean_token_accuracy": 0.7663042962551116, + "num_tokens": 55063475.0, + "step": 16190 + }, + { + "epoch": 0.16259183427676743, + "learning_rate": 0.00016748364045124253, + "loss": 0.7502, + "mean_token_accuracy": 0.7753411650657653, + "num_tokens": 55097478.0, + "step": 16200 + }, + { + "epoch": 0.16269219960656792, + "learning_rate": 0.00016746356738528244, + "loss": 0.7645, + "mean_token_accuracy": 0.7713445484638214, + "num_tokens": 55131686.0, + "step": 16210 + }, + { + "epoch": 0.16279256493636837, + "learning_rate": 0.00016744349431932235, + "loss": 0.8009, + "mean_token_accuracy": 0.7626453280448914, + "num_tokens": 55165462.0, + "step": 16220 + }, + { + "epoch": 0.16289293026616886, + "learning_rate": 0.00016742342125336226, + "loss": 0.7992, + "mean_token_accuracy": 0.7661191344261169, + "num_tokens": 55199348.0, + "step": 16230 + }, + { + "epoch": 0.16299329559596934, + "learning_rate": 0.00016740334818740217, + "loss": 0.8257, + "mean_token_accuracy": 0.7612239360809326, + "num_tokens": 55233696.0, + "step": 16240 + }, + { + "epoch": 0.1630936609257698, + "learning_rate": 0.00016738327512144205, + "loss": 0.7791, + "mean_token_accuracy": 0.7717586278915405, + "num_tokens": 55267361.0, + "step": 16250 + }, + { + "epoch": 0.16319402625557028, + "learning_rate": 0.00016736320205548198, + "loss": 0.7901, + "mean_token_accuracy": 0.7668171525001526, + "num_tokens": 55301500.0, + "step": 16260 + }, + { + "epoch": 0.16329439158537076, + "learning_rate": 0.00016734312898952186, + "loss": 0.7327, + "mean_token_accuracy": 0.7806723415851593, + "num_tokens": 55336458.0, + "step": 16270 + }, + { + "epoch": 0.16339475691517122, + "learning_rate": 0.00016732305592356177, + "loss": 0.7553, + "mean_token_accuracy": 0.773836076259613, + "num_tokens": 55371171.0, + "step": 16280 + }, + { + "epoch": 0.1634951222449717, + "learning_rate": 0.00016730298285760168, + "loss": 0.7977, + "mean_token_accuracy": 0.763254064321518, + "num_tokens": 55405118.0, + "step": 16290 + }, + { + "epoch": 0.16359548757477216, + "learning_rate": 0.0001672829097916416, + "loss": 0.7896, + "mean_token_accuracy": 0.7666790723800659, + "num_tokens": 55439087.0, + "step": 16300 + }, + { + "epoch": 0.16369585290457264, + "learning_rate": 0.00016726283672568147, + "loss": 0.8011, + "mean_token_accuracy": 0.765297120809555, + "num_tokens": 55472738.0, + "step": 16310 + }, + { + "epoch": 0.16379621823437313, + "learning_rate": 0.0001672427636597214, + "loss": 0.768, + "mean_token_accuracy": 0.7692670464515686, + "num_tokens": 55507007.0, + "step": 16320 + }, + { + "epoch": 0.16389658356417358, + "learning_rate": 0.0001672226905937613, + "loss": 0.7608, + "mean_token_accuracy": 0.772177517414093, + "num_tokens": 55541368.0, + "step": 16330 + }, + { + "epoch": 0.16399694889397406, + "learning_rate": 0.0001672026175278012, + "loss": 0.7814, + "mean_token_accuracy": 0.7707577764987945, + "num_tokens": 55576173.0, + "step": 16340 + }, + { + "epoch": 0.16409731422377455, + "learning_rate": 0.00016718254446184113, + "loss": 0.7934, + "mean_token_accuracy": 0.762543672323227, + "num_tokens": 55609079.0, + "step": 16350 + }, + { + "epoch": 0.164197679553575, + "learning_rate": 0.000167162471395881, + "loss": 0.7954, + "mean_token_accuracy": 0.7651306629180908, + "num_tokens": 55642519.0, + "step": 16360 + }, + { + "epoch": 0.1642980448833755, + "learning_rate": 0.00016714239832992092, + "loss": 0.7601, + "mean_token_accuracy": 0.7750393986701966, + "num_tokens": 55676882.0, + "step": 16370 + }, + { + "epoch": 0.16439841021317597, + "learning_rate": 0.00016712232526396083, + "loss": 0.7841, + "mean_token_accuracy": 0.7707339823246002, + "num_tokens": 55711314.0, + "step": 16380 + }, + { + "epoch": 0.16449877554297643, + "learning_rate": 0.00016710225219800074, + "loss": 0.7589, + "mean_token_accuracy": 0.7756678760051727, + "num_tokens": 55745279.0, + "step": 16390 + }, + { + "epoch": 0.1645991408727769, + "learning_rate": 0.00016708217913204062, + "loss": 0.7816, + "mean_token_accuracy": 0.766136747598648, + "num_tokens": 55779482.0, + "step": 16400 + }, + { + "epoch": 0.1646995062025774, + "learning_rate": 0.00016706210606608055, + "loss": 0.7499, + "mean_token_accuracy": 0.7740479826927185, + "num_tokens": 55814137.0, + "step": 16410 + }, + { + "epoch": 0.16479987153237785, + "learning_rate": 0.00016704203300012044, + "loss": 0.8126, + "mean_token_accuracy": 0.7630363523960113, + "num_tokens": 55848446.0, + "step": 16420 + }, + { + "epoch": 0.16490023686217833, + "learning_rate": 0.00016702195993416034, + "loss": 0.7561, + "mean_token_accuracy": 0.7752853691577911, + "num_tokens": 55882891.0, + "step": 16430 + }, + { + "epoch": 0.1650006021919788, + "learning_rate": 0.00016700188686820025, + "loss": 0.7532, + "mean_token_accuracy": 0.770255833864212, + "num_tokens": 55916716.0, + "step": 16440 + }, + { + "epoch": 0.16510096752177927, + "learning_rate": 0.00016698181380224016, + "loss": 0.7616, + "mean_token_accuracy": 0.7719760477542877, + "num_tokens": 55950412.0, + "step": 16450 + }, + { + "epoch": 0.16520133285157976, + "learning_rate": 0.00016696174073628007, + "loss": 0.7513, + "mean_token_accuracy": 0.7779366493225097, + "num_tokens": 55983776.0, + "step": 16460 + }, + { + "epoch": 0.1653016981813802, + "learning_rate": 0.00016694166767031998, + "loss": 0.7733, + "mean_token_accuracy": 0.7739466309547425, + "num_tokens": 56018200.0, + "step": 16470 + }, + { + "epoch": 0.1654020635111807, + "learning_rate": 0.00016692159460435989, + "loss": 0.7446, + "mean_token_accuracy": 0.7743953824043274, + "num_tokens": 56051751.0, + "step": 16480 + }, + { + "epoch": 0.16550242884098118, + "learning_rate": 0.00016690152153839977, + "loss": 0.7719, + "mean_token_accuracy": 0.7692020237445831, + "num_tokens": 56086204.0, + "step": 16490 + }, + { + "epoch": 0.16560279417078164, + "learning_rate": 0.0001668814484724397, + "loss": 0.7817, + "mean_token_accuracy": 0.76861452460289, + "num_tokens": 56120293.0, + "step": 16500 + }, + { + "epoch": 0.16570315950058212, + "learning_rate": 0.00016686137540647958, + "loss": 0.7493, + "mean_token_accuracy": 0.771511435508728, + "num_tokens": 56153683.0, + "step": 16510 + }, + { + "epoch": 0.1658035248303826, + "learning_rate": 0.0001668413023405195, + "loss": 0.7579, + "mean_token_accuracy": 0.7763586521148682, + "num_tokens": 56187960.0, + "step": 16520 + }, + { + "epoch": 0.16590389016018306, + "learning_rate": 0.0001668212292745594, + "loss": 0.788, + "mean_token_accuracy": 0.762101536989212, + "num_tokens": 56222385.0, + "step": 16530 + }, + { + "epoch": 0.16600425548998354, + "learning_rate": 0.0001668011562085993, + "loss": 0.7642, + "mean_token_accuracy": 0.7768764853477478, + "num_tokens": 56256575.0, + "step": 16540 + }, + { + "epoch": 0.16610462081978403, + "learning_rate": 0.00016678108314263922, + "loss": 0.8119, + "mean_token_accuracy": 0.7595563709735871, + "num_tokens": 56291016.0, + "step": 16550 + }, + { + "epoch": 0.16620498614958448, + "learning_rate": 0.00016676101007667913, + "loss": 0.7523, + "mean_token_accuracy": 0.775392371416092, + "num_tokens": 56324925.0, + "step": 16560 + }, + { + "epoch": 0.16630535147938497, + "learning_rate": 0.00016674093701071904, + "loss": 0.7889, + "mean_token_accuracy": 0.7664380073547363, + "num_tokens": 56358698.0, + "step": 16570 + }, + { + "epoch": 0.16640571680918542, + "learning_rate": 0.00016672086394475892, + "loss": 0.7372, + "mean_token_accuracy": 0.7752080440521241, + "num_tokens": 56392057.0, + "step": 16580 + }, + { + "epoch": 0.1665060821389859, + "learning_rate": 0.00016670079087879885, + "loss": 0.7743, + "mean_token_accuracy": 0.7740992903709412, + "num_tokens": 56425622.0, + "step": 16590 + }, + { + "epoch": 0.1666064474687864, + "learning_rate": 0.00016668071781283873, + "loss": 0.7723, + "mean_token_accuracy": 0.7681378543376922, + "num_tokens": 56459099.0, + "step": 16600 + }, + { + "epoch": 0.16670681279858685, + "learning_rate": 0.00016666064474687864, + "loss": 0.7815, + "mean_token_accuracy": 0.7682817459106446, + "num_tokens": 56493058.0, + "step": 16610 + }, + { + "epoch": 0.16680717812838733, + "learning_rate": 0.00016664057168091855, + "loss": 0.7631, + "mean_token_accuracy": 0.7736068487167358, + "num_tokens": 56527665.0, + "step": 16620 + }, + { + "epoch": 0.1669075434581878, + "learning_rate": 0.00016662049861495846, + "loss": 0.7964, + "mean_token_accuracy": 0.7661099135875702, + "num_tokens": 56561558.0, + "step": 16630 + }, + { + "epoch": 0.16700790878798827, + "learning_rate": 0.00016660042554899834, + "loss": 0.7776, + "mean_token_accuracy": 0.7665910840034484, + "num_tokens": 56595946.0, + "step": 16640 + }, + { + "epoch": 0.16710827411778875, + "learning_rate": 0.00016658035248303828, + "loss": 0.7871, + "mean_token_accuracy": 0.7688241362571716, + "num_tokens": 56630198.0, + "step": 16650 + }, + { + "epoch": 0.16720863944758924, + "learning_rate": 0.00016656027941707816, + "loss": 0.7748, + "mean_token_accuracy": 0.773946350812912, + "num_tokens": 56664493.0, + "step": 16660 + }, + { + "epoch": 0.1673090047773897, + "learning_rate": 0.0001665402063511181, + "loss": 0.7656, + "mean_token_accuracy": 0.7693340480327606, + "num_tokens": 56698753.0, + "step": 16670 + }, + { + "epoch": 0.16740937010719018, + "learning_rate": 0.00016652013328515797, + "loss": 0.7957, + "mean_token_accuracy": 0.7672327339649201, + "num_tokens": 56732436.0, + "step": 16680 + }, + { + "epoch": 0.16750973543699066, + "learning_rate": 0.00016650006021919788, + "loss": 0.7609, + "mean_token_accuracy": 0.7741209328174591, + "num_tokens": 56767592.0, + "step": 16690 + }, + { + "epoch": 0.16761010076679111, + "learning_rate": 0.00016647998715323782, + "loss": 0.7749, + "mean_token_accuracy": 0.7696184456348419, + "num_tokens": 56801909.0, + "step": 16700 + }, + { + "epoch": 0.1677104660965916, + "learning_rate": 0.0001664599140872777, + "loss": 0.8106, + "mean_token_accuracy": 0.763665896654129, + "num_tokens": 56836591.0, + "step": 16710 + }, + { + "epoch": 0.16781083142639205, + "learning_rate": 0.0001664398410213176, + "loss": 0.7606, + "mean_token_accuracy": 0.7729604065418243, + "num_tokens": 56870841.0, + "step": 16720 + }, + { + "epoch": 0.16791119675619254, + "learning_rate": 0.00016641976795535752, + "loss": 0.7559, + "mean_token_accuracy": 0.7698002696037293, + "num_tokens": 56904225.0, + "step": 16730 + }, + { + "epoch": 0.16801156208599302, + "learning_rate": 0.00016639969488939742, + "loss": 0.7772, + "mean_token_accuracy": 0.7710990846157074, + "num_tokens": 56938018.0, + "step": 16740 + }, + { + "epoch": 0.16811192741579348, + "learning_rate": 0.0001663796218234373, + "loss": 0.7582, + "mean_token_accuracy": 0.775606769323349, + "num_tokens": 56972455.0, + "step": 16750 + }, + { + "epoch": 0.16821229274559396, + "learning_rate": 0.00016635954875747724, + "loss": 0.7755, + "mean_token_accuracy": 0.7679441034793854, + "num_tokens": 57006665.0, + "step": 16760 + }, + { + "epoch": 0.16831265807539444, + "learning_rate": 0.00016633947569151712, + "loss": 0.7999, + "mean_token_accuracy": 0.7675316214561463, + "num_tokens": 57041029.0, + "step": 16770 + }, + { + "epoch": 0.1684130234051949, + "learning_rate": 0.00016631940262555703, + "loss": 0.7629, + "mean_token_accuracy": 0.7740450620651245, + "num_tokens": 57074771.0, + "step": 16780 + }, + { + "epoch": 0.16851338873499538, + "learning_rate": 0.00016629932955959694, + "loss": 0.7546, + "mean_token_accuracy": 0.7727279365062714, + "num_tokens": 57108544.0, + "step": 16790 + }, + { + "epoch": 0.16861375406479587, + "learning_rate": 0.00016627925649363685, + "loss": 0.7631, + "mean_token_accuracy": 0.7695836067199707, + "num_tokens": 57143451.0, + "step": 16800 + }, + { + "epoch": 0.16871411939459632, + "learning_rate": 0.00016625918342767676, + "loss": 0.7622, + "mean_token_accuracy": 0.7722588241100311, + "num_tokens": 57177527.0, + "step": 16810 + }, + { + "epoch": 0.1688144847243968, + "learning_rate": 0.00016623911036171666, + "loss": 0.755, + "mean_token_accuracy": 0.7699831604957581, + "num_tokens": 57211529.0, + "step": 16820 + }, + { + "epoch": 0.1689148500541973, + "learning_rate": 0.00016621903729575657, + "loss": 0.7404, + "mean_token_accuracy": 0.7806845128536224, + "num_tokens": 57245974.0, + "step": 16830 + }, + { + "epoch": 0.16901521538399775, + "learning_rate": 0.00016619896422979645, + "loss": 0.7864, + "mean_token_accuracy": 0.7693890869617462, + "num_tokens": 57280503.0, + "step": 16840 + }, + { + "epoch": 0.16911558071379823, + "learning_rate": 0.0001661788911638364, + "loss": 0.7749, + "mean_token_accuracy": 0.7683271586894989, + "num_tokens": 57314050.0, + "step": 16850 + }, + { + "epoch": 0.1692159460435987, + "learning_rate": 0.00016615881809787627, + "loss": 0.7742, + "mean_token_accuracy": 0.7672585129737854, + "num_tokens": 57348241.0, + "step": 16860 + }, + { + "epoch": 0.16931631137339917, + "learning_rate": 0.00016613874503191618, + "loss": 0.7563, + "mean_token_accuracy": 0.7712204933166504, + "num_tokens": 57382864.0, + "step": 16870 + }, + { + "epoch": 0.16941667670319965, + "learning_rate": 0.0001661186719659561, + "loss": 0.7912, + "mean_token_accuracy": 0.7650717854499817, + "num_tokens": 57416511.0, + "step": 16880 + }, + { + "epoch": 0.1695170420330001, + "learning_rate": 0.000166098598899996, + "loss": 0.7828, + "mean_token_accuracy": 0.7699388206005097, + "num_tokens": 57451135.0, + "step": 16890 + }, + { + "epoch": 0.1696174073628006, + "learning_rate": 0.0001660785258340359, + "loss": 0.7793, + "mean_token_accuracy": 0.7671032309532165, + "num_tokens": 57485805.0, + "step": 16900 + }, + { + "epoch": 0.16971777269260108, + "learning_rate": 0.0001660584527680758, + "loss": 0.7937, + "mean_token_accuracy": 0.7623134732246399, + "num_tokens": 57519798.0, + "step": 16910 + }, + { + "epoch": 0.16981813802240153, + "learning_rate": 0.00016603837970211572, + "loss": 0.7888, + "mean_token_accuracy": 0.7673300087451935, + "num_tokens": 57553778.0, + "step": 16920 + }, + { + "epoch": 0.16991850335220202, + "learning_rate": 0.0001660183066361556, + "loss": 0.7725, + "mean_token_accuracy": 0.7663509368896484, + "num_tokens": 57588052.0, + "step": 16930 + }, + { + "epoch": 0.1700188686820025, + "learning_rate": 0.00016599823357019554, + "loss": 0.7636, + "mean_token_accuracy": 0.7714050889015198, + "num_tokens": 57621687.0, + "step": 16940 + }, + { + "epoch": 0.17011923401180296, + "learning_rate": 0.00016597816050423542, + "loss": 0.7873, + "mean_token_accuracy": 0.7676332652568817, + "num_tokens": 57656223.0, + "step": 16950 + }, + { + "epoch": 0.17021959934160344, + "learning_rate": 0.00016595808743827533, + "loss": 0.7648, + "mean_token_accuracy": 0.7720965504646301, + "num_tokens": 57690924.0, + "step": 16960 + }, + { + "epoch": 0.17031996467140392, + "learning_rate": 0.00016593801437231524, + "loss": 0.7295, + "mean_token_accuracy": 0.7817053020000457, + "num_tokens": 57724855.0, + "step": 16970 + }, + { + "epoch": 0.17042033000120438, + "learning_rate": 0.00016591794130635515, + "loss": 0.8057, + "mean_token_accuracy": 0.7620230674743652, + "num_tokens": 57759081.0, + "step": 16980 + }, + { + "epoch": 0.17052069533100486, + "learning_rate": 0.00016589786824039503, + "loss": 0.7748, + "mean_token_accuracy": 0.7702114403247833, + "num_tokens": 57794046.0, + "step": 16990 + }, + { + "epoch": 0.17062106066080532, + "learning_rate": 0.00016587779517443496, + "loss": 0.7984, + "mean_token_accuracy": 0.7697321712970734, + "num_tokens": 57827455.0, + "step": 17000 + }, + { + "epoch": 0.1707214259906058, + "learning_rate": 0.00016585772210847484, + "loss": 0.7747, + "mean_token_accuracy": 0.7693339705467224, + "num_tokens": 57862864.0, + "step": 17010 + }, + { + "epoch": 0.17082179132040629, + "learning_rate": 0.00016583764904251475, + "loss": 0.7644, + "mean_token_accuracy": 0.772398829460144, + "num_tokens": 57896640.0, + "step": 17020 + }, + { + "epoch": 0.17092215665020674, + "learning_rate": 0.00016581757597655466, + "loss": 0.7361, + "mean_token_accuracy": 0.7789756894111634, + "num_tokens": 57930726.0, + "step": 17030 + }, + { + "epoch": 0.17102252198000722, + "learning_rate": 0.00016579750291059457, + "loss": 0.7665, + "mean_token_accuracy": 0.7718335926532746, + "num_tokens": 57963979.0, + "step": 17040 + }, + { + "epoch": 0.1711228873098077, + "learning_rate": 0.00016577742984463448, + "loss": 0.7406, + "mean_token_accuracy": 0.7737122237682342, + "num_tokens": 57997739.0, + "step": 17050 + }, + { + "epoch": 0.17122325263960816, + "learning_rate": 0.00016575735677867439, + "loss": 0.8044, + "mean_token_accuracy": 0.7606332123279571, + "num_tokens": 58030893.0, + "step": 17060 + }, + { + "epoch": 0.17132361796940865, + "learning_rate": 0.0001657372837127143, + "loss": 0.7719, + "mean_token_accuracy": 0.7710410356521606, + "num_tokens": 58065200.0, + "step": 17070 + }, + { + "epoch": 0.17142398329920913, + "learning_rate": 0.00016571721064675418, + "loss": 0.8052, + "mean_token_accuracy": 0.7625146746635437, + "num_tokens": 58098788.0, + "step": 17080 + }, + { + "epoch": 0.1715243486290096, + "learning_rate": 0.0001656971375807941, + "loss": 0.811, + "mean_token_accuracy": 0.7621822893619538, + "num_tokens": 58132803.0, + "step": 17090 + }, + { + "epoch": 0.17162471395881007, + "learning_rate": 0.000165677064514834, + "loss": 0.7644, + "mean_token_accuracy": 0.7708954095840455, + "num_tokens": 58166826.0, + "step": 17100 + }, + { + "epoch": 0.17172507928861055, + "learning_rate": 0.0001656569914488739, + "loss": 0.7519, + "mean_token_accuracy": 0.7677281260490417, + "num_tokens": 58201048.0, + "step": 17110 + }, + { + "epoch": 0.171825444618411, + "learning_rate": 0.0001656369183829138, + "loss": 0.7655, + "mean_token_accuracy": 0.7702815532684326, + "num_tokens": 58234789.0, + "step": 17120 + }, + { + "epoch": 0.1719258099482115, + "learning_rate": 0.00016561684531695372, + "loss": 0.7789, + "mean_token_accuracy": 0.7679742932319641, + "num_tokens": 58268627.0, + "step": 17130 + }, + { + "epoch": 0.17202617527801195, + "learning_rate": 0.00016559677225099363, + "loss": 0.7841, + "mean_token_accuracy": 0.7711734771728516, + "num_tokens": 58301797.0, + "step": 17140 + }, + { + "epoch": 0.17212654060781243, + "learning_rate": 0.00016557669918503353, + "loss": 0.808, + "mean_token_accuracy": 0.7599303185939789, + "num_tokens": 58336030.0, + "step": 17150 + }, + { + "epoch": 0.17222690593761292, + "learning_rate": 0.00016555662611907344, + "loss": 0.793, + "mean_token_accuracy": 0.759373950958252, + "num_tokens": 58369393.0, + "step": 17160 + }, + { + "epoch": 0.17232727126741337, + "learning_rate": 0.00016553655305311332, + "loss": 0.7565, + "mean_token_accuracy": 0.7763037025928498, + "num_tokens": 58403831.0, + "step": 17170 + }, + { + "epoch": 0.17242763659721386, + "learning_rate": 0.00016551647998715326, + "loss": 0.7921, + "mean_token_accuracy": 0.7688264667987823, + "num_tokens": 58437571.0, + "step": 17180 + }, + { + "epoch": 0.17252800192701434, + "learning_rate": 0.00016549640692119314, + "loss": 0.7961, + "mean_token_accuracy": 0.7655426859855652, + "num_tokens": 58470734.0, + "step": 17190 + }, + { + "epoch": 0.1726283672568148, + "learning_rate": 0.00016547633385523305, + "loss": 0.7725, + "mean_token_accuracy": 0.7713332056999207, + "num_tokens": 58504723.0, + "step": 17200 + }, + { + "epoch": 0.17272873258661528, + "learning_rate": 0.00016545626078927296, + "loss": 0.7972, + "mean_token_accuracy": 0.7661644756793976, + "num_tokens": 58539048.0, + "step": 17210 + }, + { + "epoch": 0.17282909791641576, + "learning_rate": 0.00016543618772331287, + "loss": 0.7798, + "mean_token_accuracy": 0.7684025287628173, + "num_tokens": 58574095.0, + "step": 17220 + }, + { + "epoch": 0.17292946324621622, + "learning_rate": 0.00016541611465735275, + "loss": 0.7969, + "mean_token_accuracy": 0.7652607381343841, + "num_tokens": 58607984.0, + "step": 17230 + }, + { + "epoch": 0.1730298285760167, + "learning_rate": 0.00016539604159139268, + "loss": 0.7865, + "mean_token_accuracy": 0.7680651903152466, + "num_tokens": 58641860.0, + "step": 17240 + }, + { + "epoch": 0.1731301939058172, + "learning_rate": 0.0001653759685254326, + "loss": 0.799, + "mean_token_accuracy": 0.761265105009079, + "num_tokens": 58675411.0, + "step": 17250 + }, + { + "epoch": 0.17323055923561764, + "learning_rate": 0.0001653558954594725, + "loss": 0.7661, + "mean_token_accuracy": 0.7691290080547333, + "num_tokens": 58709040.0, + "step": 17260 + }, + { + "epoch": 0.17333092456541813, + "learning_rate": 0.0001653358223935124, + "loss": 0.7858, + "mean_token_accuracy": 0.7651784241199493, + "num_tokens": 58743377.0, + "step": 17270 + }, + { + "epoch": 0.17343128989521858, + "learning_rate": 0.0001653157493275523, + "loss": 0.7788, + "mean_token_accuracy": 0.7682713389396667, + "num_tokens": 58776804.0, + "step": 17280 + }, + { + "epoch": 0.17353165522501907, + "learning_rate": 0.00016529567626159223, + "loss": 0.7371, + "mean_token_accuracy": 0.7746301293373108, + "num_tokens": 58810322.0, + "step": 17290 + }, + { + "epoch": 0.17363202055481955, + "learning_rate": 0.0001652756031956321, + "loss": 0.7754, + "mean_token_accuracy": 0.769923746585846, + "num_tokens": 58844019.0, + "step": 17300 + }, + { + "epoch": 0.17373238588462, + "learning_rate": 0.00016525553012967202, + "loss": 0.7643, + "mean_token_accuracy": 0.7680152416229248, + "num_tokens": 58878254.0, + "step": 17310 + }, + { + "epoch": 0.1738327512144205, + "learning_rate": 0.00016523545706371192, + "loss": 0.7867, + "mean_token_accuracy": 0.7672698497772217, + "num_tokens": 58913152.0, + "step": 17320 + }, + { + "epoch": 0.17393311654422097, + "learning_rate": 0.00016521538399775183, + "loss": 0.7675, + "mean_token_accuracy": 0.769359028339386, + "num_tokens": 58947238.0, + "step": 17330 + }, + { + "epoch": 0.17403348187402143, + "learning_rate": 0.00016519531093179171, + "loss": 0.7503, + "mean_token_accuracy": 0.7771645188331604, + "num_tokens": 58980919.0, + "step": 17340 + }, + { + "epoch": 0.1741338472038219, + "learning_rate": 0.00016517523786583165, + "loss": 0.7815, + "mean_token_accuracy": 0.7696813583374024, + "num_tokens": 59014821.0, + "step": 17350 + }, + { + "epoch": 0.1742342125336224, + "learning_rate": 0.00016515516479987153, + "loss": 0.7638, + "mean_token_accuracy": 0.7662936210632324, + "num_tokens": 59048470.0, + "step": 17360 + }, + { + "epoch": 0.17433457786342285, + "learning_rate": 0.00016513509173391144, + "loss": 0.7817, + "mean_token_accuracy": 0.7683330059051514, + "num_tokens": 59081997.0, + "step": 17370 + }, + { + "epoch": 0.17443494319322334, + "learning_rate": 0.00016511501866795135, + "loss": 0.784, + "mean_token_accuracy": 0.7709557950496674, + "num_tokens": 59116091.0, + "step": 17380 + }, + { + "epoch": 0.17453530852302382, + "learning_rate": 0.00016509494560199126, + "loss": 0.78, + "mean_token_accuracy": 0.7627904713153839, + "num_tokens": 59150435.0, + "step": 17390 + }, + { + "epoch": 0.17463567385282427, + "learning_rate": 0.00016507487253603116, + "loss": 0.7695, + "mean_token_accuracy": 0.7699004292488099, + "num_tokens": 59184392.0, + "step": 17400 + }, + { + "epoch": 0.17473603918262476, + "learning_rate": 0.00016505479947007107, + "loss": 0.7657, + "mean_token_accuracy": 0.7727609097957611, + "num_tokens": 59218019.0, + "step": 17410 + }, + { + "epoch": 0.17483640451242521, + "learning_rate": 0.00016503472640411098, + "loss": 0.779, + "mean_token_accuracy": 0.7669853568077087, + "num_tokens": 59252988.0, + "step": 17420 + }, + { + "epoch": 0.1749367698422257, + "learning_rate": 0.00016501465333815086, + "loss": 0.7597, + "mean_token_accuracy": 0.7775791406631469, + "num_tokens": 59287957.0, + "step": 17430 + }, + { + "epoch": 0.17503713517202618, + "learning_rate": 0.0001649945802721908, + "loss": 0.773, + "mean_token_accuracy": 0.7717095196247101, + "num_tokens": 59321479.0, + "step": 17440 + }, + { + "epoch": 0.17513750050182664, + "learning_rate": 0.00016497450720623068, + "loss": 0.7786, + "mean_token_accuracy": 0.7710772454738617, + "num_tokens": 59355315.0, + "step": 17450 + }, + { + "epoch": 0.17523786583162712, + "learning_rate": 0.0001649544341402706, + "loss": 0.7544, + "mean_token_accuracy": 0.779824960231781, + "num_tokens": 59388451.0, + "step": 17460 + }, + { + "epoch": 0.1753382311614276, + "learning_rate": 0.0001649343610743105, + "loss": 0.7758, + "mean_token_accuracy": 0.7695206284523011, + "num_tokens": 59421993.0, + "step": 17470 + }, + { + "epoch": 0.17543859649122806, + "learning_rate": 0.0001649142880083504, + "loss": 0.7765, + "mean_token_accuracy": 0.7642025172710418, + "num_tokens": 59455941.0, + "step": 17480 + }, + { + "epoch": 0.17553896182102854, + "learning_rate": 0.0001648942149423903, + "loss": 0.7675, + "mean_token_accuracy": 0.7715909838676452, + "num_tokens": 59489901.0, + "step": 17490 + }, + { + "epoch": 0.17563932715082903, + "learning_rate": 0.00016487414187643022, + "loss": 0.7584, + "mean_token_accuracy": 0.7685763359069824, + "num_tokens": 59523829.0, + "step": 17500 + }, + { + "epoch": 0.17573969248062948, + "learning_rate": 0.00016485406881047013, + "loss": 0.796, + "mean_token_accuracy": 0.7640321314334869, + "num_tokens": 59557675.0, + "step": 17510 + }, + { + "epoch": 0.17584005781042997, + "learning_rate": 0.00016483399574451, + "loss": 0.79, + "mean_token_accuracy": 0.768464207649231, + "num_tokens": 59591396.0, + "step": 17520 + }, + { + "epoch": 0.17594042314023045, + "learning_rate": 0.00016481392267854995, + "loss": 0.7907, + "mean_token_accuracy": 0.7635212242603302, + "num_tokens": 59624772.0, + "step": 17530 + }, + { + "epoch": 0.1760407884700309, + "learning_rate": 0.00016479384961258983, + "loss": 0.7781, + "mean_token_accuracy": 0.7647325575351716, + "num_tokens": 59658505.0, + "step": 17540 + }, + { + "epoch": 0.1761411537998314, + "learning_rate": 0.00016477377654662974, + "loss": 0.8023, + "mean_token_accuracy": 0.7604661285877228, + "num_tokens": 59693441.0, + "step": 17550 + }, + { + "epoch": 0.17624151912963185, + "learning_rate": 0.00016475370348066964, + "loss": 0.7838, + "mean_token_accuracy": 0.7707070887088776, + "num_tokens": 59726652.0, + "step": 17560 + }, + { + "epoch": 0.17634188445943233, + "learning_rate": 0.00016473363041470955, + "loss": 0.7861, + "mean_token_accuracy": 0.7668064892292022, + "num_tokens": 59760757.0, + "step": 17570 + }, + { + "epoch": 0.1764422497892328, + "learning_rate": 0.00016471355734874943, + "loss": 0.7494, + "mean_token_accuracy": 0.7720450818538666, + "num_tokens": 59795084.0, + "step": 17580 + }, + { + "epoch": 0.17654261511903327, + "learning_rate": 0.00016469348428278937, + "loss": 0.7783, + "mean_token_accuracy": 0.7722791850566864, + "num_tokens": 59828670.0, + "step": 17590 + }, + { + "epoch": 0.17664298044883375, + "learning_rate": 0.00016467341121682928, + "loss": 0.786, + "mean_token_accuracy": 0.7623280882835388, + "num_tokens": 59862929.0, + "step": 17600 + }, + { + "epoch": 0.17674334577863424, + "learning_rate": 0.00016465333815086916, + "loss": 0.7719, + "mean_token_accuracy": 0.7731631696224213, + "num_tokens": 59896994.0, + "step": 17610 + }, + { + "epoch": 0.1768437111084347, + "learning_rate": 0.0001646332650849091, + "loss": 0.7781, + "mean_token_accuracy": 0.7665385782718659, + "num_tokens": 59931868.0, + "step": 17620 + }, + { + "epoch": 0.17694407643823518, + "learning_rate": 0.00016461319201894898, + "loss": 0.7798, + "mean_token_accuracy": 0.7663361430168152, + "num_tokens": 59965609.0, + "step": 17630 + }, + { + "epoch": 0.17704444176803566, + "learning_rate": 0.00016459311895298889, + "loss": 0.7684, + "mean_token_accuracy": 0.772375512123108, + "num_tokens": 60000021.0, + "step": 17640 + }, + { + "epoch": 0.17714480709783612, + "learning_rate": 0.0001645730458870288, + "loss": 0.7677, + "mean_token_accuracy": 0.775952297449112, + "num_tokens": 60033294.0, + "step": 17650 + }, + { + "epoch": 0.1772451724276366, + "learning_rate": 0.0001645529728210687, + "loss": 0.734, + "mean_token_accuracy": 0.7766773700714111, + "num_tokens": 60066604.0, + "step": 17660 + }, + { + "epoch": 0.17734553775743708, + "learning_rate": 0.00016453289975510858, + "loss": 0.7978, + "mean_token_accuracy": 0.7641145765781403, + "num_tokens": 60101585.0, + "step": 17670 + }, + { + "epoch": 0.17744590308723754, + "learning_rate": 0.00016451282668914852, + "loss": 0.7697, + "mean_token_accuracy": 0.7713691294193268, + "num_tokens": 60135502.0, + "step": 17680 + }, + { + "epoch": 0.17754626841703802, + "learning_rate": 0.0001644927536231884, + "loss": 0.7834, + "mean_token_accuracy": 0.7656452357769012, + "num_tokens": 60168785.0, + "step": 17690 + }, + { + "epoch": 0.1776466337468385, + "learning_rate": 0.0001644726805572283, + "loss": 0.7761, + "mean_token_accuracy": 0.7686882853507996, + "num_tokens": 60203573.0, + "step": 17700 + }, + { + "epoch": 0.17774699907663896, + "learning_rate": 0.00016445260749126822, + "loss": 0.7113, + "mean_token_accuracy": 0.7895864546298981, + "num_tokens": 60236447.0, + "step": 17710 + }, + { + "epoch": 0.17784736440643945, + "learning_rate": 0.00016443253442530813, + "loss": 0.8131, + "mean_token_accuracy": 0.7609871804714203, + "num_tokens": 60270141.0, + "step": 17720 + }, + { + "epoch": 0.1779477297362399, + "learning_rate": 0.00016441246135934803, + "loss": 0.7605, + "mean_token_accuracy": 0.7759998798370361, + "num_tokens": 60304104.0, + "step": 17730 + }, + { + "epoch": 0.17804809506604038, + "learning_rate": 0.00016439238829338794, + "loss": 0.7951, + "mean_token_accuracy": 0.7703262507915497, + "num_tokens": 60339135.0, + "step": 17740 + }, + { + "epoch": 0.17814846039584087, + "learning_rate": 0.00016437231522742785, + "loss": 0.7537, + "mean_token_accuracy": 0.7827511548995971, + "num_tokens": 60372199.0, + "step": 17750 + }, + { + "epoch": 0.17824882572564132, + "learning_rate": 0.00016435224216146773, + "loss": 0.7809, + "mean_token_accuracy": 0.7661384582519531, + "num_tokens": 60406203.0, + "step": 17760 + }, + { + "epoch": 0.1783491910554418, + "learning_rate": 0.00016433216909550767, + "loss": 0.7537, + "mean_token_accuracy": 0.7733368217945099, + "num_tokens": 60440957.0, + "step": 17770 + }, + { + "epoch": 0.1784495563852423, + "learning_rate": 0.00016431209602954755, + "loss": 0.7609, + "mean_token_accuracy": 0.7707456469535827, + "num_tokens": 60474679.0, + "step": 17780 + }, + { + "epoch": 0.17854992171504275, + "learning_rate": 0.00016429202296358746, + "loss": 0.7746, + "mean_token_accuracy": 0.7717380285263061, + "num_tokens": 60508245.0, + "step": 17790 + }, + { + "epoch": 0.17865028704484323, + "learning_rate": 0.00016427194989762737, + "loss": 0.7562, + "mean_token_accuracy": 0.7732972860336303, + "num_tokens": 60542678.0, + "step": 17800 + }, + { + "epoch": 0.17875065237464371, + "learning_rate": 0.00016425187683166727, + "loss": 0.7824, + "mean_token_accuracy": 0.7712754130363464, + "num_tokens": 60576155.0, + "step": 17810 + }, + { + "epoch": 0.17885101770444417, + "learning_rate": 0.00016423180376570718, + "loss": 0.7676, + "mean_token_accuracy": 0.7724056899547577, + "num_tokens": 60610482.0, + "step": 17820 + }, + { + "epoch": 0.17895138303424465, + "learning_rate": 0.0001642117306997471, + "loss": 0.7597, + "mean_token_accuracy": 0.7675942838191986, + "num_tokens": 60644434.0, + "step": 17830 + }, + { + "epoch": 0.17905174836404514, + "learning_rate": 0.000164191657633787, + "loss": 0.7697, + "mean_token_accuracy": 0.7697039902210235, + "num_tokens": 60678529.0, + "step": 17840 + }, + { + "epoch": 0.1791521136938456, + "learning_rate": 0.0001641715845678269, + "loss": 0.7635, + "mean_token_accuracy": 0.7731961727142334, + "num_tokens": 60712066.0, + "step": 17850 + }, + { + "epoch": 0.17925247902364608, + "learning_rate": 0.00016415151150186682, + "loss": 0.7939, + "mean_token_accuracy": 0.7673891663551331, + "num_tokens": 60746415.0, + "step": 17860 + }, + { + "epoch": 0.17935284435344653, + "learning_rate": 0.0001641314384359067, + "loss": 0.7814, + "mean_token_accuracy": 0.7660547375679017, + "num_tokens": 60780453.0, + "step": 17870 + }, + { + "epoch": 0.17945320968324702, + "learning_rate": 0.00016411136536994663, + "loss": 0.7414, + "mean_token_accuracy": 0.7775905013084412, + "num_tokens": 60815219.0, + "step": 17880 + }, + { + "epoch": 0.1795535750130475, + "learning_rate": 0.00016409129230398651, + "loss": 0.7779, + "mean_token_accuracy": 0.7698129117488861, + "num_tokens": 60849708.0, + "step": 17890 + }, + { + "epoch": 0.17965394034284796, + "learning_rate": 0.00016407121923802642, + "loss": 0.8327, + "mean_token_accuracy": 0.7578640341758728, + "num_tokens": 60882991.0, + "step": 17900 + }, + { + "epoch": 0.17975430567264844, + "learning_rate": 0.00016405114617206633, + "loss": 0.7803, + "mean_token_accuracy": 0.7644511163234711, + "num_tokens": 60916793.0, + "step": 17910 + }, + { + "epoch": 0.17985467100244892, + "learning_rate": 0.00016403107310610624, + "loss": 0.7698, + "mean_token_accuracy": 0.7728886902332306, + "num_tokens": 60951248.0, + "step": 17920 + }, + { + "epoch": 0.17995503633224938, + "learning_rate": 0.00016401100004014612, + "loss": 0.78, + "mean_token_accuracy": 0.7688422322273254, + "num_tokens": 60984506.0, + "step": 17930 + }, + { + "epoch": 0.18005540166204986, + "learning_rate": 0.00016399092697418606, + "loss": 0.7535, + "mean_token_accuracy": 0.7761100590229034, + "num_tokens": 61017911.0, + "step": 17940 + }, + { + "epoch": 0.18015576699185035, + "learning_rate": 0.00016397085390822597, + "loss": 0.8006, + "mean_token_accuracy": 0.7644067168235779, + "num_tokens": 61053525.0, + "step": 17950 + }, + { + "epoch": 0.1802561323216508, + "learning_rate": 0.00016395078084226585, + "loss": 0.7547, + "mean_token_accuracy": 0.7717255651950836, + "num_tokens": 61087497.0, + "step": 17960 + }, + { + "epoch": 0.1803564976514513, + "learning_rate": 0.00016393070777630578, + "loss": 0.795, + "mean_token_accuracy": 0.7677553355693817, + "num_tokens": 61122792.0, + "step": 17970 + }, + { + "epoch": 0.18045686298125177, + "learning_rate": 0.00016391063471034566, + "loss": 0.7721, + "mean_token_accuracy": 0.7706233382225036, + "num_tokens": 61157415.0, + "step": 17980 + }, + { + "epoch": 0.18055722831105223, + "learning_rate": 0.00016389056164438557, + "loss": 0.7637, + "mean_token_accuracy": 0.7725520610809327, + "num_tokens": 61190629.0, + "step": 17990 + }, + { + "epoch": 0.1806575936408527, + "learning_rate": 0.00016387048857842548, + "loss": 0.7434, + "mean_token_accuracy": 0.7789816677570343, + "num_tokens": 61224902.0, + "step": 18000 + }, + { + "epoch": 0.18075795897065317, + "learning_rate": 0.0001638504155124654, + "loss": 0.7332, + "mean_token_accuracy": 0.7772551894187927, + "num_tokens": 61259118.0, + "step": 18010 + }, + { + "epoch": 0.18085832430045365, + "learning_rate": 0.00016383034244650527, + "loss": 0.8069, + "mean_token_accuracy": 0.7600550413131714, + "num_tokens": 61293836.0, + "step": 18020 + }, + { + "epoch": 0.18095868963025413, + "learning_rate": 0.0001638102693805452, + "loss": 0.7707, + "mean_token_accuracy": 0.7729291975498199, + "num_tokens": 61327575.0, + "step": 18030 + }, + { + "epoch": 0.1810590549600546, + "learning_rate": 0.0001637901963145851, + "loss": 0.7643, + "mean_token_accuracy": 0.7731200933456421, + "num_tokens": 61361526.0, + "step": 18040 + }, + { + "epoch": 0.18115942028985507, + "learning_rate": 0.000163770123248625, + "loss": 0.7899, + "mean_token_accuracy": 0.7629842936992646, + "num_tokens": 61396000.0, + "step": 18050 + }, + { + "epoch": 0.18125978561965556, + "learning_rate": 0.0001637500501826649, + "loss": 0.7853, + "mean_token_accuracy": 0.7604344427585602, + "num_tokens": 61430117.0, + "step": 18060 + }, + { + "epoch": 0.181360150949456, + "learning_rate": 0.0001637299771167048, + "loss": 0.7893, + "mean_token_accuracy": 0.766669875383377, + "num_tokens": 61463966.0, + "step": 18070 + }, + { + "epoch": 0.1814605162792565, + "learning_rate": 0.00016370990405074472, + "loss": 0.7824, + "mean_token_accuracy": 0.7696913361549378, + "num_tokens": 61497639.0, + "step": 18080 + }, + { + "epoch": 0.18156088160905698, + "learning_rate": 0.00016368983098478463, + "loss": 0.7629, + "mean_token_accuracy": 0.77036554813385, + "num_tokens": 61532293.0, + "step": 18090 + }, + { + "epoch": 0.18166124693885743, + "learning_rate": 0.00016366975791882454, + "loss": 0.7699, + "mean_token_accuracy": 0.7703576445579529, + "num_tokens": 61567287.0, + "step": 18100 + }, + { + "epoch": 0.18176161226865792, + "learning_rate": 0.00016364968485286442, + "loss": 0.7715, + "mean_token_accuracy": 0.7734453499317169, + "num_tokens": 61601581.0, + "step": 18110 + }, + { + "epoch": 0.1818619775984584, + "learning_rate": 0.00016362961178690435, + "loss": 0.7609, + "mean_token_accuracy": 0.7735493004322052, + "num_tokens": 61636230.0, + "step": 18120 + }, + { + "epoch": 0.18196234292825886, + "learning_rate": 0.00016360953872094424, + "loss": 0.7957, + "mean_token_accuracy": 0.7671381592750549, + "num_tokens": 61670977.0, + "step": 18130 + }, + { + "epoch": 0.18206270825805934, + "learning_rate": 0.00016358946565498414, + "loss": 0.7564, + "mean_token_accuracy": 0.7743266701698304, + "num_tokens": 61704761.0, + "step": 18140 + }, + { + "epoch": 0.1821630735878598, + "learning_rate": 0.00016356939258902405, + "loss": 0.793, + "mean_token_accuracy": 0.7678810358047485, + "num_tokens": 61738979.0, + "step": 18150 + }, + { + "epoch": 0.18226343891766028, + "learning_rate": 0.00016354931952306396, + "loss": 0.7911, + "mean_token_accuracy": 0.7643441200256348, + "num_tokens": 61772803.0, + "step": 18160 + }, + { + "epoch": 0.18236380424746076, + "learning_rate": 0.00016352924645710387, + "loss": 0.7843, + "mean_token_accuracy": 0.7699290454387665, + "num_tokens": 61806363.0, + "step": 18170 + }, + { + "epoch": 0.18246416957726122, + "learning_rate": 0.00016350917339114378, + "loss": 0.7534, + "mean_token_accuracy": 0.774201774597168, + "num_tokens": 61839436.0, + "step": 18180 + }, + { + "epoch": 0.1825645349070617, + "learning_rate": 0.0001634891003251837, + "loss": 0.738, + "mean_token_accuracy": 0.7790593385696412, + "num_tokens": 61873826.0, + "step": 18190 + }, + { + "epoch": 0.1826649002368622, + "learning_rate": 0.00016346902725922357, + "loss": 0.7757, + "mean_token_accuracy": 0.769185584783554, + "num_tokens": 61907947.0, + "step": 18200 + }, + { + "epoch": 0.18276526556666264, + "learning_rate": 0.0001634489541932635, + "loss": 0.7885, + "mean_token_accuracy": 0.7664050936698914, + "num_tokens": 61942529.0, + "step": 18210 + }, + { + "epoch": 0.18286563089646313, + "learning_rate": 0.00016342888112730338, + "loss": 0.7384, + "mean_token_accuracy": 0.7730357885360718, + "num_tokens": 61976876.0, + "step": 18220 + }, + { + "epoch": 0.1829659962262636, + "learning_rate": 0.0001634088080613433, + "loss": 0.8061, + "mean_token_accuracy": 0.7635744273662567, + "num_tokens": 62011317.0, + "step": 18230 + }, + { + "epoch": 0.18306636155606407, + "learning_rate": 0.0001633887349953832, + "loss": 0.7827, + "mean_token_accuracy": 0.7664428949356079, + "num_tokens": 62045627.0, + "step": 18240 + }, + { + "epoch": 0.18316672688586455, + "learning_rate": 0.0001633686619294231, + "loss": 0.7815, + "mean_token_accuracy": 0.7628428339958191, + "num_tokens": 62079421.0, + "step": 18250 + }, + { + "epoch": 0.18326709221566503, + "learning_rate": 0.000163348588863463, + "loss": 0.7451, + "mean_token_accuracy": 0.7762756168842315, + "num_tokens": 62114007.0, + "step": 18260 + }, + { + "epoch": 0.1833674575454655, + "learning_rate": 0.00016332851579750293, + "loss": 0.7622, + "mean_token_accuracy": 0.7699788212776184, + "num_tokens": 62148214.0, + "step": 18270 + }, + { + "epoch": 0.18346782287526597, + "learning_rate": 0.0001633084427315428, + "loss": 0.7885, + "mean_token_accuracy": 0.7681151330471039, + "num_tokens": 62182380.0, + "step": 18280 + }, + { + "epoch": 0.18356818820506643, + "learning_rate": 0.00016328836966558272, + "loss": 0.7658, + "mean_token_accuracy": 0.7687394440174102, + "num_tokens": 62216320.0, + "step": 18290 + }, + { + "epoch": 0.1836685535348669, + "learning_rate": 0.00016326829659962263, + "loss": 0.786, + "mean_token_accuracy": 0.7645105063915253, + "num_tokens": 62249609.0, + "step": 18300 + }, + { + "epoch": 0.1837689188646674, + "learning_rate": 0.00016324822353366253, + "loss": 0.7733, + "mean_token_accuracy": 0.7732066512107849, + "num_tokens": 62283605.0, + "step": 18310 + }, + { + "epoch": 0.18386928419446785, + "learning_rate": 0.00016322815046770244, + "loss": 0.8099, + "mean_token_accuracy": 0.7657205998897553, + "num_tokens": 62318429.0, + "step": 18320 + }, + { + "epoch": 0.18396964952426834, + "learning_rate": 0.00016320807740174235, + "loss": 0.7684, + "mean_token_accuracy": 0.7653166830539704, + "num_tokens": 62352475.0, + "step": 18330 + }, + { + "epoch": 0.18407001485406882, + "learning_rate": 0.00016318800433578226, + "loss": 0.7986, + "mean_token_accuracy": 0.7597263157367706, + "num_tokens": 62386501.0, + "step": 18340 + }, + { + "epoch": 0.18417038018386928, + "learning_rate": 0.00016316793126982214, + "loss": 0.7243, + "mean_token_accuracy": 0.7759540557861329, + "num_tokens": 62420011.0, + "step": 18350 + }, + { + "epoch": 0.18427074551366976, + "learning_rate": 0.00016314785820386208, + "loss": 0.7555, + "mean_token_accuracy": 0.7748587667942047, + "num_tokens": 62454044.0, + "step": 18360 + }, + { + "epoch": 0.18437111084347024, + "learning_rate": 0.00016312778513790196, + "loss": 0.7768, + "mean_token_accuracy": 0.7700540661811829, + "num_tokens": 62488487.0, + "step": 18370 + }, + { + "epoch": 0.1844714761732707, + "learning_rate": 0.0001631077120719419, + "loss": 0.7639, + "mean_token_accuracy": 0.7720458507537842, + "num_tokens": 62522346.0, + "step": 18380 + }, + { + "epoch": 0.18457184150307118, + "learning_rate": 0.00016308763900598177, + "loss": 0.7841, + "mean_token_accuracy": 0.768638151884079, + "num_tokens": 62556694.0, + "step": 18390 + }, + { + "epoch": 0.18467220683287167, + "learning_rate": 0.00016306756594002168, + "loss": 0.7451, + "mean_token_accuracy": 0.7727836549282074, + "num_tokens": 62590509.0, + "step": 18400 + }, + { + "epoch": 0.18477257216267212, + "learning_rate": 0.0001630474928740616, + "loss": 0.7609, + "mean_token_accuracy": 0.7713655471801758, + "num_tokens": 62624925.0, + "step": 18410 + }, + { + "epoch": 0.1848729374924726, + "learning_rate": 0.0001630274198081015, + "loss": 0.8011, + "mean_token_accuracy": 0.7590881168842316, + "num_tokens": 62659270.0, + "step": 18420 + }, + { + "epoch": 0.18497330282227306, + "learning_rate": 0.0001630073467421414, + "loss": 0.7709, + "mean_token_accuracy": 0.7708830296993255, + "num_tokens": 62693910.0, + "step": 18430 + }, + { + "epoch": 0.18507366815207354, + "learning_rate": 0.00016298727367618132, + "loss": 0.7835, + "mean_token_accuracy": 0.7661713480949401, + "num_tokens": 62727733.0, + "step": 18440 + }, + { + "epoch": 0.18517403348187403, + "learning_rate": 0.00016296720061022122, + "loss": 0.7698, + "mean_token_accuracy": 0.7711425065994263, + "num_tokens": 62762110.0, + "step": 18450 + }, + { + "epoch": 0.18527439881167448, + "learning_rate": 0.0001629471275442611, + "loss": 0.7355, + "mean_token_accuracy": 0.7776850581169128, + "num_tokens": 62796340.0, + "step": 18460 + }, + { + "epoch": 0.18537476414147497, + "learning_rate": 0.00016292705447830104, + "loss": 0.8002, + "mean_token_accuracy": 0.76320121884346, + "num_tokens": 62830746.0, + "step": 18470 + }, + { + "epoch": 0.18547512947127545, + "learning_rate": 0.00016290698141234092, + "loss": 0.8161, + "mean_token_accuracy": 0.7639877259731293, + "num_tokens": 62864457.0, + "step": 18480 + }, + { + "epoch": 0.1855754948010759, + "learning_rate": 0.00016288690834638083, + "loss": 0.7759, + "mean_token_accuracy": 0.7661233425140381, + "num_tokens": 62897935.0, + "step": 18490 + }, + { + "epoch": 0.1856758601308764, + "learning_rate": 0.00016286683528042074, + "loss": 0.7715, + "mean_token_accuracy": 0.7745231449604034, + "num_tokens": 62931317.0, + "step": 18500 + }, + { + "epoch": 0.18577622546067687, + "learning_rate": 0.00016284676221446065, + "loss": 0.764, + "mean_token_accuracy": 0.7681089520454407, + "num_tokens": 62966225.0, + "step": 18510 + }, + { + "epoch": 0.18587659079047733, + "learning_rate": 0.00016282668914850056, + "loss": 0.7418, + "mean_token_accuracy": 0.7758630812168121, + "num_tokens": 62999601.0, + "step": 18520 + }, + { + "epoch": 0.18597695612027781, + "learning_rate": 0.00016280661608254047, + "loss": 0.7502, + "mean_token_accuracy": 0.7772676169872283, + "num_tokens": 63034028.0, + "step": 18530 + }, + { + "epoch": 0.1860773214500783, + "learning_rate": 0.00016278654301658037, + "loss": 0.7602, + "mean_token_accuracy": 0.77999187707901, + "num_tokens": 63068275.0, + "step": 18540 + }, + { + "epoch": 0.18617768677987875, + "learning_rate": 0.00016276646995062025, + "loss": 0.7471, + "mean_token_accuracy": 0.7712823390960694, + "num_tokens": 63102226.0, + "step": 18550 + }, + { + "epoch": 0.18627805210967924, + "learning_rate": 0.0001627463968846602, + "loss": 0.7632, + "mean_token_accuracy": 0.7757633328437805, + "num_tokens": 63136322.0, + "step": 18560 + }, + { + "epoch": 0.1863784174394797, + "learning_rate": 0.00016272632381870007, + "loss": 0.8076, + "mean_token_accuracy": 0.7684038341045379, + "num_tokens": 63169950.0, + "step": 18570 + }, + { + "epoch": 0.18647878276928018, + "learning_rate": 0.00016270625075273998, + "loss": 0.7681, + "mean_token_accuracy": 0.7748810112476349, + "num_tokens": 63204442.0, + "step": 18580 + }, + { + "epoch": 0.18657914809908066, + "learning_rate": 0.0001626861776867799, + "loss": 0.7866, + "mean_token_accuracy": 0.7683030843734742, + "num_tokens": 63237776.0, + "step": 18590 + }, + { + "epoch": 0.18667951342888112, + "learning_rate": 0.0001626661046208198, + "loss": 0.7459, + "mean_token_accuracy": 0.7781949758529663, + "num_tokens": 63271701.0, + "step": 18600 + }, + { + "epoch": 0.1867798787586816, + "learning_rate": 0.00016264603155485968, + "loss": 0.772, + "mean_token_accuracy": 0.7715380012989044, + "num_tokens": 63305993.0, + "step": 18610 + }, + { + "epoch": 0.18688024408848208, + "learning_rate": 0.00016262595848889961, + "loss": 0.7893, + "mean_token_accuracy": 0.7674874544143677, + "num_tokens": 63340482.0, + "step": 18620 + }, + { + "epoch": 0.18698060941828254, + "learning_rate": 0.0001626058854229395, + "loss": 0.7756, + "mean_token_accuracy": 0.7720118045806885, + "num_tokens": 63374747.0, + "step": 18630 + }, + { + "epoch": 0.18708097474808302, + "learning_rate": 0.0001625858123569794, + "loss": 0.7554, + "mean_token_accuracy": 0.7776407539844513, + "num_tokens": 63409758.0, + "step": 18640 + }, + { + "epoch": 0.1871813400778835, + "learning_rate": 0.0001625657392910193, + "loss": 0.7874, + "mean_token_accuracy": 0.7663829922676086, + "num_tokens": 63443948.0, + "step": 18650 + }, + { + "epoch": 0.18728170540768396, + "learning_rate": 0.00016254566622505922, + "loss": 0.7333, + "mean_token_accuracy": 0.7760569155216217, + "num_tokens": 63477292.0, + "step": 18660 + }, + { + "epoch": 0.18738207073748445, + "learning_rate": 0.00016252559315909913, + "loss": 0.7723, + "mean_token_accuracy": 0.7722366213798523, + "num_tokens": 63512263.0, + "step": 18670 + }, + { + "epoch": 0.18748243606728493, + "learning_rate": 0.00016250552009313904, + "loss": 0.7733, + "mean_token_accuracy": 0.7722975015640259, + "num_tokens": 63546456.0, + "step": 18680 + }, + { + "epoch": 0.18758280139708539, + "learning_rate": 0.00016248544702717895, + "loss": 0.7483, + "mean_token_accuracy": 0.7726555287837982, + "num_tokens": 63580150.0, + "step": 18690 + }, + { + "epoch": 0.18768316672688587, + "learning_rate": 0.00016246537396121883, + "loss": 0.7964, + "mean_token_accuracy": 0.7653996467590332, + "num_tokens": 63613575.0, + "step": 18700 + }, + { + "epoch": 0.18778353205668633, + "learning_rate": 0.00016244530089525876, + "loss": 0.7967, + "mean_token_accuracy": 0.7680726945400238, + "num_tokens": 63647897.0, + "step": 18710 + }, + { + "epoch": 0.1878838973864868, + "learning_rate": 0.00016242522782929864, + "loss": 0.761, + "mean_token_accuracy": 0.7686357796192169, + "num_tokens": 63682485.0, + "step": 18720 + }, + { + "epoch": 0.1879842627162873, + "learning_rate": 0.00016240515476333855, + "loss": 0.7723, + "mean_token_accuracy": 0.7725031673908234, + "num_tokens": 63716708.0, + "step": 18730 + }, + { + "epoch": 0.18808462804608775, + "learning_rate": 0.00016238508169737846, + "loss": 0.7876, + "mean_token_accuracy": 0.7653063297271728, + "num_tokens": 63750589.0, + "step": 18740 + }, + { + "epoch": 0.18818499337588823, + "learning_rate": 0.00016236500863141837, + "loss": 0.75, + "mean_token_accuracy": 0.7706561863422394, + "num_tokens": 63784726.0, + "step": 18750 + }, + { + "epoch": 0.18828535870568872, + "learning_rate": 0.00016234493556545828, + "loss": 0.7524, + "mean_token_accuracy": 0.7732706964015961, + "num_tokens": 63818732.0, + "step": 18760 + }, + { + "epoch": 0.18838572403548917, + "learning_rate": 0.00016232486249949819, + "loss": 0.7756, + "mean_token_accuracy": 0.771875262260437, + "num_tokens": 63852581.0, + "step": 18770 + }, + { + "epoch": 0.18848608936528966, + "learning_rate": 0.0001623047894335381, + "loss": 0.7364, + "mean_token_accuracy": 0.7823958218097686, + "num_tokens": 63887370.0, + "step": 18780 + }, + { + "epoch": 0.18858645469509014, + "learning_rate": 0.00016228471636757798, + "loss": 0.7522, + "mean_token_accuracy": 0.7735142648220062, + "num_tokens": 63921195.0, + "step": 18790 + }, + { + "epoch": 0.1886868200248906, + "learning_rate": 0.0001622646433016179, + "loss": 0.7942, + "mean_token_accuracy": 0.7688505411148071, + "num_tokens": 63955282.0, + "step": 18800 + }, + { + "epoch": 0.18878718535469108, + "learning_rate": 0.0001622445702356578, + "loss": 0.7245, + "mean_token_accuracy": 0.7823804557323456, + "num_tokens": 63989952.0, + "step": 18810 + }, + { + "epoch": 0.18888755068449156, + "learning_rate": 0.0001622244971696977, + "loss": 0.7704, + "mean_token_accuracy": 0.7732816517353058, + "num_tokens": 64024831.0, + "step": 18820 + }, + { + "epoch": 0.18898791601429202, + "learning_rate": 0.0001622044241037376, + "loss": 0.7837, + "mean_token_accuracy": 0.7630086898803711, + "num_tokens": 64057698.0, + "step": 18830 + }, + { + "epoch": 0.1890882813440925, + "learning_rate": 0.00016218435103777752, + "loss": 0.788, + "mean_token_accuracy": 0.7682810366153717, + "num_tokens": 64091622.0, + "step": 18840 + }, + { + "epoch": 0.18918864667389296, + "learning_rate": 0.00016216427797181743, + "loss": 0.774, + "mean_token_accuracy": 0.763655811548233, + "num_tokens": 64125909.0, + "step": 18850 + }, + { + "epoch": 0.18928901200369344, + "learning_rate": 0.00016214420490585733, + "loss": 0.7757, + "mean_token_accuracy": 0.7707290172576904, + "num_tokens": 64159547.0, + "step": 18860 + }, + { + "epoch": 0.18938937733349392, + "learning_rate": 0.00016212413183989724, + "loss": 0.7333, + "mean_token_accuracy": 0.7797725558280945, + "num_tokens": 64194312.0, + "step": 18870 + }, + { + "epoch": 0.18948974266329438, + "learning_rate": 0.00016210405877393712, + "loss": 0.7632, + "mean_token_accuracy": 0.7734246671199798, + "num_tokens": 64228034.0, + "step": 18880 + }, + { + "epoch": 0.18959010799309486, + "learning_rate": 0.00016208398570797706, + "loss": 0.7897, + "mean_token_accuracy": 0.7694403171539307, + "num_tokens": 64261670.0, + "step": 18890 + }, + { + "epoch": 0.18969047332289535, + "learning_rate": 0.00016206391264201694, + "loss": 0.7826, + "mean_token_accuracy": 0.7667472302913666, + "num_tokens": 64295493.0, + "step": 18900 + }, + { + "epoch": 0.1897908386526958, + "learning_rate": 0.00016204383957605685, + "loss": 0.7472, + "mean_token_accuracy": 0.7765673577785492, + "num_tokens": 64330705.0, + "step": 18910 + }, + { + "epoch": 0.1898912039824963, + "learning_rate": 0.00016202376651009676, + "loss": 0.7754, + "mean_token_accuracy": 0.7735772848129272, + "num_tokens": 64364839.0, + "step": 18920 + }, + { + "epoch": 0.18999156931229677, + "learning_rate": 0.00016200369344413667, + "loss": 0.7468, + "mean_token_accuracy": 0.7750263512134552, + "num_tokens": 64399309.0, + "step": 18930 + }, + { + "epoch": 0.19009193464209723, + "learning_rate": 0.00016198362037817658, + "loss": 0.7468, + "mean_token_accuracy": 0.7775311589241027, + "num_tokens": 64432659.0, + "step": 18940 + }, + { + "epoch": 0.1901922999718977, + "learning_rate": 0.00016196354731221648, + "loss": 0.7947, + "mean_token_accuracy": 0.7694822609424591, + "num_tokens": 64467264.0, + "step": 18950 + }, + { + "epoch": 0.1902926653016982, + "learning_rate": 0.00016194347424625637, + "loss": 0.7435, + "mean_token_accuracy": 0.7792628645896912, + "num_tokens": 64500619.0, + "step": 18960 + }, + { + "epoch": 0.19039303063149865, + "learning_rate": 0.0001619234011802963, + "loss": 0.7609, + "mean_token_accuracy": 0.7780649542808533, + "num_tokens": 64535044.0, + "step": 18970 + }, + { + "epoch": 0.19049339596129913, + "learning_rate": 0.00016190332811433618, + "loss": 0.7588, + "mean_token_accuracy": 0.7738030016422272, + "num_tokens": 64568192.0, + "step": 18980 + }, + { + "epoch": 0.1905937612910996, + "learning_rate": 0.0001618832550483761, + "loss": 0.7508, + "mean_token_accuracy": 0.7778998613357544, + "num_tokens": 64602388.0, + "step": 18990 + }, + { + "epoch": 0.19069412662090007, + "learning_rate": 0.000161863181982416, + "loss": 0.7433, + "mean_token_accuracy": 0.7757618129253387, + "num_tokens": 64636406.0, + "step": 19000 + }, + { + "epoch": 0.19079449195070056, + "learning_rate": 0.0001618431089164559, + "loss": 0.7362, + "mean_token_accuracy": 0.7791922152042389, + "num_tokens": 64670618.0, + "step": 19010 + }, + { + "epoch": 0.190894857280501, + "learning_rate": 0.00016182303585049582, + "loss": 0.757, + "mean_token_accuracy": 0.7783075511455536, + "num_tokens": 64704532.0, + "step": 19020 + }, + { + "epoch": 0.1909952226103015, + "learning_rate": 0.00016180296278453572, + "loss": 0.7496, + "mean_token_accuracy": 0.7750849246978759, + "num_tokens": 64738653.0, + "step": 19030 + }, + { + "epoch": 0.19109558794010198, + "learning_rate": 0.00016178288971857563, + "loss": 0.7583, + "mean_token_accuracy": 0.7745764195919037, + "num_tokens": 64772906.0, + "step": 19040 + }, + { + "epoch": 0.19119595326990244, + "learning_rate": 0.00016176281665261551, + "loss": 0.7985, + "mean_token_accuracy": 0.765564888715744, + "num_tokens": 64806675.0, + "step": 19050 + }, + { + "epoch": 0.19129631859970292, + "learning_rate": 0.00016174274358665545, + "loss": 0.7547, + "mean_token_accuracy": 0.7681283593177796, + "num_tokens": 64840702.0, + "step": 19060 + }, + { + "epoch": 0.1913966839295034, + "learning_rate": 0.00016172267052069533, + "loss": 0.7764, + "mean_token_accuracy": 0.7724027931690216, + "num_tokens": 64874883.0, + "step": 19070 + }, + { + "epoch": 0.19149704925930386, + "learning_rate": 0.00016170259745473524, + "loss": 0.7713, + "mean_token_accuracy": 0.7691495954990387, + "num_tokens": 64909325.0, + "step": 19080 + }, + { + "epoch": 0.19159741458910434, + "learning_rate": 0.00016168252438877515, + "loss": 0.7723, + "mean_token_accuracy": 0.7718911945819855, + "num_tokens": 64943396.0, + "step": 19090 + }, + { + "epoch": 0.19169777991890483, + "learning_rate": 0.00016166245132281506, + "loss": 0.7724, + "mean_token_accuracy": 0.773424506187439, + "num_tokens": 64976834.0, + "step": 19100 + }, + { + "epoch": 0.19179814524870528, + "learning_rate": 0.00016164237825685496, + "loss": 0.7492, + "mean_token_accuracy": 0.7783820271492005, + "num_tokens": 65011251.0, + "step": 19110 + }, + { + "epoch": 0.19189851057850577, + "learning_rate": 0.00016162230519089487, + "loss": 0.7803, + "mean_token_accuracy": 0.7681094467639923, + "num_tokens": 65045076.0, + "step": 19120 + }, + { + "epoch": 0.19199887590830622, + "learning_rate": 0.00016160223212493478, + "loss": 0.7621, + "mean_token_accuracy": 0.7738582372665406, + "num_tokens": 65079194.0, + "step": 19130 + }, + { + "epoch": 0.1920992412381067, + "learning_rate": 0.00016158215905897466, + "loss": 0.7479, + "mean_token_accuracy": 0.7765959143638611, + "num_tokens": 65113027.0, + "step": 19140 + }, + { + "epoch": 0.1921996065679072, + "learning_rate": 0.0001615620859930146, + "loss": 0.7552, + "mean_token_accuracy": 0.7722527205944061, + "num_tokens": 65147200.0, + "step": 19150 + }, + { + "epoch": 0.19229997189770764, + "learning_rate": 0.00016154201292705448, + "loss": 0.7623, + "mean_token_accuracy": 0.7735209167003632, + "num_tokens": 65181510.0, + "step": 19160 + }, + { + "epoch": 0.19240033722750813, + "learning_rate": 0.0001615219398610944, + "loss": 0.7746, + "mean_token_accuracy": 0.7687154591083527, + "num_tokens": 65216910.0, + "step": 19170 + }, + { + "epoch": 0.1925007025573086, + "learning_rate": 0.0001615018667951343, + "loss": 0.7587, + "mean_token_accuracy": 0.7720073342323304, + "num_tokens": 65250578.0, + "step": 19180 + }, + { + "epoch": 0.19260106788710907, + "learning_rate": 0.0001614817937291742, + "loss": 0.788, + "mean_token_accuracy": 0.7646001219749451, + "num_tokens": 65285306.0, + "step": 19190 + }, + { + "epoch": 0.19270143321690955, + "learning_rate": 0.0001614617206632141, + "loss": 0.7715, + "mean_token_accuracy": 0.7696290969848633, + "num_tokens": 65318962.0, + "step": 19200 + }, + { + "epoch": 0.19280179854671003, + "learning_rate": 0.00016144164759725402, + "loss": 0.7646, + "mean_token_accuracy": 0.7771562337875366, + "num_tokens": 65353318.0, + "step": 19210 + }, + { + "epoch": 0.1929021638765105, + "learning_rate": 0.00016142157453129393, + "loss": 0.7875, + "mean_token_accuracy": 0.7628707885742188, + "num_tokens": 65387345.0, + "step": 19220 + }, + { + "epoch": 0.19300252920631097, + "learning_rate": 0.0001614015014653338, + "loss": 0.7945, + "mean_token_accuracy": 0.7688746809959411, + "num_tokens": 65421580.0, + "step": 19230 + }, + { + "epoch": 0.19310289453611146, + "learning_rate": 0.00016138142839937375, + "loss": 0.7782, + "mean_token_accuracy": 0.7717042803764343, + "num_tokens": 65455984.0, + "step": 19240 + }, + { + "epoch": 0.1932032598659119, + "learning_rate": 0.00016136135533341363, + "loss": 0.7943, + "mean_token_accuracy": 0.759830641746521, + "num_tokens": 65490077.0, + "step": 19250 + }, + { + "epoch": 0.1933036251957124, + "learning_rate": 0.00016134128226745354, + "loss": 0.7432, + "mean_token_accuracy": 0.7727313756942749, + "num_tokens": 65524484.0, + "step": 19260 + }, + { + "epoch": 0.19340399052551285, + "learning_rate": 0.00016132120920149345, + "loss": 0.7773, + "mean_token_accuracy": 0.7688717007637024, + "num_tokens": 65558779.0, + "step": 19270 + }, + { + "epoch": 0.19350435585531334, + "learning_rate": 0.00016130113613553335, + "loss": 0.7565, + "mean_token_accuracy": 0.7738625407218933, + "num_tokens": 65593308.0, + "step": 19280 + }, + { + "epoch": 0.19360472118511382, + "learning_rate": 0.00016128106306957324, + "loss": 0.7559, + "mean_token_accuracy": 0.7738423943519592, + "num_tokens": 65627835.0, + "step": 19290 + }, + { + "epoch": 0.19370508651491428, + "learning_rate": 0.00016126099000361317, + "loss": 0.8207, + "mean_token_accuracy": 0.7625119268894196, + "num_tokens": 65661353.0, + "step": 19300 + }, + { + "epoch": 0.19380545184471476, + "learning_rate": 0.00016124091693765305, + "loss": 0.7023, + "mean_token_accuracy": 0.7863344430923462, + "num_tokens": 65696158.0, + "step": 19310 + }, + { + "epoch": 0.19390581717451524, + "learning_rate": 0.00016122084387169296, + "loss": 0.7513, + "mean_token_accuracy": 0.776838755607605, + "num_tokens": 65730366.0, + "step": 19320 + }, + { + "epoch": 0.1940061825043157, + "learning_rate": 0.00016120077080573287, + "loss": 0.7921, + "mean_token_accuracy": 0.7652410626411438, + "num_tokens": 65764302.0, + "step": 19330 + }, + { + "epoch": 0.19410654783411618, + "learning_rate": 0.00016118069773977278, + "loss": 0.7633, + "mean_token_accuracy": 0.7726734757423401, + "num_tokens": 65798873.0, + "step": 19340 + }, + { + "epoch": 0.19420691316391667, + "learning_rate": 0.00016116062467381269, + "loss": 0.8107, + "mean_token_accuracy": 0.7613295316696167, + "num_tokens": 65833515.0, + "step": 19350 + }, + { + "epoch": 0.19430727849371712, + "learning_rate": 0.0001611405516078526, + "loss": 0.7282, + "mean_token_accuracy": 0.78021360039711, + "num_tokens": 65868430.0, + "step": 19360 + }, + { + "epoch": 0.1944076438235176, + "learning_rate": 0.0001611204785418925, + "loss": 0.7643, + "mean_token_accuracy": 0.773417180776596, + "num_tokens": 65902908.0, + "step": 19370 + }, + { + "epoch": 0.1945080091533181, + "learning_rate": 0.00016110040547593238, + "loss": 0.764, + "mean_token_accuracy": 0.7677555322647095, + "num_tokens": 65937131.0, + "step": 19380 + }, + { + "epoch": 0.19460837448311855, + "learning_rate": 0.00016108033240997232, + "loss": 0.7787, + "mean_token_accuracy": 0.7665543496608734, + "num_tokens": 65971478.0, + "step": 19390 + }, + { + "epoch": 0.19470873981291903, + "learning_rate": 0.0001610602593440122, + "loss": 0.7957, + "mean_token_accuracy": 0.7618605971336365, + "num_tokens": 66006556.0, + "step": 19400 + }, + { + "epoch": 0.19480910514271949, + "learning_rate": 0.0001610401862780521, + "loss": 0.7613, + "mean_token_accuracy": 0.7710905432701111, + "num_tokens": 66041114.0, + "step": 19410 + }, + { + "epoch": 0.19490947047251997, + "learning_rate": 0.00016102011321209202, + "loss": 0.802, + "mean_token_accuracy": 0.7617272436618805, + "num_tokens": 66075592.0, + "step": 19420 + }, + { + "epoch": 0.19500983580232045, + "learning_rate": 0.00016100004014613193, + "loss": 0.7734, + "mean_token_accuracy": 0.7753029108047486, + "num_tokens": 66110273.0, + "step": 19430 + }, + { + "epoch": 0.1951102011321209, + "learning_rate": 0.00016097996708017183, + "loss": 0.7799, + "mean_token_accuracy": 0.7730140388011932, + "num_tokens": 66144736.0, + "step": 19440 + }, + { + "epoch": 0.1952105664619214, + "learning_rate": 0.00016095989401421174, + "loss": 0.8066, + "mean_token_accuracy": 0.7628728866577148, + "num_tokens": 66178161.0, + "step": 19450 + }, + { + "epoch": 0.19531093179172188, + "learning_rate": 0.00016093982094825165, + "loss": 0.7576, + "mean_token_accuracy": 0.7740750789642334, + "num_tokens": 66212869.0, + "step": 19460 + }, + { + "epoch": 0.19541129712152233, + "learning_rate": 0.00016091974788229153, + "loss": 0.7671, + "mean_token_accuracy": 0.7667285203933716, + "num_tokens": 66246749.0, + "step": 19470 + }, + { + "epoch": 0.19551166245132282, + "learning_rate": 0.00016089967481633147, + "loss": 0.7931, + "mean_token_accuracy": 0.7644418716430664, + "num_tokens": 66281090.0, + "step": 19480 + }, + { + "epoch": 0.1956120277811233, + "learning_rate": 0.00016087960175037135, + "loss": 0.7689, + "mean_token_accuracy": 0.7702011048793793, + "num_tokens": 66314725.0, + "step": 19490 + }, + { + "epoch": 0.19571239311092375, + "learning_rate": 0.00016085952868441126, + "loss": 0.7489, + "mean_token_accuracy": 0.7723415434360504, + "num_tokens": 66348900.0, + "step": 19500 + }, + { + "epoch": 0.19581275844072424, + "learning_rate": 0.00016083945561845117, + "loss": 0.7949, + "mean_token_accuracy": 0.764240151643753, + "num_tokens": 66384488.0, + "step": 19510 + }, + { + "epoch": 0.19591312377052472, + "learning_rate": 0.00016081938255249107, + "loss": 0.755, + "mean_token_accuracy": 0.7781309485435486, + "num_tokens": 66417923.0, + "step": 19520 + }, + { + "epoch": 0.19601348910032518, + "learning_rate": 0.00016079930948653098, + "loss": 0.7758, + "mean_token_accuracy": 0.7700519561767578, + "num_tokens": 66451905.0, + "step": 19530 + }, + { + "epoch": 0.19611385443012566, + "learning_rate": 0.0001607792364205709, + "loss": 0.7327, + "mean_token_accuracy": 0.779544734954834, + "num_tokens": 66486623.0, + "step": 19540 + }, + { + "epoch": 0.19621421975992612, + "learning_rate": 0.0001607591633546108, + "loss": 0.8051, + "mean_token_accuracy": 0.7675462424755096, + "num_tokens": 66520599.0, + "step": 19550 + }, + { + "epoch": 0.1963145850897266, + "learning_rate": 0.0001607390902886507, + "loss": 0.7556, + "mean_token_accuracy": 0.7777894735336304, + "num_tokens": 66554324.0, + "step": 19560 + }, + { + "epoch": 0.19641495041952708, + "learning_rate": 0.00016071901722269062, + "loss": 0.8006, + "mean_token_accuracy": 0.7677490472793579, + "num_tokens": 66588213.0, + "step": 19570 + }, + { + "epoch": 0.19651531574932754, + "learning_rate": 0.0001606989441567305, + "loss": 0.7556, + "mean_token_accuracy": 0.7706791758537292, + "num_tokens": 66622343.0, + "step": 19580 + }, + { + "epoch": 0.19661568107912802, + "learning_rate": 0.00016067887109077043, + "loss": 0.7861, + "mean_token_accuracy": 0.7715229392051697, + "num_tokens": 66656268.0, + "step": 19590 + }, + { + "epoch": 0.1967160464089285, + "learning_rate": 0.00016065879802481032, + "loss": 0.7393, + "mean_token_accuracy": 0.775808721780777, + "num_tokens": 66690563.0, + "step": 19600 + }, + { + "epoch": 0.19681641173872896, + "learning_rate": 0.00016063872495885022, + "loss": 0.7681, + "mean_token_accuracy": 0.7682813704013824, + "num_tokens": 66724181.0, + "step": 19610 + }, + { + "epoch": 0.19691677706852945, + "learning_rate": 0.00016061865189289013, + "loss": 0.7803, + "mean_token_accuracy": 0.7706619620323181, + "num_tokens": 66758485.0, + "step": 19620 + }, + { + "epoch": 0.19701714239832993, + "learning_rate": 0.00016059857882693004, + "loss": 0.7465, + "mean_token_accuracy": 0.7719769418239594, + "num_tokens": 66792463.0, + "step": 19630 + }, + { + "epoch": 0.1971175077281304, + "learning_rate": 0.00016057850576096992, + "loss": 0.7843, + "mean_token_accuracy": 0.7723612189292908, + "num_tokens": 66827091.0, + "step": 19640 + }, + { + "epoch": 0.19721787305793087, + "learning_rate": 0.00016055843269500986, + "loss": 0.7754, + "mean_token_accuracy": 0.768305379152298, + "num_tokens": 66861157.0, + "step": 19650 + }, + { + "epoch": 0.19731823838773135, + "learning_rate": 0.00016053835962904974, + "loss": 0.7689, + "mean_token_accuracy": 0.773998099565506, + "num_tokens": 66895205.0, + "step": 19660 + }, + { + "epoch": 0.1974186037175318, + "learning_rate": 0.00016051828656308965, + "loss": 0.8079, + "mean_token_accuracy": 0.7620140492916108, + "num_tokens": 66928321.0, + "step": 19670 + }, + { + "epoch": 0.1975189690473323, + "learning_rate": 0.00016049821349712956, + "loss": 0.7579, + "mean_token_accuracy": 0.7748634397983551, + "num_tokens": 66962433.0, + "step": 19680 + }, + { + "epoch": 0.19761933437713278, + "learning_rate": 0.00016047814043116946, + "loss": 0.7832, + "mean_token_accuracy": 0.7628565311431885, + "num_tokens": 66996228.0, + "step": 19690 + }, + { + "epoch": 0.19771969970693323, + "learning_rate": 0.00016045806736520937, + "loss": 0.7924, + "mean_token_accuracy": 0.7635167181491852, + "num_tokens": 67030281.0, + "step": 19700 + }, + { + "epoch": 0.19782006503673372, + "learning_rate": 0.00016043799429924928, + "loss": 0.7802, + "mean_token_accuracy": 0.7688194334506988, + "num_tokens": 67063354.0, + "step": 19710 + }, + { + "epoch": 0.19792043036653417, + "learning_rate": 0.0001604179212332892, + "loss": 0.7444, + "mean_token_accuracy": 0.7749076604843139, + "num_tokens": 67098215.0, + "step": 19720 + }, + { + "epoch": 0.19802079569633466, + "learning_rate": 0.00016039784816732907, + "loss": 0.7757, + "mean_token_accuracy": 0.7693403422832489, + "num_tokens": 67132673.0, + "step": 19730 + }, + { + "epoch": 0.19812116102613514, + "learning_rate": 0.000160377775101369, + "loss": 0.7756, + "mean_token_accuracy": 0.7703332483768464, + "num_tokens": 67166083.0, + "step": 19740 + }, + { + "epoch": 0.1982215263559356, + "learning_rate": 0.0001603577020354089, + "loss": 0.7883, + "mean_token_accuracy": 0.7647324919700622, + "num_tokens": 67199412.0, + "step": 19750 + }, + { + "epoch": 0.19832189168573608, + "learning_rate": 0.0001603376289694488, + "loss": 0.8099, + "mean_token_accuracy": 0.7631685435771942, + "num_tokens": 67234387.0, + "step": 19760 + }, + { + "epoch": 0.19842225701553656, + "learning_rate": 0.0001603175559034887, + "loss": 0.8004, + "mean_token_accuracy": 0.7648675858974456, + "num_tokens": 67268247.0, + "step": 19770 + }, + { + "epoch": 0.19852262234533702, + "learning_rate": 0.0001602974828375286, + "loss": 0.7787, + "mean_token_accuracy": 0.7660826325416565, + "num_tokens": 67301830.0, + "step": 19780 + }, + { + "epoch": 0.1986229876751375, + "learning_rate": 0.00016027740977156852, + "loss": 0.7433, + "mean_token_accuracy": 0.7775061130523682, + "num_tokens": 67336474.0, + "step": 19790 + }, + { + "epoch": 0.19872335300493799, + "learning_rate": 0.00016025733670560843, + "loss": 0.7207, + "mean_token_accuracy": 0.7795002400875092, + "num_tokens": 67369765.0, + "step": 19800 + }, + { + "epoch": 0.19882371833473844, + "learning_rate": 0.00016023726363964834, + "loss": 0.7399, + "mean_token_accuracy": 0.7733273029327392, + "num_tokens": 67404040.0, + "step": 19810 + }, + { + "epoch": 0.19892408366453893, + "learning_rate": 0.00016021719057368822, + "loss": 0.7694, + "mean_token_accuracy": 0.7676566243171692, + "num_tokens": 67438489.0, + "step": 19820 + }, + { + "epoch": 0.1990244489943394, + "learning_rate": 0.00016019711750772816, + "loss": 0.7759, + "mean_token_accuracy": 0.7730227828025817, + "num_tokens": 67472735.0, + "step": 19830 + }, + { + "epoch": 0.19912481432413986, + "learning_rate": 0.00016017704444176804, + "loss": 0.7815, + "mean_token_accuracy": 0.7656783998012543, + "num_tokens": 67506887.0, + "step": 19840 + }, + { + "epoch": 0.19922517965394035, + "learning_rate": 0.00016015697137580794, + "loss": 0.7802, + "mean_token_accuracy": 0.7670118987560273, + "num_tokens": 67540833.0, + "step": 19850 + }, + { + "epoch": 0.1993255449837408, + "learning_rate": 0.00016013689830984785, + "loss": 0.7698, + "mean_token_accuracy": 0.7682573080062867, + "num_tokens": 67575295.0, + "step": 19860 + }, + { + "epoch": 0.1994259103135413, + "learning_rate": 0.00016011682524388776, + "loss": 0.7702, + "mean_token_accuracy": 0.7683188498020173, + "num_tokens": 67610099.0, + "step": 19870 + }, + { + "epoch": 0.19952627564334177, + "learning_rate": 0.00016009675217792764, + "loss": 0.761, + "mean_token_accuracy": 0.7709443926811218, + "num_tokens": 67644359.0, + "step": 19880 + }, + { + "epoch": 0.19962664097314223, + "learning_rate": 0.00016007667911196758, + "loss": 0.7494, + "mean_token_accuracy": 0.7775312781333923, + "num_tokens": 67678947.0, + "step": 19890 + }, + { + "epoch": 0.1997270063029427, + "learning_rate": 0.00016005660604600746, + "loss": 0.7914, + "mean_token_accuracy": 0.7651115536689759, + "num_tokens": 67714030.0, + "step": 19900 + }, + { + "epoch": 0.1998273716327432, + "learning_rate": 0.00016003653298004737, + "loss": 0.7577, + "mean_token_accuracy": 0.7703204929828644, + "num_tokens": 67749045.0, + "step": 19910 + }, + { + "epoch": 0.19992773696254365, + "learning_rate": 0.0001600164599140873, + "loss": 0.739, + "mean_token_accuracy": 0.7767483949661255, + "num_tokens": 67782181.0, + "step": 19920 + }, + { + "epoch": 0.20002810229234413, + "learning_rate": 0.00015999638684812719, + "loss": 0.767, + "mean_token_accuracy": 0.7694602489471436, + "num_tokens": 67816160.0, + "step": 19930 + }, + { + "epoch": 0.20012846762214462, + "learning_rate": 0.0001599763137821671, + "loss": 0.7796, + "mean_token_accuracy": 0.7599666953086853, + "num_tokens": 67850447.0, + "step": 19940 + }, + { + "epoch": 0.20022883295194507, + "learning_rate": 0.000159956240716207, + "loss": 0.7669, + "mean_token_accuracy": 0.7668049991130829, + "num_tokens": 67883705.0, + "step": 19950 + }, + { + "epoch": 0.20032919828174556, + "learning_rate": 0.0001599361676502469, + "loss": 0.7527, + "mean_token_accuracy": 0.7709909677505493, + "num_tokens": 67917374.0, + "step": 19960 + }, + { + "epoch": 0.20042956361154604, + "learning_rate": 0.0001599160945842868, + "loss": 0.7614, + "mean_token_accuracy": 0.7740794658660889, + "num_tokens": 67951524.0, + "step": 19970 + }, + { + "epoch": 0.2005299289413465, + "learning_rate": 0.00015989602151832673, + "loss": 0.7665, + "mean_token_accuracy": 0.7670549333095551, + "num_tokens": 67985802.0, + "step": 19980 + }, + { + "epoch": 0.20063029427114698, + "learning_rate": 0.0001598759484523666, + "loss": 0.7429, + "mean_token_accuracy": 0.7795494019985199, + "num_tokens": 68019235.0, + "step": 19990 + }, + { + "epoch": 0.20073065960094744, + "learning_rate": 0.00015985587538640652, + "loss": 0.757, + "mean_token_accuracy": 0.7741480469703674, + "num_tokens": 68052749.0, + "step": 20000 + }, + { + "epoch": 0.20083102493074792, + "learning_rate": 0.00015983580232044643, + "loss": 0.7728, + "mean_token_accuracy": 0.7676588833332062, + "num_tokens": 68087359.0, + "step": 20010 + }, + { + "epoch": 0.2009313902605484, + "learning_rate": 0.00015981572925448633, + "loss": 0.7994, + "mean_token_accuracy": 0.7637075424194336, + "num_tokens": 68121983.0, + "step": 20020 + }, + { + "epoch": 0.20103175559034886, + "learning_rate": 0.00015979565618852624, + "loss": 0.7415, + "mean_token_accuracy": 0.7765156745910644, + "num_tokens": 68156097.0, + "step": 20030 + }, + { + "epoch": 0.20113212092014934, + "learning_rate": 0.00015977558312256615, + "loss": 0.7706, + "mean_token_accuracy": 0.7695318102836609, + "num_tokens": 68190128.0, + "step": 20040 + }, + { + "epoch": 0.20123248624994983, + "learning_rate": 0.00015975551005660606, + "loss": 0.7692, + "mean_token_accuracy": 0.7701895475387573, + "num_tokens": 68222825.0, + "step": 20050 + }, + { + "epoch": 0.20133285157975028, + "learning_rate": 0.00015973543699064594, + "loss": 0.7545, + "mean_token_accuracy": 0.7765472412109375, + "num_tokens": 68256662.0, + "step": 20060 + }, + { + "epoch": 0.20143321690955077, + "learning_rate": 0.00015971536392468588, + "loss": 0.7519, + "mean_token_accuracy": 0.7768332183361053, + "num_tokens": 68290858.0, + "step": 20070 + }, + { + "epoch": 0.20153358223935125, + "learning_rate": 0.00015969529085872576, + "loss": 0.79, + "mean_token_accuracy": 0.7622937262058258, + "num_tokens": 68324739.0, + "step": 20080 + }, + { + "epoch": 0.2016339475691517, + "learning_rate": 0.0001596752177927657, + "loss": 0.7529, + "mean_token_accuracy": 0.775265508890152, + "num_tokens": 68359074.0, + "step": 20090 + }, + { + "epoch": 0.2017343128989522, + "learning_rate": 0.00015965514472680557, + "loss": 0.7679, + "mean_token_accuracy": 0.769006222486496, + "num_tokens": 68393197.0, + "step": 20100 + }, + { + "epoch": 0.20183467822875267, + "learning_rate": 0.00015963507166084548, + "loss": 0.7573, + "mean_token_accuracy": 0.7712887763977051, + "num_tokens": 68427457.0, + "step": 20110 + }, + { + "epoch": 0.20193504355855313, + "learning_rate": 0.0001596149985948854, + "loss": 0.7592, + "mean_token_accuracy": 0.7706013262271881, + "num_tokens": 68462288.0, + "step": 20120 + }, + { + "epoch": 0.2020354088883536, + "learning_rate": 0.0001595949255289253, + "loss": 0.7678, + "mean_token_accuracy": 0.7678113400936126, + "num_tokens": 68496126.0, + "step": 20130 + }, + { + "epoch": 0.20213577421815407, + "learning_rate": 0.0001595748524629652, + "loss": 0.784, + "mean_token_accuracy": 0.7700542449951172, + "num_tokens": 68530714.0, + "step": 20140 + }, + { + "epoch": 0.20223613954795455, + "learning_rate": 0.00015955477939700512, + "loss": 0.7465, + "mean_token_accuracy": 0.7755346357822418, + "num_tokens": 68565073.0, + "step": 20150 + }, + { + "epoch": 0.20233650487775504, + "learning_rate": 0.00015953470633104503, + "loss": 0.7371, + "mean_token_accuracy": 0.779209417104721, + "num_tokens": 68598624.0, + "step": 20160 + }, + { + "epoch": 0.2024368702075555, + "learning_rate": 0.0001595146332650849, + "loss": 0.7631, + "mean_token_accuracy": 0.7787334799766541, + "num_tokens": 68632613.0, + "step": 20170 + }, + { + "epoch": 0.20253723553735598, + "learning_rate": 0.00015949456019912484, + "loss": 0.7452, + "mean_token_accuracy": 0.7790575742721557, + "num_tokens": 68666550.0, + "step": 20180 + }, + { + "epoch": 0.20263760086715646, + "learning_rate": 0.00015947448713316472, + "loss": 0.7786, + "mean_token_accuracy": 0.7660065054893493, + "num_tokens": 68700364.0, + "step": 20190 + }, + { + "epoch": 0.20273796619695691, + "learning_rate": 0.00015945441406720463, + "loss": 0.7645, + "mean_token_accuracy": 0.7723218679428101, + "num_tokens": 68734109.0, + "step": 20200 + }, + { + "epoch": 0.2028383315267574, + "learning_rate": 0.00015943434100124454, + "loss": 0.7609, + "mean_token_accuracy": 0.7738436937332154, + "num_tokens": 68768553.0, + "step": 20210 + }, + { + "epoch": 0.20293869685655788, + "learning_rate": 0.00015941426793528445, + "loss": 0.7487, + "mean_token_accuracy": 0.7739782512187958, + "num_tokens": 68802618.0, + "step": 20220 + }, + { + "epoch": 0.20303906218635834, + "learning_rate": 0.00015939419486932433, + "loss": 0.7602, + "mean_token_accuracy": 0.7701372802257538, + "num_tokens": 68837329.0, + "step": 20230 + }, + { + "epoch": 0.20313942751615882, + "learning_rate": 0.00015937412180336427, + "loss": 0.7383, + "mean_token_accuracy": 0.7742105484008789, + "num_tokens": 68870823.0, + "step": 20240 + }, + { + "epoch": 0.2032397928459593, + "learning_rate": 0.00015935404873740415, + "loss": 0.7785, + "mean_token_accuracy": 0.7661495864391327, + "num_tokens": 68905264.0, + "step": 20250 + }, + { + "epoch": 0.20334015817575976, + "learning_rate": 0.00015933397567144406, + "loss": 0.7729, + "mean_token_accuracy": 0.7653391361236572, + "num_tokens": 68939106.0, + "step": 20260 + }, + { + "epoch": 0.20344052350556024, + "learning_rate": 0.000159313902605484, + "loss": 0.8013, + "mean_token_accuracy": 0.7635286152362823, + "num_tokens": 68973161.0, + "step": 20270 + }, + { + "epoch": 0.2035408888353607, + "learning_rate": 0.00015929382953952387, + "loss": 0.7626, + "mean_token_accuracy": 0.7765633702278137, + "num_tokens": 69008120.0, + "step": 20280 + }, + { + "epoch": 0.20364125416516118, + "learning_rate": 0.00015927375647356378, + "loss": 0.7635, + "mean_token_accuracy": 0.7679502248764039, + "num_tokens": 69041517.0, + "step": 20290 + }, + { + "epoch": 0.20374161949496167, + "learning_rate": 0.0001592536834076037, + "loss": 0.7791, + "mean_token_accuracy": 0.7693223118782043, + "num_tokens": 69075388.0, + "step": 20300 + }, + { + "epoch": 0.20384198482476212, + "learning_rate": 0.0001592336103416436, + "loss": 0.7792, + "mean_token_accuracy": 0.7693504750728607, + "num_tokens": 69109863.0, + "step": 20310 + }, + { + "epoch": 0.2039423501545626, + "learning_rate": 0.00015921353727568348, + "loss": 0.7868, + "mean_token_accuracy": 0.7634381890296936, + "num_tokens": 69144241.0, + "step": 20320 + }, + { + "epoch": 0.2040427154843631, + "learning_rate": 0.00015919346420972341, + "loss": 0.7538, + "mean_token_accuracy": 0.7786667466163635, + "num_tokens": 69178931.0, + "step": 20330 + }, + { + "epoch": 0.20414308081416355, + "learning_rate": 0.0001591733911437633, + "loss": 0.7668, + "mean_token_accuracy": 0.7745855212211609, + "num_tokens": 69212797.0, + "step": 20340 + }, + { + "epoch": 0.20424344614396403, + "learning_rate": 0.0001591533180778032, + "loss": 0.7896, + "mean_token_accuracy": 0.7649648904800415, + "num_tokens": 69245945.0, + "step": 20350 + }, + { + "epoch": 0.20434381147376451, + "learning_rate": 0.0001591332450118431, + "loss": 0.7594, + "mean_token_accuracy": 0.7718109905719757, + "num_tokens": 69279613.0, + "step": 20360 + }, + { + "epoch": 0.20444417680356497, + "learning_rate": 0.00015911317194588302, + "loss": 0.7308, + "mean_token_accuracy": 0.7783885061740875, + "num_tokens": 69313556.0, + "step": 20370 + }, + { + "epoch": 0.20454454213336545, + "learning_rate": 0.00015909309887992293, + "loss": 0.7609, + "mean_token_accuracy": 0.7700179278850555, + "num_tokens": 69347036.0, + "step": 20380 + }, + { + "epoch": 0.20464490746316594, + "learning_rate": 0.00015907302581396284, + "loss": 0.7425, + "mean_token_accuracy": 0.7761937737464905, + "num_tokens": 69381310.0, + "step": 20390 + }, + { + "epoch": 0.2047452727929664, + "learning_rate": 0.00015905295274800275, + "loss": 0.7714, + "mean_token_accuracy": 0.7757660686969757, + "num_tokens": 69415250.0, + "step": 20400 + }, + { + "epoch": 0.20484563812276688, + "learning_rate": 0.00015903287968204263, + "loss": 0.7726, + "mean_token_accuracy": 0.7738589107990265, + "num_tokens": 69449151.0, + "step": 20410 + }, + { + "epoch": 0.20494600345256733, + "learning_rate": 0.00015901280661608256, + "loss": 0.7692, + "mean_token_accuracy": 0.7708847939968109, + "num_tokens": 69484146.0, + "step": 20420 + }, + { + "epoch": 0.20504636878236782, + "learning_rate": 0.00015899273355012244, + "loss": 0.7575, + "mean_token_accuracy": 0.7732176184654236, + "num_tokens": 69518455.0, + "step": 20430 + }, + { + "epoch": 0.2051467341121683, + "learning_rate": 0.00015897266048416235, + "loss": 0.741, + "mean_token_accuracy": 0.7802337765693664, + "num_tokens": 69552681.0, + "step": 20440 + }, + { + "epoch": 0.20524709944196876, + "learning_rate": 0.00015895258741820226, + "loss": 0.7632, + "mean_token_accuracy": 0.7741704881191254, + "num_tokens": 69585877.0, + "step": 20450 + }, + { + "epoch": 0.20534746477176924, + "learning_rate": 0.00015893251435224217, + "loss": 0.7792, + "mean_token_accuracy": 0.7710673213005066, + "num_tokens": 69620188.0, + "step": 20460 + }, + { + "epoch": 0.20544783010156972, + "learning_rate": 0.00015891244128628208, + "loss": 0.7827, + "mean_token_accuracy": 0.7680623292922973, + "num_tokens": 69655389.0, + "step": 20470 + }, + { + "epoch": 0.20554819543137018, + "learning_rate": 0.000158892368220322, + "loss": 0.7646, + "mean_token_accuracy": 0.7719215154647827, + "num_tokens": 69688903.0, + "step": 20480 + }, + { + "epoch": 0.20564856076117066, + "learning_rate": 0.0001588722951543619, + "loss": 0.785, + "mean_token_accuracy": 0.7672102153301239, + "num_tokens": 69723016.0, + "step": 20490 + }, + { + "epoch": 0.20574892609097115, + "learning_rate": 0.00015885222208840178, + "loss": 0.7832, + "mean_token_accuracy": 0.7706070244312286, + "num_tokens": 69757382.0, + "step": 20500 + }, + { + "epoch": 0.2058492914207716, + "learning_rate": 0.0001588321490224417, + "loss": 0.7616, + "mean_token_accuracy": 0.7733456909656524, + "num_tokens": 69791715.0, + "step": 20510 + }, + { + "epoch": 0.20594965675057209, + "learning_rate": 0.0001588120759564816, + "loss": 0.7583, + "mean_token_accuracy": 0.7724246740341186, + "num_tokens": 69826059.0, + "step": 20520 + }, + { + "epoch": 0.20605002208037257, + "learning_rate": 0.0001587920028905215, + "loss": 0.7458, + "mean_token_accuracy": 0.7753987908363342, + "num_tokens": 69860872.0, + "step": 20530 + }, + { + "epoch": 0.20615038741017302, + "learning_rate": 0.0001587719298245614, + "loss": 0.7804, + "mean_token_accuracy": 0.7636359870433808, + "num_tokens": 69895328.0, + "step": 20540 + }, + { + "epoch": 0.2062507527399735, + "learning_rate": 0.00015875185675860132, + "loss": 0.8072, + "mean_token_accuracy": 0.767308634519577, + "num_tokens": 69929541.0, + "step": 20550 + }, + { + "epoch": 0.20635111806977396, + "learning_rate": 0.0001587317836926412, + "loss": 0.7573, + "mean_token_accuracy": 0.7705384433269501, + "num_tokens": 69962917.0, + "step": 20560 + }, + { + "epoch": 0.20645148339957445, + "learning_rate": 0.00015871171062668114, + "loss": 0.7707, + "mean_token_accuracy": 0.7707615435123444, + "num_tokens": 69996444.0, + "step": 20570 + }, + { + "epoch": 0.20655184872937493, + "learning_rate": 0.00015869163756072102, + "loss": 0.7804, + "mean_token_accuracy": 0.7686228096485138, + "num_tokens": 70030414.0, + "step": 20580 + }, + { + "epoch": 0.2066522140591754, + "learning_rate": 0.00015867156449476093, + "loss": 0.7433, + "mean_token_accuracy": 0.7765547573566437, + "num_tokens": 70065297.0, + "step": 20590 + }, + { + "epoch": 0.20675257938897587, + "learning_rate": 0.00015865149142880083, + "loss": 0.7711, + "mean_token_accuracy": 0.7739952743053437, + "num_tokens": 70099550.0, + "step": 20600 + }, + { + "epoch": 0.20685294471877635, + "learning_rate": 0.00015863141836284074, + "loss": 0.7765, + "mean_token_accuracy": 0.7641831517219544, + "num_tokens": 70133719.0, + "step": 20610 + }, + { + "epoch": 0.2069533100485768, + "learning_rate": 0.00015861134529688065, + "loss": 0.7923, + "mean_token_accuracy": 0.7672351777553559, + "num_tokens": 70167631.0, + "step": 20620 + }, + { + "epoch": 0.2070536753783773, + "learning_rate": 0.00015859127223092056, + "loss": 0.7472, + "mean_token_accuracy": 0.7753488838672637, + "num_tokens": 70202415.0, + "step": 20630 + }, + { + "epoch": 0.20715404070817778, + "learning_rate": 0.00015857119916496047, + "loss": 0.767, + "mean_token_accuracy": 0.7673940360546112, + "num_tokens": 70236336.0, + "step": 20640 + }, + { + "epoch": 0.20725440603797823, + "learning_rate": 0.00015855112609900038, + "loss": 0.7756, + "mean_token_accuracy": 0.7706686735153199, + "num_tokens": 70269739.0, + "step": 20650 + }, + { + "epoch": 0.20735477136777872, + "learning_rate": 0.00015853105303304028, + "loss": 0.7129, + "mean_token_accuracy": 0.7834236145019531, + "num_tokens": 70303515.0, + "step": 20660 + }, + { + "epoch": 0.2074551366975792, + "learning_rate": 0.00015851097996708017, + "loss": 0.7369, + "mean_token_accuracy": 0.7737632632255554, + "num_tokens": 70336878.0, + "step": 20670 + }, + { + "epoch": 0.20755550202737966, + "learning_rate": 0.0001584909069011201, + "loss": 0.7726, + "mean_token_accuracy": 0.7719765722751617, + "num_tokens": 70370896.0, + "step": 20680 + }, + { + "epoch": 0.20765586735718014, + "learning_rate": 0.00015847083383515998, + "loss": 0.7577, + "mean_token_accuracy": 0.7750647962093353, + "num_tokens": 70404729.0, + "step": 20690 + }, + { + "epoch": 0.2077562326869806, + "learning_rate": 0.0001584507607691999, + "loss": 0.7725, + "mean_token_accuracy": 0.7715784668922424, + "num_tokens": 70439114.0, + "step": 20700 + }, + { + "epoch": 0.20785659801678108, + "learning_rate": 0.0001584306877032398, + "loss": 0.7464, + "mean_token_accuracy": 0.7785567104816437, + "num_tokens": 70472634.0, + "step": 20710 + }, + { + "epoch": 0.20795696334658156, + "learning_rate": 0.0001584106146372797, + "loss": 0.7742, + "mean_token_accuracy": 0.7646165311336517, + "num_tokens": 70506601.0, + "step": 20720 + }, + { + "epoch": 0.20805732867638202, + "learning_rate": 0.00015839054157131962, + "loss": 0.8001, + "mean_token_accuracy": 0.7662071764469147, + "num_tokens": 70540508.0, + "step": 20730 + }, + { + "epoch": 0.2081576940061825, + "learning_rate": 0.00015837046850535952, + "loss": 0.789, + "mean_token_accuracy": 0.7709681332111359, + "num_tokens": 70575172.0, + "step": 20740 + }, + { + "epoch": 0.208258059335983, + "learning_rate": 0.00015835039543939943, + "loss": 0.7394, + "mean_token_accuracy": 0.7774100303649902, + "num_tokens": 70609049.0, + "step": 20750 + }, + { + "epoch": 0.20835842466578344, + "learning_rate": 0.00015833032237343931, + "loss": 0.7373, + "mean_token_accuracy": 0.7811862468719483, + "num_tokens": 70643102.0, + "step": 20760 + }, + { + "epoch": 0.20845878999558393, + "learning_rate": 0.00015831024930747925, + "loss": 0.7404, + "mean_token_accuracy": 0.7779871642589569, + "num_tokens": 70676816.0, + "step": 20770 + }, + { + "epoch": 0.2085591553253844, + "learning_rate": 0.00015829017624151913, + "loss": 0.7756, + "mean_token_accuracy": 0.7701539635658264, + "num_tokens": 70711046.0, + "step": 20780 + }, + { + "epoch": 0.20865952065518487, + "learning_rate": 0.00015827010317555904, + "loss": 0.7852, + "mean_token_accuracy": 0.764276772737503, + "num_tokens": 70744074.0, + "step": 20790 + }, + { + "epoch": 0.20875988598498535, + "learning_rate": 0.00015825003010959895, + "loss": 0.8007, + "mean_token_accuracy": 0.7678519129753113, + "num_tokens": 70777768.0, + "step": 20800 + }, + { + "epoch": 0.20886025131478583, + "learning_rate": 0.00015822995704363886, + "loss": 0.7754, + "mean_token_accuracy": 0.7766441702842712, + "num_tokens": 70810973.0, + "step": 20810 + }, + { + "epoch": 0.2089606166445863, + "learning_rate": 0.00015820988397767876, + "loss": 0.7906, + "mean_token_accuracy": 0.7657183766365051, + "num_tokens": 70844540.0, + "step": 20820 + }, + { + "epoch": 0.20906098197438677, + "learning_rate": 0.00015818981091171867, + "loss": 0.7371, + "mean_token_accuracy": 0.777416217327118, + "num_tokens": 70878634.0, + "step": 20830 + }, + { + "epoch": 0.20916134730418723, + "learning_rate": 0.00015816973784575858, + "loss": 0.7398, + "mean_token_accuracy": 0.7815571427345276, + "num_tokens": 70912370.0, + "step": 20840 + }, + { + "epoch": 0.2092617126339877, + "learning_rate": 0.00015814966477979846, + "loss": 0.7539, + "mean_token_accuracy": 0.7748958528041839, + "num_tokens": 70945512.0, + "step": 20850 + }, + { + "epoch": 0.2093620779637882, + "learning_rate": 0.0001581295917138384, + "loss": 0.7776, + "mean_token_accuracy": 0.7678313195705414, + "num_tokens": 70979404.0, + "step": 20860 + }, + { + "epoch": 0.20946244329358865, + "learning_rate": 0.00015810951864787828, + "loss": 0.7774, + "mean_token_accuracy": 0.7691116333007812, + "num_tokens": 71013184.0, + "step": 20870 + }, + { + "epoch": 0.20956280862338914, + "learning_rate": 0.0001580894455819182, + "loss": 0.7721, + "mean_token_accuracy": 0.7686834394931793, + "num_tokens": 71046758.0, + "step": 20880 + }, + { + "epoch": 0.20966317395318962, + "learning_rate": 0.0001580693725159581, + "loss": 0.7106, + "mean_token_accuracy": 0.7875912904739379, + "num_tokens": 71081019.0, + "step": 20890 + }, + { + "epoch": 0.20976353928299007, + "learning_rate": 0.000158049299449998, + "loss": 0.7555, + "mean_token_accuracy": 0.7696977019309997, + "num_tokens": 71115195.0, + "step": 20900 + }, + { + "epoch": 0.20986390461279056, + "learning_rate": 0.0001580292263840379, + "loss": 0.7546, + "mean_token_accuracy": 0.7728437840938568, + "num_tokens": 71148512.0, + "step": 20910 + }, + { + "epoch": 0.20996426994259104, + "learning_rate": 0.00015800915331807782, + "loss": 0.7693, + "mean_token_accuracy": 0.7716422200202941, + "num_tokens": 71182644.0, + "step": 20920 + }, + { + "epoch": 0.2100646352723915, + "learning_rate": 0.0001579890802521177, + "loss": 0.7809, + "mean_token_accuracy": 0.7700718164443969, + "num_tokens": 71216736.0, + "step": 20930 + }, + { + "epoch": 0.21016500060219198, + "learning_rate": 0.0001579690071861576, + "loss": 0.7831, + "mean_token_accuracy": 0.7644835889339447, + "num_tokens": 71251048.0, + "step": 20940 + }, + { + "epoch": 0.21026536593199247, + "learning_rate": 0.00015794893412019752, + "loss": 0.7408, + "mean_token_accuracy": 0.7768671214580536, + "num_tokens": 71285103.0, + "step": 20950 + }, + { + "epoch": 0.21036573126179292, + "learning_rate": 0.00015792886105423743, + "loss": 0.7712, + "mean_token_accuracy": 0.7657074928283691, + "num_tokens": 71319516.0, + "step": 20960 + }, + { + "epoch": 0.2104660965915934, + "learning_rate": 0.00015790878798827734, + "loss": 0.7708, + "mean_token_accuracy": 0.7705487966537475, + "num_tokens": 71352939.0, + "step": 20970 + }, + { + "epoch": 0.21056646192139386, + "learning_rate": 0.00015788871492231725, + "loss": 0.7799, + "mean_token_accuracy": 0.7726272165775299, + "num_tokens": 71388027.0, + "step": 20980 + }, + { + "epoch": 0.21066682725119434, + "learning_rate": 0.00015786864185635715, + "loss": 0.769, + "mean_token_accuracy": 0.7712588965892792, + "num_tokens": 71421342.0, + "step": 20990 + }, + { + "epoch": 0.21076719258099483, + "learning_rate": 0.00015784856879039704, + "loss": 0.7768, + "mean_token_accuracy": 0.7639996528625488, + "num_tokens": 71455351.0, + "step": 21000 + }, + { + "epoch": 0.21086755791079528, + "learning_rate": 0.00015782849572443697, + "loss": 0.7589, + "mean_token_accuracy": 0.7738116085529327, + "num_tokens": 71489546.0, + "step": 21010 + }, + { + "epoch": 0.21096792324059577, + "learning_rate": 0.00015780842265847685, + "loss": 0.7451, + "mean_token_accuracy": 0.7762113988399506, + "num_tokens": 71522857.0, + "step": 21020 + }, + { + "epoch": 0.21106828857039625, + "learning_rate": 0.00015778834959251676, + "loss": 0.7845, + "mean_token_accuracy": 0.7659790396690369, + "num_tokens": 71556864.0, + "step": 21030 + }, + { + "epoch": 0.2111686539001967, + "learning_rate": 0.00015776827652655667, + "loss": 0.749, + "mean_token_accuracy": 0.7743443191051483, + "num_tokens": 71590124.0, + "step": 21040 + }, + { + "epoch": 0.2112690192299972, + "learning_rate": 0.00015774820346059658, + "loss": 0.7793, + "mean_token_accuracy": 0.7672454655170441, + "num_tokens": 71625632.0, + "step": 21050 + }, + { + "epoch": 0.21136938455979767, + "learning_rate": 0.00015772813039463649, + "loss": 0.736, + "mean_token_accuracy": 0.7821826696395874, + "num_tokens": 71659529.0, + "step": 21060 + }, + { + "epoch": 0.21146974988959813, + "learning_rate": 0.0001577080573286764, + "loss": 0.7416, + "mean_token_accuracy": 0.780550765991211, + "num_tokens": 71693522.0, + "step": 21070 + }, + { + "epoch": 0.2115701152193986, + "learning_rate": 0.0001576879842627163, + "loss": 0.7656, + "mean_token_accuracy": 0.7747459173202514, + "num_tokens": 71727633.0, + "step": 21080 + }, + { + "epoch": 0.2116704805491991, + "learning_rate": 0.00015766791119675618, + "loss": 0.7822, + "mean_token_accuracy": 0.7633500158786773, + "num_tokens": 71761519.0, + "step": 21090 + }, + { + "epoch": 0.21177084587899955, + "learning_rate": 0.00015764783813079612, + "loss": 0.7684, + "mean_token_accuracy": 0.7736807346343995, + "num_tokens": 71795381.0, + "step": 21100 + }, + { + "epoch": 0.21187121120880004, + "learning_rate": 0.000157627765064836, + "loss": 0.7485, + "mean_token_accuracy": 0.7741257667541503, + "num_tokens": 71829951.0, + "step": 21110 + }, + { + "epoch": 0.2119715765386005, + "learning_rate": 0.0001576076919988759, + "loss": 0.7816, + "mean_token_accuracy": 0.7627883315086365, + "num_tokens": 71864229.0, + "step": 21120 + }, + { + "epoch": 0.21207194186840098, + "learning_rate": 0.00015758761893291582, + "loss": 0.769, + "mean_token_accuracy": 0.770053106546402, + "num_tokens": 71898017.0, + "step": 21130 + }, + { + "epoch": 0.21217230719820146, + "learning_rate": 0.00015756754586695573, + "loss": 0.7583, + "mean_token_accuracy": 0.7741436541080475, + "num_tokens": 71932994.0, + "step": 21140 + }, + { + "epoch": 0.21227267252800192, + "learning_rate": 0.00015754747280099563, + "loss": 0.766, + "mean_token_accuracy": 0.7751873314380646, + "num_tokens": 71967639.0, + "step": 21150 + }, + { + "epoch": 0.2123730378578024, + "learning_rate": 0.00015752739973503554, + "loss": 0.7616, + "mean_token_accuracy": 0.7707334399223328, + "num_tokens": 72001602.0, + "step": 21160 + }, + { + "epoch": 0.21247340318760288, + "learning_rate": 0.00015750732666907545, + "loss": 0.7438, + "mean_token_accuracy": 0.7694995701313019, + "num_tokens": 72035995.0, + "step": 21170 + }, + { + "epoch": 0.21257376851740334, + "learning_rate": 0.00015748725360311533, + "loss": 0.7566, + "mean_token_accuracy": 0.7757935225963593, + "num_tokens": 72070180.0, + "step": 21180 + }, + { + "epoch": 0.21267413384720382, + "learning_rate": 0.00015746718053715527, + "loss": 0.7736, + "mean_token_accuracy": 0.7682357907295227, + "num_tokens": 72104000.0, + "step": 21190 + }, + { + "epoch": 0.2127744991770043, + "learning_rate": 0.00015744710747119515, + "loss": 0.7167, + "mean_token_accuracy": 0.7844587206840515, + "num_tokens": 72138835.0, + "step": 21200 + }, + { + "epoch": 0.21287486450680476, + "learning_rate": 0.00015742703440523506, + "loss": 0.7839, + "mean_token_accuracy": 0.7647915065288544, + "num_tokens": 72172464.0, + "step": 21210 + }, + { + "epoch": 0.21297522983660525, + "learning_rate": 0.00015740696133927497, + "loss": 0.778, + "mean_token_accuracy": 0.7714803338050842, + "num_tokens": 72207750.0, + "step": 21220 + }, + { + "epoch": 0.21307559516640573, + "learning_rate": 0.00015738688827331488, + "loss": 0.7477, + "mean_token_accuracy": 0.7713371753692627, + "num_tokens": 72241130.0, + "step": 21230 + }, + { + "epoch": 0.21317596049620618, + "learning_rate": 0.00015736681520735478, + "loss": 0.7772, + "mean_token_accuracy": 0.7683083772659302, + "num_tokens": 72275096.0, + "step": 21240 + }, + { + "epoch": 0.21327632582600667, + "learning_rate": 0.0001573467421413947, + "loss": 0.7589, + "mean_token_accuracy": 0.7768821716308594, + "num_tokens": 72309015.0, + "step": 21250 + }, + { + "epoch": 0.21337669115580712, + "learning_rate": 0.00015732666907543457, + "loss": 0.7583, + "mean_token_accuracy": 0.7699033319950104, + "num_tokens": 72343249.0, + "step": 21260 + }, + { + "epoch": 0.2134770564856076, + "learning_rate": 0.0001573065960094745, + "loss": 0.77, + "mean_token_accuracy": 0.771565067768097, + "num_tokens": 72377915.0, + "step": 21270 + }, + { + "epoch": 0.2135774218154081, + "learning_rate": 0.0001572865229435144, + "loss": 0.7458, + "mean_token_accuracy": 0.7759322106838227, + "num_tokens": 72410908.0, + "step": 21280 + }, + { + "epoch": 0.21367778714520855, + "learning_rate": 0.0001572664498775543, + "loss": 0.7901, + "mean_token_accuracy": 0.7675193965435028, + "num_tokens": 72445208.0, + "step": 21290 + }, + { + "epoch": 0.21377815247500903, + "learning_rate": 0.0001572463768115942, + "loss": 0.7449, + "mean_token_accuracy": 0.7791765749454498, + "num_tokens": 72479582.0, + "step": 21300 + }, + { + "epoch": 0.21387851780480951, + "learning_rate": 0.00015722630374563412, + "loss": 0.7656, + "mean_token_accuracy": 0.7676794767379761, + "num_tokens": 72513685.0, + "step": 21310 + }, + { + "epoch": 0.21397888313460997, + "learning_rate": 0.00015720623067967402, + "loss": 0.7499, + "mean_token_accuracy": 0.7740518152713776, + "num_tokens": 72547705.0, + "step": 21320 + }, + { + "epoch": 0.21407924846441045, + "learning_rate": 0.00015718615761371393, + "loss": 0.7408, + "mean_token_accuracy": 0.7749380826950073, + "num_tokens": 72581639.0, + "step": 21330 + }, + { + "epoch": 0.21417961379421094, + "learning_rate": 0.00015716608454775384, + "loss": 0.759, + "mean_token_accuracy": 0.7758741557598114, + "num_tokens": 72615597.0, + "step": 21340 + }, + { + "epoch": 0.2142799791240114, + "learning_rate": 0.00015714601148179372, + "loss": 0.7965, + "mean_token_accuracy": 0.7671333730220795, + "num_tokens": 72649300.0, + "step": 21350 + }, + { + "epoch": 0.21438034445381188, + "learning_rate": 0.00015712593841583366, + "loss": 0.7664, + "mean_token_accuracy": 0.7697389960289002, + "num_tokens": 72683135.0, + "step": 21360 + }, + { + "epoch": 0.21448070978361236, + "learning_rate": 0.00015710586534987354, + "loss": 0.742, + "mean_token_accuracy": 0.7795991182327271, + "num_tokens": 72717613.0, + "step": 21370 + }, + { + "epoch": 0.21458107511341282, + "learning_rate": 0.00015708579228391345, + "loss": 0.7424, + "mean_token_accuracy": 0.7717825472354889, + "num_tokens": 72751495.0, + "step": 21380 + }, + { + "epoch": 0.2146814404432133, + "learning_rate": 0.00015706571921795336, + "loss": 0.7464, + "mean_token_accuracy": 0.7756230950355529, + "num_tokens": 72785472.0, + "step": 21390 + }, + { + "epoch": 0.21478180577301376, + "learning_rate": 0.00015704564615199326, + "loss": 0.7617, + "mean_token_accuracy": 0.7696384608745575, + "num_tokens": 72819465.0, + "step": 21400 + }, + { + "epoch": 0.21488217110281424, + "learning_rate": 0.00015702557308603317, + "loss": 0.7665, + "mean_token_accuracy": 0.7731923341751099, + "num_tokens": 72852889.0, + "step": 21410 + }, + { + "epoch": 0.21498253643261472, + "learning_rate": 0.00015700550002007308, + "loss": 0.7428, + "mean_token_accuracy": 0.7707126796245575, + "num_tokens": 72886839.0, + "step": 21420 + }, + { + "epoch": 0.21508290176241518, + "learning_rate": 0.000156985426954113, + "loss": 0.7258, + "mean_token_accuracy": 0.7753783881664276, + "num_tokens": 72921136.0, + "step": 21430 + }, + { + "epoch": 0.21518326709221566, + "learning_rate": 0.00015696535388815287, + "loss": 0.7576, + "mean_token_accuracy": 0.7778366923332214, + "num_tokens": 72955468.0, + "step": 21440 + }, + { + "epoch": 0.21528363242201615, + "learning_rate": 0.0001569452808221928, + "loss": 0.7584, + "mean_token_accuracy": 0.770528769493103, + "num_tokens": 72989801.0, + "step": 21450 + }, + { + "epoch": 0.2153839977518166, + "learning_rate": 0.0001569252077562327, + "loss": 0.7724, + "mean_token_accuracy": 0.7657631397247314, + "num_tokens": 73023755.0, + "step": 21460 + }, + { + "epoch": 0.2154843630816171, + "learning_rate": 0.0001569051346902726, + "loss": 0.7782, + "mean_token_accuracy": 0.7705927014350891, + "num_tokens": 73057480.0, + "step": 21470 + }, + { + "epoch": 0.21558472841141757, + "learning_rate": 0.0001568850616243125, + "loss": 0.7788, + "mean_token_accuracy": 0.7675239384174347, + "num_tokens": 73091640.0, + "step": 21480 + }, + { + "epoch": 0.21568509374121803, + "learning_rate": 0.0001568649885583524, + "loss": 0.7724, + "mean_token_accuracy": 0.7599137783050537, + "num_tokens": 73125111.0, + "step": 21490 + }, + { + "epoch": 0.2157854590710185, + "learning_rate": 0.0001568449154923923, + "loss": 0.7513, + "mean_token_accuracy": 0.7712138295173645, + "num_tokens": 73159105.0, + "step": 21500 + }, + { + "epoch": 0.215885824400819, + "learning_rate": 0.00015682484242643223, + "loss": 0.7356, + "mean_token_accuracy": 0.7795074224472046, + "num_tokens": 73192588.0, + "step": 21510 + }, + { + "epoch": 0.21598618973061945, + "learning_rate": 0.00015680476936047214, + "loss": 0.7927, + "mean_token_accuracy": 0.7678205966949463, + "num_tokens": 73225956.0, + "step": 21520 + }, + { + "epoch": 0.21608655506041993, + "learning_rate": 0.00015678469629451202, + "loss": 0.7737, + "mean_token_accuracy": 0.7745775699615478, + "num_tokens": 73259268.0, + "step": 21530 + }, + { + "epoch": 0.2161869203902204, + "learning_rate": 0.00015676462322855196, + "loss": 0.7183, + "mean_token_accuracy": 0.7816416978836059, + "num_tokens": 73293677.0, + "step": 21540 + }, + { + "epoch": 0.21628728572002087, + "learning_rate": 0.00015674455016259184, + "loss": 0.7924, + "mean_token_accuracy": 0.7706844091415406, + "num_tokens": 73327223.0, + "step": 21550 + }, + { + "epoch": 0.21638765104982136, + "learning_rate": 0.00015672447709663175, + "loss": 0.7988, + "mean_token_accuracy": 0.7607482850551606, + "num_tokens": 73361275.0, + "step": 21560 + }, + { + "epoch": 0.2164880163796218, + "learning_rate": 0.00015670440403067165, + "loss": 0.7277, + "mean_token_accuracy": 0.7849364280700684, + "num_tokens": 73395290.0, + "step": 21570 + }, + { + "epoch": 0.2165883817094223, + "learning_rate": 0.00015668433096471156, + "loss": 0.7582, + "mean_token_accuracy": 0.77339026927948, + "num_tokens": 73429209.0, + "step": 21580 + }, + { + "epoch": 0.21668874703922278, + "learning_rate": 0.00015666425789875144, + "loss": 0.766, + "mean_token_accuracy": 0.7696726858615875, + "num_tokens": 73463512.0, + "step": 21590 + }, + { + "epoch": 0.21678911236902323, + "learning_rate": 0.00015664418483279138, + "loss": 0.752, + "mean_token_accuracy": 0.7735897541046143, + "num_tokens": 73497731.0, + "step": 21600 + }, + { + "epoch": 0.21688947769882372, + "learning_rate": 0.00015662411176683126, + "loss": 0.7642, + "mean_token_accuracy": 0.7691661059856415, + "num_tokens": 73532012.0, + "step": 21610 + }, + { + "epoch": 0.2169898430286242, + "learning_rate": 0.00015660403870087117, + "loss": 0.7731, + "mean_token_accuracy": 0.7705914676189423, + "num_tokens": 73566607.0, + "step": 21620 + }, + { + "epoch": 0.21709020835842466, + "learning_rate": 0.00015658396563491108, + "loss": 0.7882, + "mean_token_accuracy": 0.7648298919200898, + "num_tokens": 73601959.0, + "step": 21630 + }, + { + "epoch": 0.21719057368822514, + "learning_rate": 0.00015656389256895099, + "loss": 0.7759, + "mean_token_accuracy": 0.7717965483665467, + "num_tokens": 73635868.0, + "step": 21640 + }, + { + "epoch": 0.21729093901802563, + "learning_rate": 0.0001565438195029909, + "loss": 0.7722, + "mean_token_accuracy": 0.770391458272934, + "num_tokens": 73669533.0, + "step": 21650 + }, + { + "epoch": 0.21739130434782608, + "learning_rate": 0.0001565237464370308, + "loss": 0.7659, + "mean_token_accuracy": 0.7714470684528351, + "num_tokens": 73704028.0, + "step": 21660 + }, + { + "epoch": 0.21749166967762656, + "learning_rate": 0.0001565036733710707, + "loss": 0.7889, + "mean_token_accuracy": 0.7684951424598694, + "num_tokens": 73738628.0, + "step": 21670 + }, + { + "epoch": 0.21759203500742705, + "learning_rate": 0.0001564836003051106, + "loss": 0.7517, + "mean_token_accuracy": 0.7769899666309357, + "num_tokens": 73772208.0, + "step": 21680 + }, + { + "epoch": 0.2176924003372275, + "learning_rate": 0.00015646352723915053, + "loss": 0.7497, + "mean_token_accuracy": 0.7768558323383331, + "num_tokens": 73806372.0, + "step": 21690 + }, + { + "epoch": 0.217792765667028, + "learning_rate": 0.0001564434541731904, + "loss": 0.7573, + "mean_token_accuracy": 0.7735520601272583, + "num_tokens": 73840098.0, + "step": 21700 + }, + { + "epoch": 0.21789313099682844, + "learning_rate": 0.00015642338110723032, + "loss": 0.7249, + "mean_token_accuracy": 0.781202632188797, + "num_tokens": 73873739.0, + "step": 21710 + }, + { + "epoch": 0.21799349632662893, + "learning_rate": 0.00015640330804127023, + "loss": 0.7925, + "mean_token_accuracy": 0.7633719384670258, + "num_tokens": 73907501.0, + "step": 21720 + }, + { + "epoch": 0.2180938616564294, + "learning_rate": 0.00015638323497531013, + "loss": 0.7783, + "mean_token_accuracy": 0.7692427694797516, + "num_tokens": 73941303.0, + "step": 21730 + }, + { + "epoch": 0.21819422698622987, + "learning_rate": 0.00015636316190935004, + "loss": 0.8132, + "mean_token_accuracy": 0.7652038037776947, + "num_tokens": 73975219.0, + "step": 21740 + }, + { + "epoch": 0.21829459231603035, + "learning_rate": 0.00015634308884338995, + "loss": 0.7565, + "mean_token_accuracy": 0.7756443738937377, + "num_tokens": 74009478.0, + "step": 21750 + }, + { + "epoch": 0.21839495764583083, + "learning_rate": 0.00015632301577742986, + "loss": 0.7595, + "mean_token_accuracy": 0.7766941070556641, + "num_tokens": 74043682.0, + "step": 21760 + }, + { + "epoch": 0.2184953229756313, + "learning_rate": 0.00015630294271146974, + "loss": 0.7673, + "mean_token_accuracy": 0.7681203067302704, + "num_tokens": 74077408.0, + "step": 21770 + }, + { + "epoch": 0.21859568830543177, + "learning_rate": 0.00015628286964550968, + "loss": 0.7186, + "mean_token_accuracy": 0.7839077115058899, + "num_tokens": 74111317.0, + "step": 21780 + }, + { + "epoch": 0.21869605363523226, + "learning_rate": 0.00015626279657954956, + "loss": 0.771, + "mean_token_accuracy": 0.7729612588882446, + "num_tokens": 74145562.0, + "step": 21790 + }, + { + "epoch": 0.2187964189650327, + "learning_rate": 0.0001562427235135895, + "loss": 0.7508, + "mean_token_accuracy": 0.7716224253177643, + "num_tokens": 74179412.0, + "step": 21800 + }, + { + "epoch": 0.2188967842948332, + "learning_rate": 0.00015622265044762937, + "loss": 0.7946, + "mean_token_accuracy": 0.7600009620189667, + "num_tokens": 74212780.0, + "step": 21810 + }, + { + "epoch": 0.21899714962463368, + "learning_rate": 0.00015620257738166928, + "loss": 0.7515, + "mean_token_accuracy": 0.7766862094402314, + "num_tokens": 74246670.0, + "step": 21820 + }, + { + "epoch": 0.21909751495443414, + "learning_rate": 0.0001561825043157092, + "loss": 0.7785, + "mean_token_accuracy": 0.7634067952632904, + "num_tokens": 74280425.0, + "step": 21830 + }, + { + "epoch": 0.21919788028423462, + "learning_rate": 0.0001561624312497491, + "loss": 0.7571, + "mean_token_accuracy": 0.772942304611206, + "num_tokens": 74314451.0, + "step": 21840 + }, + { + "epoch": 0.21929824561403508, + "learning_rate": 0.00015614235818378898, + "loss": 0.8118, + "mean_token_accuracy": 0.7635380804538727, + "num_tokens": 74348625.0, + "step": 21850 + }, + { + "epoch": 0.21939861094383556, + "learning_rate": 0.00015612228511782892, + "loss": 0.7621, + "mean_token_accuracy": 0.7696048498153687, + "num_tokens": 74382687.0, + "step": 21860 + }, + { + "epoch": 0.21949897627363604, + "learning_rate": 0.00015610221205186883, + "loss": 0.7441, + "mean_token_accuracy": 0.7728609502315521, + "num_tokens": 74416683.0, + "step": 21870 + }, + { + "epoch": 0.2195993416034365, + "learning_rate": 0.0001560821389859087, + "loss": 0.7681, + "mean_token_accuracy": 0.7727586686611175, + "num_tokens": 74450751.0, + "step": 21880 + }, + { + "epoch": 0.21969970693323698, + "learning_rate": 0.00015606206591994864, + "loss": 0.749, + "mean_token_accuracy": 0.7788787484169006, + "num_tokens": 74484170.0, + "step": 21890 + }, + { + "epoch": 0.21980007226303747, + "learning_rate": 0.00015604199285398852, + "loss": 0.7495, + "mean_token_accuracy": 0.7776457905769348, + "num_tokens": 74518553.0, + "step": 21900 + }, + { + "epoch": 0.21990043759283792, + "learning_rate": 0.00015602191978802843, + "loss": 0.7677, + "mean_token_accuracy": 0.7708371758460999, + "num_tokens": 74553087.0, + "step": 21910 + }, + { + "epoch": 0.2200008029226384, + "learning_rate": 0.00015600184672206834, + "loss": 0.7525, + "mean_token_accuracy": 0.7738921821117402, + "num_tokens": 74587675.0, + "step": 21920 + }, + { + "epoch": 0.2201011682524389, + "learning_rate": 0.00015598177365610825, + "loss": 0.7449, + "mean_token_accuracy": 0.7725287139415741, + "num_tokens": 74621433.0, + "step": 21930 + }, + { + "epoch": 0.22020153358223934, + "learning_rate": 0.00015596170059014813, + "loss": 0.7384, + "mean_token_accuracy": 0.7794537603855133, + "num_tokens": 74655139.0, + "step": 21940 + }, + { + "epoch": 0.22030189891203983, + "learning_rate": 0.00015594162752418807, + "loss": 0.7527, + "mean_token_accuracy": 0.7764513313770294, + "num_tokens": 74689015.0, + "step": 21950 + }, + { + "epoch": 0.2204022642418403, + "learning_rate": 0.00015592155445822795, + "loss": 0.7209, + "mean_token_accuracy": 0.7809753298759461, + "num_tokens": 74722946.0, + "step": 21960 + }, + { + "epoch": 0.22050262957164077, + "learning_rate": 0.00015590148139226786, + "loss": 0.7704, + "mean_token_accuracy": 0.7701947748661041, + "num_tokens": 74756312.0, + "step": 21970 + }, + { + "epoch": 0.22060299490144125, + "learning_rate": 0.00015588140832630776, + "loss": 0.7618, + "mean_token_accuracy": 0.7662958800792694, + "num_tokens": 74790810.0, + "step": 21980 + }, + { + "epoch": 0.2207033602312417, + "learning_rate": 0.00015586133526034767, + "loss": 0.7343, + "mean_token_accuracy": 0.7780974447727204, + "num_tokens": 74825050.0, + "step": 21990 + }, + { + "epoch": 0.2208037255610422, + "learning_rate": 0.00015584126219438758, + "loss": 0.7648, + "mean_token_accuracy": 0.7687854588031768, + "num_tokens": 74858386.0, + "step": 22000 + }, + { + "epoch": 0.22090409089084267, + "learning_rate": 0.0001558211891284275, + "loss": 0.7859, + "mean_token_accuracy": 0.7641824066638947, + "num_tokens": 74892002.0, + "step": 22010 + }, + { + "epoch": 0.22100445622064313, + "learning_rate": 0.0001558011160624674, + "loss": 0.7778, + "mean_token_accuracy": 0.7700320959091187, + "num_tokens": 74926198.0, + "step": 22020 + }, + { + "epoch": 0.22110482155044361, + "learning_rate": 0.00015578104299650728, + "loss": 0.7513, + "mean_token_accuracy": 0.77521892786026, + "num_tokens": 74960848.0, + "step": 22030 + }, + { + "epoch": 0.2212051868802441, + "learning_rate": 0.00015576096993054721, + "loss": 0.7329, + "mean_token_accuracy": 0.7798405706882476, + "num_tokens": 74994390.0, + "step": 22040 + }, + { + "epoch": 0.22130555221004455, + "learning_rate": 0.0001557408968645871, + "loss": 0.7424, + "mean_token_accuracy": 0.7813081204891205, + "num_tokens": 75028365.0, + "step": 22050 + }, + { + "epoch": 0.22140591753984504, + "learning_rate": 0.000155720823798627, + "loss": 0.743, + "mean_token_accuracy": 0.7755156219005584, + "num_tokens": 75062163.0, + "step": 22060 + }, + { + "epoch": 0.22150628286964552, + "learning_rate": 0.0001557007507326669, + "loss": 0.7459, + "mean_token_accuracy": 0.7786991477012635, + "num_tokens": 75095932.0, + "step": 22070 + }, + { + "epoch": 0.22160664819944598, + "learning_rate": 0.00015568067766670682, + "loss": 0.7628, + "mean_token_accuracy": 0.7725139379501342, + "num_tokens": 75130192.0, + "step": 22080 + }, + { + "epoch": 0.22170701352924646, + "learning_rate": 0.00015566060460074673, + "loss": 0.7378, + "mean_token_accuracy": 0.7728904247283935, + "num_tokens": 75163781.0, + "step": 22090 + }, + { + "epoch": 0.22180737885904694, + "learning_rate": 0.00015564053153478664, + "loss": 0.7264, + "mean_token_accuracy": 0.7793911337852478, + "num_tokens": 75197120.0, + "step": 22100 + }, + { + "epoch": 0.2219077441888474, + "learning_rate": 0.00015562045846882655, + "loss": 0.7322, + "mean_token_accuracy": 0.7795130431652069, + "num_tokens": 75230906.0, + "step": 22110 + }, + { + "epoch": 0.22200810951864788, + "learning_rate": 0.00015560038540286643, + "loss": 0.7677, + "mean_token_accuracy": 0.7698107719421386, + "num_tokens": 75264321.0, + "step": 22120 + }, + { + "epoch": 0.22210847484844834, + "learning_rate": 0.00015558031233690636, + "loss": 0.7681, + "mean_token_accuracy": 0.7709541559219361, + "num_tokens": 75298107.0, + "step": 22130 + }, + { + "epoch": 0.22220884017824882, + "learning_rate": 0.00015556023927094624, + "loss": 0.7832, + "mean_token_accuracy": 0.7653647840023041, + "num_tokens": 75332461.0, + "step": 22140 + }, + { + "epoch": 0.2223092055080493, + "learning_rate": 0.00015554016620498615, + "loss": 0.7637, + "mean_token_accuracy": 0.7696703612804413, + "num_tokens": 75366882.0, + "step": 22150 + }, + { + "epoch": 0.22240957083784976, + "learning_rate": 0.00015552009313902606, + "loss": 0.7857, + "mean_token_accuracy": 0.7655081987380982, + "num_tokens": 75401726.0, + "step": 22160 + }, + { + "epoch": 0.22250993616765025, + "learning_rate": 0.00015550002007306597, + "loss": 0.7576, + "mean_token_accuracy": 0.7751639306545257, + "num_tokens": 75435612.0, + "step": 22170 + }, + { + "epoch": 0.22261030149745073, + "learning_rate": 0.00015547994700710585, + "loss": 0.7773, + "mean_token_accuracy": 0.771637785434723, + "num_tokens": 75469010.0, + "step": 22180 + }, + { + "epoch": 0.22271066682725119, + "learning_rate": 0.0001554598739411458, + "loss": 0.7459, + "mean_token_accuracy": 0.7756258308887481, + "num_tokens": 75502834.0, + "step": 22190 + }, + { + "epoch": 0.22281103215705167, + "learning_rate": 0.00015543980087518567, + "loss": 0.7541, + "mean_token_accuracy": 0.7758987307548523, + "num_tokens": 75537291.0, + "step": 22200 + }, + { + "epoch": 0.22291139748685215, + "learning_rate": 0.00015541972780922558, + "loss": 0.7639, + "mean_token_accuracy": 0.7698519408702851, + "num_tokens": 75570830.0, + "step": 22210 + }, + { + "epoch": 0.2230117628166526, + "learning_rate": 0.0001553996547432655, + "loss": 0.7553, + "mean_token_accuracy": 0.7741851449012757, + "num_tokens": 75604702.0, + "step": 22220 + }, + { + "epoch": 0.2231121281464531, + "learning_rate": 0.0001553795816773054, + "loss": 0.7774, + "mean_token_accuracy": 0.7693216919898986, + "num_tokens": 75638956.0, + "step": 22230 + }, + { + "epoch": 0.22321249347625358, + "learning_rate": 0.0001553595086113453, + "loss": 0.7907, + "mean_token_accuracy": 0.7661739885807037, + "num_tokens": 75673235.0, + "step": 22240 + }, + { + "epoch": 0.22331285880605403, + "learning_rate": 0.0001553394355453852, + "loss": 0.7663, + "mean_token_accuracy": 0.776247090101242, + "num_tokens": 75707292.0, + "step": 22250 + }, + { + "epoch": 0.22341322413585452, + "learning_rate": 0.00015531936247942512, + "loss": 0.7721, + "mean_token_accuracy": 0.7690892219543457, + "num_tokens": 75741060.0, + "step": 22260 + }, + { + "epoch": 0.22351358946565497, + "learning_rate": 0.000155299289413465, + "loss": 0.7414, + "mean_token_accuracy": 0.7747559785842896, + "num_tokens": 75775464.0, + "step": 22270 + }, + { + "epoch": 0.22361395479545546, + "learning_rate": 0.00015527921634750494, + "loss": 0.7736, + "mean_token_accuracy": 0.769670695066452, + "num_tokens": 75810173.0, + "step": 22280 + }, + { + "epoch": 0.22371432012525594, + "learning_rate": 0.00015525914328154482, + "loss": 0.7707, + "mean_token_accuracy": 0.7710635662078857, + "num_tokens": 75844231.0, + "step": 22290 + }, + { + "epoch": 0.2238146854550564, + "learning_rate": 0.00015523907021558473, + "loss": 0.7926, + "mean_token_accuracy": 0.7665982961654663, + "num_tokens": 75878387.0, + "step": 22300 + }, + { + "epoch": 0.22391505078485688, + "learning_rate": 0.00015521899714962463, + "loss": 0.7763, + "mean_token_accuracy": 0.7694206535816193, + "num_tokens": 75912285.0, + "step": 22310 + }, + { + "epoch": 0.22401541611465736, + "learning_rate": 0.00015519892408366454, + "loss": 0.7541, + "mean_token_accuracy": 0.7772053599357605, + "num_tokens": 75946814.0, + "step": 22320 + }, + { + "epoch": 0.22411578144445782, + "learning_rate": 0.00015517885101770445, + "loss": 0.7324, + "mean_token_accuracy": 0.7818355023860931, + "num_tokens": 75981088.0, + "step": 22330 + }, + { + "epoch": 0.2242161467742583, + "learning_rate": 0.00015515877795174436, + "loss": 0.76, + "mean_token_accuracy": 0.7736691057682037, + "num_tokens": 76015104.0, + "step": 22340 + }, + { + "epoch": 0.22431651210405879, + "learning_rate": 0.00015513870488578427, + "loss": 0.7855, + "mean_token_accuracy": 0.7721585512161255, + "num_tokens": 76049101.0, + "step": 22350 + }, + { + "epoch": 0.22441687743385924, + "learning_rate": 0.00015511863181982418, + "loss": 0.8257, + "mean_token_accuracy": 0.7583268821239472, + "num_tokens": 76082977.0, + "step": 22360 + }, + { + "epoch": 0.22451724276365972, + "learning_rate": 0.00015509855875386408, + "loss": 0.736, + "mean_token_accuracy": 0.7773957967758178, + "num_tokens": 76116739.0, + "step": 22370 + }, + { + "epoch": 0.2246176080934602, + "learning_rate": 0.00015507848568790397, + "loss": 0.7733, + "mean_token_accuracy": 0.7722367703914642, + "num_tokens": 76151238.0, + "step": 22380 + }, + { + "epoch": 0.22471797342326066, + "learning_rate": 0.0001550584126219439, + "loss": 0.7681, + "mean_token_accuracy": 0.7752468824386597, + "num_tokens": 76185106.0, + "step": 22390 + }, + { + "epoch": 0.22481833875306115, + "learning_rate": 0.00015503833955598378, + "loss": 0.7414, + "mean_token_accuracy": 0.7812665343284607, + "num_tokens": 76219283.0, + "step": 22400 + }, + { + "epoch": 0.2249187040828616, + "learning_rate": 0.0001550182664900237, + "loss": 0.7457, + "mean_token_accuracy": 0.7715763866901397, + "num_tokens": 76254503.0, + "step": 22410 + }, + { + "epoch": 0.2250190694126621, + "learning_rate": 0.0001549981934240636, + "loss": 0.7923, + "mean_token_accuracy": 0.7659672141075134, + "num_tokens": 76288084.0, + "step": 22420 + }, + { + "epoch": 0.22511943474246257, + "learning_rate": 0.0001549781203581035, + "loss": 0.7366, + "mean_token_accuracy": 0.7778996825218201, + "num_tokens": 76322732.0, + "step": 22430 + }, + { + "epoch": 0.22521980007226303, + "learning_rate": 0.00015495804729214342, + "loss": 0.7949, + "mean_token_accuracy": 0.7588162422180176, + "num_tokens": 76357108.0, + "step": 22440 + }, + { + "epoch": 0.2253201654020635, + "learning_rate": 0.00015493797422618332, + "loss": 0.7349, + "mean_token_accuracy": 0.7827002227306366, + "num_tokens": 76391121.0, + "step": 22450 + }, + { + "epoch": 0.225420530731864, + "learning_rate": 0.00015491790116022323, + "loss": 0.7445, + "mean_token_accuracy": 0.7849261403083801, + "num_tokens": 76425458.0, + "step": 22460 + }, + { + "epoch": 0.22552089606166445, + "learning_rate": 0.00015489782809426311, + "loss": 0.7508, + "mean_token_accuracy": 0.7736548244953155, + "num_tokens": 76458851.0, + "step": 22470 + }, + { + "epoch": 0.22562126139146493, + "learning_rate": 0.00015487775502830305, + "loss": 0.764, + "mean_token_accuracy": 0.7733363151550293, + "num_tokens": 76492919.0, + "step": 22480 + }, + { + "epoch": 0.22572162672126542, + "learning_rate": 0.00015485768196234293, + "loss": 0.7402, + "mean_token_accuracy": 0.7776598811149598, + "num_tokens": 76526610.0, + "step": 22490 + }, + { + "epoch": 0.22582199205106587, + "learning_rate": 0.00015483760889638284, + "loss": 0.769, + "mean_token_accuracy": 0.7713018953800201, + "num_tokens": 76560058.0, + "step": 22500 + }, + { + "epoch": 0.22592235738086636, + "learning_rate": 0.00015481753583042275, + "loss": 0.756, + "mean_token_accuracy": 0.7778894782066346, + "num_tokens": 76593949.0, + "step": 22510 + }, + { + "epoch": 0.22602272271066684, + "learning_rate": 0.00015479746276446266, + "loss": 0.7392, + "mean_token_accuracy": 0.7810545206069947, + "num_tokens": 76627038.0, + "step": 22520 + }, + { + "epoch": 0.2261230880404673, + "learning_rate": 0.00015477738969850254, + "loss": 0.7421, + "mean_token_accuracy": 0.7785213947296142, + "num_tokens": 76660999.0, + "step": 22530 + }, + { + "epoch": 0.22622345337026778, + "learning_rate": 0.00015475731663254247, + "loss": 0.7655, + "mean_token_accuracy": 0.7720098912715911, + "num_tokens": 76695646.0, + "step": 22540 + }, + { + "epoch": 0.22632381870006824, + "learning_rate": 0.00015473724356658236, + "loss": 0.7769, + "mean_token_accuracy": 0.7670884728431702, + "num_tokens": 76729311.0, + "step": 22550 + }, + { + "epoch": 0.22642418402986872, + "learning_rate": 0.00015471717050062226, + "loss": 0.7619, + "mean_token_accuracy": 0.7754532396793365, + "num_tokens": 76762880.0, + "step": 22560 + }, + { + "epoch": 0.2265245493596692, + "learning_rate": 0.0001546970974346622, + "loss": 0.7963, + "mean_token_accuracy": 0.7628134310245513, + "num_tokens": 76796916.0, + "step": 22570 + }, + { + "epoch": 0.22662491468946966, + "learning_rate": 0.00015467702436870208, + "loss": 0.7719, + "mean_token_accuracy": 0.765484744310379, + "num_tokens": 76831375.0, + "step": 22580 + }, + { + "epoch": 0.22672528001927014, + "learning_rate": 0.000154656951302742, + "loss": 0.7535, + "mean_token_accuracy": 0.7687456011772156, + "num_tokens": 76864517.0, + "step": 22590 + }, + { + "epoch": 0.22682564534907063, + "learning_rate": 0.0001546368782367819, + "loss": 0.7672, + "mean_token_accuracy": 0.7701222836971283, + "num_tokens": 76900131.0, + "step": 22600 + }, + { + "epoch": 0.22692601067887108, + "learning_rate": 0.0001546168051708218, + "loss": 0.7782, + "mean_token_accuracy": 0.765713906288147, + "num_tokens": 76933999.0, + "step": 22610 + }, + { + "epoch": 0.22702637600867157, + "learning_rate": 0.0001545967321048617, + "loss": 0.7807, + "mean_token_accuracy": 0.7662304699420929, + "num_tokens": 76968304.0, + "step": 22620 + }, + { + "epoch": 0.22712674133847205, + "learning_rate": 0.00015457665903890162, + "loss": 0.7814, + "mean_token_accuracy": 0.7684104800224304, + "num_tokens": 77002282.0, + "step": 22630 + }, + { + "epoch": 0.2272271066682725, + "learning_rate": 0.0001545565859729415, + "loss": 0.8023, + "mean_token_accuracy": 0.7641406416893005, + "num_tokens": 77036795.0, + "step": 22640 + }, + { + "epoch": 0.227327471998073, + "learning_rate": 0.0001545365129069814, + "loss": 0.7435, + "mean_token_accuracy": 0.7800127029418945, + "num_tokens": 77071678.0, + "step": 22650 + }, + { + "epoch": 0.22742783732787347, + "learning_rate": 0.00015451643984102132, + "loss": 0.7705, + "mean_token_accuracy": 0.7709397971630096, + "num_tokens": 77105827.0, + "step": 22660 + }, + { + "epoch": 0.22752820265767393, + "learning_rate": 0.00015449636677506123, + "loss": 0.7517, + "mean_token_accuracy": 0.7780755877494812, + "num_tokens": 77139690.0, + "step": 22670 + }, + { + "epoch": 0.2276285679874744, + "learning_rate": 0.00015447629370910114, + "loss": 0.7468, + "mean_token_accuracy": 0.7782335638999939, + "num_tokens": 77173944.0, + "step": 22680 + }, + { + "epoch": 0.22772893331727487, + "learning_rate": 0.00015445622064314105, + "loss": 0.7776, + "mean_token_accuracy": 0.7662321627140045, + "num_tokens": 77207324.0, + "step": 22690 + }, + { + "epoch": 0.22782929864707535, + "learning_rate": 0.00015443614757718095, + "loss": 0.7143, + "mean_token_accuracy": 0.7842252373695373, + "num_tokens": 77241537.0, + "step": 22700 + }, + { + "epoch": 0.22792966397687583, + "learning_rate": 0.00015441607451122084, + "loss": 0.7524, + "mean_token_accuracy": 0.7744047999382019, + "num_tokens": 77275735.0, + "step": 22710 + }, + { + "epoch": 0.2280300293066763, + "learning_rate": 0.00015439600144526077, + "loss": 0.7689, + "mean_token_accuracy": 0.7665367484092712, + "num_tokens": 77309976.0, + "step": 22720 + }, + { + "epoch": 0.22813039463647677, + "learning_rate": 0.00015437592837930065, + "loss": 0.7763, + "mean_token_accuracy": 0.7648578226566315, + "num_tokens": 77343643.0, + "step": 22730 + }, + { + "epoch": 0.22823075996627726, + "learning_rate": 0.00015435585531334056, + "loss": 0.7909, + "mean_token_accuracy": 0.7639325499534607, + "num_tokens": 77377381.0, + "step": 22740 + }, + { + "epoch": 0.2283311252960777, + "learning_rate": 0.00015433578224738047, + "loss": 0.7579, + "mean_token_accuracy": 0.7704145252704621, + "num_tokens": 77411698.0, + "step": 22750 + }, + { + "epoch": 0.2284314906258782, + "learning_rate": 0.00015431570918142038, + "loss": 0.7714, + "mean_token_accuracy": 0.7725685954093933, + "num_tokens": 77445414.0, + "step": 22760 + }, + { + "epoch": 0.22853185595567868, + "learning_rate": 0.00015429563611546029, + "loss": 0.7976, + "mean_token_accuracy": 0.7643962144851685, + "num_tokens": 77479790.0, + "step": 22770 + }, + { + "epoch": 0.22863222128547914, + "learning_rate": 0.0001542755630495002, + "loss": 0.742, + "mean_token_accuracy": 0.7726198673248291, + "num_tokens": 77513380.0, + "step": 22780 + }, + { + "epoch": 0.22873258661527962, + "learning_rate": 0.0001542554899835401, + "loss": 0.7357, + "mean_token_accuracy": 0.7799278557300567, + "num_tokens": 77547445.0, + "step": 22790 + }, + { + "epoch": 0.2288329519450801, + "learning_rate": 0.00015423541691757998, + "loss": 0.755, + "mean_token_accuracy": 0.7717826008796692, + "num_tokens": 77580805.0, + "step": 22800 + }, + { + "epoch": 0.22893331727488056, + "learning_rate": 0.00015421534385161992, + "loss": 0.7819, + "mean_token_accuracy": 0.7631809949874878, + "num_tokens": 77614939.0, + "step": 22810 + }, + { + "epoch": 0.22903368260468104, + "learning_rate": 0.0001541952707856598, + "loss": 0.765, + "mean_token_accuracy": 0.7719576239585877, + "num_tokens": 77648513.0, + "step": 22820 + }, + { + "epoch": 0.2291340479344815, + "learning_rate": 0.0001541751977196997, + "loss": 0.7378, + "mean_token_accuracy": 0.7783514261245728, + "num_tokens": 77682577.0, + "step": 22830 + }, + { + "epoch": 0.22923441326428198, + "learning_rate": 0.00015415512465373962, + "loss": 0.7595, + "mean_token_accuracy": 0.7713116824626922, + "num_tokens": 77716512.0, + "step": 22840 + }, + { + "epoch": 0.22933477859408247, + "learning_rate": 0.00015413505158777953, + "loss": 0.7539, + "mean_token_accuracy": 0.7750553786754608, + "num_tokens": 77750751.0, + "step": 22850 + }, + { + "epoch": 0.22943514392388292, + "learning_rate": 0.0001541149785218194, + "loss": 0.7468, + "mean_token_accuracy": 0.7759535074234009, + "num_tokens": 77784657.0, + "step": 22860 + }, + { + "epoch": 0.2295355092536834, + "learning_rate": 0.00015409490545585934, + "loss": 0.7643, + "mean_token_accuracy": 0.7716870188713074, + "num_tokens": 77818195.0, + "step": 22870 + }, + { + "epoch": 0.2296358745834839, + "learning_rate": 0.00015407483238989922, + "loss": 0.744, + "mean_token_accuracy": 0.7780516982078552, + "num_tokens": 77852683.0, + "step": 22880 + }, + { + "epoch": 0.22973623991328435, + "learning_rate": 0.00015405475932393913, + "loss": 0.799, + "mean_token_accuracy": 0.763060474395752, + "num_tokens": 77887523.0, + "step": 22890 + }, + { + "epoch": 0.22983660524308483, + "learning_rate": 0.00015403468625797904, + "loss": 0.7758, + "mean_token_accuracy": 0.7726968407630921, + "num_tokens": 77921201.0, + "step": 22900 + }, + { + "epoch": 0.2299369705728853, + "learning_rate": 0.00015401461319201895, + "loss": 0.7513, + "mean_token_accuracy": 0.782043993473053, + "num_tokens": 77955086.0, + "step": 22910 + }, + { + "epoch": 0.23003733590268577, + "learning_rate": 0.00015399454012605889, + "loss": 0.7712, + "mean_token_accuracy": 0.7686130344867707, + "num_tokens": 77989111.0, + "step": 22920 + }, + { + "epoch": 0.23013770123248625, + "learning_rate": 0.00015397446706009877, + "loss": 0.7319, + "mean_token_accuracy": 0.7798277974128723, + "num_tokens": 78022530.0, + "step": 22930 + }, + { + "epoch": 0.23023806656228674, + "learning_rate": 0.00015395439399413868, + "loss": 0.7743, + "mean_token_accuracy": 0.7693477272987366, + "num_tokens": 78057045.0, + "step": 22940 + }, + { + "epoch": 0.2303384318920872, + "learning_rate": 0.00015393432092817858, + "loss": 0.7808, + "mean_token_accuracy": 0.7679920077323914, + "num_tokens": 78091534.0, + "step": 22950 + }, + { + "epoch": 0.23043879722188768, + "learning_rate": 0.0001539142478622185, + "loss": 0.8153, + "mean_token_accuracy": 0.7571540176868439, + "num_tokens": 78124619.0, + "step": 22960 + }, + { + "epoch": 0.23053916255168813, + "learning_rate": 0.00015389417479625837, + "loss": 0.8063, + "mean_token_accuracy": 0.7597503304481507, + "num_tokens": 78158312.0, + "step": 22970 + }, + { + "epoch": 0.23063952788148862, + "learning_rate": 0.0001538741017302983, + "loss": 0.7322, + "mean_token_accuracy": 0.781629455089569, + "num_tokens": 78193093.0, + "step": 22980 + }, + { + "epoch": 0.2307398932112891, + "learning_rate": 0.0001538540286643382, + "loss": 0.7713, + "mean_token_accuracy": 0.7688167214393615, + "num_tokens": 78227432.0, + "step": 22990 + }, + { + "epoch": 0.23084025854108955, + "learning_rate": 0.0001538339555983781, + "loss": 0.7679, + "mean_token_accuracy": 0.772001850605011, + "num_tokens": 78261054.0, + "step": 23000 + }, + { + "epoch": 0.23094062387089004, + "learning_rate": 0.000153813882532418, + "loss": 0.8045, + "mean_token_accuracy": 0.7627824485301972, + "num_tokens": 78294990.0, + "step": 23010 + }, + { + "epoch": 0.23104098920069052, + "learning_rate": 0.00015379380946645792, + "loss": 0.7661, + "mean_token_accuracy": 0.773594182729721, + "num_tokens": 78329086.0, + "step": 23020 + }, + { + "epoch": 0.23114135453049098, + "learning_rate": 0.00015377373640049782, + "loss": 0.7651, + "mean_token_accuracy": 0.7671305358409881, + "num_tokens": 78362541.0, + "step": 23030 + }, + { + "epoch": 0.23124171986029146, + "learning_rate": 0.00015375366333453773, + "loss": 0.7923, + "mean_token_accuracy": 0.7729197859764099, + "num_tokens": 78397177.0, + "step": 23040 + }, + { + "epoch": 0.23134208519009195, + "learning_rate": 0.00015373359026857764, + "loss": 0.7604, + "mean_token_accuracy": 0.7704223334789276, + "num_tokens": 78431194.0, + "step": 23050 + }, + { + "epoch": 0.2314424505198924, + "learning_rate": 0.00015371351720261752, + "loss": 0.7749, + "mean_token_accuracy": 0.7729601800441742, + "num_tokens": 78465215.0, + "step": 23060 + }, + { + "epoch": 0.23154281584969288, + "learning_rate": 0.00015369344413665746, + "loss": 0.7676, + "mean_token_accuracy": 0.7727331995964051, + "num_tokens": 78499820.0, + "step": 23070 + }, + { + "epoch": 0.23164318117949337, + "learning_rate": 0.00015367337107069734, + "loss": 0.7887, + "mean_token_accuracy": 0.7687535941600799, + "num_tokens": 78534030.0, + "step": 23080 + }, + { + "epoch": 0.23174354650929382, + "learning_rate": 0.00015365329800473725, + "loss": 0.76, + "mean_token_accuracy": 0.7724514603614807, + "num_tokens": 78568289.0, + "step": 23090 + }, + { + "epoch": 0.2318439118390943, + "learning_rate": 0.00015363322493877716, + "loss": 0.7763, + "mean_token_accuracy": 0.7684251010417938, + "num_tokens": 78602670.0, + "step": 23100 + }, + { + "epoch": 0.23194427716889476, + "learning_rate": 0.00015361315187281706, + "loss": 0.7717, + "mean_token_accuracy": 0.7708824157714844, + "num_tokens": 78637550.0, + "step": 23110 + }, + { + "epoch": 0.23204464249869525, + "learning_rate": 0.00015359307880685697, + "loss": 0.7743, + "mean_token_accuracy": 0.7683057010173797, + "num_tokens": 78671462.0, + "step": 23120 + }, + { + "epoch": 0.23214500782849573, + "learning_rate": 0.00015357300574089688, + "loss": 0.7418, + "mean_token_accuracy": 0.7737292468547821, + "num_tokens": 78705589.0, + "step": 23130 + }, + { + "epoch": 0.2322453731582962, + "learning_rate": 0.0001535529326749368, + "loss": 0.765, + "mean_token_accuracy": 0.7699859380722046, + "num_tokens": 78739648.0, + "step": 23140 + }, + { + "epoch": 0.23234573848809667, + "learning_rate": 0.00015353285960897667, + "loss": 0.7744, + "mean_token_accuracy": 0.7685719311237336, + "num_tokens": 78773935.0, + "step": 23150 + }, + { + "epoch": 0.23244610381789715, + "learning_rate": 0.0001535127865430166, + "loss": 0.7922, + "mean_token_accuracy": 0.7677593052387237, + "num_tokens": 78808407.0, + "step": 23160 + }, + { + "epoch": 0.2325464691476976, + "learning_rate": 0.0001534927134770565, + "loss": 0.7943, + "mean_token_accuracy": 0.765311723947525, + "num_tokens": 78842722.0, + "step": 23170 + }, + { + "epoch": 0.2326468344774981, + "learning_rate": 0.0001534726404110964, + "loss": 0.7831, + "mean_token_accuracy": 0.7717867314815521, + "num_tokens": 78876265.0, + "step": 23180 + }, + { + "epoch": 0.23274719980729858, + "learning_rate": 0.0001534525673451363, + "loss": 0.7645, + "mean_token_accuracy": 0.7726698100566864, + "num_tokens": 78910424.0, + "step": 23190 + }, + { + "epoch": 0.23284756513709903, + "learning_rate": 0.00015343249427917621, + "loss": 0.7541, + "mean_token_accuracy": 0.7792783617973328, + "num_tokens": 78944040.0, + "step": 23200 + }, + { + "epoch": 0.23294793046689952, + "learning_rate": 0.0001534124212132161, + "loss": 0.7767, + "mean_token_accuracy": 0.7686317384243011, + "num_tokens": 78977131.0, + "step": 23210 + }, + { + "epoch": 0.2330482957967, + "learning_rate": 0.00015339234814725603, + "loss": 0.7369, + "mean_token_accuracy": 0.776541656255722, + "num_tokens": 79011287.0, + "step": 23220 + }, + { + "epoch": 0.23314866112650046, + "learning_rate": 0.0001533722750812959, + "loss": 0.7657, + "mean_token_accuracy": 0.7776280224323273, + "num_tokens": 79044620.0, + "step": 23230 + }, + { + "epoch": 0.23324902645630094, + "learning_rate": 0.00015335220201533582, + "loss": 0.7912, + "mean_token_accuracy": 0.7631687164306641, + "num_tokens": 79078598.0, + "step": 23240 + }, + { + "epoch": 0.2333493917861014, + "learning_rate": 0.00015333212894937573, + "loss": 0.7749, + "mean_token_accuracy": 0.7703653693199157, + "num_tokens": 79112267.0, + "step": 23250 + }, + { + "epoch": 0.23344975711590188, + "learning_rate": 0.00015331205588341564, + "loss": 0.723, + "mean_token_accuracy": 0.7808611869812012, + "num_tokens": 79146140.0, + "step": 23260 + }, + { + "epoch": 0.23355012244570236, + "learning_rate": 0.00015329198281745555, + "loss": 0.7877, + "mean_token_accuracy": 0.7686753094196319, + "num_tokens": 79179376.0, + "step": 23270 + }, + { + "epoch": 0.23365048777550282, + "learning_rate": 0.00015327190975149545, + "loss": 0.7795, + "mean_token_accuracy": 0.7692699015140534, + "num_tokens": 79212928.0, + "step": 23280 + }, + { + "epoch": 0.2337508531053033, + "learning_rate": 0.00015325183668553536, + "loss": 0.7714, + "mean_token_accuracy": 0.7678778171539307, + "num_tokens": 79247276.0, + "step": 23290 + }, + { + "epoch": 0.23385121843510379, + "learning_rate": 0.00015323176361957524, + "loss": 0.7667, + "mean_token_accuracy": 0.7694761216640472, + "num_tokens": 79280809.0, + "step": 23300 + }, + { + "epoch": 0.23395158376490424, + "learning_rate": 0.00015321169055361518, + "loss": 0.7777, + "mean_token_accuracy": 0.7689460635185241, + "num_tokens": 79315215.0, + "step": 23310 + }, + { + "epoch": 0.23405194909470473, + "learning_rate": 0.00015319161748765506, + "loss": 0.7812, + "mean_token_accuracy": 0.7662648558616638, + "num_tokens": 79348428.0, + "step": 23320 + }, + { + "epoch": 0.2341523144245052, + "learning_rate": 0.00015317154442169497, + "loss": 0.7765, + "mean_token_accuracy": 0.7612001657485962, + "num_tokens": 79382310.0, + "step": 23330 + }, + { + "epoch": 0.23425267975430566, + "learning_rate": 0.00015315147135573488, + "loss": 0.7873, + "mean_token_accuracy": 0.7655379593372345, + "num_tokens": 79416640.0, + "step": 23340 + }, + { + "epoch": 0.23435304508410615, + "learning_rate": 0.00015313139828977479, + "loss": 0.7713, + "mean_token_accuracy": 0.7735551476478577, + "num_tokens": 79450449.0, + "step": 23350 + }, + { + "epoch": 0.23445341041390663, + "learning_rate": 0.0001531113252238147, + "loss": 0.7624, + "mean_token_accuracy": 0.7742606103420258, + "num_tokens": 79484109.0, + "step": 23360 + }, + { + "epoch": 0.2345537757437071, + "learning_rate": 0.0001530912521578546, + "loss": 0.7555, + "mean_token_accuracy": 0.7740523397922516, + "num_tokens": 79517766.0, + "step": 23370 + }, + { + "epoch": 0.23465414107350757, + "learning_rate": 0.0001530711790918945, + "loss": 0.7388, + "mean_token_accuracy": 0.7769231557846069, + "num_tokens": 79550985.0, + "step": 23380 + }, + { + "epoch": 0.23475450640330803, + "learning_rate": 0.0001530511060259344, + "loss": 0.7587, + "mean_token_accuracy": 0.7782913088798523, + "num_tokens": 79584552.0, + "step": 23390 + }, + { + "epoch": 0.2348548717331085, + "learning_rate": 0.00015303103295997433, + "loss": 0.8073, + "mean_token_accuracy": 0.7672119975090027, + "num_tokens": 79618051.0, + "step": 23400 + }, + { + "epoch": 0.234955237062909, + "learning_rate": 0.0001530109598940142, + "loss": 0.7406, + "mean_token_accuracy": 0.7801278173923493, + "num_tokens": 79652321.0, + "step": 23410 + }, + { + "epoch": 0.23505560239270945, + "learning_rate": 0.00015299088682805412, + "loss": 0.7625, + "mean_token_accuracy": 0.7745743751525879, + "num_tokens": 79685474.0, + "step": 23420 + }, + { + "epoch": 0.23515596772250993, + "learning_rate": 0.00015297081376209403, + "loss": 0.7483, + "mean_token_accuracy": 0.7806742548942566, + "num_tokens": 79718907.0, + "step": 23430 + }, + { + "epoch": 0.23525633305231042, + "learning_rate": 0.00015295074069613393, + "loss": 0.7707, + "mean_token_accuracy": 0.7705367624759674, + "num_tokens": 79752851.0, + "step": 23440 + }, + { + "epoch": 0.23535669838211087, + "learning_rate": 0.00015293066763017382, + "loss": 0.7445, + "mean_token_accuracy": 0.778471952676773, + "num_tokens": 79786545.0, + "step": 23450 + }, + { + "epoch": 0.23545706371191136, + "learning_rate": 0.00015291059456421375, + "loss": 0.7565, + "mean_token_accuracy": 0.7745211839675903, + "num_tokens": 79820372.0, + "step": 23460 + }, + { + "epoch": 0.23555742904171184, + "learning_rate": 0.00015289052149825366, + "loss": 0.7728, + "mean_token_accuracy": 0.7718680500984192, + "num_tokens": 79854552.0, + "step": 23470 + }, + { + "epoch": 0.2356577943715123, + "learning_rate": 0.00015287044843229354, + "loss": 0.7902, + "mean_token_accuracy": 0.7693752467632293, + "num_tokens": 79888384.0, + "step": 23480 + }, + { + "epoch": 0.23575815970131278, + "learning_rate": 0.00015285037536633348, + "loss": 0.7592, + "mean_token_accuracy": 0.7773387908935547, + "num_tokens": 79921343.0, + "step": 23490 + }, + { + "epoch": 0.23585852503111326, + "learning_rate": 0.00015283030230037336, + "loss": 0.7407, + "mean_token_accuracy": 0.7736146032810212, + "num_tokens": 79954869.0, + "step": 23500 + }, + { + "epoch": 0.23595889036091372, + "learning_rate": 0.0001528102292344133, + "loss": 0.75, + "mean_token_accuracy": 0.7789220571517944, + "num_tokens": 79988787.0, + "step": 23510 + }, + { + "epoch": 0.2360592556907142, + "learning_rate": 0.00015279015616845318, + "loss": 0.748, + "mean_token_accuracy": 0.7819363057613373, + "num_tokens": 80022579.0, + "step": 23520 + }, + { + "epoch": 0.23615962102051466, + "learning_rate": 0.00015277008310249308, + "loss": 0.7716, + "mean_token_accuracy": 0.7654751539230347, + "num_tokens": 80056791.0, + "step": 23530 + }, + { + "epoch": 0.23625998635031514, + "learning_rate": 0.000152750010036533, + "loss": 0.7384, + "mean_token_accuracy": 0.7784739851951599, + "num_tokens": 80091293.0, + "step": 23540 + }, + { + "epoch": 0.23636035168011563, + "learning_rate": 0.0001527299369705729, + "loss": 0.7486, + "mean_token_accuracy": 0.7739460527896881, + "num_tokens": 80125243.0, + "step": 23550 + }, + { + "epoch": 0.23646071700991608, + "learning_rate": 0.00015270986390461278, + "loss": 0.7448, + "mean_token_accuracy": 0.7724997520446777, + "num_tokens": 80159651.0, + "step": 23560 + }, + { + "epoch": 0.23656108233971657, + "learning_rate": 0.00015268979083865272, + "loss": 0.7728, + "mean_token_accuracy": 0.773425680398941, + "num_tokens": 80194166.0, + "step": 23570 + }, + { + "epoch": 0.23666144766951705, + "learning_rate": 0.0001526697177726926, + "loss": 0.7402, + "mean_token_accuracy": 0.7749640464782714, + "num_tokens": 80227835.0, + "step": 23580 + }, + { + "epoch": 0.2367618129993175, + "learning_rate": 0.0001526496447067325, + "loss": 0.7717, + "mean_token_accuracy": 0.7723572850227356, + "num_tokens": 80262461.0, + "step": 23590 + }, + { + "epoch": 0.236862178329118, + "learning_rate": 0.00015262957164077242, + "loss": 0.7917, + "mean_token_accuracy": 0.7664845049381256, + "num_tokens": 80296052.0, + "step": 23600 + }, + { + "epoch": 0.23696254365891847, + "learning_rate": 0.00015260949857481232, + "loss": 0.8065, + "mean_token_accuracy": 0.76147341132164, + "num_tokens": 80329560.0, + "step": 23610 + }, + { + "epoch": 0.23706290898871893, + "learning_rate": 0.00015258942550885223, + "loss": 0.7748, + "mean_token_accuracy": 0.7736762523651123, + "num_tokens": 80364268.0, + "step": 23620 + }, + { + "epoch": 0.2371632743185194, + "learning_rate": 0.00015256935244289214, + "loss": 0.7829, + "mean_token_accuracy": 0.7689502716064454, + "num_tokens": 80398126.0, + "step": 23630 + }, + { + "epoch": 0.2372636396483199, + "learning_rate": 0.00015254927937693205, + "loss": 0.7257, + "mean_token_accuracy": 0.7803487658500672, + "num_tokens": 80431691.0, + "step": 23640 + }, + { + "epoch": 0.23736400497812035, + "learning_rate": 0.00015252920631097193, + "loss": 0.7832, + "mean_token_accuracy": 0.7693206608295441, + "num_tokens": 80464821.0, + "step": 23650 + }, + { + "epoch": 0.23746437030792084, + "learning_rate": 0.00015250913324501187, + "loss": 0.7436, + "mean_token_accuracy": 0.7709475219249725, + "num_tokens": 80499063.0, + "step": 23660 + }, + { + "epoch": 0.23756473563772132, + "learning_rate": 0.00015248906017905175, + "loss": 0.7716, + "mean_token_accuracy": 0.7674477159976959, + "num_tokens": 80533670.0, + "step": 23670 + }, + { + "epoch": 0.23766510096752178, + "learning_rate": 0.00015246898711309166, + "loss": 0.7706, + "mean_token_accuracy": 0.7716367185115814, + "num_tokens": 80567369.0, + "step": 23680 + }, + { + "epoch": 0.23776546629732226, + "learning_rate": 0.00015244891404713156, + "loss": 0.7813, + "mean_token_accuracy": 0.7622873067855835, + "num_tokens": 80601216.0, + "step": 23690 + }, + { + "epoch": 0.23786583162712271, + "learning_rate": 0.00015242884098117147, + "loss": 0.7957, + "mean_token_accuracy": 0.7627099812030792, + "num_tokens": 80634983.0, + "step": 23700 + }, + { + "epoch": 0.2379661969569232, + "learning_rate": 0.00015240876791521138, + "loss": 0.7663, + "mean_token_accuracy": 0.7720392763614654, + "num_tokens": 80668706.0, + "step": 23710 + }, + { + "epoch": 0.23806656228672368, + "learning_rate": 0.0001523886948492513, + "loss": 0.7461, + "mean_token_accuracy": 0.7805128991603851, + "num_tokens": 80702813.0, + "step": 23720 + }, + { + "epoch": 0.23816692761652414, + "learning_rate": 0.0001523686217832912, + "loss": 0.7692, + "mean_token_accuracy": 0.7717490255832672, + "num_tokens": 80736386.0, + "step": 23730 + }, + { + "epoch": 0.23826729294632462, + "learning_rate": 0.00015234854871733108, + "loss": 0.7556, + "mean_token_accuracy": 0.7743633389472961, + "num_tokens": 80769866.0, + "step": 23740 + }, + { + "epoch": 0.2383676582761251, + "learning_rate": 0.00015232847565137101, + "loss": 0.7392, + "mean_token_accuracy": 0.7824662148952484, + "num_tokens": 80804598.0, + "step": 23750 + }, + { + "epoch": 0.23846802360592556, + "learning_rate": 0.0001523084025854109, + "loss": 0.7772, + "mean_token_accuracy": 0.7698829948902131, + "num_tokens": 80839414.0, + "step": 23760 + }, + { + "epoch": 0.23856838893572604, + "learning_rate": 0.0001522883295194508, + "loss": 0.758, + "mean_token_accuracy": 0.7751199185848237, + "num_tokens": 80873310.0, + "step": 23770 + }, + { + "epoch": 0.23866875426552653, + "learning_rate": 0.0001522682564534907, + "loss": 0.7705, + "mean_token_accuracy": 0.7692757785320282, + "num_tokens": 80907353.0, + "step": 23780 + }, + { + "epoch": 0.23876911959532698, + "learning_rate": 0.00015224818338753062, + "loss": 0.7719, + "mean_token_accuracy": 0.7673554956912995, + "num_tokens": 80941677.0, + "step": 23790 + }, + { + "epoch": 0.23886948492512747, + "learning_rate": 0.0001522281103215705, + "loss": 0.7576, + "mean_token_accuracy": 0.7721669137477875, + "num_tokens": 80975300.0, + "step": 23800 + }, + { + "epoch": 0.23896985025492795, + "learning_rate": 0.00015220803725561044, + "loss": 0.7427, + "mean_token_accuracy": 0.7750360429286957, + "num_tokens": 81009743.0, + "step": 23810 + }, + { + "epoch": 0.2390702155847284, + "learning_rate": 0.00015218796418965035, + "loss": 0.7502, + "mean_token_accuracy": 0.7714247167110443, + "num_tokens": 81043156.0, + "step": 23820 + }, + { + "epoch": 0.2391705809145289, + "learning_rate": 0.00015216789112369023, + "loss": 0.7379, + "mean_token_accuracy": 0.7796186149120331, + "num_tokens": 81077157.0, + "step": 23830 + }, + { + "epoch": 0.23927094624432935, + "learning_rate": 0.00015214781805773016, + "loss": 0.7561, + "mean_token_accuracy": 0.7781562328338623, + "num_tokens": 81111061.0, + "step": 23840 + }, + { + "epoch": 0.23937131157412983, + "learning_rate": 0.00015212774499177005, + "loss": 0.7717, + "mean_token_accuracy": 0.7698342204093933, + "num_tokens": 81144849.0, + "step": 23850 + }, + { + "epoch": 0.23947167690393031, + "learning_rate": 0.00015210767192580995, + "loss": 0.7429, + "mean_token_accuracy": 0.7787699818611145, + "num_tokens": 81178995.0, + "step": 23860 + }, + { + "epoch": 0.23957204223373077, + "learning_rate": 0.00015208759885984986, + "loss": 0.7224, + "mean_token_accuracy": 0.7845096230506897, + "num_tokens": 81212540.0, + "step": 23870 + }, + { + "epoch": 0.23967240756353125, + "learning_rate": 0.00015206752579388977, + "loss": 0.7611, + "mean_token_accuracy": 0.7693464875221252, + "num_tokens": 81245572.0, + "step": 23880 + }, + { + "epoch": 0.23977277289333174, + "learning_rate": 0.00015204745272792965, + "loss": 0.7845, + "mean_token_accuracy": 0.7700681567192078, + "num_tokens": 81279958.0, + "step": 23890 + }, + { + "epoch": 0.2398731382231322, + "learning_rate": 0.0001520273796619696, + "loss": 0.7998, + "mean_token_accuracy": 0.7623650908470154, + "num_tokens": 81314120.0, + "step": 23900 + }, + { + "epoch": 0.23997350355293268, + "learning_rate": 0.00015200730659600947, + "loss": 0.7459, + "mean_token_accuracy": 0.7785841584205627, + "num_tokens": 81348417.0, + "step": 23910 + }, + { + "epoch": 0.24007386888273316, + "learning_rate": 0.00015198723353004938, + "loss": 0.7728, + "mean_token_accuracy": 0.7697364985942841, + "num_tokens": 81382691.0, + "step": 23920 + }, + { + "epoch": 0.24017423421253362, + "learning_rate": 0.00015196716046408929, + "loss": 0.7579, + "mean_token_accuracy": 0.7758682548999787, + "num_tokens": 81416407.0, + "step": 23930 + }, + { + "epoch": 0.2402745995423341, + "learning_rate": 0.0001519470873981292, + "loss": 0.758, + "mean_token_accuracy": 0.7686584532260895, + "num_tokens": 81450577.0, + "step": 23940 + }, + { + "epoch": 0.24037496487213458, + "learning_rate": 0.0001519270143321691, + "loss": 0.7846, + "mean_token_accuracy": 0.7708744466304779, + "num_tokens": 81483488.0, + "step": 23950 + }, + { + "epoch": 0.24047533020193504, + "learning_rate": 0.000151906941266209, + "loss": 0.7611, + "mean_token_accuracy": 0.7697698056697846, + "num_tokens": 81517080.0, + "step": 23960 + }, + { + "epoch": 0.24057569553173552, + "learning_rate": 0.00015188686820024892, + "loss": 0.7582, + "mean_token_accuracy": 0.7723502278327942, + "num_tokens": 81550744.0, + "step": 23970 + }, + { + "epoch": 0.24067606086153598, + "learning_rate": 0.0001518667951342888, + "loss": 0.7491, + "mean_token_accuracy": 0.7779267430305481, + "num_tokens": 81583661.0, + "step": 23980 + }, + { + "epoch": 0.24077642619133646, + "learning_rate": 0.00015184672206832874, + "loss": 0.7448, + "mean_token_accuracy": 0.7716735482215882, + "num_tokens": 81617350.0, + "step": 23990 + }, + { + "epoch": 0.24087679152113695, + "learning_rate": 0.00015182664900236862, + "loss": 0.7594, + "mean_token_accuracy": 0.7715551853179932, + "num_tokens": 81652052.0, + "step": 24000 + }, + { + "epoch": 0.2409771568509374, + "learning_rate": 0.00015180657593640853, + "loss": 0.752, + "mean_token_accuracy": 0.7722446501255036, + "num_tokens": 81686582.0, + "step": 24010 + }, + { + "epoch": 0.24107752218073789, + "learning_rate": 0.00015178650287044843, + "loss": 0.7922, + "mean_token_accuracy": 0.7614984273910522, + "num_tokens": 81720532.0, + "step": 24020 + }, + { + "epoch": 0.24117788751053837, + "learning_rate": 0.00015176642980448834, + "loss": 0.7255, + "mean_token_accuracy": 0.7767630457878113, + "num_tokens": 81753436.0, + "step": 24030 + }, + { + "epoch": 0.24127825284033882, + "learning_rate": 0.00015174635673852825, + "loss": 0.7811, + "mean_token_accuracy": 0.7708664476871491, + "num_tokens": 81786624.0, + "step": 24040 + }, + { + "epoch": 0.2413786181701393, + "learning_rate": 0.00015172628367256816, + "loss": 0.7344, + "mean_token_accuracy": 0.7771263420581818, + "num_tokens": 81820742.0, + "step": 24050 + }, + { + "epoch": 0.2414789834999398, + "learning_rate": 0.00015170621060660807, + "loss": 0.7361, + "mean_token_accuracy": 0.7774999976158142, + "num_tokens": 81854862.0, + "step": 24060 + }, + { + "epoch": 0.24157934882974025, + "learning_rate": 0.00015168613754064798, + "loss": 0.7712, + "mean_token_accuracy": 0.7666206061840057, + "num_tokens": 81889274.0, + "step": 24070 + }, + { + "epoch": 0.24167971415954073, + "learning_rate": 0.00015166606447468788, + "loss": 0.7633, + "mean_token_accuracy": 0.7750555813312531, + "num_tokens": 81923286.0, + "step": 24080 + }, + { + "epoch": 0.24178007948934122, + "learning_rate": 0.00015164599140872777, + "loss": 0.7728, + "mean_token_accuracy": 0.7750057756900788, + "num_tokens": 81957647.0, + "step": 24090 + }, + { + "epoch": 0.24188044481914167, + "learning_rate": 0.0001516259183427677, + "loss": 0.7657, + "mean_token_accuracy": 0.7737397193908692, + "num_tokens": 81992262.0, + "step": 24100 + }, + { + "epoch": 0.24198081014894215, + "learning_rate": 0.00015160584527680758, + "loss": 0.7723, + "mean_token_accuracy": 0.7746361017227172, + "num_tokens": 82026134.0, + "step": 24110 + }, + { + "epoch": 0.2420811754787426, + "learning_rate": 0.0001515857722108475, + "loss": 0.7493, + "mean_token_accuracy": 0.7760856509208679, + "num_tokens": 82059412.0, + "step": 24120 + }, + { + "epoch": 0.2421815408085431, + "learning_rate": 0.0001515656991448874, + "loss": 0.7867, + "mean_token_accuracy": 0.7642060816287994, + "num_tokens": 82093614.0, + "step": 24130 + }, + { + "epoch": 0.24228190613834358, + "learning_rate": 0.0001515456260789273, + "loss": 0.7614, + "mean_token_accuracy": 0.7733182191848755, + "num_tokens": 82127152.0, + "step": 24140 + }, + { + "epoch": 0.24238227146814403, + "learning_rate": 0.0001515255530129672, + "loss": 0.7538, + "mean_token_accuracy": 0.7726780831813812, + "num_tokens": 82161045.0, + "step": 24150 + }, + { + "epoch": 0.24248263679794452, + "learning_rate": 0.00015150547994700713, + "loss": 0.7609, + "mean_token_accuracy": 0.7732154488563537, + "num_tokens": 82195039.0, + "step": 24160 + }, + { + "epoch": 0.242583002127745, + "learning_rate": 0.00015148540688104703, + "loss": 0.7853, + "mean_token_accuracy": 0.7675738036632538, + "num_tokens": 82229105.0, + "step": 24170 + }, + { + "epoch": 0.24268336745754546, + "learning_rate": 0.00015146533381508692, + "loss": 0.7686, + "mean_token_accuracy": 0.7697836279869079, + "num_tokens": 82262613.0, + "step": 24180 + }, + { + "epoch": 0.24278373278734594, + "learning_rate": 0.00015144526074912685, + "loss": 0.7689, + "mean_token_accuracy": 0.7739278435707092, + "num_tokens": 82296703.0, + "step": 24190 + }, + { + "epoch": 0.24288409811714642, + "learning_rate": 0.00015142518768316673, + "loss": 0.7673, + "mean_token_accuracy": 0.7727110087871552, + "num_tokens": 82331068.0, + "step": 24200 + }, + { + "epoch": 0.24298446344694688, + "learning_rate": 0.00015140511461720664, + "loss": 0.7503, + "mean_token_accuracy": 0.7769576132297515, + "num_tokens": 82364505.0, + "step": 24210 + }, + { + "epoch": 0.24308482877674736, + "learning_rate": 0.00015138504155124655, + "loss": 0.745, + "mean_token_accuracy": 0.7776174426078797, + "num_tokens": 82398500.0, + "step": 24220 + }, + { + "epoch": 0.24318519410654785, + "learning_rate": 0.00015136496848528646, + "loss": 0.7814, + "mean_token_accuracy": 0.7694048345088959, + "num_tokens": 82431808.0, + "step": 24230 + }, + { + "epoch": 0.2432855594363483, + "learning_rate": 0.00015134489541932634, + "loss": 0.7956, + "mean_token_accuracy": 0.7689190626144409, + "num_tokens": 82466117.0, + "step": 24240 + }, + { + "epoch": 0.2433859247661488, + "learning_rate": 0.00015132482235336627, + "loss": 0.7453, + "mean_token_accuracy": 0.780043751001358, + "num_tokens": 82500190.0, + "step": 24250 + }, + { + "epoch": 0.24348629009594924, + "learning_rate": 0.00015130474928740616, + "loss": 0.7847, + "mean_token_accuracy": 0.7688788890838623, + "num_tokens": 82533370.0, + "step": 24260 + }, + { + "epoch": 0.24358665542574973, + "learning_rate": 0.00015128467622144606, + "loss": 0.7662, + "mean_token_accuracy": 0.7725997388362884, + "num_tokens": 82567679.0, + "step": 24270 + }, + { + "epoch": 0.2436870207555502, + "learning_rate": 0.00015126460315548597, + "loss": 0.7745, + "mean_token_accuracy": 0.77141774892807, + "num_tokens": 82601856.0, + "step": 24280 + }, + { + "epoch": 0.24378738608535067, + "learning_rate": 0.00015124453008952588, + "loss": 0.7621, + "mean_token_accuracy": 0.7707475662231446, + "num_tokens": 82635356.0, + "step": 24290 + }, + { + "epoch": 0.24388775141515115, + "learning_rate": 0.0001512244570235658, + "loss": 0.7545, + "mean_token_accuracy": 0.7701977491378784, + "num_tokens": 82669879.0, + "step": 24300 + }, + { + "epoch": 0.24398811674495163, + "learning_rate": 0.0001512043839576057, + "loss": 0.7599, + "mean_token_accuracy": 0.7706035733222961, + "num_tokens": 82704522.0, + "step": 24310 + }, + { + "epoch": 0.2440884820747521, + "learning_rate": 0.0001511843108916456, + "loss": 0.7971, + "mean_token_accuracy": 0.7634208917617797, + "num_tokens": 82737999.0, + "step": 24320 + }, + { + "epoch": 0.24418884740455257, + "learning_rate": 0.0001511642378256855, + "loss": 0.7596, + "mean_token_accuracy": 0.778376430273056, + "num_tokens": 82771533.0, + "step": 24330 + }, + { + "epoch": 0.24428921273435306, + "learning_rate": 0.00015114416475972542, + "loss": 0.7487, + "mean_token_accuracy": 0.7745313465595245, + "num_tokens": 82805949.0, + "step": 24340 + }, + { + "epoch": 0.2443895780641535, + "learning_rate": 0.0001511240916937653, + "loss": 0.7667, + "mean_token_accuracy": 0.7709367036819458, + "num_tokens": 82840834.0, + "step": 24350 + }, + { + "epoch": 0.244489943393954, + "learning_rate": 0.0001511040186278052, + "loss": 0.7546, + "mean_token_accuracy": 0.7755620777606964, + "num_tokens": 82874182.0, + "step": 24360 + }, + { + "epoch": 0.24459030872375448, + "learning_rate": 0.00015108394556184512, + "loss": 0.7832, + "mean_token_accuracy": 0.7668637633323669, + "num_tokens": 82907934.0, + "step": 24370 + }, + { + "epoch": 0.24469067405355494, + "learning_rate": 0.00015106387249588503, + "loss": 0.7701, + "mean_token_accuracy": 0.7740091979503632, + "num_tokens": 82942363.0, + "step": 24380 + }, + { + "epoch": 0.24479103938335542, + "learning_rate": 0.00015104379942992494, + "loss": 0.7596, + "mean_token_accuracy": 0.775358909368515, + "num_tokens": 82976781.0, + "step": 24390 + }, + { + "epoch": 0.24489140471315587, + "learning_rate": 0.00015102372636396485, + "loss": 0.7905, + "mean_token_accuracy": 0.7667368113994598, + "num_tokens": 83010721.0, + "step": 24400 + }, + { + "epoch": 0.24499177004295636, + "learning_rate": 0.00015100365329800475, + "loss": 0.7485, + "mean_token_accuracy": 0.7746308982372284, + "num_tokens": 83044831.0, + "step": 24410 + }, + { + "epoch": 0.24509213537275684, + "learning_rate": 0.00015098358023204464, + "loss": 0.7526, + "mean_token_accuracy": 0.7761373102664948, + "num_tokens": 83078730.0, + "step": 24420 + }, + { + "epoch": 0.2451925007025573, + "learning_rate": 0.00015096350716608457, + "loss": 0.7553, + "mean_token_accuracy": 0.7750726759433746, + "num_tokens": 83112963.0, + "step": 24430 + }, + { + "epoch": 0.24529286603235778, + "learning_rate": 0.00015094343410012445, + "loss": 0.7528, + "mean_token_accuracy": 0.7696741640567779, + "num_tokens": 83146238.0, + "step": 24440 + }, + { + "epoch": 0.24539323136215827, + "learning_rate": 0.00015092336103416436, + "loss": 0.7571, + "mean_token_accuracy": 0.7693495810031891, + "num_tokens": 83179916.0, + "step": 24450 + }, + { + "epoch": 0.24549359669195872, + "learning_rate": 0.00015090328796820427, + "loss": 0.7639, + "mean_token_accuracy": 0.7746648609638214, + "num_tokens": 83214052.0, + "step": 24460 + }, + { + "epoch": 0.2455939620217592, + "learning_rate": 0.00015088321490224418, + "loss": 0.7327, + "mean_token_accuracy": 0.7817089438438416, + "num_tokens": 83248328.0, + "step": 24470 + }, + { + "epoch": 0.2456943273515597, + "learning_rate": 0.00015086314183628406, + "loss": 0.7763, + "mean_token_accuracy": 0.7671709716320038, + "num_tokens": 83281506.0, + "step": 24480 + }, + { + "epoch": 0.24579469268136014, + "learning_rate": 0.000150843068770324, + "loss": 0.7817, + "mean_token_accuracy": 0.7677108585834503, + "num_tokens": 83315624.0, + "step": 24490 + }, + { + "epoch": 0.24589505801116063, + "learning_rate": 0.00015082299570436388, + "loss": 0.7814, + "mean_token_accuracy": 0.7697063982486725, + "num_tokens": 83349795.0, + "step": 24500 + }, + { + "epoch": 0.2459954233409611, + "learning_rate": 0.00015080292263840378, + "loss": 0.7506, + "mean_token_accuracy": 0.7754936277866363, + "num_tokens": 83383555.0, + "step": 24510 + }, + { + "epoch": 0.24609578867076157, + "learning_rate": 0.00015078284957244372, + "loss": 0.7845, + "mean_token_accuracy": 0.7674134135246277, + "num_tokens": 83417458.0, + "step": 24520 + }, + { + "epoch": 0.24619615400056205, + "learning_rate": 0.0001507627765064836, + "loss": 0.7682, + "mean_token_accuracy": 0.7745970547199249, + "num_tokens": 83452068.0, + "step": 24530 + }, + { + "epoch": 0.2462965193303625, + "learning_rate": 0.0001507427034405235, + "loss": 0.7397, + "mean_token_accuracy": 0.7787245750427246, + "num_tokens": 83486232.0, + "step": 24540 + }, + { + "epoch": 0.246396884660163, + "learning_rate": 0.00015072263037456342, + "loss": 0.7854, + "mean_token_accuracy": 0.7659784495830536, + "num_tokens": 83520412.0, + "step": 24550 + }, + { + "epoch": 0.24649724998996347, + "learning_rate": 0.00015070255730860333, + "loss": 0.7673, + "mean_token_accuracy": 0.7728880882263184, + "num_tokens": 83554383.0, + "step": 24560 + }, + { + "epoch": 0.24659761531976393, + "learning_rate": 0.0001506824842426432, + "loss": 0.7763, + "mean_token_accuracy": 0.7732985317707062, + "num_tokens": 83588112.0, + "step": 24570 + }, + { + "epoch": 0.2466979806495644, + "learning_rate": 0.00015066241117668314, + "loss": 0.7909, + "mean_token_accuracy": 0.7652292132377625, + "num_tokens": 83622427.0, + "step": 24580 + }, + { + "epoch": 0.2467983459793649, + "learning_rate": 0.00015064233811072303, + "loss": 0.7231, + "mean_token_accuracy": 0.7823591709136963, + "num_tokens": 83656834.0, + "step": 24590 + }, + { + "epoch": 0.24689871130916535, + "learning_rate": 0.00015062226504476293, + "loss": 0.7636, + "mean_token_accuracy": 0.7728028655052185, + "num_tokens": 83690537.0, + "step": 24600 + }, + { + "epoch": 0.24699907663896584, + "learning_rate": 0.00015060219197880284, + "loss": 0.7269, + "mean_token_accuracy": 0.7785695910453796, + "num_tokens": 83724980.0, + "step": 24610 + }, + { + "epoch": 0.24709944196876632, + "learning_rate": 0.00015058211891284275, + "loss": 0.7324, + "mean_token_accuracy": 0.7791578233242035, + "num_tokens": 83759574.0, + "step": 24620 + }, + { + "epoch": 0.24719980729856678, + "learning_rate": 0.00015056204584688266, + "loss": 0.7934, + "mean_token_accuracy": 0.7672521889209747, + "num_tokens": 83793398.0, + "step": 24630 + }, + { + "epoch": 0.24730017262836726, + "learning_rate": 0.00015054197278092257, + "loss": 0.7527, + "mean_token_accuracy": 0.7744177103042602, + "num_tokens": 83828140.0, + "step": 24640 + }, + { + "epoch": 0.24740053795816774, + "learning_rate": 0.00015052189971496248, + "loss": 0.7684, + "mean_token_accuracy": 0.768083530664444, + "num_tokens": 83862329.0, + "step": 24650 + }, + { + "epoch": 0.2475009032879682, + "learning_rate": 0.00015050182664900238, + "loss": 0.7745, + "mean_token_accuracy": 0.7712616503238678, + "num_tokens": 83896804.0, + "step": 24660 + }, + { + "epoch": 0.24760126861776868, + "learning_rate": 0.0001504817535830423, + "loss": 0.7643, + "mean_token_accuracy": 0.7727303802967072, + "num_tokens": 83931689.0, + "step": 24670 + }, + { + "epoch": 0.24770163394756914, + "learning_rate": 0.00015046168051708217, + "loss": 0.7554, + "mean_token_accuracy": 0.7718530833721161, + "num_tokens": 83965817.0, + "step": 24680 + }, + { + "epoch": 0.24780199927736962, + "learning_rate": 0.0001504416074511221, + "loss": 0.766, + "mean_token_accuracy": 0.7704915702342987, + "num_tokens": 83999083.0, + "step": 24690 + }, + { + "epoch": 0.2479023646071701, + "learning_rate": 0.000150421534385162, + "loss": 0.7429, + "mean_token_accuracy": 0.7724758744239807, + "num_tokens": 84033306.0, + "step": 24700 + }, + { + "epoch": 0.24800272993697056, + "learning_rate": 0.0001504014613192019, + "loss": 0.7658, + "mean_token_accuracy": 0.7693391263484954, + "num_tokens": 84066880.0, + "step": 24710 + }, + { + "epoch": 0.24810309526677105, + "learning_rate": 0.0001503813882532418, + "loss": 0.7494, + "mean_token_accuracy": 0.770747721195221, + "num_tokens": 84100580.0, + "step": 24720 + }, + { + "epoch": 0.24820346059657153, + "learning_rate": 0.00015036131518728172, + "loss": 0.7875, + "mean_token_accuracy": 0.7645402133464814, + "num_tokens": 84134540.0, + "step": 24730 + }, + { + "epoch": 0.24830382592637198, + "learning_rate": 0.00015034124212132162, + "loss": 0.7692, + "mean_token_accuracy": 0.7743058323860168, + "num_tokens": 84168575.0, + "step": 24740 + }, + { + "epoch": 0.24840419125617247, + "learning_rate": 0.00015032116905536153, + "loss": 0.7812, + "mean_token_accuracy": 0.766360980272293, + "num_tokens": 84202924.0, + "step": 24750 + }, + { + "epoch": 0.24850455658597295, + "learning_rate": 0.00015030109598940144, + "loss": 0.7697, + "mean_token_accuracy": 0.7704414248466491, + "num_tokens": 84237238.0, + "step": 24760 + }, + { + "epoch": 0.2486049219157734, + "learning_rate": 0.00015028102292344132, + "loss": 0.7391, + "mean_token_accuracy": 0.7736336052417755, + "num_tokens": 84271592.0, + "step": 24770 + }, + { + "epoch": 0.2487052872455739, + "learning_rate": 0.00015026094985748126, + "loss": 0.7559, + "mean_token_accuracy": 0.7742735326290131, + "num_tokens": 84305917.0, + "step": 24780 + }, + { + "epoch": 0.24880565257537438, + "learning_rate": 0.00015024087679152114, + "loss": 0.7626, + "mean_token_accuracy": 0.7742458462715149, + "num_tokens": 84339607.0, + "step": 24790 + }, + { + "epoch": 0.24890601790517483, + "learning_rate": 0.00015022080372556105, + "loss": 0.7454, + "mean_token_accuracy": 0.7744569897651672, + "num_tokens": 84374014.0, + "step": 24800 + }, + { + "epoch": 0.24900638323497531, + "learning_rate": 0.00015020073065960096, + "loss": 0.78, + "mean_token_accuracy": 0.7679212808609008, + "num_tokens": 84407966.0, + "step": 24810 + }, + { + "epoch": 0.24910674856477577, + "learning_rate": 0.00015018065759364087, + "loss": 0.7903, + "mean_token_accuracy": 0.7653574228286744, + "num_tokens": 84442126.0, + "step": 24820 + }, + { + "epoch": 0.24920711389457625, + "learning_rate": 0.00015016058452768075, + "loss": 0.7613, + "mean_token_accuracy": 0.7751851081848145, + "num_tokens": 84476405.0, + "step": 24830 + }, + { + "epoch": 0.24930747922437674, + "learning_rate": 0.00015014051146172068, + "loss": 0.7459, + "mean_token_accuracy": 0.7735485136508942, + "num_tokens": 84510655.0, + "step": 24840 + }, + { + "epoch": 0.2494078445541772, + "learning_rate": 0.00015012043839576056, + "loss": 0.7649, + "mean_token_accuracy": 0.7721766114234925, + "num_tokens": 84544543.0, + "step": 24850 + }, + { + "epoch": 0.24950820988397768, + "learning_rate": 0.00015010036532980047, + "loss": 0.7673, + "mean_token_accuracy": 0.7733584702014923, + "num_tokens": 84578016.0, + "step": 24860 + }, + { + "epoch": 0.24960857521377816, + "learning_rate": 0.0001500802922638404, + "loss": 0.7727, + "mean_token_accuracy": 0.7719229996204376, + "num_tokens": 84612899.0, + "step": 24870 + }, + { + "epoch": 0.24970894054357862, + "learning_rate": 0.0001500602191978803, + "loss": 0.7685, + "mean_token_accuracy": 0.769759064912796, + "num_tokens": 84647798.0, + "step": 24880 + }, + { + "epoch": 0.2498093058733791, + "learning_rate": 0.0001500401461319202, + "loss": 0.754, + "mean_token_accuracy": 0.7807211995124816, + "num_tokens": 84682489.0, + "step": 24890 + }, + { + "epoch": 0.24990967120317958, + "learning_rate": 0.0001500200730659601, + "loss": 0.7634, + "mean_token_accuracy": 0.7719671905040741, + "num_tokens": 84716528.0, + "step": 24900 + }, + { + "epoch": 0.25001003653298004, + "learning_rate": 0.00015000000000000001, + "loss": 0.7432, + "mean_token_accuracy": 0.7741679668426513, + "num_tokens": 84750516.0, + "step": 24910 + }, + { + "epoch": 0.2501104018627805, + "learning_rate": 0.0001499799269340399, + "loss": 0.7741, + "mean_token_accuracy": 0.769940984249115, + "num_tokens": 84784272.0, + "step": 24920 + }, + { + "epoch": 0.250210767192581, + "learning_rate": 0.00014995985386807983, + "loss": 0.7687, + "mean_token_accuracy": 0.7691887438297271, + "num_tokens": 84819003.0, + "step": 24930 + }, + { + "epoch": 0.25031113252238146, + "learning_rate": 0.0001499397808021197, + "loss": 0.7266, + "mean_token_accuracy": 0.7773842871189117, + "num_tokens": 84852763.0, + "step": 24940 + }, + { + "epoch": 0.2504114978521819, + "learning_rate": 0.00014991970773615962, + "loss": 0.7593, + "mean_token_accuracy": 0.7744570195674896, + "num_tokens": 84886921.0, + "step": 24950 + }, + { + "epoch": 0.25051186318198243, + "learning_rate": 0.00014989963467019953, + "loss": 0.7699, + "mean_token_accuracy": 0.7752615630626678, + "num_tokens": 84921113.0, + "step": 24960 + }, + { + "epoch": 0.2506122285117829, + "learning_rate": 0.00014987956160423944, + "loss": 0.7212, + "mean_token_accuracy": 0.7837283551692963, + "num_tokens": 84955449.0, + "step": 24970 + }, + { + "epoch": 0.25071259384158334, + "learning_rate": 0.00014985948853827935, + "loss": 0.7636, + "mean_token_accuracy": 0.7748461961746216, + "num_tokens": 84989985.0, + "step": 24980 + }, + { + "epoch": 0.25081295917138385, + "learning_rate": 0.00014983941547231925, + "loss": 0.7679, + "mean_token_accuracy": 0.7788638472557068, + "num_tokens": 85023754.0, + "step": 24990 + }, + { + "epoch": 0.2509133245011843, + "learning_rate": 0.00014981934240635916, + "loss": 0.7541, + "mean_token_accuracy": 0.7738966584205628, + "num_tokens": 85057485.0, + "step": 25000 + }, + { + "epoch": 0.25101368983098477, + "learning_rate": 0.00014979926934039904, + "loss": 0.7717, + "mean_token_accuracy": 0.7705737590789795, + "num_tokens": 85092345.0, + "step": 25010 + }, + { + "epoch": 0.2511140551607853, + "learning_rate": 0.00014977919627443898, + "loss": 0.8036, + "mean_token_accuracy": 0.7606657981872559, + "num_tokens": 85126415.0, + "step": 25020 + }, + { + "epoch": 0.25121442049058573, + "learning_rate": 0.00014975912320847886, + "loss": 0.7839, + "mean_token_accuracy": 0.7678379952907562, + "num_tokens": 85160265.0, + "step": 25030 + }, + { + "epoch": 0.2513147858203862, + "learning_rate": 0.00014973905014251877, + "loss": 0.7654, + "mean_token_accuracy": 0.7709371447563171, + "num_tokens": 85194420.0, + "step": 25040 + }, + { + "epoch": 0.2514151511501867, + "learning_rate": 0.00014971897707655868, + "loss": 0.7382, + "mean_token_accuracy": 0.7809635996818542, + "num_tokens": 85227880.0, + "step": 25050 + }, + { + "epoch": 0.25151551647998716, + "learning_rate": 0.00014969890401059859, + "loss": 0.7632, + "mean_token_accuracy": 0.7718024134635926, + "num_tokens": 85261717.0, + "step": 25060 + }, + { + "epoch": 0.2516158818097876, + "learning_rate": 0.0001496788309446385, + "loss": 0.7702, + "mean_token_accuracy": 0.7697980642318726, + "num_tokens": 85295733.0, + "step": 25070 + }, + { + "epoch": 0.2517162471395881, + "learning_rate": 0.0001496587578786784, + "loss": 0.775, + "mean_token_accuracy": 0.771453458070755, + "num_tokens": 85329861.0, + "step": 25080 + }, + { + "epoch": 0.2518166124693886, + "learning_rate": 0.0001496386848127183, + "loss": 0.7659, + "mean_token_accuracy": 0.7687193214893341, + "num_tokens": 85364228.0, + "step": 25090 + }, + { + "epoch": 0.25191697779918903, + "learning_rate": 0.0001496186117467582, + "loss": 0.745, + "mean_token_accuracy": 0.7802204549312591, + "num_tokens": 85397878.0, + "step": 25100 + }, + { + "epoch": 0.25201734312898955, + "learning_rate": 0.00014959853868079813, + "loss": 0.7364, + "mean_token_accuracy": 0.7754930555820465, + "num_tokens": 85431906.0, + "step": 25110 + }, + { + "epoch": 0.25211770845879, + "learning_rate": 0.000149578465614838, + "loss": 0.8023, + "mean_token_accuracy": 0.7620309591293335, + "num_tokens": 85466672.0, + "step": 25120 + }, + { + "epoch": 0.25221807378859046, + "learning_rate": 0.00014955839254887792, + "loss": 0.7639, + "mean_token_accuracy": 0.7732936799526214, + "num_tokens": 85501948.0, + "step": 25130 + }, + { + "epoch": 0.25231843911839097, + "learning_rate": 0.00014953831948291783, + "loss": 0.7285, + "mean_token_accuracy": 0.7803778707981109, + "num_tokens": 85535594.0, + "step": 25140 + }, + { + "epoch": 0.2524188044481914, + "learning_rate": 0.00014951824641695774, + "loss": 0.7729, + "mean_token_accuracy": 0.7724705159664154, + "num_tokens": 85570745.0, + "step": 25150 + }, + { + "epoch": 0.2525191697779919, + "learning_rate": 0.00014949817335099762, + "loss": 0.7769, + "mean_token_accuracy": 0.7735279023647308, + "num_tokens": 85604587.0, + "step": 25160 + }, + { + "epoch": 0.25261953510779234, + "learning_rate": 0.00014947810028503755, + "loss": 0.7619, + "mean_token_accuracy": 0.7704692482948303, + "num_tokens": 85638073.0, + "step": 25170 + }, + { + "epoch": 0.25271990043759285, + "learning_rate": 0.00014945802721907743, + "loss": 0.7564, + "mean_token_accuracy": 0.7743849337100983, + "num_tokens": 85671963.0, + "step": 25180 + }, + { + "epoch": 0.2528202657673933, + "learning_rate": 0.00014943795415311734, + "loss": 0.7575, + "mean_token_accuracy": 0.774717116355896, + "num_tokens": 85706538.0, + "step": 25190 + }, + { + "epoch": 0.25292063109719376, + "learning_rate": 0.00014941788108715725, + "loss": 0.7468, + "mean_token_accuracy": 0.7788683176040649, + "num_tokens": 85740414.0, + "step": 25200 + }, + { + "epoch": 0.25302099642699427, + "learning_rate": 0.00014939780802119716, + "loss": 0.7752, + "mean_token_accuracy": 0.7676084637641907, + "num_tokens": 85774633.0, + "step": 25210 + }, + { + "epoch": 0.2531213617567947, + "learning_rate": 0.0001493777349552371, + "loss": 0.749, + "mean_token_accuracy": 0.7740694999694824, + "num_tokens": 85808692.0, + "step": 25220 + }, + { + "epoch": 0.2532217270865952, + "learning_rate": 0.00014935766188927698, + "loss": 0.7251, + "mean_token_accuracy": 0.7860980331897736, + "num_tokens": 85842126.0, + "step": 25230 + }, + { + "epoch": 0.2533220924163957, + "learning_rate": 0.00014933758882331688, + "loss": 0.7751, + "mean_token_accuracy": 0.7714491665363312, + "num_tokens": 85875593.0, + "step": 25240 + }, + { + "epoch": 0.25342245774619615, + "learning_rate": 0.0001493175157573568, + "loss": 0.7671, + "mean_token_accuracy": 0.7751310586929321, + "num_tokens": 85909507.0, + "step": 25250 + }, + { + "epoch": 0.2535228230759966, + "learning_rate": 0.0001492974426913967, + "loss": 0.7596, + "mean_token_accuracy": 0.7769211292266845, + "num_tokens": 85943937.0, + "step": 25260 + }, + { + "epoch": 0.2536231884057971, + "learning_rate": 0.00014927736962543658, + "loss": 0.7508, + "mean_token_accuracy": 0.7736414492130279, + "num_tokens": 85977417.0, + "step": 25270 + }, + { + "epoch": 0.2537235537355976, + "learning_rate": 0.00014925729655947652, + "loss": 0.8044, + "mean_token_accuracy": 0.7656659841537475, + "num_tokens": 86010732.0, + "step": 25280 + }, + { + "epoch": 0.25382391906539803, + "learning_rate": 0.0001492372234935164, + "loss": 0.7445, + "mean_token_accuracy": 0.7763683319091796, + "num_tokens": 86044764.0, + "step": 25290 + }, + { + "epoch": 0.25392428439519854, + "learning_rate": 0.0001492171504275563, + "loss": 0.7432, + "mean_token_accuracy": 0.7775234937667846, + "num_tokens": 86078781.0, + "step": 25300 + }, + { + "epoch": 0.254024649724999, + "learning_rate": 0.00014919707736159622, + "loss": 0.7654, + "mean_token_accuracy": 0.7700466334819793, + "num_tokens": 86113326.0, + "step": 25310 + }, + { + "epoch": 0.25412501505479945, + "learning_rate": 0.00014917700429563612, + "loss": 0.7856, + "mean_token_accuracy": 0.7683400988578797, + "num_tokens": 86147025.0, + "step": 25320 + }, + { + "epoch": 0.25422538038459996, + "learning_rate": 0.00014915693122967603, + "loss": 0.7414, + "mean_token_accuracy": 0.7748342633247376, + "num_tokens": 86181539.0, + "step": 25330 + }, + { + "epoch": 0.2543257457144004, + "learning_rate": 0.00014913685816371594, + "loss": 0.7805, + "mean_token_accuracy": 0.768756777048111, + "num_tokens": 86215963.0, + "step": 25340 + }, + { + "epoch": 0.2544261110442009, + "learning_rate": 0.00014911678509775585, + "loss": 0.7576, + "mean_token_accuracy": 0.7703627109527588, + "num_tokens": 86249684.0, + "step": 25350 + }, + { + "epoch": 0.2545264763740014, + "learning_rate": 0.00014909671203179573, + "loss": 0.7637, + "mean_token_accuracy": 0.7684246659278869, + "num_tokens": 86282686.0, + "step": 25360 + }, + { + "epoch": 0.25462684170380184, + "learning_rate": 0.00014907663896583567, + "loss": 0.7586, + "mean_token_accuracy": 0.7752669513225555, + "num_tokens": 86317014.0, + "step": 25370 + }, + { + "epoch": 0.2547272070336023, + "learning_rate": 0.00014905656589987555, + "loss": 0.7911, + "mean_token_accuracy": 0.7662883758544922, + "num_tokens": 86351353.0, + "step": 25380 + }, + { + "epoch": 0.2548275723634028, + "learning_rate": 0.00014903649283391546, + "loss": 0.7546, + "mean_token_accuracy": 0.7772423982620239, + "num_tokens": 86385009.0, + "step": 25390 + }, + { + "epoch": 0.25492793769320327, + "learning_rate": 0.00014901641976795536, + "loss": 0.757, + "mean_token_accuracy": 0.776004284620285, + "num_tokens": 86419271.0, + "step": 25400 + }, + { + "epoch": 0.2550283030230037, + "learning_rate": 0.00014899634670199527, + "loss": 0.756, + "mean_token_accuracy": 0.7729967117309571, + "num_tokens": 86453343.0, + "step": 25410 + }, + { + "epoch": 0.25512866835280423, + "learning_rate": 0.00014897627363603518, + "loss": 0.7826, + "mean_token_accuracy": 0.7646670699119568, + "num_tokens": 86487554.0, + "step": 25420 + }, + { + "epoch": 0.2552290336826047, + "learning_rate": 0.0001489562005700751, + "loss": 0.7624, + "mean_token_accuracy": 0.7803102493286133, + "num_tokens": 86521925.0, + "step": 25430 + }, + { + "epoch": 0.25532939901240514, + "learning_rate": 0.000148936127504115, + "loss": 0.7857, + "mean_token_accuracy": 0.7645636975765229, + "num_tokens": 86555158.0, + "step": 25440 + }, + { + "epoch": 0.2554297643422056, + "learning_rate": 0.00014891605443815488, + "loss": 0.7669, + "mean_token_accuracy": 0.7731352686882019, + "num_tokens": 86589507.0, + "step": 25450 + }, + { + "epoch": 0.2555301296720061, + "learning_rate": 0.00014889598137219482, + "loss": 0.7557, + "mean_token_accuracy": 0.7728032350540162, + "num_tokens": 86622919.0, + "step": 25460 + }, + { + "epoch": 0.25563049500180657, + "learning_rate": 0.0001488759083062347, + "loss": 0.8059, + "mean_token_accuracy": 0.7628725171089172, + "num_tokens": 86656473.0, + "step": 25470 + }, + { + "epoch": 0.255730860331607, + "learning_rate": 0.0001488558352402746, + "loss": 0.7713, + "mean_token_accuracy": 0.7711473762989044, + "num_tokens": 86690523.0, + "step": 25480 + }, + { + "epoch": 0.25583122566140754, + "learning_rate": 0.0001488357621743145, + "loss": 0.7745, + "mean_token_accuracy": 0.7721888720989227, + "num_tokens": 86724478.0, + "step": 25490 + }, + { + "epoch": 0.255931590991208, + "learning_rate": 0.00014881568910835442, + "loss": 0.8016, + "mean_token_accuracy": 0.7639282763004303, + "num_tokens": 86757913.0, + "step": 25500 + }, + { + "epoch": 0.25603195632100845, + "learning_rate": 0.0001487956160423943, + "loss": 0.7672, + "mean_token_accuracy": 0.7748159408569336, + "num_tokens": 86791797.0, + "step": 25510 + }, + { + "epoch": 0.25613232165080896, + "learning_rate": 0.00014877554297643424, + "loss": 0.7705, + "mean_token_accuracy": 0.7691547334194183, + "num_tokens": 86825417.0, + "step": 25520 + }, + { + "epoch": 0.2562326869806094, + "learning_rate": 0.00014875546991047412, + "loss": 0.7442, + "mean_token_accuracy": 0.7793104350566864, + "num_tokens": 86858769.0, + "step": 25530 + }, + { + "epoch": 0.25633305231040987, + "learning_rate": 0.00014873539684451403, + "loss": 0.7636, + "mean_token_accuracy": 0.7719816446304322, + "num_tokens": 86892597.0, + "step": 25540 + }, + { + "epoch": 0.2564334176402104, + "learning_rate": 0.00014871532377855394, + "loss": 0.7282, + "mean_token_accuracy": 0.7823039889335632, + "num_tokens": 86926765.0, + "step": 25550 + }, + { + "epoch": 0.25653378297001084, + "learning_rate": 0.00014869525071259385, + "loss": 0.7331, + "mean_token_accuracy": 0.778553056716919, + "num_tokens": 86962121.0, + "step": 25560 + }, + { + "epoch": 0.2566341482998113, + "learning_rate": 0.00014867517764663375, + "loss": 0.7989, + "mean_token_accuracy": 0.7632017970085144, + "num_tokens": 86996587.0, + "step": 25570 + }, + { + "epoch": 0.2567345136296118, + "learning_rate": 0.00014865510458067366, + "loss": 0.8135, + "mean_token_accuracy": 0.7593931913375854, + "num_tokens": 87029765.0, + "step": 25580 + }, + { + "epoch": 0.25683487895941226, + "learning_rate": 0.00014863503151471357, + "loss": 0.7807, + "mean_token_accuracy": 0.7670421421527862, + "num_tokens": 87063804.0, + "step": 25590 + }, + { + "epoch": 0.2569352442892127, + "learning_rate": 0.00014861495844875345, + "loss": 0.7511, + "mean_token_accuracy": 0.7708527326583863, + "num_tokens": 87098792.0, + "step": 25600 + }, + { + "epoch": 0.25703560961901323, + "learning_rate": 0.0001485948853827934, + "loss": 0.7642, + "mean_token_accuracy": 0.7667521178722382, + "num_tokens": 87133042.0, + "step": 25610 + }, + { + "epoch": 0.2571359749488137, + "learning_rate": 0.00014857481231683327, + "loss": 0.7553, + "mean_token_accuracy": 0.7766914963722229, + "num_tokens": 87166899.0, + "step": 25620 + }, + { + "epoch": 0.25723634027861414, + "learning_rate": 0.00014855473925087318, + "loss": 0.7379, + "mean_token_accuracy": 0.7837460577487946, + "num_tokens": 87201686.0, + "step": 25630 + }, + { + "epoch": 0.25733670560841465, + "learning_rate": 0.00014853466618491309, + "loss": 0.7499, + "mean_token_accuracy": 0.7803411364555359, + "num_tokens": 87235747.0, + "step": 25640 + }, + { + "epoch": 0.2574370709382151, + "learning_rate": 0.000148514593118953, + "loss": 0.7564, + "mean_token_accuracy": 0.7728347659111023, + "num_tokens": 87270207.0, + "step": 25650 + }, + { + "epoch": 0.25753743626801556, + "learning_rate": 0.0001484945200529929, + "loss": 0.7546, + "mean_token_accuracy": 0.7803968906402587, + "num_tokens": 87303823.0, + "step": 25660 + }, + { + "epoch": 0.2576378015978161, + "learning_rate": 0.0001484744469870328, + "loss": 0.7389, + "mean_token_accuracy": 0.7769669115543365, + "num_tokens": 87338022.0, + "step": 25670 + }, + { + "epoch": 0.25773816692761653, + "learning_rate": 0.00014845437392107272, + "loss": 0.7527, + "mean_token_accuracy": 0.7749365508556366, + "num_tokens": 87371875.0, + "step": 25680 + }, + { + "epoch": 0.257838532257417, + "learning_rate": 0.0001484343008551126, + "loss": 0.7358, + "mean_token_accuracy": 0.7795381069183349, + "num_tokens": 87406221.0, + "step": 25690 + }, + { + "epoch": 0.2579388975872175, + "learning_rate": 0.00014841422778915254, + "loss": 0.7875, + "mean_token_accuracy": 0.7627764105796814, + "num_tokens": 87440019.0, + "step": 25700 + }, + { + "epoch": 0.25803926291701795, + "learning_rate": 0.00014839415472319242, + "loss": 0.7575, + "mean_token_accuracy": 0.7729061365127563, + "num_tokens": 87473672.0, + "step": 25710 + }, + { + "epoch": 0.2581396282468184, + "learning_rate": 0.00014837408165723233, + "loss": 0.7385, + "mean_token_accuracy": 0.7753385066986084, + "num_tokens": 87507791.0, + "step": 25720 + }, + { + "epoch": 0.2582399935766189, + "learning_rate": 0.00014835400859127223, + "loss": 0.7725, + "mean_token_accuracy": 0.769771808385849, + "num_tokens": 87541696.0, + "step": 25730 + }, + { + "epoch": 0.2583403589064194, + "learning_rate": 0.00014833393552531214, + "loss": 0.7594, + "mean_token_accuracy": 0.7752532303333283, + "num_tokens": 87575872.0, + "step": 25740 + }, + { + "epoch": 0.25844072423621983, + "learning_rate": 0.00014831386245935202, + "loss": 0.7869, + "mean_token_accuracy": 0.7630620658397674, + "num_tokens": 87609585.0, + "step": 25750 + }, + { + "epoch": 0.2585410895660203, + "learning_rate": 0.00014829378939339196, + "loss": 0.7837, + "mean_token_accuracy": 0.7641562402248383, + "num_tokens": 87642769.0, + "step": 25760 + }, + { + "epoch": 0.2586414548958208, + "learning_rate": 0.00014827371632743187, + "loss": 0.7451, + "mean_token_accuracy": 0.7799721121788025, + "num_tokens": 87677019.0, + "step": 25770 + }, + { + "epoch": 0.25874182022562126, + "learning_rate": 0.00014825364326147178, + "loss": 0.7809, + "mean_token_accuracy": 0.7631854057312012, + "num_tokens": 87710569.0, + "step": 25780 + }, + { + "epoch": 0.2588421855554217, + "learning_rate": 0.00014823357019551169, + "loss": 0.7645, + "mean_token_accuracy": 0.768880182504654, + "num_tokens": 87744559.0, + "step": 25790 + }, + { + "epoch": 0.2589425508852222, + "learning_rate": 0.00014821349712955157, + "loss": 0.7331, + "mean_token_accuracy": 0.7779667556285859, + "num_tokens": 87779111.0, + "step": 25800 + }, + { + "epoch": 0.2590429162150227, + "learning_rate": 0.0001481934240635915, + "loss": 0.7628, + "mean_token_accuracy": 0.7720450103282929, + "num_tokens": 87812979.0, + "step": 25810 + }, + { + "epoch": 0.25914328154482313, + "learning_rate": 0.00014817335099763138, + "loss": 0.7678, + "mean_token_accuracy": 0.7701455950737, + "num_tokens": 87846804.0, + "step": 25820 + }, + { + "epoch": 0.25924364687462365, + "learning_rate": 0.0001481532779316713, + "loss": 0.7376, + "mean_token_accuracy": 0.7828764975070953, + "num_tokens": 87880594.0, + "step": 25830 + }, + { + "epoch": 0.2593440122044241, + "learning_rate": 0.0001481332048657112, + "loss": 0.7419, + "mean_token_accuracy": 0.7778504431247711, + "num_tokens": 87915015.0, + "step": 25840 + }, + { + "epoch": 0.25944437753422456, + "learning_rate": 0.0001481131317997511, + "loss": 0.7597, + "mean_token_accuracy": 0.7739579916000366, + "num_tokens": 87949304.0, + "step": 25850 + }, + { + "epoch": 0.25954474286402507, + "learning_rate": 0.000148093058733791, + "loss": 0.7592, + "mean_token_accuracy": 0.7708935976028443, + "num_tokens": 87984007.0, + "step": 25860 + }, + { + "epoch": 0.2596451081938255, + "learning_rate": 0.00014807298566783093, + "loss": 0.7483, + "mean_token_accuracy": 0.7781088590621948, + "num_tokens": 88017751.0, + "step": 25870 + }, + { + "epoch": 0.259745473523626, + "learning_rate": 0.0001480529126018708, + "loss": 0.7626, + "mean_token_accuracy": 0.7717514097690582, + "num_tokens": 88051964.0, + "step": 25880 + }, + { + "epoch": 0.2598458388534265, + "learning_rate": 0.00014803283953591072, + "loss": 0.7754, + "mean_token_accuracy": 0.7723719537258148, + "num_tokens": 88086205.0, + "step": 25890 + }, + { + "epoch": 0.25994620418322695, + "learning_rate": 0.00014801276646995062, + "loss": 0.7677, + "mean_token_accuracy": 0.7652353048324585, + "num_tokens": 88120072.0, + "step": 25900 + }, + { + "epoch": 0.2600465695130274, + "learning_rate": 0.00014799269340399053, + "loss": 0.7664, + "mean_token_accuracy": 0.7733864307403564, + "num_tokens": 88154084.0, + "step": 25910 + }, + { + "epoch": 0.2601469348428279, + "learning_rate": 0.00014797262033803044, + "loss": 0.7458, + "mean_token_accuracy": 0.7812437653541565, + "num_tokens": 88187507.0, + "step": 25920 + }, + { + "epoch": 0.26024730017262837, + "learning_rate": 0.00014795254727207035, + "loss": 0.7518, + "mean_token_accuracy": 0.781405258178711, + "num_tokens": 88222091.0, + "step": 25930 + }, + { + "epoch": 0.2603476655024288, + "learning_rate": 0.00014793247420611026, + "loss": 0.758, + "mean_token_accuracy": 0.7747311294078827, + "num_tokens": 88256756.0, + "step": 25940 + }, + { + "epoch": 0.26044803083222934, + "learning_rate": 0.00014791240114015014, + "loss": 0.7998, + "mean_token_accuracy": 0.76486234664917, + "num_tokens": 88291051.0, + "step": 25950 + }, + { + "epoch": 0.2605483961620298, + "learning_rate": 0.00014789232807419007, + "loss": 0.7442, + "mean_token_accuracy": 0.774928230047226, + "num_tokens": 88325971.0, + "step": 25960 + }, + { + "epoch": 0.26064876149183025, + "learning_rate": 0.00014787225500822996, + "loss": 0.7897, + "mean_token_accuracy": 0.7625066220760346, + "num_tokens": 88359212.0, + "step": 25970 + }, + { + "epoch": 0.26074912682163076, + "learning_rate": 0.00014785218194226986, + "loss": 0.7635, + "mean_token_accuracy": 0.7737499475479126, + "num_tokens": 88393800.0, + "step": 25980 + }, + { + "epoch": 0.2608494921514312, + "learning_rate": 0.00014783210887630977, + "loss": 0.7666, + "mean_token_accuracy": 0.7730528473854065, + "num_tokens": 88427377.0, + "step": 25990 + }, + { + "epoch": 0.2609498574812317, + "learning_rate": 0.00014781203581034968, + "loss": 0.754, + "mean_token_accuracy": 0.7699731945991516, + "num_tokens": 88461009.0, + "step": 26000 + }, + { + "epoch": 0.2610502228110322, + "learning_rate": 0.0001477919627443896, + "loss": 0.7432, + "mean_token_accuracy": 0.7773293673992157, + "num_tokens": 88495592.0, + "step": 26010 + }, + { + "epoch": 0.26115058814083264, + "learning_rate": 0.0001477718896784295, + "loss": 0.7381, + "mean_token_accuracy": 0.7789890348911286, + "num_tokens": 88529869.0, + "step": 26020 + }, + { + "epoch": 0.2612509534706331, + "learning_rate": 0.0001477518166124694, + "loss": 0.7281, + "mean_token_accuracy": 0.7793543338775635, + "num_tokens": 88564353.0, + "step": 26030 + }, + { + "epoch": 0.26135131880043355, + "learning_rate": 0.0001477317435465093, + "loss": 0.7974, + "mean_token_accuracy": 0.7633599936962128, + "num_tokens": 88597465.0, + "step": 26040 + }, + { + "epoch": 0.26145168413023406, + "learning_rate": 0.00014771167048054922, + "loss": 0.7659, + "mean_token_accuracy": 0.7736822187900543, + "num_tokens": 88632088.0, + "step": 26050 + }, + { + "epoch": 0.2615520494600345, + "learning_rate": 0.0001476915974145891, + "loss": 0.7615, + "mean_token_accuracy": 0.775991004705429, + "num_tokens": 88666349.0, + "step": 26060 + }, + { + "epoch": 0.261652414789835, + "learning_rate": 0.000147671524348629, + "loss": 0.7854, + "mean_token_accuracy": 0.767848151922226, + "num_tokens": 88700496.0, + "step": 26070 + }, + { + "epoch": 0.2617527801196355, + "learning_rate": 0.00014765145128266892, + "loss": 0.7569, + "mean_token_accuracy": 0.7757873892784118, + "num_tokens": 88734242.0, + "step": 26080 + }, + { + "epoch": 0.26185314544943594, + "learning_rate": 0.00014763137821670883, + "loss": 0.7732, + "mean_token_accuracy": 0.7637600004673004, + "num_tokens": 88768767.0, + "step": 26090 + }, + { + "epoch": 0.2619535107792364, + "learning_rate": 0.0001476113051507487, + "loss": 0.7515, + "mean_token_accuracy": 0.7808138072490692, + "num_tokens": 88802694.0, + "step": 26100 + }, + { + "epoch": 0.2620538761090369, + "learning_rate": 0.00014759123208478865, + "loss": 0.7785, + "mean_token_accuracy": 0.7718406736850738, + "num_tokens": 88837667.0, + "step": 26110 + }, + { + "epoch": 0.26215424143883737, + "learning_rate": 0.00014757115901882856, + "loss": 0.7647, + "mean_token_accuracy": 0.7676180183887482, + "num_tokens": 88871970.0, + "step": 26120 + }, + { + "epoch": 0.2622546067686378, + "learning_rate": 0.00014755108595286844, + "loss": 0.763, + "mean_token_accuracy": 0.7729875087738037, + "num_tokens": 88906196.0, + "step": 26130 + }, + { + "epoch": 0.26235497209843833, + "learning_rate": 0.00014753101288690837, + "loss": 0.7668, + "mean_token_accuracy": 0.765146690607071, + "num_tokens": 88940835.0, + "step": 26140 + }, + { + "epoch": 0.2624553374282388, + "learning_rate": 0.00014751093982094825, + "loss": 0.7629, + "mean_token_accuracy": 0.7752687871456146, + "num_tokens": 88974742.0, + "step": 26150 + }, + { + "epoch": 0.26255570275803924, + "learning_rate": 0.00014749086675498816, + "loss": 0.7757, + "mean_token_accuracy": 0.766808158159256, + "num_tokens": 89008704.0, + "step": 26160 + }, + { + "epoch": 0.26265606808783976, + "learning_rate": 0.00014747079368902807, + "loss": 0.7471, + "mean_token_accuracy": 0.7748014807701111, + "num_tokens": 89042137.0, + "step": 26170 + }, + { + "epoch": 0.2627564334176402, + "learning_rate": 0.00014745072062306798, + "loss": 0.777, + "mean_token_accuracy": 0.7709549844264985, + "num_tokens": 89076907.0, + "step": 26180 + }, + { + "epoch": 0.26285679874744067, + "learning_rate": 0.00014743064755710786, + "loss": 0.7771, + "mean_token_accuracy": 0.769685173034668, + "num_tokens": 89111152.0, + "step": 26190 + }, + { + "epoch": 0.2629571640772412, + "learning_rate": 0.0001474105744911478, + "loss": 0.7893, + "mean_token_accuracy": 0.7698112249374389, + "num_tokens": 89144779.0, + "step": 26200 + }, + { + "epoch": 0.26305752940704163, + "learning_rate": 0.00014739050142518768, + "loss": 0.7556, + "mean_token_accuracy": 0.7724555194377899, + "num_tokens": 89179208.0, + "step": 26210 + }, + { + "epoch": 0.2631578947368421, + "learning_rate": 0.00014737042835922759, + "loss": 0.764, + "mean_token_accuracy": 0.7716877400875092, + "num_tokens": 89214342.0, + "step": 26220 + }, + { + "epoch": 0.2632582600666426, + "learning_rate": 0.0001473503552932675, + "loss": 0.7617, + "mean_token_accuracy": 0.7650292932987213, + "num_tokens": 89248605.0, + "step": 26230 + }, + { + "epoch": 0.26335862539644306, + "learning_rate": 0.0001473302822273074, + "loss": 0.7672, + "mean_token_accuracy": 0.7738565146923065, + "num_tokens": 89283124.0, + "step": 26240 + }, + { + "epoch": 0.2634589907262435, + "learning_rate": 0.0001473102091613473, + "loss": 0.7672, + "mean_token_accuracy": 0.7719832837581635, + "num_tokens": 89317935.0, + "step": 26250 + }, + { + "epoch": 0.263559356056044, + "learning_rate": 0.00014729013609538722, + "loss": 0.7356, + "mean_token_accuracy": 0.7735422611236572, + "num_tokens": 89351818.0, + "step": 26260 + }, + { + "epoch": 0.2636597213858445, + "learning_rate": 0.00014727006302942713, + "loss": 0.7358, + "mean_token_accuracy": 0.7762411177158356, + "num_tokens": 89386435.0, + "step": 26270 + }, + { + "epoch": 0.26376008671564494, + "learning_rate": 0.000147249989963467, + "loss": 0.7471, + "mean_token_accuracy": 0.7716344475746155, + "num_tokens": 89419913.0, + "step": 26280 + }, + { + "epoch": 0.26386045204544545, + "learning_rate": 0.00014722991689750694, + "loss": 0.756, + "mean_token_accuracy": 0.7759276568889618, + "num_tokens": 89453983.0, + "step": 26290 + }, + { + "epoch": 0.2639608173752459, + "learning_rate": 0.00014720984383154683, + "loss": 0.7705, + "mean_token_accuracy": 0.7660773396492004, + "num_tokens": 89488193.0, + "step": 26300 + }, + { + "epoch": 0.26406118270504636, + "learning_rate": 0.00014718977076558673, + "loss": 0.7792, + "mean_token_accuracy": 0.7708575546741485, + "num_tokens": 89522827.0, + "step": 26310 + }, + { + "epoch": 0.2641615480348468, + "learning_rate": 0.00014716969769962664, + "loss": 0.7586, + "mean_token_accuracy": 0.7754275083541871, + "num_tokens": 89557222.0, + "step": 26320 + }, + { + "epoch": 0.2642619133646473, + "learning_rate": 0.00014714962463366655, + "loss": 0.7269, + "mean_token_accuracy": 0.7784863173961639, + "num_tokens": 89590824.0, + "step": 26330 + }, + { + "epoch": 0.2643622786944478, + "learning_rate": 0.00014712955156770646, + "loss": 0.7862, + "mean_token_accuracy": 0.7694959044456482, + "num_tokens": 89624242.0, + "step": 26340 + }, + { + "epoch": 0.26446264402424824, + "learning_rate": 0.00014710947850174637, + "loss": 0.774, + "mean_token_accuracy": 0.7698050498962402, + "num_tokens": 89658183.0, + "step": 26350 + }, + { + "epoch": 0.26456300935404875, + "learning_rate": 0.00014708940543578628, + "loss": 0.7435, + "mean_token_accuracy": 0.7790042400360108, + "num_tokens": 89692498.0, + "step": 26360 + }, + { + "epoch": 0.2646633746838492, + "learning_rate": 0.00014706933236982618, + "loss": 0.7808, + "mean_token_accuracy": 0.7702409267425537, + "num_tokens": 89726203.0, + "step": 26370 + }, + { + "epoch": 0.26476374001364966, + "learning_rate": 0.0001470492593038661, + "loss": 0.7667, + "mean_token_accuracy": 0.7702608048915863, + "num_tokens": 89761020.0, + "step": 26380 + }, + { + "epoch": 0.2648641053434502, + "learning_rate": 0.00014702918623790597, + "loss": 0.7636, + "mean_token_accuracy": 0.7724583685398102, + "num_tokens": 89794899.0, + "step": 26390 + }, + { + "epoch": 0.26496447067325063, + "learning_rate": 0.0001470091131719459, + "loss": 0.7647, + "mean_token_accuracy": 0.7716863036155701, + "num_tokens": 89829349.0, + "step": 26400 + }, + { + "epoch": 0.2650648360030511, + "learning_rate": 0.0001469890401059858, + "loss": 0.7896, + "mean_token_accuracy": 0.7599710524082184, + "num_tokens": 89863346.0, + "step": 26410 + }, + { + "epoch": 0.2651652013328516, + "learning_rate": 0.0001469689670400257, + "loss": 0.7805, + "mean_token_accuracy": 0.7709419846534729, + "num_tokens": 89897702.0, + "step": 26420 + }, + { + "epoch": 0.26526556666265205, + "learning_rate": 0.0001469488939740656, + "loss": 0.7534, + "mean_token_accuracy": 0.7745054662227631, + "num_tokens": 89931936.0, + "step": 26430 + }, + { + "epoch": 0.2653659319924525, + "learning_rate": 0.00014692882090810552, + "loss": 0.773, + "mean_token_accuracy": 0.7691297650337219, + "num_tokens": 89965848.0, + "step": 26440 + }, + { + "epoch": 0.265466297322253, + "learning_rate": 0.0001469087478421454, + "loss": 0.7411, + "mean_token_accuracy": 0.7742989897727967, + "num_tokens": 90000381.0, + "step": 26450 + }, + { + "epoch": 0.2655666626520535, + "learning_rate": 0.00014688867477618533, + "loss": 0.7487, + "mean_token_accuracy": 0.7739397466182709, + "num_tokens": 90034983.0, + "step": 26460 + }, + { + "epoch": 0.26566702798185393, + "learning_rate": 0.00014686860171022524, + "loss": 0.7722, + "mean_token_accuracy": 0.7688474774360656, + "num_tokens": 90068902.0, + "step": 26470 + }, + { + "epoch": 0.26576739331165444, + "learning_rate": 0.00014684852864426512, + "loss": 0.7474, + "mean_token_accuracy": 0.7761471569538116, + "num_tokens": 90102872.0, + "step": 26480 + }, + { + "epoch": 0.2658677586414549, + "learning_rate": 0.00014682845557830506, + "loss": 0.75, + "mean_token_accuracy": 0.7720959186553955, + "num_tokens": 90136397.0, + "step": 26490 + }, + { + "epoch": 0.26596812397125535, + "learning_rate": 0.00014680838251234494, + "loss": 0.7705, + "mean_token_accuracy": 0.769785875082016, + "num_tokens": 90169930.0, + "step": 26500 + }, + { + "epoch": 0.26606848930105587, + "learning_rate": 0.00014678830944638485, + "loss": 0.7813, + "mean_token_accuracy": 0.7711447656154633, + "num_tokens": 90204175.0, + "step": 26510 + }, + { + "epoch": 0.2661688546308563, + "learning_rate": 0.00014676823638042476, + "loss": 0.7756, + "mean_token_accuracy": 0.7681370198726654, + "num_tokens": 90238114.0, + "step": 26520 + }, + { + "epoch": 0.2662692199606568, + "learning_rate": 0.00014674816331446467, + "loss": 0.7562, + "mean_token_accuracy": 0.7734508454799652, + "num_tokens": 90272322.0, + "step": 26530 + }, + { + "epoch": 0.2663695852904573, + "learning_rate": 0.00014672809024850455, + "loss": 0.7734, + "mean_token_accuracy": 0.770289134979248, + "num_tokens": 90305800.0, + "step": 26540 + }, + { + "epoch": 0.26646995062025775, + "learning_rate": 0.00014670801718254448, + "loss": 0.7493, + "mean_token_accuracy": 0.7708206474781036, + "num_tokens": 90339684.0, + "step": 26550 + }, + { + "epoch": 0.2665703159500582, + "learning_rate": 0.00014668794411658436, + "loss": 0.7423, + "mean_token_accuracy": 0.7786689579486847, + "num_tokens": 90372906.0, + "step": 26560 + }, + { + "epoch": 0.2666706812798587, + "learning_rate": 0.00014666787105062427, + "loss": 0.7369, + "mean_token_accuracy": 0.7815804660320282, + "num_tokens": 90406942.0, + "step": 26570 + }, + { + "epoch": 0.26677104660965917, + "learning_rate": 0.00014664779798466418, + "loss": 0.776, + "mean_token_accuracy": 0.7725221812725067, + "num_tokens": 90440698.0, + "step": 26580 + }, + { + "epoch": 0.2668714119394596, + "learning_rate": 0.0001466277249187041, + "loss": 0.7444, + "mean_token_accuracy": 0.7757733106613159, + "num_tokens": 90474987.0, + "step": 26590 + }, + { + "epoch": 0.2669717772692601, + "learning_rate": 0.000146607651852744, + "loss": 0.7831, + "mean_token_accuracy": 0.7649937748908997, + "num_tokens": 90508097.0, + "step": 26600 + }, + { + "epoch": 0.2670721425990606, + "learning_rate": 0.0001465875787867839, + "loss": 0.7617, + "mean_token_accuracy": 0.7734456777572631, + "num_tokens": 90542306.0, + "step": 26610 + }, + { + "epoch": 0.26717250792886105, + "learning_rate": 0.00014656750572082381, + "loss": 0.7369, + "mean_token_accuracy": 0.7760408341884613, + "num_tokens": 90576882.0, + "step": 26620 + }, + { + "epoch": 0.2672728732586615, + "learning_rate": 0.0001465474326548637, + "loss": 0.7669, + "mean_token_accuracy": 0.771179610490799, + "num_tokens": 90611481.0, + "step": 26630 + }, + { + "epoch": 0.267373238588462, + "learning_rate": 0.00014652735958890363, + "loss": 0.7684, + "mean_token_accuracy": 0.7678513467311859, + "num_tokens": 90645536.0, + "step": 26640 + }, + { + "epoch": 0.26747360391826247, + "learning_rate": 0.0001465072865229435, + "loss": 0.7648, + "mean_token_accuracy": 0.7721072733402252, + "num_tokens": 90677927.0, + "step": 26650 + }, + { + "epoch": 0.2675739692480629, + "learning_rate": 0.00014648721345698342, + "loss": 0.756, + "mean_token_accuracy": 0.7761224567890167, + "num_tokens": 90711841.0, + "step": 26660 + }, + { + "epoch": 0.26767433457786344, + "learning_rate": 0.00014646714039102333, + "loss": 0.798, + "mean_token_accuracy": 0.7591996788978577, + "num_tokens": 90745399.0, + "step": 26670 + }, + { + "epoch": 0.2677746999076639, + "learning_rate": 0.00014644706732506324, + "loss": 0.7148, + "mean_token_accuracy": 0.7797797799110413, + "num_tokens": 90780285.0, + "step": 26680 + }, + { + "epoch": 0.26787506523746435, + "learning_rate": 0.00014642699425910315, + "loss": 0.7872, + "mean_token_accuracy": 0.7621639013290405, + "num_tokens": 90814627.0, + "step": 26690 + }, + { + "epoch": 0.26797543056726486, + "learning_rate": 0.00014640692119314305, + "loss": 0.748, + "mean_token_accuracy": 0.7777003645896912, + "num_tokens": 90848678.0, + "step": 26700 + }, + { + "epoch": 0.2680757958970653, + "learning_rate": 0.00014638684812718296, + "loss": 0.7405, + "mean_token_accuracy": 0.7803672850131989, + "num_tokens": 90883023.0, + "step": 26710 + }, + { + "epoch": 0.2681761612268658, + "learning_rate": 0.00014636677506122284, + "loss": 0.7517, + "mean_token_accuracy": 0.776670640707016, + "num_tokens": 90916308.0, + "step": 26720 + }, + { + "epoch": 0.2682765265566663, + "learning_rate": 0.00014634670199526278, + "loss": 0.7811, + "mean_token_accuracy": 0.7678254127502442, + "num_tokens": 90950190.0, + "step": 26730 + }, + { + "epoch": 0.26837689188646674, + "learning_rate": 0.00014632662892930266, + "loss": 0.7742, + "mean_token_accuracy": 0.7694431900978088, + "num_tokens": 90984264.0, + "step": 26740 + }, + { + "epoch": 0.2684772572162672, + "learning_rate": 0.00014630655586334257, + "loss": 0.7571, + "mean_token_accuracy": 0.7706903934478759, + "num_tokens": 91018052.0, + "step": 26750 + }, + { + "epoch": 0.2685776225460677, + "learning_rate": 0.00014628648279738248, + "loss": 0.7584, + "mean_token_accuracy": 0.7746901094913483, + "num_tokens": 91051633.0, + "step": 26760 + }, + { + "epoch": 0.26867798787586816, + "learning_rate": 0.0001462664097314224, + "loss": 0.7367, + "mean_token_accuracy": 0.7790070295333862, + "num_tokens": 91085155.0, + "step": 26770 + }, + { + "epoch": 0.2687783532056686, + "learning_rate": 0.00014624633666546227, + "loss": 0.7598, + "mean_token_accuracy": 0.7718618929386138, + "num_tokens": 91119620.0, + "step": 26780 + }, + { + "epoch": 0.26887871853546913, + "learning_rate": 0.0001462262635995022, + "loss": 0.7817, + "mean_token_accuracy": 0.7654790699481964, + "num_tokens": 91153999.0, + "step": 26790 + }, + { + "epoch": 0.2689790838652696, + "learning_rate": 0.00014620619053354208, + "loss": 0.7861, + "mean_token_accuracy": 0.7685680568218232, + "num_tokens": 91188823.0, + "step": 26800 + }, + { + "epoch": 0.26907944919507004, + "learning_rate": 0.000146186117467582, + "loss": 0.7468, + "mean_token_accuracy": 0.7814339876174927, + "num_tokens": 91222517.0, + "step": 26810 + }, + { + "epoch": 0.26917981452487055, + "learning_rate": 0.00014616604440162193, + "loss": 0.7612, + "mean_token_accuracy": 0.7738438963890075, + "num_tokens": 91255788.0, + "step": 26820 + }, + { + "epoch": 0.269280179854671, + "learning_rate": 0.0001461459713356618, + "loss": 0.7524, + "mean_token_accuracy": 0.7798373401165009, + "num_tokens": 91290426.0, + "step": 26830 + }, + { + "epoch": 0.26938054518447146, + "learning_rate": 0.00014612589826970172, + "loss": 0.7551, + "mean_token_accuracy": 0.7722236275672912, + "num_tokens": 91324006.0, + "step": 26840 + }, + { + "epoch": 0.269480910514272, + "learning_rate": 0.00014610582520374163, + "loss": 0.7644, + "mean_token_accuracy": 0.7733603954315186, + "num_tokens": 91358023.0, + "step": 26850 + }, + { + "epoch": 0.26958127584407243, + "learning_rate": 0.00014608575213778154, + "loss": 0.7467, + "mean_token_accuracy": 0.7735972940921784, + "num_tokens": 91391146.0, + "step": 26860 + }, + { + "epoch": 0.2696816411738729, + "learning_rate": 0.00014606567907182142, + "loss": 0.7633, + "mean_token_accuracy": 0.7709302246570587, + "num_tokens": 91424533.0, + "step": 26870 + }, + { + "epoch": 0.26978200650367334, + "learning_rate": 0.00014604560600586135, + "loss": 0.7555, + "mean_token_accuracy": 0.7727507174015045, + "num_tokens": 91459307.0, + "step": 26880 + }, + { + "epoch": 0.26988237183347386, + "learning_rate": 0.00014602553293990123, + "loss": 0.791, + "mean_token_accuracy": 0.7658800482749939, + "num_tokens": 91492206.0, + "step": 26890 + }, + { + "epoch": 0.2699827371632743, + "learning_rate": 0.00014600545987394114, + "loss": 0.7527, + "mean_token_accuracy": 0.7779639959335327, + "num_tokens": 91526738.0, + "step": 26900 + }, + { + "epoch": 0.27008310249307477, + "learning_rate": 0.00014598538680798105, + "loss": 0.8066, + "mean_token_accuracy": 0.7683506786823273, + "num_tokens": 91561481.0, + "step": 26910 + }, + { + "epoch": 0.2701834678228753, + "learning_rate": 0.00014596531374202096, + "loss": 0.7674, + "mean_token_accuracy": 0.7711017251014709, + "num_tokens": 91594524.0, + "step": 26920 + }, + { + "epoch": 0.27028383315267573, + "learning_rate": 0.00014594524067606087, + "loss": 0.7502, + "mean_token_accuracy": 0.7745255947113037, + "num_tokens": 91628790.0, + "step": 26930 + }, + { + "epoch": 0.2703841984824762, + "learning_rate": 0.00014592516761010078, + "loss": 0.7484, + "mean_token_accuracy": 0.7774655818939209, + "num_tokens": 91662405.0, + "step": 26940 + }, + { + "epoch": 0.2704845638122767, + "learning_rate": 0.00014590509454414068, + "loss": 0.7758, + "mean_token_accuracy": 0.7700693845748902, + "num_tokens": 91695910.0, + "step": 26950 + }, + { + "epoch": 0.27058492914207716, + "learning_rate": 0.0001458850214781806, + "loss": 0.7373, + "mean_token_accuracy": 0.7784343719482422, + "num_tokens": 91730220.0, + "step": 26960 + }, + { + "epoch": 0.2706852944718776, + "learning_rate": 0.0001458649484122205, + "loss": 0.77, + "mean_token_accuracy": 0.7710197031497955, + "num_tokens": 91764271.0, + "step": 26970 + }, + { + "epoch": 0.2707856598016781, + "learning_rate": 0.00014584487534626038, + "loss": 0.755, + "mean_token_accuracy": 0.7732560396194458, + "num_tokens": 91798289.0, + "step": 26980 + }, + { + "epoch": 0.2708860251314786, + "learning_rate": 0.00014582480228030032, + "loss": 0.804, + "mean_token_accuracy": 0.7688061237335205, + "num_tokens": 91833897.0, + "step": 26990 + }, + { + "epoch": 0.27098639046127904, + "learning_rate": 0.0001458047292143402, + "loss": 0.7586, + "mean_token_accuracy": 0.7720942556858063, + "num_tokens": 91866369.0, + "step": 27000 + }, + { + "epoch": 0.27108675579107955, + "learning_rate": 0.0001457846561483801, + "loss": 0.7596, + "mean_token_accuracy": 0.7738721609115601, + "num_tokens": 91900038.0, + "step": 27010 + }, + { + "epoch": 0.27118712112088, + "learning_rate": 0.00014576458308242002, + "loss": 0.7948, + "mean_token_accuracy": 0.766669362783432, + "num_tokens": 91933852.0, + "step": 27020 + }, + { + "epoch": 0.27128748645068046, + "learning_rate": 0.00014574451001645992, + "loss": 0.7531, + "mean_token_accuracy": 0.7770777583122254, + "num_tokens": 91968304.0, + "step": 27030 + }, + { + "epoch": 0.27138785178048097, + "learning_rate": 0.00014572443695049983, + "loss": 0.7481, + "mean_token_accuracy": 0.7717696845531463, + "num_tokens": 92001663.0, + "step": 27040 + }, + { + "epoch": 0.2714882171102814, + "learning_rate": 0.00014570436388453974, + "loss": 0.7413, + "mean_token_accuracy": 0.776682448387146, + "num_tokens": 92035535.0, + "step": 27050 + }, + { + "epoch": 0.2715885824400819, + "learning_rate": 0.00014568429081857965, + "loss": 0.7579, + "mean_token_accuracy": 0.7750038385391236, + "num_tokens": 92069123.0, + "step": 27060 + }, + { + "epoch": 0.2716889477698824, + "learning_rate": 0.00014566421775261953, + "loss": 0.7796, + "mean_token_accuracy": 0.769258689880371, + "num_tokens": 92103429.0, + "step": 27070 + }, + { + "epoch": 0.27178931309968285, + "learning_rate": 0.00014564414468665947, + "loss": 0.7679, + "mean_token_accuracy": 0.7737447798252106, + "num_tokens": 92137066.0, + "step": 27080 + }, + { + "epoch": 0.2718896784294833, + "learning_rate": 0.00014562407162069935, + "loss": 0.7683, + "mean_token_accuracy": 0.7694413065910339, + "num_tokens": 92170835.0, + "step": 27090 + }, + { + "epoch": 0.2719900437592838, + "learning_rate": 0.00014560399855473926, + "loss": 0.7937, + "mean_token_accuracy": 0.7688502252101899, + "num_tokens": 92204605.0, + "step": 27100 + }, + { + "epoch": 0.2720904090890843, + "learning_rate": 0.00014558392548877917, + "loss": 0.7626, + "mean_token_accuracy": 0.7689731538295745, + "num_tokens": 92238421.0, + "step": 27110 + }, + { + "epoch": 0.27219077441888473, + "learning_rate": 0.00014556385242281907, + "loss": 0.7851, + "mean_token_accuracy": 0.7678522109985352, + "num_tokens": 92271632.0, + "step": 27120 + }, + { + "epoch": 0.27229113974868524, + "learning_rate": 0.00014554377935685895, + "loss": 0.7798, + "mean_token_accuracy": 0.7715808153152466, + "num_tokens": 92306359.0, + "step": 27130 + }, + { + "epoch": 0.2723915050784857, + "learning_rate": 0.0001455237062908989, + "loss": 0.749, + "mean_token_accuracy": 0.7793966174125672, + "num_tokens": 92340190.0, + "step": 27140 + }, + { + "epoch": 0.27249187040828615, + "learning_rate": 0.00014550363322493877, + "loss": 0.7427, + "mean_token_accuracy": 0.7762248814105988, + "num_tokens": 92374829.0, + "step": 27150 + }, + { + "epoch": 0.2725922357380866, + "learning_rate": 0.00014548356015897868, + "loss": 0.7611, + "mean_token_accuracy": 0.774640703201294, + "num_tokens": 92408164.0, + "step": 27160 + }, + { + "epoch": 0.2726926010678871, + "learning_rate": 0.00014546348709301862, + "loss": 0.7566, + "mean_token_accuracy": 0.769939798116684, + "num_tokens": 92441790.0, + "step": 27170 + }, + { + "epoch": 0.2727929663976876, + "learning_rate": 0.0001454434140270585, + "loss": 0.7516, + "mean_token_accuracy": 0.7719286739826202, + "num_tokens": 92475623.0, + "step": 27180 + }, + { + "epoch": 0.27289333172748803, + "learning_rate": 0.0001454233409610984, + "loss": 0.759, + "mean_token_accuracy": 0.7721605718135833, + "num_tokens": 92509903.0, + "step": 27190 + }, + { + "epoch": 0.27299369705728854, + "learning_rate": 0.00014540326789513831, + "loss": 0.7858, + "mean_token_accuracy": 0.769053041934967, + "num_tokens": 92543066.0, + "step": 27200 + }, + { + "epoch": 0.273094062387089, + "learning_rate": 0.00014538319482917822, + "loss": 0.7449, + "mean_token_accuracy": 0.7751676380634308, + "num_tokens": 92577254.0, + "step": 27210 + }, + { + "epoch": 0.27319442771688945, + "learning_rate": 0.0001453631217632181, + "loss": 0.7531, + "mean_token_accuracy": 0.7739300549030304, + "num_tokens": 92611429.0, + "step": 27220 + }, + { + "epoch": 0.27329479304668997, + "learning_rate": 0.00014534304869725804, + "loss": 0.7595, + "mean_token_accuracy": 0.7717872381210327, + "num_tokens": 92645621.0, + "step": 27230 + }, + { + "epoch": 0.2733951583764904, + "learning_rate": 0.00014532297563129792, + "loss": 0.7555, + "mean_token_accuracy": 0.7736692726612091, + "num_tokens": 92679943.0, + "step": 27240 + }, + { + "epoch": 0.2734955237062909, + "learning_rate": 0.00014530290256533783, + "loss": 0.7526, + "mean_token_accuracy": 0.7769086182117462, + "num_tokens": 92714044.0, + "step": 27250 + }, + { + "epoch": 0.2735958890360914, + "learning_rate": 0.00014528282949937774, + "loss": 0.7704, + "mean_token_accuracy": 0.7706098198890686, + "num_tokens": 92747702.0, + "step": 27260 + }, + { + "epoch": 0.27369625436589184, + "learning_rate": 0.00014526275643341765, + "loss": 0.758, + "mean_token_accuracy": 0.7733682990074158, + "num_tokens": 92781472.0, + "step": 27270 + }, + { + "epoch": 0.2737966196956923, + "learning_rate": 0.00014524268336745755, + "loss": 0.7782, + "mean_token_accuracy": 0.7743779301643372, + "num_tokens": 92815143.0, + "step": 27280 + }, + { + "epoch": 0.2738969850254928, + "learning_rate": 0.00014522261030149746, + "loss": 0.772, + "mean_token_accuracy": 0.7625142872333527, + "num_tokens": 92849414.0, + "step": 27290 + }, + { + "epoch": 0.27399735035529327, + "learning_rate": 0.00014520253723553737, + "loss": 0.7282, + "mean_token_accuracy": 0.7782218098640442, + "num_tokens": 92883309.0, + "step": 27300 + }, + { + "epoch": 0.2740977156850937, + "learning_rate": 0.00014518246416957725, + "loss": 0.7501, + "mean_token_accuracy": 0.7723683476448059, + "num_tokens": 92917119.0, + "step": 27310 + }, + { + "epoch": 0.27419808101489423, + "learning_rate": 0.0001451623911036172, + "loss": 0.7795, + "mean_token_accuracy": 0.7603408515453338, + "num_tokens": 92951054.0, + "step": 27320 + }, + { + "epoch": 0.2742984463446947, + "learning_rate": 0.00014514231803765707, + "loss": 0.7496, + "mean_token_accuracy": 0.7706218063831329, + "num_tokens": 92985246.0, + "step": 27330 + }, + { + "epoch": 0.27439881167449515, + "learning_rate": 0.00014512224497169698, + "loss": 0.7861, + "mean_token_accuracy": 0.7647865056991577, + "num_tokens": 93019185.0, + "step": 27340 + }, + { + "epoch": 0.27449917700429566, + "learning_rate": 0.00014510217190573689, + "loss": 0.7869, + "mean_token_accuracy": 0.7622201561927795, + "num_tokens": 93052004.0, + "step": 27350 + }, + { + "epoch": 0.2745995423340961, + "learning_rate": 0.0001450820988397768, + "loss": 0.7667, + "mean_token_accuracy": 0.7691390633583068, + "num_tokens": 93085775.0, + "step": 27360 + }, + { + "epoch": 0.27469990766389657, + "learning_rate": 0.0001450620257738167, + "loss": 0.7774, + "mean_token_accuracy": 0.7697662651538849, + "num_tokens": 93119339.0, + "step": 27370 + }, + { + "epoch": 0.2748002729936971, + "learning_rate": 0.0001450419527078566, + "loss": 0.7812, + "mean_token_accuracy": 0.7708326518535614, + "num_tokens": 93152624.0, + "step": 27380 + }, + { + "epoch": 0.27490063832349754, + "learning_rate": 0.00014502187964189652, + "loss": 0.7749, + "mean_token_accuracy": 0.773492568731308, + "num_tokens": 93187350.0, + "step": 27390 + }, + { + "epoch": 0.275001003653298, + "learning_rate": 0.0001450018065759364, + "loss": 0.7615, + "mean_token_accuracy": 0.7714549422264099, + "num_tokens": 93221486.0, + "step": 27400 + }, + { + "epoch": 0.2751013689830985, + "learning_rate": 0.00014498173350997634, + "loss": 0.7441, + "mean_token_accuracy": 0.7719537556171417, + "num_tokens": 93255173.0, + "step": 27410 + }, + { + "epoch": 0.27520173431289896, + "learning_rate": 0.00014496166044401622, + "loss": 0.7648, + "mean_token_accuracy": 0.7742453396320343, + "num_tokens": 93287585.0, + "step": 27420 + }, + { + "epoch": 0.2753020996426994, + "learning_rate": 0.00014494158737805613, + "loss": 0.788, + "mean_token_accuracy": 0.7616688489913941, + "num_tokens": 93321191.0, + "step": 27430 + }, + { + "epoch": 0.27540246497249987, + "learning_rate": 0.00014492151431209603, + "loss": 0.7625, + "mean_token_accuracy": 0.7683378040790558, + "num_tokens": 93354782.0, + "step": 27440 + }, + { + "epoch": 0.2755028303023004, + "learning_rate": 0.00014490144124613594, + "loss": 0.7866, + "mean_token_accuracy": 0.7675630867481231, + "num_tokens": 93388494.0, + "step": 27450 + }, + { + "epoch": 0.27560319563210084, + "learning_rate": 0.00014488136818017582, + "loss": 0.7565, + "mean_token_accuracy": 0.7782629013061524, + "num_tokens": 93422181.0, + "step": 27460 + }, + { + "epoch": 0.2757035609619013, + "learning_rate": 0.00014486129511421576, + "loss": 0.7416, + "mean_token_accuracy": 0.7764272034168244, + "num_tokens": 93456328.0, + "step": 27470 + }, + { + "epoch": 0.2758039262917018, + "learning_rate": 0.00014484122204825564, + "loss": 0.7569, + "mean_token_accuracy": 0.7699039518833161, + "num_tokens": 93490705.0, + "step": 27480 + }, + { + "epoch": 0.27590429162150226, + "learning_rate": 0.00014482114898229558, + "loss": 0.7709, + "mean_token_accuracy": 0.773164016008377, + "num_tokens": 93524210.0, + "step": 27490 + }, + { + "epoch": 0.2760046569513027, + "learning_rate": 0.00014480107591633546, + "loss": 0.7364, + "mean_token_accuracy": 0.7783370196819306, + "num_tokens": 93558061.0, + "step": 27500 + }, + { + "epoch": 0.27610502228110323, + "learning_rate": 0.00014478100285037537, + "loss": 0.7507, + "mean_token_accuracy": 0.7777692973613739, + "num_tokens": 93593033.0, + "step": 27510 + }, + { + "epoch": 0.2762053876109037, + "learning_rate": 0.0001447609297844153, + "loss": 0.7486, + "mean_token_accuracy": 0.7742154121398925, + "num_tokens": 93626303.0, + "step": 27520 + }, + { + "epoch": 0.27630575294070414, + "learning_rate": 0.00014474085671845518, + "loss": 0.7917, + "mean_token_accuracy": 0.76452516913414, + "num_tokens": 93661039.0, + "step": 27530 + }, + { + "epoch": 0.27640611827050465, + "learning_rate": 0.0001447207836524951, + "loss": 0.7643, + "mean_token_accuracy": 0.7712850332260132, + "num_tokens": 93694127.0, + "step": 27540 + }, + { + "epoch": 0.2765064836003051, + "learning_rate": 0.000144700710586535, + "loss": 0.7515, + "mean_token_accuracy": 0.7779252588748932, + "num_tokens": 93727570.0, + "step": 27550 + }, + { + "epoch": 0.27660684893010556, + "learning_rate": 0.0001446806375205749, + "loss": 0.7731, + "mean_token_accuracy": 0.7694986999034882, + "num_tokens": 93761211.0, + "step": 27560 + }, + { + "epoch": 0.2767072142599061, + "learning_rate": 0.0001446605644546148, + "loss": 0.7703, + "mean_token_accuracy": 0.7661393880844116, + "num_tokens": 93794623.0, + "step": 27570 + }, + { + "epoch": 0.27680757958970653, + "learning_rate": 0.00014464049138865473, + "loss": 0.7699, + "mean_token_accuracy": 0.7691900432109833, + "num_tokens": 93828423.0, + "step": 27580 + }, + { + "epoch": 0.276907944919507, + "learning_rate": 0.0001446204183226946, + "loss": 0.7637, + "mean_token_accuracy": 0.7683387637138367, + "num_tokens": 93861875.0, + "step": 27590 + }, + { + "epoch": 0.2770083102493075, + "learning_rate": 0.00014460034525673452, + "loss": 0.7609, + "mean_token_accuracy": 0.7742133915424347, + "num_tokens": 93895356.0, + "step": 27600 + }, + { + "epoch": 0.27710867557910795, + "learning_rate": 0.00014458027219077442, + "loss": 0.7438, + "mean_token_accuracy": 0.7763895392417908, + "num_tokens": 93929096.0, + "step": 27610 + }, + { + "epoch": 0.2772090409089084, + "learning_rate": 0.00014456019912481433, + "loss": 0.7544, + "mean_token_accuracy": 0.7730475723743438, + "num_tokens": 93962868.0, + "step": 27620 + }, + { + "epoch": 0.2773094062387089, + "learning_rate": 0.00014454012605885424, + "loss": 0.7662, + "mean_token_accuracy": 0.7731011271476745, + "num_tokens": 93997156.0, + "step": 27630 + }, + { + "epoch": 0.2774097715685094, + "learning_rate": 0.00014452005299289415, + "loss": 0.7569, + "mean_token_accuracy": 0.7725311994552613, + "num_tokens": 94031395.0, + "step": 27640 + }, + { + "epoch": 0.27751013689830983, + "learning_rate": 0.00014449997992693406, + "loss": 0.7388, + "mean_token_accuracy": 0.7824570715427399, + "num_tokens": 94065614.0, + "step": 27650 + }, + { + "epoch": 0.27761050222811035, + "learning_rate": 0.00014447990686097394, + "loss": 0.735, + "mean_token_accuracy": 0.7755841255187989, + "num_tokens": 94099789.0, + "step": 27660 + }, + { + "epoch": 0.2777108675579108, + "learning_rate": 0.00014445983379501387, + "loss": 0.7411, + "mean_token_accuracy": 0.7816408157348633, + "num_tokens": 94133642.0, + "step": 27670 + }, + { + "epoch": 0.27781123288771126, + "learning_rate": 0.00014443976072905376, + "loss": 0.7383, + "mean_token_accuracy": 0.7797886252403259, + "num_tokens": 94167582.0, + "step": 27680 + }, + { + "epoch": 0.27791159821751177, + "learning_rate": 0.00014441968766309366, + "loss": 0.7522, + "mean_token_accuracy": 0.7724378883838654, + "num_tokens": 94202495.0, + "step": 27690 + }, + { + "epoch": 0.2780119635473122, + "learning_rate": 0.00014439961459713357, + "loss": 0.7833, + "mean_token_accuracy": 0.7701262414455414, + "num_tokens": 94236805.0, + "step": 27700 + }, + { + "epoch": 0.2781123288771127, + "learning_rate": 0.00014437954153117348, + "loss": 0.802, + "mean_token_accuracy": 0.7600609242916108, + "num_tokens": 94270099.0, + "step": 27710 + }, + { + "epoch": 0.2782126942069132, + "learning_rate": 0.0001443594684652134, + "loss": 0.7378, + "mean_token_accuracy": 0.7771346986293792, + "num_tokens": 94304587.0, + "step": 27720 + }, + { + "epoch": 0.27831305953671365, + "learning_rate": 0.0001443393953992533, + "loss": 0.7512, + "mean_token_accuracy": 0.7794571101665497, + "num_tokens": 94338925.0, + "step": 27730 + }, + { + "epoch": 0.2784134248665141, + "learning_rate": 0.0001443193223332932, + "loss": 0.7579, + "mean_token_accuracy": 0.7762793719768524, + "num_tokens": 94373156.0, + "step": 27740 + }, + { + "epoch": 0.27851379019631456, + "learning_rate": 0.0001442992492673331, + "loss": 0.7466, + "mean_token_accuracy": 0.7774362564086914, + "num_tokens": 94407745.0, + "step": 27750 + }, + { + "epoch": 0.27861415552611507, + "learning_rate": 0.00014427917620137302, + "loss": 0.7695, + "mean_token_accuracy": 0.7731296360492707, + "num_tokens": 94441357.0, + "step": 27760 + }, + { + "epoch": 0.2787145208559155, + "learning_rate": 0.0001442591031354129, + "loss": 0.7778, + "mean_token_accuracy": 0.772819846868515, + "num_tokens": 94474707.0, + "step": 27770 + }, + { + "epoch": 0.278814886185716, + "learning_rate": 0.0001442390300694528, + "loss": 0.7193, + "mean_token_accuracy": 0.7839652538299561, + "num_tokens": 94509157.0, + "step": 27780 + }, + { + "epoch": 0.2789152515155165, + "learning_rate": 0.00014421895700349272, + "loss": 0.7626, + "mean_token_accuracy": 0.7695025742053986, + "num_tokens": 94542957.0, + "step": 27790 + }, + { + "epoch": 0.27901561684531695, + "learning_rate": 0.00014419888393753263, + "loss": 0.772, + "mean_token_accuracy": 0.7738290429115295, + "num_tokens": 94577156.0, + "step": 27800 + }, + { + "epoch": 0.2791159821751174, + "learning_rate": 0.0001441788108715725, + "loss": 0.7546, + "mean_token_accuracy": 0.779708981513977, + "num_tokens": 94610412.0, + "step": 27810 + }, + { + "epoch": 0.2792163475049179, + "learning_rate": 0.00014415873780561245, + "loss": 0.7716, + "mean_token_accuracy": 0.7689424514770508, + "num_tokens": 94644339.0, + "step": 27820 + }, + { + "epoch": 0.2793167128347184, + "learning_rate": 0.00014413866473965233, + "loss": 0.7807, + "mean_token_accuracy": 0.7719169199466706, + "num_tokens": 94678212.0, + "step": 27830 + }, + { + "epoch": 0.27941707816451883, + "learning_rate": 0.00014411859167369224, + "loss": 0.8012, + "mean_token_accuracy": 0.7627018094062805, + "num_tokens": 94711572.0, + "step": 27840 + }, + { + "epoch": 0.27951744349431934, + "learning_rate": 0.00014409851860773215, + "loss": 0.7563, + "mean_token_accuracy": 0.7732181370258331, + "num_tokens": 94746210.0, + "step": 27850 + }, + { + "epoch": 0.2796178088241198, + "learning_rate": 0.00014407844554177205, + "loss": 0.7649, + "mean_token_accuracy": 0.77310009598732, + "num_tokens": 94780684.0, + "step": 27860 + }, + { + "epoch": 0.27971817415392025, + "learning_rate": 0.00014405837247581196, + "loss": 0.7802, + "mean_token_accuracy": 0.7678790330886841, + "num_tokens": 94814629.0, + "step": 27870 + }, + { + "epoch": 0.27981853948372076, + "learning_rate": 0.00014403829940985187, + "loss": 0.7699, + "mean_token_accuracy": 0.7725537121295929, + "num_tokens": 94848391.0, + "step": 27880 + }, + { + "epoch": 0.2799189048135212, + "learning_rate": 0.00014401822634389178, + "loss": 0.7663, + "mean_token_accuracy": 0.7687770128250122, + "num_tokens": 94882450.0, + "step": 27890 + }, + { + "epoch": 0.2800192701433217, + "learning_rate": 0.00014399815327793166, + "loss": 0.7744, + "mean_token_accuracy": 0.7670266807079316, + "num_tokens": 94916523.0, + "step": 27900 + }, + { + "epoch": 0.2801196354731222, + "learning_rate": 0.0001439780802119716, + "loss": 0.7619, + "mean_token_accuracy": 0.7759920358657837, + "num_tokens": 94950511.0, + "step": 27910 + }, + { + "epoch": 0.28022000080292264, + "learning_rate": 0.00014395800714601148, + "loss": 0.7888, + "mean_token_accuracy": 0.770870441198349, + "num_tokens": 94984809.0, + "step": 27920 + }, + { + "epoch": 0.2803203661327231, + "learning_rate": 0.00014393793408005139, + "loss": 0.7339, + "mean_token_accuracy": 0.7784211814403534, + "num_tokens": 95018325.0, + "step": 27930 + }, + { + "epoch": 0.2804207314625236, + "learning_rate": 0.0001439178610140913, + "loss": 0.7914, + "mean_token_accuracy": 0.7643942356109619, + "num_tokens": 95052556.0, + "step": 27940 + }, + { + "epoch": 0.28052109679232407, + "learning_rate": 0.0001438977879481312, + "loss": 0.779, + "mean_token_accuracy": 0.7691850602626801, + "num_tokens": 95086818.0, + "step": 27950 + }, + { + "epoch": 0.2806214621221245, + "learning_rate": 0.0001438777148821711, + "loss": 0.78, + "mean_token_accuracy": 0.7732650637626648, + "num_tokens": 95121026.0, + "step": 27960 + }, + { + "epoch": 0.28072182745192503, + "learning_rate": 0.00014385764181621102, + "loss": 0.7607, + "mean_token_accuracy": 0.7753560781478882, + "num_tokens": 95154968.0, + "step": 27970 + }, + { + "epoch": 0.2808221927817255, + "learning_rate": 0.00014383756875025093, + "loss": 0.7465, + "mean_token_accuracy": 0.7759646117687226, + "num_tokens": 95187520.0, + "step": 27980 + }, + { + "epoch": 0.28092255811152594, + "learning_rate": 0.0001438174956842908, + "loss": 0.7325, + "mean_token_accuracy": 0.7718597769737243, + "num_tokens": 95221151.0, + "step": 27990 + }, + { + "epoch": 0.28102292344132646, + "learning_rate": 0.00014379742261833074, + "loss": 0.738, + "mean_token_accuracy": 0.7761099696159363, + "num_tokens": 95254573.0, + "step": 28000 + }, + { + "epoch": 0.2811232887711269, + "learning_rate": 0.00014377734955237063, + "loss": 0.7829, + "mean_token_accuracy": 0.7705293476581574, + "num_tokens": 95289084.0, + "step": 28010 + }, + { + "epoch": 0.28122365410092737, + "learning_rate": 0.00014375727648641053, + "loss": 0.7435, + "mean_token_accuracy": 0.775824499130249, + "num_tokens": 95323588.0, + "step": 28020 + }, + { + "epoch": 0.2813240194307278, + "learning_rate": 0.00014373720342045044, + "loss": 0.7628, + "mean_token_accuracy": 0.7712218165397644, + "num_tokens": 95357591.0, + "step": 28030 + }, + { + "epoch": 0.28142438476052833, + "learning_rate": 0.00014371713035449035, + "loss": 0.7541, + "mean_token_accuracy": 0.7757143259048462, + "num_tokens": 95391528.0, + "step": 28040 + }, + { + "epoch": 0.2815247500903288, + "learning_rate": 0.00014369705728853026, + "loss": 0.7729, + "mean_token_accuracy": 0.7702911853790283, + "num_tokens": 95426526.0, + "step": 28050 + }, + { + "epoch": 0.28162511542012925, + "learning_rate": 0.00014367698422257017, + "loss": 0.7534, + "mean_token_accuracy": 0.7716615200042725, + "num_tokens": 95460919.0, + "step": 28060 + }, + { + "epoch": 0.28172548074992976, + "learning_rate": 0.00014365691115661008, + "loss": 0.7908, + "mean_token_accuracy": 0.7679134845733643, + "num_tokens": 95495023.0, + "step": 28070 + }, + { + "epoch": 0.2818258460797302, + "learning_rate": 0.00014363683809064999, + "loss": 0.7572, + "mean_token_accuracy": 0.7714826464653015, + "num_tokens": 95528809.0, + "step": 28080 + }, + { + "epoch": 0.28192621140953067, + "learning_rate": 0.0001436167650246899, + "loss": 0.7317, + "mean_token_accuracy": 0.7837158501148224, + "num_tokens": 95561932.0, + "step": 28090 + }, + { + "epoch": 0.2820265767393312, + "learning_rate": 0.00014359669195872977, + "loss": 0.7395, + "mean_token_accuracy": 0.7799531280994415, + "num_tokens": 95595828.0, + "step": 28100 + }, + { + "epoch": 0.28212694206913164, + "learning_rate": 0.0001435766188927697, + "loss": 0.7409, + "mean_token_accuracy": 0.7749620318412781, + "num_tokens": 95629727.0, + "step": 28110 + }, + { + "epoch": 0.2822273073989321, + "learning_rate": 0.0001435565458268096, + "loss": 0.7538, + "mean_token_accuracy": 0.7765342891216278, + "num_tokens": 95663466.0, + "step": 28120 + }, + { + "epoch": 0.2823276727287326, + "learning_rate": 0.0001435364727608495, + "loss": 0.7656, + "mean_token_accuracy": 0.7728769242763519, + "num_tokens": 95697934.0, + "step": 28130 + }, + { + "epoch": 0.28242803805853306, + "learning_rate": 0.0001435163996948894, + "loss": 0.774, + "mean_token_accuracy": 0.7711954891681672, + "num_tokens": 95731856.0, + "step": 28140 + }, + { + "epoch": 0.2825284033883335, + "learning_rate": 0.00014349632662892932, + "loss": 0.7526, + "mean_token_accuracy": 0.7742810428142548, + "num_tokens": 95766197.0, + "step": 28150 + }, + { + "epoch": 0.282628768718134, + "learning_rate": 0.0001434762535629692, + "loss": 0.7757, + "mean_token_accuracy": 0.7725955188274384, + "num_tokens": 95800956.0, + "step": 28160 + }, + { + "epoch": 0.2827291340479345, + "learning_rate": 0.00014345618049700913, + "loss": 0.7657, + "mean_token_accuracy": 0.7697532892227172, + "num_tokens": 95834567.0, + "step": 28170 + }, + { + "epoch": 0.28282949937773494, + "learning_rate": 0.00014343610743104902, + "loss": 0.7459, + "mean_token_accuracy": 0.7763911068439484, + "num_tokens": 95869011.0, + "step": 28180 + }, + { + "epoch": 0.28292986470753545, + "learning_rate": 0.00014341603436508892, + "loss": 0.7782, + "mean_token_accuracy": 0.7635152816772461, + "num_tokens": 95903302.0, + "step": 28190 + }, + { + "epoch": 0.2830302300373359, + "learning_rate": 0.00014339596129912883, + "loss": 0.7643, + "mean_token_accuracy": 0.7720817685127258, + "num_tokens": 95936762.0, + "step": 28200 + }, + { + "epoch": 0.28313059536713636, + "learning_rate": 0.00014337588823316874, + "loss": 0.7494, + "mean_token_accuracy": 0.7792890071868896, + "num_tokens": 95971551.0, + "step": 28210 + }, + { + "epoch": 0.2832309606969369, + "learning_rate": 0.00014335581516720865, + "loss": 0.7348, + "mean_token_accuracy": 0.7871302604675293, + "num_tokens": 96006501.0, + "step": 28220 + }, + { + "epoch": 0.28333132602673733, + "learning_rate": 0.00014333574210124856, + "loss": 0.7858, + "mean_token_accuracy": 0.7612696290016174, + "num_tokens": 96040332.0, + "step": 28230 + }, + { + "epoch": 0.2834316913565378, + "learning_rate": 0.00014331566903528847, + "loss": 0.7609, + "mean_token_accuracy": 0.7700464427471161, + "num_tokens": 96075156.0, + "step": 28240 + }, + { + "epoch": 0.2835320566863383, + "learning_rate": 0.00014329559596932835, + "loss": 0.7595, + "mean_token_accuracy": 0.7754449605941772, + "num_tokens": 96108056.0, + "step": 28250 + }, + { + "epoch": 0.28363242201613875, + "learning_rate": 0.00014327552290336828, + "loss": 0.8003, + "mean_token_accuracy": 0.7639413118362427, + "num_tokens": 96142646.0, + "step": 28260 + }, + { + "epoch": 0.2837327873459392, + "learning_rate": 0.00014325544983740816, + "loss": 0.7905, + "mean_token_accuracy": 0.7684699833393097, + "num_tokens": 96176728.0, + "step": 28270 + }, + { + "epoch": 0.2838331526757397, + "learning_rate": 0.00014323537677144807, + "loss": 0.7795, + "mean_token_accuracy": 0.7639523983001709, + "num_tokens": 96212312.0, + "step": 28280 + }, + { + "epoch": 0.2839335180055402, + "learning_rate": 0.00014321530370548798, + "loss": 0.7493, + "mean_token_accuracy": 0.7776244401931762, + "num_tokens": 96246642.0, + "step": 28290 + }, + { + "epoch": 0.28403388333534063, + "learning_rate": 0.0001431952306395279, + "loss": 0.7831, + "mean_token_accuracy": 0.7680910229682922, + "num_tokens": 96279819.0, + "step": 28300 + }, + { + "epoch": 0.2841342486651411, + "learning_rate": 0.0001431751575735678, + "loss": 0.7555, + "mean_token_accuracy": 0.7736326217651367, + "num_tokens": 96313203.0, + "step": 28310 + }, + { + "epoch": 0.2842346139949416, + "learning_rate": 0.0001431550845076077, + "loss": 0.7262, + "mean_token_accuracy": 0.7782347440719605, + "num_tokens": 96347472.0, + "step": 28320 + }, + { + "epoch": 0.28433497932474205, + "learning_rate": 0.00014313501144164761, + "loss": 0.7408, + "mean_token_accuracy": 0.7803001344203949, + "num_tokens": 96381772.0, + "step": 28330 + }, + { + "epoch": 0.2844353446545425, + "learning_rate": 0.0001431149383756875, + "loss": 0.7964, + "mean_token_accuracy": 0.7637731015682221, + "num_tokens": 96415551.0, + "step": 28340 + }, + { + "epoch": 0.284535709984343, + "learning_rate": 0.00014309486530972743, + "loss": 0.786, + "mean_token_accuracy": 0.76785329580307, + "num_tokens": 96448445.0, + "step": 28350 + }, + { + "epoch": 0.2846360753141435, + "learning_rate": 0.0001430747922437673, + "loss": 0.7455, + "mean_token_accuracy": 0.7801205277442932, + "num_tokens": 96483007.0, + "step": 28360 + }, + { + "epoch": 0.28473644064394393, + "learning_rate": 0.00014305471917780722, + "loss": 0.7391, + "mean_token_accuracy": 0.7741820096969605, + "num_tokens": 96517006.0, + "step": 28370 + }, + { + "epoch": 0.28483680597374444, + "learning_rate": 0.00014303464611184713, + "loss": 0.7697, + "mean_token_accuracy": 0.7698454201221466, + "num_tokens": 96550991.0, + "step": 28380 + }, + { + "epoch": 0.2849371713035449, + "learning_rate": 0.00014301457304588704, + "loss": 0.7568, + "mean_token_accuracy": 0.7713454842567444, + "num_tokens": 96585415.0, + "step": 28390 + }, + { + "epoch": 0.28503753663334536, + "learning_rate": 0.00014299449997992692, + "loss": 0.7779, + "mean_token_accuracy": 0.7706193685531616, + "num_tokens": 96620165.0, + "step": 28400 + }, + { + "epoch": 0.28513790196314587, + "learning_rate": 0.00014297442691396686, + "loss": 0.7399, + "mean_token_accuracy": 0.7788212418556213, + "num_tokens": 96653482.0, + "step": 28410 + }, + { + "epoch": 0.2852382672929463, + "learning_rate": 0.00014295435384800676, + "loss": 0.7192, + "mean_token_accuracy": 0.7818759381771088, + "num_tokens": 96687630.0, + "step": 28420 + }, + { + "epoch": 0.2853386326227468, + "learning_rate": 0.00014293428078204664, + "loss": 0.7786, + "mean_token_accuracy": 0.7628415882587433, + "num_tokens": 96722395.0, + "step": 28430 + }, + { + "epoch": 0.2854389979525473, + "learning_rate": 0.00014291420771608658, + "loss": 0.7831, + "mean_token_accuracy": 0.7688349485397339, + "num_tokens": 96756837.0, + "step": 28440 + }, + { + "epoch": 0.28553936328234775, + "learning_rate": 0.00014289413465012646, + "loss": 0.7745, + "mean_token_accuracy": 0.7714909553527832, + "num_tokens": 96791139.0, + "step": 28450 + }, + { + "epoch": 0.2856397286121482, + "learning_rate": 0.00014287406158416637, + "loss": 0.7824, + "mean_token_accuracy": 0.7721018195152283, + "num_tokens": 96825362.0, + "step": 28460 + }, + { + "epoch": 0.2857400939419487, + "learning_rate": 0.00014285398851820628, + "loss": 0.7156, + "mean_token_accuracy": 0.7840331375598908, + "num_tokens": 96859324.0, + "step": 28470 + }, + { + "epoch": 0.28584045927174917, + "learning_rate": 0.0001428339154522462, + "loss": 0.7609, + "mean_token_accuracy": 0.773687344789505, + "num_tokens": 96892927.0, + "step": 28480 + }, + { + "epoch": 0.2859408246015496, + "learning_rate": 0.00014281384238628607, + "loss": 0.7696, + "mean_token_accuracy": 0.7728011250495911, + "num_tokens": 96926712.0, + "step": 28490 + }, + { + "epoch": 0.28604118993135014, + "learning_rate": 0.000142793769320326, + "loss": 0.7451, + "mean_token_accuracy": 0.7809718906879425, + "num_tokens": 96960701.0, + "step": 28500 + }, + { + "epoch": 0.2861415552611506, + "learning_rate": 0.00014277369625436589, + "loss": 0.7744, + "mean_token_accuracy": 0.7736421167850495, + "num_tokens": 96995049.0, + "step": 28510 + }, + { + "epoch": 0.28624192059095105, + "learning_rate": 0.0001427536231884058, + "loss": 0.7453, + "mean_token_accuracy": 0.7792791187763214, + "num_tokens": 97028900.0, + "step": 28520 + }, + { + "epoch": 0.28634228592075156, + "learning_rate": 0.0001427335501224457, + "loss": 0.7736, + "mean_token_accuracy": 0.770075649023056, + "num_tokens": 97062735.0, + "step": 28530 + }, + { + "epoch": 0.286442651250552, + "learning_rate": 0.0001427134770564856, + "loss": 0.7898, + "mean_token_accuracy": 0.7700929760932922, + "num_tokens": 97097572.0, + "step": 28540 + }, + { + "epoch": 0.28654301658035247, + "learning_rate": 0.00014269340399052552, + "loss": 0.7687, + "mean_token_accuracy": 0.7669449508190155, + "num_tokens": 97131601.0, + "step": 28550 + }, + { + "epoch": 0.286643381910153, + "learning_rate": 0.00014267333092456543, + "loss": 0.7908, + "mean_token_accuracy": 0.7685792148113251, + "num_tokens": 97166226.0, + "step": 28560 + }, + { + "epoch": 0.28674374723995344, + "learning_rate": 0.00014265325785860534, + "loss": 0.7688, + "mean_token_accuracy": 0.7743170499801636, + "num_tokens": 97200126.0, + "step": 28570 + }, + { + "epoch": 0.2868441125697539, + "learning_rate": 0.00014263318479264522, + "loss": 0.7925, + "mean_token_accuracy": 0.7632998406887055, + "num_tokens": 97234143.0, + "step": 28580 + }, + { + "epoch": 0.28694447789955435, + "learning_rate": 0.00014261311172668515, + "loss": 0.811, + "mean_token_accuracy": 0.7661246061325073, + "num_tokens": 97268940.0, + "step": 28590 + }, + { + "epoch": 0.28704484322935486, + "learning_rate": 0.00014259303866072503, + "loss": 0.77, + "mean_token_accuracy": 0.7769502639770508, + "num_tokens": 97303733.0, + "step": 28600 + }, + { + "epoch": 0.2871452085591553, + "learning_rate": 0.00014257296559476497, + "loss": 0.7538, + "mean_token_accuracy": 0.7684979557991027, + "num_tokens": 97337759.0, + "step": 28610 + }, + { + "epoch": 0.2872455738889558, + "learning_rate": 0.00014255289252880485, + "loss": 0.7318, + "mean_token_accuracy": 0.7757490456104279, + "num_tokens": 97371306.0, + "step": 28620 + }, + { + "epoch": 0.2873459392187563, + "learning_rate": 0.00014253281946284476, + "loss": 0.7584, + "mean_token_accuracy": 0.7712860763072967, + "num_tokens": 97404592.0, + "step": 28630 + }, + { + "epoch": 0.28744630454855674, + "learning_rate": 0.00014251274639688467, + "loss": 0.7659, + "mean_token_accuracy": 0.7660297691822052, + "num_tokens": 97438537.0, + "step": 28640 + }, + { + "epoch": 0.2875466698783572, + "learning_rate": 0.00014249267333092458, + "loss": 0.7588, + "mean_token_accuracy": 0.7710791051387786, + "num_tokens": 97473717.0, + "step": 28650 + }, + { + "epoch": 0.2876470352081577, + "learning_rate": 0.00014247260026496448, + "loss": 0.7729, + "mean_token_accuracy": 0.7716709733009338, + "num_tokens": 97508297.0, + "step": 28660 + }, + { + "epoch": 0.28774740053795816, + "learning_rate": 0.0001424525271990044, + "loss": 0.7825, + "mean_token_accuracy": 0.7744401037693024, + "num_tokens": 97541722.0, + "step": 28670 + }, + { + "epoch": 0.2878477658677586, + "learning_rate": 0.0001424324541330443, + "loss": 0.7743, + "mean_token_accuracy": 0.7714649736881256, + "num_tokens": 97576189.0, + "step": 28680 + }, + { + "epoch": 0.28794813119755913, + "learning_rate": 0.00014241238106708418, + "loss": 0.7725, + "mean_token_accuracy": 0.7723775625228881, + "num_tokens": 97610364.0, + "step": 28690 + }, + { + "epoch": 0.2880484965273596, + "learning_rate": 0.00014239230800112412, + "loss": 0.7923, + "mean_token_accuracy": 0.7643298923969268, + "num_tokens": 97644164.0, + "step": 28700 + }, + { + "epoch": 0.28814886185716004, + "learning_rate": 0.000142372234935164, + "loss": 0.7296, + "mean_token_accuracy": 0.7828871130943298, + "num_tokens": 97677997.0, + "step": 28710 + }, + { + "epoch": 0.28824922718696055, + "learning_rate": 0.0001423521618692039, + "loss": 0.7556, + "mean_token_accuracy": 0.7748179018497467, + "num_tokens": 97712317.0, + "step": 28720 + }, + { + "epoch": 0.288349592516761, + "learning_rate": 0.00014233208880324382, + "loss": 0.7743, + "mean_token_accuracy": 0.7652441620826721, + "num_tokens": 97746507.0, + "step": 28730 + }, + { + "epoch": 0.28844995784656147, + "learning_rate": 0.00014231201573728372, + "loss": 0.7736, + "mean_token_accuracy": 0.7693808436393738, + "num_tokens": 97780635.0, + "step": 28740 + }, + { + "epoch": 0.288550323176362, + "learning_rate": 0.0001422919426713236, + "loss": 0.7729, + "mean_token_accuracy": 0.7710655629634857, + "num_tokens": 97813917.0, + "step": 28750 + }, + { + "epoch": 0.28865068850616243, + "learning_rate": 0.00014227186960536354, + "loss": 0.7773, + "mean_token_accuracy": 0.7683239877223969, + "num_tokens": 97847757.0, + "step": 28760 + }, + { + "epoch": 0.2887510538359629, + "learning_rate": 0.00014225179653940345, + "loss": 0.7899, + "mean_token_accuracy": 0.7675133168697357, + "num_tokens": 97881711.0, + "step": 28770 + }, + { + "epoch": 0.2888514191657634, + "learning_rate": 0.00014223172347344333, + "loss": 0.737, + "mean_token_accuracy": 0.7838814437389374, + "num_tokens": 97915644.0, + "step": 28780 + }, + { + "epoch": 0.28895178449556386, + "learning_rate": 0.00014221165040748327, + "loss": 0.7471, + "mean_token_accuracy": 0.7744276881217956, + "num_tokens": 97950484.0, + "step": 28790 + }, + { + "epoch": 0.2890521498253643, + "learning_rate": 0.00014219157734152315, + "loss": 0.7635, + "mean_token_accuracy": 0.7697767615318298, + "num_tokens": 97985047.0, + "step": 28800 + }, + { + "epoch": 0.2891525151551648, + "learning_rate": 0.00014217150427556306, + "loss": 0.7477, + "mean_token_accuracy": 0.781688803434372, + "num_tokens": 98019137.0, + "step": 28810 + }, + { + "epoch": 0.2892528804849653, + "learning_rate": 0.00014215143120960297, + "loss": 0.7424, + "mean_token_accuracy": 0.7789560616016388, + "num_tokens": 98053377.0, + "step": 28820 + }, + { + "epoch": 0.28935324581476574, + "learning_rate": 0.00014213135814364287, + "loss": 0.7792, + "mean_token_accuracy": 0.7686887979507446, + "num_tokens": 98087491.0, + "step": 28830 + }, + { + "epoch": 0.28945361114456625, + "learning_rate": 0.00014211128507768276, + "loss": 0.7418, + "mean_token_accuracy": 0.7751915872097015, + "num_tokens": 98121681.0, + "step": 28840 + }, + { + "epoch": 0.2895539764743667, + "learning_rate": 0.0001420912120117227, + "loss": 0.7228, + "mean_token_accuracy": 0.7830632448196411, + "num_tokens": 98155558.0, + "step": 28850 + }, + { + "epoch": 0.28965434180416716, + "learning_rate": 0.00014207113894576257, + "loss": 0.7255, + "mean_token_accuracy": 0.7823713898658753, + "num_tokens": 98189916.0, + "step": 28860 + }, + { + "epoch": 0.2897547071339676, + "learning_rate": 0.00014205106587980248, + "loss": 0.7819, + "mean_token_accuracy": 0.7697534620761871, + "num_tokens": 98223477.0, + "step": 28870 + }, + { + "epoch": 0.2898550724637681, + "learning_rate": 0.0001420309928138424, + "loss": 0.7167, + "mean_token_accuracy": 0.781836849451065, + "num_tokens": 98257219.0, + "step": 28880 + }, + { + "epoch": 0.2899554377935686, + "learning_rate": 0.0001420109197478823, + "loss": 0.7227, + "mean_token_accuracy": 0.7811435163021088, + "num_tokens": 98291835.0, + "step": 28890 + }, + { + "epoch": 0.29005580312336904, + "learning_rate": 0.0001419908466819222, + "loss": 0.7484, + "mean_token_accuracy": 0.7724690556526184, + "num_tokens": 98325991.0, + "step": 28900 + }, + { + "epoch": 0.29015616845316955, + "learning_rate": 0.00014197077361596211, + "loss": 0.7015, + "mean_token_accuracy": 0.7852222204208374, + "num_tokens": 98360498.0, + "step": 28910 + }, + { + "epoch": 0.29025653378297, + "learning_rate": 0.00014195070055000202, + "loss": 0.7659, + "mean_token_accuracy": 0.7725250482559204, + "num_tokens": 98395355.0, + "step": 28920 + }, + { + "epoch": 0.29035689911277046, + "learning_rate": 0.0001419306274840419, + "loss": 0.7502, + "mean_token_accuracy": 0.781274002790451, + "num_tokens": 98428841.0, + "step": 28930 + }, + { + "epoch": 0.290457264442571, + "learning_rate": 0.00014191055441808184, + "loss": 0.7604, + "mean_token_accuracy": 0.7756985306739808, + "num_tokens": 98462247.0, + "step": 28940 + }, + { + "epoch": 0.29055762977237143, + "learning_rate": 0.00014189048135212172, + "loss": 0.7858, + "mean_token_accuracy": 0.7663555085659027, + "num_tokens": 98496044.0, + "step": 28950 + }, + { + "epoch": 0.2906579951021719, + "learning_rate": 0.00014187040828616163, + "loss": 0.7511, + "mean_token_accuracy": 0.7796390414237976, + "num_tokens": 98529092.0, + "step": 28960 + }, + { + "epoch": 0.2907583604319724, + "learning_rate": 0.00014185033522020154, + "loss": 0.7276, + "mean_token_accuracy": 0.7819804608821869, + "num_tokens": 98563656.0, + "step": 28970 + }, + { + "epoch": 0.29085872576177285, + "learning_rate": 0.00014183026215424145, + "loss": 0.78, + "mean_token_accuracy": 0.7645665585994721, + "num_tokens": 98596523.0, + "step": 28980 + }, + { + "epoch": 0.2909590910915733, + "learning_rate": 0.00014181018908828135, + "loss": 0.7637, + "mean_token_accuracy": 0.772081583738327, + "num_tokens": 98630427.0, + "step": 28990 + }, + { + "epoch": 0.2910594564213738, + "learning_rate": 0.00014179011602232126, + "loss": 0.7434, + "mean_token_accuracy": 0.7764184951782227, + "num_tokens": 98663817.0, + "step": 29000 + }, + { + "epoch": 0.2911598217511743, + "learning_rate": 0.00014177004295636117, + "loss": 0.7724, + "mean_token_accuracy": 0.7713199734687806, + "num_tokens": 98697541.0, + "step": 29010 + }, + { + "epoch": 0.29126018708097473, + "learning_rate": 0.00014174996989040105, + "loss": 0.7531, + "mean_token_accuracy": 0.7737714588642121, + "num_tokens": 98731366.0, + "step": 29020 + }, + { + "epoch": 0.29136055241077524, + "learning_rate": 0.000141729896824441, + "loss": 0.728, + "mean_token_accuracy": 0.7822924375534057, + "num_tokens": 98765363.0, + "step": 29030 + }, + { + "epoch": 0.2914609177405757, + "learning_rate": 0.00014170982375848087, + "loss": 0.7612, + "mean_token_accuracy": 0.7754798293113708, + "num_tokens": 98799259.0, + "step": 29040 + }, + { + "epoch": 0.29156128307037615, + "learning_rate": 0.00014168975069252078, + "loss": 0.7352, + "mean_token_accuracy": 0.7805355131626129, + "num_tokens": 98832864.0, + "step": 29050 + }, + { + "epoch": 0.29166164840017667, + "learning_rate": 0.0001416696776265607, + "loss": 0.762, + "mean_token_accuracy": 0.7746479451656342, + "num_tokens": 98867332.0, + "step": 29060 + }, + { + "epoch": 0.2917620137299771, + "learning_rate": 0.0001416496045606006, + "loss": 0.797, + "mean_token_accuracy": 0.7642375528812408, + "num_tokens": 98901255.0, + "step": 29070 + }, + { + "epoch": 0.2918623790597776, + "learning_rate": 0.00014162953149464048, + "loss": 0.708, + "mean_token_accuracy": 0.7842754781246185, + "num_tokens": 98935116.0, + "step": 29080 + }, + { + "epoch": 0.2919627443895781, + "learning_rate": 0.0001416094584286804, + "loss": 0.7592, + "mean_token_accuracy": 0.7736884295940399, + "num_tokens": 98969475.0, + "step": 29090 + }, + { + "epoch": 0.29206310971937854, + "learning_rate": 0.0001415893853627203, + "loss": 0.7473, + "mean_token_accuracy": 0.7742801606655121, + "num_tokens": 99003262.0, + "step": 29100 + }, + { + "epoch": 0.292163475049179, + "learning_rate": 0.0001415693122967602, + "loss": 0.7715, + "mean_token_accuracy": 0.7666668891906738, + "num_tokens": 99037582.0, + "step": 29110 + }, + { + "epoch": 0.2922638403789795, + "learning_rate": 0.00014154923923080014, + "loss": 0.7807, + "mean_token_accuracy": 0.770354300737381, + "num_tokens": 99071947.0, + "step": 29120 + }, + { + "epoch": 0.29236420570877997, + "learning_rate": 0.00014152916616484002, + "loss": 0.7485, + "mean_token_accuracy": 0.7715291023254395, + "num_tokens": 99106290.0, + "step": 29130 + }, + { + "epoch": 0.2924645710385804, + "learning_rate": 0.00014150909309887993, + "loss": 0.7623, + "mean_token_accuracy": 0.7719914376735687, + "num_tokens": 99141141.0, + "step": 29140 + }, + { + "epoch": 0.2925649363683809, + "learning_rate": 0.00014148902003291984, + "loss": 0.7776, + "mean_token_accuracy": 0.7699817597866059, + "num_tokens": 99175816.0, + "step": 29150 + }, + { + "epoch": 0.2926653016981814, + "learning_rate": 0.00014146894696695974, + "loss": 0.7173, + "mean_token_accuracy": 0.7794719636440277, + "num_tokens": 99210735.0, + "step": 29160 + }, + { + "epoch": 0.29276566702798185, + "learning_rate": 0.00014144887390099963, + "loss": 0.7402, + "mean_token_accuracy": 0.7780381441116333, + "num_tokens": 99244651.0, + "step": 29170 + }, + { + "epoch": 0.2928660323577823, + "learning_rate": 0.00014142880083503956, + "loss": 0.7765, + "mean_token_accuracy": 0.7682926177978515, + "num_tokens": 99278357.0, + "step": 29180 + }, + { + "epoch": 0.2929663976875828, + "learning_rate": 0.00014140872776907944, + "loss": 0.7646, + "mean_token_accuracy": 0.7708244085311889, + "num_tokens": 99311832.0, + "step": 29190 + }, + { + "epoch": 0.29306676301738327, + "learning_rate": 0.00014138865470311938, + "loss": 0.7416, + "mean_token_accuracy": 0.7788143336772919, + "num_tokens": 99346131.0, + "step": 29200 + }, + { + "epoch": 0.2931671283471837, + "learning_rate": 0.00014136858163715926, + "loss": 0.7569, + "mean_token_accuracy": 0.7704828321933747, + "num_tokens": 99380558.0, + "step": 29210 + }, + { + "epoch": 0.29326749367698424, + "learning_rate": 0.00014134850857119917, + "loss": 0.755, + "mean_token_accuracy": 0.7756388902664184, + "num_tokens": 99414723.0, + "step": 29220 + }, + { + "epoch": 0.2933678590067847, + "learning_rate": 0.00014132843550523908, + "loss": 0.7468, + "mean_token_accuracy": 0.7792263329029083, + "num_tokens": 99448669.0, + "step": 29230 + }, + { + "epoch": 0.29346822433658515, + "learning_rate": 0.00014130836243927898, + "loss": 0.7497, + "mean_token_accuracy": 0.7784649908542634, + "num_tokens": 99482972.0, + "step": 29240 + }, + { + "epoch": 0.29356858966638566, + "learning_rate": 0.0001412882893733189, + "loss": 0.7427, + "mean_token_accuracy": 0.7733777105808258, + "num_tokens": 99517517.0, + "step": 29250 + }, + { + "epoch": 0.2936689549961861, + "learning_rate": 0.0001412682163073588, + "loss": 0.7199, + "mean_token_accuracy": 0.7836706876754761, + "num_tokens": 99552197.0, + "step": 29260 + }, + { + "epoch": 0.29376932032598657, + "learning_rate": 0.0001412481432413987, + "loss": 0.7555, + "mean_token_accuracy": 0.7785599768161774, + "num_tokens": 99585933.0, + "step": 29270 + }, + { + "epoch": 0.2938696856557871, + "learning_rate": 0.0001412280701754386, + "loss": 0.7682, + "mean_token_accuracy": 0.7654083967208862, + "num_tokens": 99619927.0, + "step": 29280 + }, + { + "epoch": 0.29397005098558754, + "learning_rate": 0.00014120799710947853, + "loss": 0.762, + "mean_token_accuracy": 0.769352251291275, + "num_tokens": 99654333.0, + "step": 29290 + }, + { + "epoch": 0.294070416315388, + "learning_rate": 0.0001411879240435184, + "loss": 0.7675, + "mean_token_accuracy": 0.7726259291172027, + "num_tokens": 99688347.0, + "step": 29300 + }, + { + "epoch": 0.2941707816451885, + "learning_rate": 0.00014116785097755832, + "loss": 0.7247, + "mean_token_accuracy": 0.7817895948886872, + "num_tokens": 99722710.0, + "step": 29310 + }, + { + "epoch": 0.29427114697498896, + "learning_rate": 0.00014114777791159822, + "loss": 0.7616, + "mean_token_accuracy": 0.7785114288330078, + "num_tokens": 99756516.0, + "step": 29320 + }, + { + "epoch": 0.2943715123047894, + "learning_rate": 0.00014112770484563813, + "loss": 0.7895, + "mean_token_accuracy": 0.7688580214977264, + "num_tokens": 99790753.0, + "step": 29330 + }, + { + "epoch": 0.29447187763458993, + "learning_rate": 0.00014110763177967804, + "loss": 0.7288, + "mean_token_accuracy": 0.7836663603782654, + "num_tokens": 99824741.0, + "step": 29340 + }, + { + "epoch": 0.2945722429643904, + "learning_rate": 0.00014108755871371795, + "loss": 0.7933, + "mean_token_accuracy": 0.7669318795204163, + "num_tokens": 99858920.0, + "step": 29350 + }, + { + "epoch": 0.29467260829419084, + "learning_rate": 0.00014106748564775786, + "loss": 0.7384, + "mean_token_accuracy": 0.7750026464462281, + "num_tokens": 99892374.0, + "step": 29360 + }, + { + "epoch": 0.29477297362399135, + "learning_rate": 0.00014104741258179774, + "loss": 0.7601, + "mean_token_accuracy": 0.7714162588119506, + "num_tokens": 99927242.0, + "step": 29370 + }, + { + "epoch": 0.2948733389537918, + "learning_rate": 0.00014102733951583768, + "loss": 0.7441, + "mean_token_accuracy": 0.7752436697483063, + "num_tokens": 99962405.0, + "step": 29380 + }, + { + "epoch": 0.29497370428359226, + "learning_rate": 0.00014100726644987756, + "loss": 0.7622, + "mean_token_accuracy": 0.7726584315299988, + "num_tokens": 99995965.0, + "step": 29390 + }, + { + "epoch": 0.2950740696133928, + "learning_rate": 0.00014098719338391746, + "loss": 0.7422, + "mean_token_accuracy": 0.7753499388694763, + "num_tokens": 100029884.0, + "step": 29400 + }, + { + "epoch": 0.29517443494319323, + "learning_rate": 0.00014096712031795737, + "loss": 0.7576, + "mean_token_accuracy": 0.7731671333312988, + "num_tokens": 100064293.0, + "step": 29410 + }, + { + "epoch": 0.2952748002729937, + "learning_rate": 0.00014094704725199728, + "loss": 0.7929, + "mean_token_accuracy": 0.769537627696991, + "num_tokens": 100098475.0, + "step": 29420 + }, + { + "epoch": 0.2953751656027942, + "learning_rate": 0.00014092697418603716, + "loss": 0.7344, + "mean_token_accuracy": 0.7775164842605591, + "num_tokens": 100133249.0, + "step": 29430 + }, + { + "epoch": 0.29547553093259465, + "learning_rate": 0.0001409069011200771, + "loss": 0.7214, + "mean_token_accuracy": 0.779714035987854, + "num_tokens": 100167512.0, + "step": 29440 + }, + { + "epoch": 0.2955758962623951, + "learning_rate": 0.00014088682805411698, + "loss": 0.7678, + "mean_token_accuracy": 0.7712717652320862, + "num_tokens": 100202601.0, + "step": 29450 + }, + { + "epoch": 0.29567626159219557, + "learning_rate": 0.0001408667549881569, + "loss": 0.7705, + "mean_token_accuracy": 0.7723312854766846, + "num_tokens": 100236753.0, + "step": 29460 + }, + { + "epoch": 0.2957766269219961, + "learning_rate": 0.0001408466819221968, + "loss": 0.7199, + "mean_token_accuracy": 0.7800745785236358, + "num_tokens": 100271362.0, + "step": 29470 + }, + { + "epoch": 0.29587699225179653, + "learning_rate": 0.0001408266088562367, + "loss": 0.7353, + "mean_token_accuracy": 0.77441685795784, + "num_tokens": 100305577.0, + "step": 29480 + }, + { + "epoch": 0.295977357581597, + "learning_rate": 0.00014080653579027661, + "loss": 0.7574, + "mean_token_accuracy": 0.7717891931533813, + "num_tokens": 100339939.0, + "step": 29490 + }, + { + "epoch": 0.2960777229113975, + "learning_rate": 0.00014078646272431652, + "loss": 0.7527, + "mean_token_accuracy": 0.7759120404720307, + "num_tokens": 100374633.0, + "step": 29500 + }, + { + "epoch": 0.29617808824119796, + "learning_rate": 0.00014076638965835643, + "loss": 0.7529, + "mean_token_accuracy": 0.7745722115039826, + "num_tokens": 100409806.0, + "step": 29510 + }, + { + "epoch": 0.2962784535709984, + "learning_rate": 0.0001407463165923963, + "loss": 0.6996, + "mean_token_accuracy": 0.7888730943202973, + "num_tokens": 100443260.0, + "step": 29520 + }, + { + "epoch": 0.2963788189007989, + "learning_rate": 0.00014072624352643625, + "loss": 0.6948, + "mean_token_accuracy": 0.7858321964740753, + "num_tokens": 100477022.0, + "step": 29530 + }, + { + "epoch": 0.2964791842305994, + "learning_rate": 0.00014070617046047613, + "loss": 0.759, + "mean_token_accuracy": 0.771923303604126, + "num_tokens": 100511138.0, + "step": 29540 + }, + { + "epoch": 0.29657954956039984, + "learning_rate": 0.00014068609739451604, + "loss": 0.7333, + "mean_token_accuracy": 0.7735685169696808, + "num_tokens": 100545533.0, + "step": 29550 + }, + { + "epoch": 0.29667991489020035, + "learning_rate": 0.00014066602432855595, + "loss": 0.7196, + "mean_token_accuracy": 0.7803890228271484, + "num_tokens": 100579346.0, + "step": 29560 + }, + { + "epoch": 0.2967802802200008, + "learning_rate": 0.00014064595126259585, + "loss": 0.7514, + "mean_token_accuracy": 0.7723907589912414, + "num_tokens": 100613387.0, + "step": 29570 + }, + { + "epoch": 0.29688064554980126, + "learning_rate": 0.00014062587819663576, + "loss": 0.7193, + "mean_token_accuracy": 0.7758615255355835, + "num_tokens": 100647040.0, + "step": 29580 + }, + { + "epoch": 0.29698101087960177, + "learning_rate": 0.00014060580513067567, + "loss": 0.7482, + "mean_token_accuracy": 0.7730087757110595, + "num_tokens": 100680660.0, + "step": 29590 + }, + { + "epoch": 0.2970813762094022, + "learning_rate": 0.00014058573206471558, + "loss": 0.7461, + "mean_token_accuracy": 0.7728002905845642, + "num_tokens": 100714616.0, + "step": 29600 + }, + { + "epoch": 0.2971817415392027, + "learning_rate": 0.00014056565899875546, + "loss": 0.7692, + "mean_token_accuracy": 0.7765908062458038, + "num_tokens": 100748952.0, + "step": 29610 + }, + { + "epoch": 0.2972821068690032, + "learning_rate": 0.0001405455859327954, + "loss": 0.7341, + "mean_token_accuracy": 0.7805267155170441, + "num_tokens": 100782497.0, + "step": 29620 + }, + { + "epoch": 0.29738247219880365, + "learning_rate": 0.00014052551286683528, + "loss": 0.7531, + "mean_token_accuracy": 0.7727090954780579, + "num_tokens": 100816702.0, + "step": 29630 + }, + { + "epoch": 0.2974828375286041, + "learning_rate": 0.00014050543980087519, + "loss": 0.7204, + "mean_token_accuracy": 0.7859593152999877, + "num_tokens": 100850951.0, + "step": 29640 + }, + { + "epoch": 0.2975832028584046, + "learning_rate": 0.0001404853667349151, + "loss": 0.7352, + "mean_token_accuracy": 0.7814213275909424, + "num_tokens": 100885330.0, + "step": 29650 + }, + { + "epoch": 0.29768356818820507, + "learning_rate": 0.000140465293668955, + "loss": 0.7652, + "mean_token_accuracy": 0.7715207993984222, + "num_tokens": 100919542.0, + "step": 29660 + }, + { + "epoch": 0.29778393351800553, + "learning_rate": 0.0001404452206029949, + "loss": 0.7558, + "mean_token_accuracy": 0.772058779001236, + "num_tokens": 100953203.0, + "step": 29670 + }, + { + "epoch": 0.29788429884780604, + "learning_rate": 0.00014042514753703482, + "loss": 0.7221, + "mean_token_accuracy": 0.781199312210083, + "num_tokens": 100987335.0, + "step": 29680 + }, + { + "epoch": 0.2979846641776065, + "learning_rate": 0.00014040507447107473, + "loss": 0.7492, + "mean_token_accuracy": 0.7747159957885742, + "num_tokens": 101022161.0, + "step": 29690 + }, + { + "epoch": 0.29808502950740695, + "learning_rate": 0.0001403850014051146, + "loss": 0.7362, + "mean_token_accuracy": 0.7758022427558899, + "num_tokens": 101056388.0, + "step": 29700 + }, + { + "epoch": 0.29818539483720746, + "learning_rate": 0.00014036492833915455, + "loss": 0.7661, + "mean_token_accuracy": 0.7724496126174927, + "num_tokens": 101090576.0, + "step": 29710 + }, + { + "epoch": 0.2982857601670079, + "learning_rate": 0.00014034485527319443, + "loss": 0.7649, + "mean_token_accuracy": 0.7721573054790497, + "num_tokens": 101124962.0, + "step": 29720 + }, + { + "epoch": 0.2983861254968084, + "learning_rate": 0.00014032478220723433, + "loss": 0.7833, + "mean_token_accuracy": 0.7669749796390534, + "num_tokens": 101159222.0, + "step": 29730 + }, + { + "epoch": 0.29848649082660883, + "learning_rate": 0.00014030470914127424, + "loss": 0.7649, + "mean_token_accuracy": 0.7715265154838562, + "num_tokens": 101192782.0, + "step": 29740 + }, + { + "epoch": 0.29858685615640934, + "learning_rate": 0.00014028463607531415, + "loss": 0.7386, + "mean_token_accuracy": 0.7763209939002991, + "num_tokens": 101227386.0, + "step": 29750 + }, + { + "epoch": 0.2986872214862098, + "learning_rate": 0.00014026456300935406, + "loss": 0.7645, + "mean_token_accuracy": 0.7729579210281372, + "num_tokens": 101261496.0, + "step": 29760 + }, + { + "epoch": 0.29878758681601025, + "learning_rate": 0.00014024448994339397, + "loss": 0.7807, + "mean_token_accuracy": 0.7649962842464447, + "num_tokens": 101294541.0, + "step": 29770 + }, + { + "epoch": 0.29888795214581076, + "learning_rate": 0.00014022441687743385, + "loss": 0.7569, + "mean_token_accuracy": 0.7742062866687774, + "num_tokens": 101328027.0, + "step": 29780 + }, + { + "epoch": 0.2989883174756112, + "learning_rate": 0.00014020434381147379, + "loss": 0.7641, + "mean_token_accuracy": 0.7726384162902832, + "num_tokens": 101362470.0, + "step": 29790 + }, + { + "epoch": 0.2990886828054117, + "learning_rate": 0.00014018427074551367, + "loss": 0.7501, + "mean_token_accuracy": 0.7763361215591431, + "num_tokens": 101397922.0, + "step": 29800 + }, + { + "epoch": 0.2991890481352122, + "learning_rate": 0.00014016419767955358, + "loss": 0.744, + "mean_token_accuracy": 0.77735715508461, + "num_tokens": 101432261.0, + "step": 29810 + }, + { + "epoch": 0.29928941346501264, + "learning_rate": 0.00014014412461359348, + "loss": 0.7689, + "mean_token_accuracy": 0.768517005443573, + "num_tokens": 101466295.0, + "step": 29820 + }, + { + "epoch": 0.2993897787948131, + "learning_rate": 0.0001401240515476334, + "loss": 0.7406, + "mean_token_accuracy": 0.7753639459609986, + "num_tokens": 101499988.0, + "step": 29830 + }, + { + "epoch": 0.2994901441246136, + "learning_rate": 0.0001401039784816733, + "loss": 0.7789, + "mean_token_accuracy": 0.7696060717105866, + "num_tokens": 101534045.0, + "step": 29840 + }, + { + "epoch": 0.29959050945441407, + "learning_rate": 0.0001400839054157132, + "loss": 0.7292, + "mean_token_accuracy": 0.783731073141098, + "num_tokens": 101568206.0, + "step": 29850 + }, + { + "epoch": 0.2996908747842145, + "learning_rate": 0.00014006383234975312, + "loss": 0.762, + "mean_token_accuracy": 0.7774661183357239, + "num_tokens": 101602848.0, + "step": 29860 + }, + { + "epoch": 0.29979124011401503, + "learning_rate": 0.000140043759283793, + "loss": 0.7366, + "mean_token_accuracy": 0.7775753319263459, + "num_tokens": 101637417.0, + "step": 29870 + }, + { + "epoch": 0.2998916054438155, + "learning_rate": 0.00014002368621783293, + "loss": 0.7471, + "mean_token_accuracy": 0.7773273289203644, + "num_tokens": 101671036.0, + "step": 29880 + }, + { + "epoch": 0.29999197077361595, + "learning_rate": 0.00014000361315187282, + "loss": 0.761, + "mean_token_accuracy": 0.7722024261951447, + "num_tokens": 101704395.0, + "step": 29890 + }, + { + "epoch": 0.30009233610341646, + "learning_rate": 0.00013998354008591272, + "loss": 0.7846, + "mean_token_accuracy": 0.7594796240329742, + "num_tokens": 101739177.0, + "step": 29900 + }, + { + "epoch": 0.3001927014332169, + "learning_rate": 0.00013996346701995263, + "loss": 0.7551, + "mean_token_accuracy": 0.7724564135074615, + "num_tokens": 101773232.0, + "step": 29910 + }, + { + "epoch": 0.30029306676301737, + "learning_rate": 0.00013994339395399254, + "loss": 0.7756, + "mean_token_accuracy": 0.7685364961624146, + "num_tokens": 101806573.0, + "step": 29920 + }, + { + "epoch": 0.3003934320928179, + "learning_rate": 0.00013992332088803245, + "loss": 0.7848, + "mean_token_accuracy": 0.7614635407924653, + "num_tokens": 101840236.0, + "step": 29930 + }, + { + "epoch": 0.30049379742261834, + "learning_rate": 0.00013990324782207236, + "loss": 0.7807, + "mean_token_accuracy": 0.767466914653778, + "num_tokens": 101874586.0, + "step": 29940 + }, + { + "epoch": 0.3005941627524188, + "learning_rate": 0.00013988317475611227, + "loss": 0.7185, + "mean_token_accuracy": 0.7807386338710784, + "num_tokens": 101908606.0, + "step": 29950 + }, + { + "epoch": 0.3006945280822193, + "learning_rate": 0.00013986310169015215, + "loss": 0.76, + "mean_token_accuracy": 0.7769132673740387, + "num_tokens": 101942444.0, + "step": 29960 + }, + { + "epoch": 0.30079489341201976, + "learning_rate": 0.00013984302862419208, + "loss": 0.7468, + "mean_token_accuracy": 0.771494460105896, + "num_tokens": 101976158.0, + "step": 29970 + }, + { + "epoch": 0.3008952587418202, + "learning_rate": 0.00013982295555823196, + "loss": 0.7816, + "mean_token_accuracy": 0.7671621084213257, + "num_tokens": 102009545.0, + "step": 29980 + }, + { + "epoch": 0.3009956240716207, + "learning_rate": 0.00013980288249227187, + "loss": 0.7547, + "mean_token_accuracy": 0.7769341826438904, + "num_tokens": 102044039.0, + "step": 29990 + }, + { + "epoch": 0.3010959894014212, + "learning_rate": 0.00013978280942631178, + "loss": 0.7284, + "mean_token_accuracy": 0.779939603805542, + "num_tokens": 102077900.0, + "step": 30000 + }, + { + "epoch": 0.30119635473122164, + "learning_rate": 0.0001397627363603517, + "loss": 0.7558, + "mean_token_accuracy": 0.7702864706516266, + "num_tokens": 102112192.0, + "step": 30010 + }, + { + "epoch": 0.3012967200610221, + "learning_rate": 0.0001397426632943916, + "loss": 0.742, + "mean_token_accuracy": 0.7804159045219421, + "num_tokens": 102145289.0, + "step": 30020 + }, + { + "epoch": 0.3013970853908226, + "learning_rate": 0.0001397225902284315, + "loss": 0.7393, + "mean_token_accuracy": 0.7782248795032501, + "num_tokens": 102179561.0, + "step": 30030 + }, + { + "epoch": 0.30149745072062306, + "learning_rate": 0.00013970251716247142, + "loss": 0.7637, + "mean_token_accuracy": 0.7731903374195099, + "num_tokens": 102214258.0, + "step": 30040 + }, + { + "epoch": 0.3015978160504235, + "learning_rate": 0.0001396824440965113, + "loss": 0.7254, + "mean_token_accuracy": 0.7820830702781677, + "num_tokens": 102248720.0, + "step": 30050 + }, + { + "epoch": 0.30169818138022403, + "learning_rate": 0.00013966237103055123, + "loss": 0.7759, + "mean_token_accuracy": 0.7698108375072479, + "num_tokens": 102282978.0, + "step": 30060 + }, + { + "epoch": 0.3017985467100245, + "learning_rate": 0.0001396422979645911, + "loss": 0.7759, + "mean_token_accuracy": 0.7666373908519745, + "num_tokens": 102316762.0, + "step": 30070 + }, + { + "epoch": 0.30189891203982494, + "learning_rate": 0.00013962222489863102, + "loss": 0.7706, + "mean_token_accuracy": 0.7717369139194489, + "num_tokens": 102350881.0, + "step": 30080 + }, + { + "epoch": 0.30199927736962545, + "learning_rate": 0.00013960215183267093, + "loss": 0.7883, + "mean_token_accuracy": 0.7646639883518219, + "num_tokens": 102385177.0, + "step": 30090 + }, + { + "epoch": 0.3020996426994259, + "learning_rate": 0.00013958207876671084, + "loss": 0.729, + "mean_token_accuracy": 0.7823030114173889, + "num_tokens": 102418790.0, + "step": 30100 + }, + { + "epoch": 0.30220000802922636, + "learning_rate": 0.00013956200570075072, + "loss": 0.7357, + "mean_token_accuracy": 0.7797044217586517, + "num_tokens": 102453132.0, + "step": 30110 + }, + { + "epoch": 0.3023003733590269, + "learning_rate": 0.00013954193263479066, + "loss": 0.8085, + "mean_token_accuracy": 0.7604319095611572, + "num_tokens": 102486414.0, + "step": 30120 + }, + { + "epoch": 0.30240073868882733, + "learning_rate": 0.00013952185956883054, + "loss": 0.7597, + "mean_token_accuracy": 0.7722374677658081, + "num_tokens": 102520116.0, + "step": 30130 + }, + { + "epoch": 0.3025011040186278, + "learning_rate": 0.00013950178650287045, + "loss": 0.7408, + "mean_token_accuracy": 0.7763288021087646, + "num_tokens": 102554004.0, + "step": 30140 + }, + { + "epoch": 0.3026014693484283, + "learning_rate": 0.00013948171343691035, + "loss": 0.8025, + "mean_token_accuracy": 0.7670863509178162, + "num_tokens": 102588513.0, + "step": 30150 + }, + { + "epoch": 0.30270183467822875, + "learning_rate": 0.00013946164037095026, + "loss": 0.7587, + "mean_token_accuracy": 0.7740037620067597, + "num_tokens": 102623041.0, + "step": 30160 + }, + { + "epoch": 0.3028022000080292, + "learning_rate": 0.00013944156730499017, + "loss": 0.7721, + "mean_token_accuracy": 0.7665294706821442, + "num_tokens": 102657413.0, + "step": 30170 + }, + { + "epoch": 0.3029025653378297, + "learning_rate": 0.00013942149423903008, + "loss": 0.7335, + "mean_token_accuracy": 0.7742194294929504, + "num_tokens": 102691460.0, + "step": 30180 + }, + { + "epoch": 0.3030029306676302, + "learning_rate": 0.00013940142117307, + "loss": 0.7599, + "mean_token_accuracy": 0.7743681907653809, + "num_tokens": 102725438.0, + "step": 30190 + }, + { + "epoch": 0.30310329599743063, + "learning_rate": 0.00013938134810710987, + "loss": 0.767, + "mean_token_accuracy": 0.7699396669864654, + "num_tokens": 102760347.0, + "step": 30200 + }, + { + "epoch": 0.30320366132723114, + "learning_rate": 0.0001393612750411498, + "loss": 0.7362, + "mean_token_accuracy": 0.7853947639465332, + "num_tokens": 102795404.0, + "step": 30210 + }, + { + "epoch": 0.3033040266570316, + "learning_rate": 0.00013934120197518969, + "loss": 0.743, + "mean_token_accuracy": 0.7780166029930115, + "num_tokens": 102828487.0, + "step": 30220 + }, + { + "epoch": 0.30340439198683206, + "learning_rate": 0.0001393211289092296, + "loss": 0.7794, + "mean_token_accuracy": 0.7706028580665588, + "num_tokens": 102863431.0, + "step": 30230 + }, + { + "epoch": 0.30350475731663257, + "learning_rate": 0.0001393010558432695, + "loss": 0.776, + "mean_token_accuracy": 0.7714719414710999, + "num_tokens": 102898248.0, + "step": 30240 + }, + { + "epoch": 0.303605122646433, + "learning_rate": 0.0001392809827773094, + "loss": 0.7756, + "mean_token_accuracy": 0.7676347851753235, + "num_tokens": 102932695.0, + "step": 30250 + }, + { + "epoch": 0.3037054879762335, + "learning_rate": 0.00013926090971134932, + "loss": 0.7732, + "mean_token_accuracy": 0.7656772911548615, + "num_tokens": 102966717.0, + "step": 30260 + }, + { + "epoch": 0.303805853306034, + "learning_rate": 0.00013924083664538923, + "loss": 0.826, + "mean_token_accuracy": 0.7555188834667206, + "num_tokens": 102999671.0, + "step": 30270 + }, + { + "epoch": 0.30390621863583445, + "learning_rate": 0.00013922076357942914, + "loss": 0.7552, + "mean_token_accuracy": 0.7759094893932342, + "num_tokens": 103033895.0, + "step": 30280 + }, + { + "epoch": 0.3040065839656349, + "learning_rate": 0.00013920069051346902, + "loss": 0.7419, + "mean_token_accuracy": 0.775572144985199, + "num_tokens": 103067820.0, + "step": 30290 + }, + { + "epoch": 0.30410694929543536, + "learning_rate": 0.00013918061744750895, + "loss": 0.7392, + "mean_token_accuracy": 0.7811022341251374, + "num_tokens": 103102289.0, + "step": 30300 + }, + { + "epoch": 0.30420731462523587, + "learning_rate": 0.00013916054438154883, + "loss": 0.7273, + "mean_token_accuracy": 0.7775943994522094, + "num_tokens": 103136433.0, + "step": 30310 + }, + { + "epoch": 0.3043076799550363, + "learning_rate": 0.00013914047131558877, + "loss": 0.733, + "mean_token_accuracy": 0.7790721535682679, + "num_tokens": 103170299.0, + "step": 30320 + }, + { + "epoch": 0.3044080452848368, + "learning_rate": 0.00013912039824962865, + "loss": 0.7854, + "mean_token_accuracy": 0.7666976571083068, + "num_tokens": 103204040.0, + "step": 30330 + }, + { + "epoch": 0.3045084106146373, + "learning_rate": 0.00013910032518366856, + "loss": 0.7398, + "mean_token_accuracy": 0.7777034878730774, + "num_tokens": 103237977.0, + "step": 30340 + }, + { + "epoch": 0.30460877594443775, + "learning_rate": 0.00013908025211770847, + "loss": 0.7711, + "mean_token_accuracy": 0.7719676792621613, + "num_tokens": 103272465.0, + "step": 30350 + }, + { + "epoch": 0.3047091412742382, + "learning_rate": 0.00013906017905174838, + "loss": 0.7599, + "mean_token_accuracy": 0.7756696701049804, + "num_tokens": 103306302.0, + "step": 30360 + }, + { + "epoch": 0.3048095066040387, + "learning_rate": 0.00013904010598578828, + "loss": 0.7459, + "mean_token_accuracy": 0.7794725835323334, + "num_tokens": 103340295.0, + "step": 30370 + }, + { + "epoch": 0.30490987193383917, + "learning_rate": 0.0001390200329198282, + "loss": 0.7594, + "mean_token_accuracy": 0.7782514810562133, + "num_tokens": 103374872.0, + "step": 30380 + }, + { + "epoch": 0.3050102372636396, + "learning_rate": 0.0001389999598538681, + "loss": 0.7999, + "mean_token_accuracy": 0.7694885909557343, + "num_tokens": 103408841.0, + "step": 30390 + }, + { + "epoch": 0.30511060259344014, + "learning_rate": 0.00013897988678790798, + "loss": 0.7787, + "mean_token_accuracy": 0.7691689252853393, + "num_tokens": 103443503.0, + "step": 30400 + }, + { + "epoch": 0.3052109679232406, + "learning_rate": 0.00013895981372194792, + "loss": 0.746, + "mean_token_accuracy": 0.7696506142616272, + "num_tokens": 103477779.0, + "step": 30410 + }, + { + "epoch": 0.30531133325304105, + "learning_rate": 0.0001389397406559878, + "loss": 0.7598, + "mean_token_accuracy": 0.7774660527706146, + "num_tokens": 103511407.0, + "step": 30420 + }, + { + "epoch": 0.30541169858284156, + "learning_rate": 0.0001389196675900277, + "loss": 0.7576, + "mean_token_accuracy": 0.7759681701660156, + "num_tokens": 103545543.0, + "step": 30430 + }, + { + "epoch": 0.305512063912642, + "learning_rate": 0.00013889959452406762, + "loss": 0.7486, + "mean_token_accuracy": 0.7778256833553314, + "num_tokens": 103579468.0, + "step": 30440 + }, + { + "epoch": 0.3056124292424425, + "learning_rate": 0.00013887952145810753, + "loss": 0.7532, + "mean_token_accuracy": 0.7719829618930817, + "num_tokens": 103613942.0, + "step": 30450 + }, + { + "epoch": 0.305712794572243, + "learning_rate": 0.0001388594483921474, + "loss": 0.7545, + "mean_token_accuracy": 0.7741083145141602, + "num_tokens": 103647817.0, + "step": 30460 + }, + { + "epoch": 0.30581315990204344, + "learning_rate": 0.00013883937532618734, + "loss": 0.7698, + "mean_token_accuracy": 0.7674217760562897, + "num_tokens": 103681743.0, + "step": 30470 + }, + { + "epoch": 0.3059135252318439, + "learning_rate": 0.00013881930226022722, + "loss": 0.7816, + "mean_token_accuracy": 0.7681707978248596, + "num_tokens": 103715424.0, + "step": 30480 + }, + { + "epoch": 0.3060138905616444, + "learning_rate": 0.00013879922919426713, + "loss": 0.7705, + "mean_token_accuracy": 0.7729944229125977, + "num_tokens": 103749449.0, + "step": 30490 + }, + { + "epoch": 0.30611425589144486, + "learning_rate": 0.00013877915612830704, + "loss": 0.7347, + "mean_token_accuracy": 0.7809194803237915, + "num_tokens": 103784175.0, + "step": 30500 + }, + { + "epoch": 0.3062146212212453, + "learning_rate": 0.00013875908306234695, + "loss": 0.7738, + "mean_token_accuracy": 0.7669017791748047, + "num_tokens": 103818085.0, + "step": 30510 + }, + { + "epoch": 0.30631498655104583, + "learning_rate": 0.00013873900999638686, + "loss": 0.7881, + "mean_token_accuracy": 0.7695654451847076, + "num_tokens": 103851803.0, + "step": 30520 + }, + { + "epoch": 0.3064153518808463, + "learning_rate": 0.00013871893693042677, + "loss": 0.7747, + "mean_token_accuracy": 0.7680711686611176, + "num_tokens": 103886459.0, + "step": 30530 + }, + { + "epoch": 0.30651571721064674, + "learning_rate": 0.00013869886386446667, + "loss": 0.7481, + "mean_token_accuracy": 0.7746942222118378, + "num_tokens": 103920953.0, + "step": 30540 + }, + { + "epoch": 0.30661608254044725, + "learning_rate": 0.00013867879079850656, + "loss": 0.793, + "mean_token_accuracy": 0.763790887594223, + "num_tokens": 103954390.0, + "step": 30550 + }, + { + "epoch": 0.3067164478702477, + "learning_rate": 0.0001386587177325465, + "loss": 0.7995, + "mean_token_accuracy": 0.7638724386692047, + "num_tokens": 103988371.0, + "step": 30560 + }, + { + "epoch": 0.30681681320004817, + "learning_rate": 0.00013863864466658637, + "loss": 0.7561, + "mean_token_accuracy": 0.774150276184082, + "num_tokens": 104021981.0, + "step": 30570 + }, + { + "epoch": 0.3069171785298486, + "learning_rate": 0.00013861857160062628, + "loss": 0.7588, + "mean_token_accuracy": 0.7727494657039642, + "num_tokens": 104055285.0, + "step": 30580 + }, + { + "epoch": 0.30701754385964913, + "learning_rate": 0.0001385984985346662, + "loss": 0.7524, + "mean_token_accuracy": 0.7772042453289032, + "num_tokens": 104089263.0, + "step": 30590 + }, + { + "epoch": 0.3071179091894496, + "learning_rate": 0.0001385784254687061, + "loss": 0.765, + "mean_token_accuracy": 0.7683424353599548, + "num_tokens": 104123211.0, + "step": 30600 + }, + { + "epoch": 0.30721827451925005, + "learning_rate": 0.000138558352402746, + "loss": 0.7288, + "mean_token_accuracy": 0.7830067038536072, + "num_tokens": 104157222.0, + "step": 30610 + }, + { + "epoch": 0.30731863984905056, + "learning_rate": 0.00013853827933678591, + "loss": 0.7709, + "mean_token_accuracy": 0.7685743570327759, + "num_tokens": 104190522.0, + "step": 30620 + }, + { + "epoch": 0.307419005178851, + "learning_rate": 0.00013851820627082582, + "loss": 0.7614, + "mean_token_accuracy": 0.7725608289241791, + "num_tokens": 104224983.0, + "step": 30630 + }, + { + "epoch": 0.30751937050865147, + "learning_rate": 0.0001384981332048657, + "loss": 0.7824, + "mean_token_accuracy": 0.7672821164131165, + "num_tokens": 104259059.0, + "step": 30640 + }, + { + "epoch": 0.307619735838452, + "learning_rate": 0.00013847806013890564, + "loss": 0.7438, + "mean_token_accuracy": 0.7788600921630859, + "num_tokens": 104292259.0, + "step": 30650 + }, + { + "epoch": 0.30772010116825244, + "learning_rate": 0.00013845798707294552, + "loss": 0.8073, + "mean_token_accuracy": 0.76075199842453, + "num_tokens": 104326183.0, + "step": 30660 + }, + { + "epoch": 0.3078204664980529, + "learning_rate": 0.00013843791400698543, + "loss": 0.8143, + "mean_token_accuracy": 0.7618832290172577, + "num_tokens": 104360667.0, + "step": 30670 + }, + { + "epoch": 0.3079208318278534, + "learning_rate": 0.00013841784094102534, + "loss": 0.7751, + "mean_token_accuracy": 0.7713720083236695, + "num_tokens": 104395892.0, + "step": 30680 + }, + { + "epoch": 0.30802119715765386, + "learning_rate": 0.00013839776787506525, + "loss": 0.747, + "mean_token_accuracy": 0.7763884246349335, + "num_tokens": 104429388.0, + "step": 30690 + }, + { + "epoch": 0.3081215624874543, + "learning_rate": 0.00013837769480910513, + "loss": 0.7482, + "mean_token_accuracy": 0.7765169620513916, + "num_tokens": 104463555.0, + "step": 30700 + }, + { + "epoch": 0.3082219278172548, + "learning_rate": 0.00013835762174314506, + "loss": 0.7702, + "mean_token_accuracy": 0.7701191127300262, + "num_tokens": 104497207.0, + "step": 30710 + }, + { + "epoch": 0.3083222931470553, + "learning_rate": 0.00013833754867718497, + "loss": 0.7945, + "mean_token_accuracy": 0.7636801123619079, + "num_tokens": 104531413.0, + "step": 30720 + }, + { + "epoch": 0.30842265847685574, + "learning_rate": 0.00013831747561122485, + "loss": 0.7868, + "mean_token_accuracy": 0.7641001880168915, + "num_tokens": 104565304.0, + "step": 30730 + }, + { + "epoch": 0.30852302380665625, + "learning_rate": 0.0001382974025452648, + "loss": 0.7358, + "mean_token_accuracy": 0.7806992888450622, + "num_tokens": 104599197.0, + "step": 30740 + }, + { + "epoch": 0.3086233891364567, + "learning_rate": 0.00013827732947930467, + "loss": 0.7734, + "mean_token_accuracy": 0.767440915107727, + "num_tokens": 104633950.0, + "step": 30750 + }, + { + "epoch": 0.30872375446625716, + "learning_rate": 0.00013825725641334458, + "loss": 0.7815, + "mean_token_accuracy": 0.7703138053417206, + "num_tokens": 104667636.0, + "step": 30760 + }, + { + "epoch": 0.3088241197960577, + "learning_rate": 0.0001382371833473845, + "loss": 0.7899, + "mean_token_accuracy": 0.7707507610321045, + "num_tokens": 104701907.0, + "step": 30770 + }, + { + "epoch": 0.30892448512585813, + "learning_rate": 0.0001382171102814244, + "loss": 0.7455, + "mean_token_accuracy": 0.7727533578872681, + "num_tokens": 104735953.0, + "step": 30780 + }, + { + "epoch": 0.3090248504556586, + "learning_rate": 0.00013819703721546428, + "loss": 0.7535, + "mean_token_accuracy": 0.7779163002967835, + "num_tokens": 104770245.0, + "step": 30790 + }, + { + "epoch": 0.3091252157854591, + "learning_rate": 0.0001381769641495042, + "loss": 0.7664, + "mean_token_accuracy": 0.7698115825653076, + "num_tokens": 104804162.0, + "step": 30800 + }, + { + "epoch": 0.30922558111525955, + "learning_rate": 0.0001381568910835441, + "loss": 0.7567, + "mean_token_accuracy": 0.7743724882602692, + "num_tokens": 104838125.0, + "step": 30810 + }, + { + "epoch": 0.30932594644506, + "learning_rate": 0.000138136818017584, + "loss": 0.7572, + "mean_token_accuracy": 0.7760859906673432, + "num_tokens": 104871914.0, + "step": 30820 + }, + { + "epoch": 0.3094263117748605, + "learning_rate": 0.0001381167449516239, + "loss": 0.7655, + "mean_token_accuracy": 0.7666561007499695, + "num_tokens": 104905686.0, + "step": 30830 + }, + { + "epoch": 0.309526677104661, + "learning_rate": 0.00013809667188566382, + "loss": 0.7541, + "mean_token_accuracy": 0.7743497550487518, + "num_tokens": 104939031.0, + "step": 30840 + }, + { + "epoch": 0.30962704243446143, + "learning_rate": 0.00013807659881970373, + "loss": 0.754, + "mean_token_accuracy": 0.7771598994731903, + "num_tokens": 104972478.0, + "step": 30850 + }, + { + "epoch": 0.3097274077642619, + "learning_rate": 0.00013805652575374364, + "loss": 0.7577, + "mean_token_accuracy": 0.7708552062511445, + "num_tokens": 105006288.0, + "step": 30860 + }, + { + "epoch": 0.3098277730940624, + "learning_rate": 0.00013803645268778354, + "loss": 0.7704, + "mean_token_accuracy": 0.7731885015964508, + "num_tokens": 105040326.0, + "step": 30870 + }, + { + "epoch": 0.30992813842386285, + "learning_rate": 0.00013801637962182343, + "loss": 0.7555, + "mean_token_accuracy": 0.7685849487781524, + "num_tokens": 105074608.0, + "step": 30880 + }, + { + "epoch": 0.3100285037536633, + "learning_rate": 0.00013799630655586336, + "loss": 0.7669, + "mean_token_accuracy": 0.768442940711975, + "num_tokens": 105108269.0, + "step": 30890 + }, + { + "epoch": 0.3101288690834638, + "learning_rate": 0.00013797623348990324, + "loss": 0.7628, + "mean_token_accuracy": 0.7735085904598236, + "num_tokens": 105142180.0, + "step": 30900 + }, + { + "epoch": 0.3102292344132643, + "learning_rate": 0.00013795616042394318, + "loss": 0.7409, + "mean_token_accuracy": 0.7764650583267212, + "num_tokens": 105177116.0, + "step": 30910 + }, + { + "epoch": 0.31032959974306473, + "learning_rate": 0.00013793608735798306, + "loss": 0.7345, + "mean_token_accuracy": 0.777233612537384, + "num_tokens": 105211607.0, + "step": 30920 + }, + { + "epoch": 0.31042996507286524, + "learning_rate": 0.00013791601429202297, + "loss": 0.7477, + "mean_token_accuracy": 0.7734798491001129, + "num_tokens": 105245472.0, + "step": 30930 + }, + { + "epoch": 0.3105303304026657, + "learning_rate": 0.00013789594122606288, + "loss": 0.7583, + "mean_token_accuracy": 0.7751196205615998, + "num_tokens": 105280064.0, + "step": 30940 + }, + { + "epoch": 0.31063069573246616, + "learning_rate": 0.00013787586816010278, + "loss": 0.7634, + "mean_token_accuracy": 0.7729607403278351, + "num_tokens": 105313611.0, + "step": 30950 + }, + { + "epoch": 0.31073106106226667, + "learning_rate": 0.0001378557950941427, + "loss": 0.7604, + "mean_token_accuracy": 0.7732480943202973, + "num_tokens": 105347185.0, + "step": 30960 + }, + { + "epoch": 0.3108314263920671, + "learning_rate": 0.0001378357220281826, + "loss": 0.7643, + "mean_token_accuracy": 0.7731426000595093, + "num_tokens": 105381308.0, + "step": 30970 + }, + { + "epoch": 0.3109317917218676, + "learning_rate": 0.0001378156489622225, + "loss": 0.7839, + "mean_token_accuracy": 0.7677311778068543, + "num_tokens": 105415510.0, + "step": 30980 + }, + { + "epoch": 0.3110321570516681, + "learning_rate": 0.0001377955758962624, + "loss": 0.7344, + "mean_token_accuracy": 0.7777604460716248, + "num_tokens": 105448862.0, + "step": 30990 + }, + { + "epoch": 0.31113252238146855, + "learning_rate": 0.00013777550283030233, + "loss": 0.7904, + "mean_token_accuracy": 0.7629985630512237, + "num_tokens": 105483254.0, + "step": 31000 + }, + { + "epoch": 0.311232887711269, + "learning_rate": 0.0001377554297643422, + "loss": 0.7454, + "mean_token_accuracy": 0.7740285396575928, + "num_tokens": 105516709.0, + "step": 31010 + }, + { + "epoch": 0.3113332530410695, + "learning_rate": 0.00013773535669838212, + "loss": 0.7731, + "mean_token_accuracy": 0.7723234176635743, + "num_tokens": 105551036.0, + "step": 31020 + }, + { + "epoch": 0.31143361837086997, + "learning_rate": 0.00013771528363242202, + "loss": 0.7744, + "mean_token_accuracy": 0.7675805270671845, + "num_tokens": 105585587.0, + "step": 31030 + }, + { + "epoch": 0.3115339837006704, + "learning_rate": 0.00013769521056646193, + "loss": 0.7659, + "mean_token_accuracy": 0.7708247542381287, + "num_tokens": 105619742.0, + "step": 31040 + }, + { + "epoch": 0.31163434903047094, + "learning_rate": 0.00013767513750050181, + "loss": 0.7634, + "mean_token_accuracy": 0.7713421285152435, + "num_tokens": 105653638.0, + "step": 31050 + }, + { + "epoch": 0.3117347143602714, + "learning_rate": 0.00013765506443454175, + "loss": 0.7852, + "mean_token_accuracy": 0.7653680384159088, + "num_tokens": 105687649.0, + "step": 31060 + }, + { + "epoch": 0.31183507969007185, + "learning_rate": 0.00013763499136858163, + "loss": 0.7616, + "mean_token_accuracy": 0.7732458889484406, + "num_tokens": 105721675.0, + "step": 31070 + }, + { + "epoch": 0.31193544501987236, + "learning_rate": 0.00013761491830262154, + "loss": 0.7867, + "mean_token_accuracy": 0.7689832389354706, + "num_tokens": 105755249.0, + "step": 31080 + }, + { + "epoch": 0.3120358103496728, + "learning_rate": 0.00013759484523666148, + "loss": 0.7403, + "mean_token_accuracy": 0.7799917042255402, + "num_tokens": 105788421.0, + "step": 31090 + }, + { + "epoch": 0.31213617567947327, + "learning_rate": 0.00013757477217070136, + "loss": 0.7231, + "mean_token_accuracy": 0.7802851498126984, + "num_tokens": 105822170.0, + "step": 31100 + }, + { + "epoch": 0.3122365410092738, + "learning_rate": 0.00013755469910474127, + "loss": 0.7707, + "mean_token_accuracy": 0.7696276247501374, + "num_tokens": 105856158.0, + "step": 31110 + }, + { + "epoch": 0.31233690633907424, + "learning_rate": 0.00013753462603878117, + "loss": 0.7574, + "mean_token_accuracy": 0.773821359872818, + "num_tokens": 105890198.0, + "step": 31120 + }, + { + "epoch": 0.3124372716688747, + "learning_rate": 0.00013751455297282108, + "loss": 0.7371, + "mean_token_accuracy": 0.7768973231315612, + "num_tokens": 105923800.0, + "step": 31130 + }, + { + "epoch": 0.31253763699867515, + "learning_rate": 0.00013749447990686096, + "loss": 0.7404, + "mean_token_accuracy": 0.7785003006458282, + "num_tokens": 105957717.0, + "step": 31140 + }, + { + "epoch": 0.31263800232847566, + "learning_rate": 0.0001374744068409009, + "loss": 0.7529, + "mean_token_accuracy": 0.7759685933589935, + "num_tokens": 105992243.0, + "step": 31150 + }, + { + "epoch": 0.3127383676582761, + "learning_rate": 0.00013745433377494078, + "loss": 0.7903, + "mean_token_accuracy": 0.7654335021972656, + "num_tokens": 106026004.0, + "step": 31160 + }, + { + "epoch": 0.3128387329880766, + "learning_rate": 0.0001374342607089807, + "loss": 0.8104, + "mean_token_accuracy": 0.7664890110492706, + "num_tokens": 106059229.0, + "step": 31170 + }, + { + "epoch": 0.3129390983178771, + "learning_rate": 0.0001374141876430206, + "loss": 0.7665, + "mean_token_accuracy": 0.7725627541542053, + "num_tokens": 106093422.0, + "step": 31180 + }, + { + "epoch": 0.31303946364767754, + "learning_rate": 0.0001373941145770605, + "loss": 0.7356, + "mean_token_accuracy": 0.7773735344409942, + "num_tokens": 106127644.0, + "step": 31190 + }, + { + "epoch": 0.313139828977478, + "learning_rate": 0.00013737404151110041, + "loss": 0.7087, + "mean_token_accuracy": 0.7839349806308746, + "num_tokens": 106161610.0, + "step": 31200 + }, + { + "epoch": 0.3132401943072785, + "learning_rate": 0.00013735396844514032, + "loss": 0.7562, + "mean_token_accuracy": 0.7767717659473419, + "num_tokens": 106194593.0, + "step": 31210 + }, + { + "epoch": 0.31334055963707896, + "learning_rate": 0.00013733389537918023, + "loss": 0.731, + "mean_token_accuracy": 0.7789615154266357, + "num_tokens": 106228903.0, + "step": 31220 + }, + { + "epoch": 0.3134409249668794, + "learning_rate": 0.0001373138223132201, + "loss": 0.6995, + "mean_token_accuracy": 0.7882622420787812, + "num_tokens": 106262657.0, + "step": 31230 + }, + { + "epoch": 0.31354129029667993, + "learning_rate": 0.00013729374924726005, + "loss": 0.7779, + "mean_token_accuracy": 0.7682585716247559, + "num_tokens": 106296495.0, + "step": 31240 + }, + { + "epoch": 0.3136416556264804, + "learning_rate": 0.00013727367618129993, + "loss": 0.796, + "mean_token_accuracy": 0.7617917835712433, + "num_tokens": 106330196.0, + "step": 31250 + }, + { + "epoch": 0.31374202095628084, + "learning_rate": 0.00013725360311533984, + "loss": 0.7565, + "mean_token_accuracy": 0.7745411932468415, + "num_tokens": 106363984.0, + "step": 31260 + }, + { + "epoch": 0.31384238628608135, + "learning_rate": 0.00013723353004937975, + "loss": 0.754, + "mean_token_accuracy": 0.7728968620300293, + "num_tokens": 106398353.0, + "step": 31270 + }, + { + "epoch": 0.3139427516158818, + "learning_rate": 0.00013721345698341965, + "loss": 0.7627, + "mean_token_accuracy": 0.7766358733177186, + "num_tokens": 106432556.0, + "step": 31280 + }, + { + "epoch": 0.31404311694568227, + "learning_rate": 0.00013719338391745956, + "loss": 0.7577, + "mean_token_accuracy": 0.7688096821308136, + "num_tokens": 106466061.0, + "step": 31290 + }, + { + "epoch": 0.3141434822754828, + "learning_rate": 0.00013717331085149947, + "loss": 0.7628, + "mean_token_accuracy": 0.7754148781299591, + "num_tokens": 106500236.0, + "step": 31300 + }, + { + "epoch": 0.31424384760528323, + "learning_rate": 0.00013715323778553938, + "loss": 0.7528, + "mean_token_accuracy": 0.7724867820739746, + "num_tokens": 106533982.0, + "step": 31310 + }, + { + "epoch": 0.3143442129350837, + "learning_rate": 0.00013713316471957926, + "loss": 0.7772, + "mean_token_accuracy": 0.7755430579185486, + "num_tokens": 106567998.0, + "step": 31320 + }, + { + "epoch": 0.3144445782648842, + "learning_rate": 0.0001371130916536192, + "loss": 0.7558, + "mean_token_accuracy": 0.7747138500213623, + "num_tokens": 106602651.0, + "step": 31330 + }, + { + "epoch": 0.31454494359468466, + "learning_rate": 0.00013709301858765908, + "loss": 0.71, + "mean_token_accuracy": 0.7766462087631225, + "num_tokens": 106635982.0, + "step": 31340 + }, + { + "epoch": 0.3146453089244851, + "learning_rate": 0.00013707294552169899, + "loss": 0.7399, + "mean_token_accuracy": 0.7780038237571716, + "num_tokens": 106670128.0, + "step": 31350 + }, + { + "epoch": 0.3147456742542856, + "learning_rate": 0.0001370528724557389, + "loss": 0.7622, + "mean_token_accuracy": 0.7697994351387024, + "num_tokens": 106704363.0, + "step": 31360 + }, + { + "epoch": 0.3148460395840861, + "learning_rate": 0.0001370327993897788, + "loss": 0.7759, + "mean_token_accuracy": 0.7660178899765014, + "num_tokens": 106738907.0, + "step": 31370 + }, + { + "epoch": 0.31494640491388654, + "learning_rate": 0.00013701272632381868, + "loss": 0.7937, + "mean_token_accuracy": 0.763887357711792, + "num_tokens": 106773262.0, + "step": 31380 + }, + { + "epoch": 0.31504677024368705, + "learning_rate": 0.00013699265325785862, + "loss": 0.7767, + "mean_token_accuracy": 0.7671867370605469, + "num_tokens": 106807856.0, + "step": 31390 + }, + { + "epoch": 0.3151471355734875, + "learning_rate": 0.0001369725801918985, + "loss": 0.7399, + "mean_token_accuracy": 0.7766685962677002, + "num_tokens": 106842772.0, + "step": 31400 + }, + { + "epoch": 0.31524750090328796, + "learning_rate": 0.0001369525071259384, + "loss": 0.735, + "mean_token_accuracy": 0.7800912439823151, + "num_tokens": 106876777.0, + "step": 31410 + }, + { + "epoch": 0.31534786623308847, + "learning_rate": 0.00013693243405997832, + "loss": 0.7646, + "mean_token_accuracy": 0.7699158966541291, + "num_tokens": 106909812.0, + "step": 31420 + }, + { + "epoch": 0.3154482315628889, + "learning_rate": 0.00013691236099401823, + "loss": 0.7232, + "mean_token_accuracy": 0.7792066931724548, + "num_tokens": 106944204.0, + "step": 31430 + }, + { + "epoch": 0.3155485968926894, + "learning_rate": 0.00013689228792805814, + "loss": 0.7657, + "mean_token_accuracy": 0.7711667120456696, + "num_tokens": 106978215.0, + "step": 31440 + }, + { + "epoch": 0.31564896222248984, + "learning_rate": 0.00013687221486209804, + "loss": 0.7525, + "mean_token_accuracy": 0.7722912907600403, + "num_tokens": 107012101.0, + "step": 31450 + }, + { + "epoch": 0.31574932755229035, + "learning_rate": 0.00013685214179613795, + "loss": 0.7845, + "mean_token_accuracy": 0.7634316205978393, + "num_tokens": 107045614.0, + "step": 31460 + }, + { + "epoch": 0.3158496928820908, + "learning_rate": 0.00013683206873017786, + "loss": 0.7509, + "mean_token_accuracy": 0.7773948848247528, + "num_tokens": 107079266.0, + "step": 31470 + }, + { + "epoch": 0.31595005821189126, + "learning_rate": 0.00013681199566421777, + "loss": 0.7643, + "mean_token_accuracy": 0.7704627335071563, + "num_tokens": 107113132.0, + "step": 31480 + }, + { + "epoch": 0.31605042354169177, + "learning_rate": 0.00013679192259825765, + "loss": 0.7554, + "mean_token_accuracy": 0.7745836615562439, + "num_tokens": 107147541.0, + "step": 31490 + }, + { + "epoch": 0.3161507888714922, + "learning_rate": 0.00013677184953229759, + "loss": 0.7501, + "mean_token_accuracy": 0.7730957865715027, + "num_tokens": 107180909.0, + "step": 31500 + }, + { + "epoch": 0.3162511542012927, + "learning_rate": 0.00013675177646633747, + "loss": 0.7467, + "mean_token_accuracy": 0.7751357734203339, + "num_tokens": 107214309.0, + "step": 31510 + }, + { + "epoch": 0.3163515195310932, + "learning_rate": 0.00013673170340037738, + "loss": 0.7334, + "mean_token_accuracy": 0.7759930789470673, + "num_tokens": 107247628.0, + "step": 31520 + }, + { + "epoch": 0.31645188486089365, + "learning_rate": 0.00013671163033441728, + "loss": 0.7486, + "mean_token_accuracy": 0.7736383378505707, + "num_tokens": 107280991.0, + "step": 31530 + }, + { + "epoch": 0.3165522501906941, + "learning_rate": 0.0001366915572684572, + "loss": 0.76, + "mean_token_accuracy": 0.7731526851654053, + "num_tokens": 107314784.0, + "step": 31540 + }, + { + "epoch": 0.3166526155204946, + "learning_rate": 0.0001366714842024971, + "loss": 0.7684, + "mean_token_accuracy": 0.7669507205486298, + "num_tokens": 107348737.0, + "step": 31550 + }, + { + "epoch": 0.3167529808502951, + "learning_rate": 0.000136651411136537, + "loss": 0.7573, + "mean_token_accuracy": 0.7724651575088501, + "num_tokens": 107382728.0, + "step": 31560 + }, + { + "epoch": 0.31685334618009553, + "learning_rate": 0.00013663133807057692, + "loss": 0.7223, + "mean_token_accuracy": 0.7813074648380279, + "num_tokens": 107416169.0, + "step": 31570 + }, + { + "epoch": 0.31695371150989604, + "learning_rate": 0.0001366112650046168, + "loss": 0.7422, + "mean_token_accuracy": 0.7836302399635315, + "num_tokens": 107449718.0, + "step": 31580 + }, + { + "epoch": 0.3170540768396965, + "learning_rate": 0.00013659119193865673, + "loss": 0.7257, + "mean_token_accuracy": 0.7790060758590698, + "num_tokens": 107484770.0, + "step": 31590 + }, + { + "epoch": 0.31715444216949695, + "learning_rate": 0.00013657111887269662, + "loss": 0.8104, + "mean_token_accuracy": 0.7588859498500824, + "num_tokens": 107519390.0, + "step": 31600 + }, + { + "epoch": 0.31725480749929746, + "learning_rate": 0.00013655104580673652, + "loss": 0.7816, + "mean_token_accuracy": 0.7687376499176025, + "num_tokens": 107553086.0, + "step": 31610 + }, + { + "epoch": 0.3173551728290979, + "learning_rate": 0.00013653097274077643, + "loss": 0.7693, + "mean_token_accuracy": 0.77187077999115, + "num_tokens": 107587578.0, + "step": 31620 + }, + { + "epoch": 0.3174555381588984, + "learning_rate": 0.00013651089967481634, + "loss": 0.7184, + "mean_token_accuracy": 0.7835727810859681, + "num_tokens": 107620742.0, + "step": 31630 + }, + { + "epoch": 0.3175559034886989, + "learning_rate": 0.00013649082660885625, + "loss": 0.7569, + "mean_token_accuracy": 0.7751154661178589, + "num_tokens": 107655422.0, + "step": 31640 + }, + { + "epoch": 0.31765626881849934, + "learning_rate": 0.00013647075354289616, + "loss": 0.7476, + "mean_token_accuracy": 0.7770822584629059, + "num_tokens": 107689751.0, + "step": 31650 + }, + { + "epoch": 0.3177566341482998, + "learning_rate": 0.00013645068047693607, + "loss": 0.7391, + "mean_token_accuracy": 0.7775422394275665, + "num_tokens": 107723417.0, + "step": 31660 + }, + { + "epoch": 0.3178569994781003, + "learning_rate": 0.00013643060741097595, + "loss": 0.7269, + "mean_token_accuracy": 0.7786263823509216, + "num_tokens": 107757114.0, + "step": 31670 + }, + { + "epoch": 0.31795736480790077, + "learning_rate": 0.00013641053434501588, + "loss": 0.7582, + "mean_token_accuracy": 0.773527330160141, + "num_tokens": 107791142.0, + "step": 31680 + }, + { + "epoch": 0.3180577301377012, + "learning_rate": 0.00013639046127905576, + "loss": 0.8128, + "mean_token_accuracy": 0.7656544923782349, + "num_tokens": 107825259.0, + "step": 31690 + }, + { + "epoch": 0.31815809546750173, + "learning_rate": 0.00013637038821309567, + "loss": 0.7108, + "mean_token_accuracy": 0.7856820106506348, + "num_tokens": 107859872.0, + "step": 31700 + }, + { + "epoch": 0.3182584607973022, + "learning_rate": 0.00013635031514713558, + "loss": 0.7415, + "mean_token_accuracy": 0.7775092601776123, + "num_tokens": 107894388.0, + "step": 31710 + }, + { + "epoch": 0.31835882612710265, + "learning_rate": 0.0001363302420811755, + "loss": 0.7414, + "mean_token_accuracy": 0.7725362718105316, + "num_tokens": 107928361.0, + "step": 31720 + }, + { + "epoch": 0.3184591914569031, + "learning_rate": 0.00013631016901521537, + "loss": 0.7419, + "mean_token_accuracy": 0.7755842924118042, + "num_tokens": 107961945.0, + "step": 31730 + }, + { + "epoch": 0.3185595567867036, + "learning_rate": 0.0001362900959492553, + "loss": 0.764, + "mean_token_accuracy": 0.7704953134059906, + "num_tokens": 107995563.0, + "step": 31740 + }, + { + "epoch": 0.31865992211650407, + "learning_rate": 0.0001362700228832952, + "loss": 0.7374, + "mean_token_accuracy": 0.7792326033115387, + "num_tokens": 108030023.0, + "step": 31750 + }, + { + "epoch": 0.3187602874463045, + "learning_rate": 0.0001362499498173351, + "loss": 0.7667, + "mean_token_accuracy": 0.7738947212696076, + "num_tokens": 108064184.0, + "step": 31760 + }, + { + "epoch": 0.31886065277610504, + "learning_rate": 0.000136229876751375, + "loss": 0.7567, + "mean_token_accuracy": 0.7785474181175231, + "num_tokens": 108098008.0, + "step": 31770 + }, + { + "epoch": 0.3189610181059055, + "learning_rate": 0.00013620980368541491, + "loss": 0.7346, + "mean_token_accuracy": 0.7725403249263764, + "num_tokens": 108131284.0, + "step": 31780 + }, + { + "epoch": 0.31906138343570595, + "learning_rate": 0.00013618973061945482, + "loss": 0.7419, + "mean_token_accuracy": 0.777106761932373, + "num_tokens": 108165107.0, + "step": 31790 + }, + { + "epoch": 0.31916174876550646, + "learning_rate": 0.00013616965755349473, + "loss": 0.7396, + "mean_token_accuracy": 0.7769767999649048, + "num_tokens": 108199352.0, + "step": 31800 + }, + { + "epoch": 0.3192621140953069, + "learning_rate": 0.00013614958448753464, + "loss": 0.7566, + "mean_token_accuracy": 0.7712903320789337, + "num_tokens": 108234070.0, + "step": 31810 + }, + { + "epoch": 0.31936247942510737, + "learning_rate": 0.00013612951142157452, + "loss": 0.7499, + "mean_token_accuracy": 0.7742361009120942, + "num_tokens": 108267886.0, + "step": 31820 + }, + { + "epoch": 0.3194628447549079, + "learning_rate": 0.00013610943835561446, + "loss": 0.7438, + "mean_token_accuracy": 0.775706660747528, + "num_tokens": 108301250.0, + "step": 31830 + }, + { + "epoch": 0.31956321008470834, + "learning_rate": 0.00013608936528965434, + "loss": 0.7878, + "mean_token_accuracy": 0.7631179451942444, + "num_tokens": 108335568.0, + "step": 31840 + }, + { + "epoch": 0.3196635754145088, + "learning_rate": 0.00013606929222369425, + "loss": 0.741, + "mean_token_accuracy": 0.7747395813465119, + "num_tokens": 108369565.0, + "step": 31850 + }, + { + "epoch": 0.3197639407443093, + "learning_rate": 0.00013604921915773415, + "loss": 0.7515, + "mean_token_accuracy": 0.7772541761398315, + "num_tokens": 108403911.0, + "step": 31860 + }, + { + "epoch": 0.31986430607410976, + "learning_rate": 0.00013602914609177406, + "loss": 0.7281, + "mean_token_accuracy": 0.7788921952247619, + "num_tokens": 108438749.0, + "step": 31870 + }, + { + "epoch": 0.3199646714039102, + "learning_rate": 0.00013600907302581397, + "loss": 0.7665, + "mean_token_accuracy": 0.7673018515110016, + "num_tokens": 108472615.0, + "step": 31880 + }, + { + "epoch": 0.32006503673371073, + "learning_rate": 0.00013598899995985388, + "loss": 0.7649, + "mean_token_accuracy": 0.7717642366886139, + "num_tokens": 108506568.0, + "step": 31890 + }, + { + "epoch": 0.3201654020635112, + "learning_rate": 0.0001359689268938938, + "loss": 0.7806, + "mean_token_accuracy": 0.766598004102707, + "num_tokens": 108540136.0, + "step": 31900 + }, + { + "epoch": 0.32026576739331164, + "learning_rate": 0.00013594885382793367, + "loss": 0.8041, + "mean_token_accuracy": 0.7628247916698456, + "num_tokens": 108574895.0, + "step": 31910 + }, + { + "epoch": 0.32036613272311215, + "learning_rate": 0.0001359287807619736, + "loss": 0.7557, + "mean_token_accuracy": 0.770247095823288, + "num_tokens": 108608655.0, + "step": 31920 + }, + { + "epoch": 0.3204664980529126, + "learning_rate": 0.00013590870769601349, + "loss": 0.7336, + "mean_token_accuracy": 0.7751041054725647, + "num_tokens": 108643349.0, + "step": 31930 + }, + { + "epoch": 0.32056686338271306, + "learning_rate": 0.0001358886346300534, + "loss": 0.7708, + "mean_token_accuracy": 0.7705505788326263, + "num_tokens": 108677426.0, + "step": 31940 + }, + { + "epoch": 0.3206672287125136, + "learning_rate": 0.0001358685615640933, + "loss": 0.7629, + "mean_token_accuracy": 0.7727705180644989, + "num_tokens": 108712090.0, + "step": 31950 + }, + { + "epoch": 0.32076759404231403, + "learning_rate": 0.0001358484884981332, + "loss": 0.7613, + "mean_token_accuracy": 0.7704655826091766, + "num_tokens": 108746220.0, + "step": 31960 + }, + { + "epoch": 0.3208679593721145, + "learning_rate": 0.00013582841543217312, + "loss": 0.7518, + "mean_token_accuracy": 0.7753160715103149, + "num_tokens": 108780439.0, + "step": 31970 + }, + { + "epoch": 0.320968324701915, + "learning_rate": 0.00013580834236621303, + "loss": 0.7472, + "mean_token_accuracy": 0.7801798641681671, + "num_tokens": 108814220.0, + "step": 31980 + }, + { + "epoch": 0.32106869003171545, + "learning_rate": 0.00013578826930025294, + "loss": 0.7658, + "mean_token_accuracy": 0.7712485730648041, + "num_tokens": 108848599.0, + "step": 31990 + }, + { + "epoch": 0.3211690553615159, + "learning_rate": 0.00013576819623429282, + "loss": 0.7603, + "mean_token_accuracy": 0.7678033530712127, + "num_tokens": 108881767.0, + "step": 32000 + }, + { + "epoch": 0.32126942069131637, + "learning_rate": 0.00013574812316833275, + "loss": 0.7152, + "mean_token_accuracy": 0.78734210729599, + "num_tokens": 108916916.0, + "step": 32010 + }, + { + "epoch": 0.3213697860211169, + "learning_rate": 0.00013572805010237263, + "loss": 0.7649, + "mean_token_accuracy": 0.7759453594684601, + "num_tokens": 108950128.0, + "step": 32020 + }, + { + "epoch": 0.32147015135091733, + "learning_rate": 0.00013570797703641257, + "loss": 0.7364, + "mean_token_accuracy": 0.7787595689296722, + "num_tokens": 108984782.0, + "step": 32030 + }, + { + "epoch": 0.3215705166807178, + "learning_rate": 0.00013568790397045245, + "loss": 0.7478, + "mean_token_accuracy": 0.774041885137558, + "num_tokens": 109018053.0, + "step": 32040 + }, + { + "epoch": 0.3216708820105183, + "learning_rate": 0.00013566783090449236, + "loss": 0.8212, + "mean_token_accuracy": 0.7619028091430664, + "num_tokens": 109051791.0, + "step": 32050 + }, + { + "epoch": 0.32177124734031876, + "learning_rate": 0.00013564775783853227, + "loss": 0.7473, + "mean_token_accuracy": 0.7691491365432739, + "num_tokens": 109085863.0, + "step": 32060 + }, + { + "epoch": 0.3218716126701192, + "learning_rate": 0.00013562768477257218, + "loss": 0.788, + "mean_token_accuracy": 0.7673633575439454, + "num_tokens": 109119871.0, + "step": 32070 + }, + { + "epoch": 0.3219719779999197, + "learning_rate": 0.00013560761170661206, + "loss": 0.7477, + "mean_token_accuracy": 0.7754402875900268, + "num_tokens": 109152691.0, + "step": 32080 + }, + { + "epoch": 0.3220723433297202, + "learning_rate": 0.000135587538640652, + "loss": 0.76, + "mean_token_accuracy": 0.7736308097839355, + "num_tokens": 109186279.0, + "step": 32090 + }, + { + "epoch": 0.32217270865952063, + "learning_rate": 0.00013556746557469188, + "loss": 0.7702, + "mean_token_accuracy": 0.7687101304531098, + "num_tokens": 109221336.0, + "step": 32100 + }, + { + "epoch": 0.32227307398932115, + "learning_rate": 0.00013554739250873178, + "loss": 0.7682, + "mean_token_accuracy": 0.7724032521247863, + "num_tokens": 109256245.0, + "step": 32110 + }, + { + "epoch": 0.3223734393191216, + "learning_rate": 0.0001355273194427717, + "loss": 0.737, + "mean_token_accuracy": 0.7786790549755096, + "num_tokens": 109290679.0, + "step": 32120 + }, + { + "epoch": 0.32247380464892206, + "learning_rate": 0.0001355072463768116, + "loss": 0.7931, + "mean_token_accuracy": 0.7702713489532471, + "num_tokens": 109324445.0, + "step": 32130 + }, + { + "epoch": 0.32257416997872257, + "learning_rate": 0.0001354871733108515, + "loss": 0.7615, + "mean_token_accuracy": 0.773723566532135, + "num_tokens": 109358539.0, + "step": 32140 + }, + { + "epoch": 0.322674535308523, + "learning_rate": 0.00013546710024489142, + "loss": 0.7328, + "mean_token_accuracy": 0.7815119981765747, + "num_tokens": 109393450.0, + "step": 32150 + }, + { + "epoch": 0.3227749006383235, + "learning_rate": 0.00013544702717893133, + "loss": 0.7804, + "mean_token_accuracy": 0.7684081137180329, + "num_tokens": 109427666.0, + "step": 32160 + }, + { + "epoch": 0.322875265968124, + "learning_rate": 0.0001354269541129712, + "loss": 0.7633, + "mean_token_accuracy": 0.7712672531604767, + "num_tokens": 109461562.0, + "step": 32170 + }, + { + "epoch": 0.32297563129792445, + "learning_rate": 0.00013540688104701114, + "loss": 0.7438, + "mean_token_accuracy": 0.7765189170837402, + "num_tokens": 109495100.0, + "step": 32180 + }, + { + "epoch": 0.3230759966277249, + "learning_rate": 0.00013538680798105102, + "loss": 0.7528, + "mean_token_accuracy": 0.7719919204711914, + "num_tokens": 109528647.0, + "step": 32190 + }, + { + "epoch": 0.3231763619575254, + "learning_rate": 0.00013536673491509093, + "loss": 0.7375, + "mean_token_accuracy": 0.7776155114173889, + "num_tokens": 109562188.0, + "step": 32200 + }, + { + "epoch": 0.32327672728732587, + "learning_rate": 0.00013534666184913084, + "loss": 0.7821, + "mean_token_accuracy": 0.7668117403984069, + "num_tokens": 109596286.0, + "step": 32210 + }, + { + "epoch": 0.3233770926171263, + "learning_rate": 0.00013532658878317075, + "loss": 0.7488, + "mean_token_accuracy": 0.777635246515274, + "num_tokens": 109630329.0, + "step": 32220 + }, + { + "epoch": 0.32347745794692684, + "learning_rate": 0.00013530651571721066, + "loss": 0.7407, + "mean_token_accuracy": 0.7749003648757935, + "num_tokens": 109664612.0, + "step": 32230 + }, + { + "epoch": 0.3235778232767273, + "learning_rate": 0.00013528644265125057, + "loss": 0.7774, + "mean_token_accuracy": 0.7638455092906952, + "num_tokens": 109698578.0, + "step": 32240 + }, + { + "epoch": 0.32367818860652775, + "learning_rate": 0.00013526636958529047, + "loss": 0.7846, + "mean_token_accuracy": 0.7743920683860779, + "num_tokens": 109731731.0, + "step": 32250 + }, + { + "epoch": 0.32377855393632826, + "learning_rate": 0.00013524629651933036, + "loss": 0.7861, + "mean_token_accuracy": 0.7681153833866119, + "num_tokens": 109765201.0, + "step": 32260 + }, + { + "epoch": 0.3238789192661287, + "learning_rate": 0.0001352262234533703, + "loss": 0.7314, + "mean_token_accuracy": 0.7845546007156372, + "num_tokens": 109799147.0, + "step": 32270 + }, + { + "epoch": 0.3239792845959292, + "learning_rate": 0.00013520615038741017, + "loss": 0.7559, + "mean_token_accuracy": 0.7764472961425781, + "num_tokens": 109832615.0, + "step": 32280 + }, + { + "epoch": 0.32407964992572963, + "learning_rate": 0.00013518607732145008, + "loss": 0.7769, + "mean_token_accuracy": 0.77084321975708, + "num_tokens": 109867074.0, + "step": 32290 + }, + { + "epoch": 0.32418001525553014, + "learning_rate": 0.00013516600425549, + "loss": 0.752, + "mean_token_accuracy": 0.7727360308170319, + "num_tokens": 109900583.0, + "step": 32300 + }, + { + "epoch": 0.3242803805853306, + "learning_rate": 0.0001351459311895299, + "loss": 0.7216, + "mean_token_accuracy": 0.7850228488445282, + "num_tokens": 109934782.0, + "step": 32310 + }, + { + "epoch": 0.32438074591513105, + "learning_rate": 0.00013512585812356978, + "loss": 0.7754, + "mean_token_accuracy": 0.7770364701747894, + "num_tokens": 109968322.0, + "step": 32320 + }, + { + "epoch": 0.32448111124493156, + "learning_rate": 0.00013510578505760971, + "loss": 0.7411, + "mean_token_accuracy": 0.7774547398090362, + "num_tokens": 110002369.0, + "step": 32330 + }, + { + "epoch": 0.324581476574732, + "learning_rate": 0.00013508571199164962, + "loss": 0.7426, + "mean_token_accuracy": 0.7777173161506653, + "num_tokens": 110036212.0, + "step": 32340 + }, + { + "epoch": 0.3246818419045325, + "learning_rate": 0.0001350656389256895, + "loss": 0.748, + "mean_token_accuracy": 0.7730215549468994, + "num_tokens": 110070000.0, + "step": 32350 + }, + { + "epoch": 0.324782207234333, + "learning_rate": 0.00013504556585972944, + "loss": 0.7533, + "mean_token_accuracy": 0.7774468004703522, + "num_tokens": 110103539.0, + "step": 32360 + }, + { + "epoch": 0.32488257256413344, + "learning_rate": 0.00013502549279376932, + "loss": 0.7742, + "mean_token_accuracy": 0.7731855750083924, + "num_tokens": 110136345.0, + "step": 32370 + }, + { + "epoch": 0.3249829378939339, + "learning_rate": 0.00013500541972780923, + "loss": 0.7251, + "mean_token_accuracy": 0.7809814929962158, + "num_tokens": 110170090.0, + "step": 32380 + }, + { + "epoch": 0.3250833032237344, + "learning_rate": 0.00013498534666184914, + "loss": 0.7673, + "mean_token_accuracy": 0.7671895265579224, + "num_tokens": 110204187.0, + "step": 32390 + }, + { + "epoch": 0.32518366855353487, + "learning_rate": 0.00013496527359588905, + "loss": 0.779, + "mean_token_accuracy": 0.7657867550849915, + "num_tokens": 110237628.0, + "step": 32400 + }, + { + "epoch": 0.3252840338833353, + "learning_rate": 0.00013494520052992893, + "loss": 0.7715, + "mean_token_accuracy": 0.7649196982383728, + "num_tokens": 110271972.0, + "step": 32410 + }, + { + "epoch": 0.32538439921313583, + "learning_rate": 0.00013492512746396886, + "loss": 0.7628, + "mean_token_accuracy": 0.7747393310070038, + "num_tokens": 110305474.0, + "step": 32420 + }, + { + "epoch": 0.3254847645429363, + "learning_rate": 0.00013490505439800875, + "loss": 0.7726, + "mean_token_accuracy": 0.7721804261207581, + "num_tokens": 110338273.0, + "step": 32430 + }, + { + "epoch": 0.32558512987273674, + "learning_rate": 0.00013488498133204865, + "loss": 0.7774, + "mean_token_accuracy": 0.7693785786628723, + "num_tokens": 110371668.0, + "step": 32440 + }, + { + "epoch": 0.32568549520253726, + "learning_rate": 0.00013486490826608856, + "loss": 0.733, + "mean_token_accuracy": 0.7804516375064849, + "num_tokens": 110405971.0, + "step": 32450 + }, + { + "epoch": 0.3257858605323377, + "learning_rate": 0.00013484483520012847, + "loss": 0.7488, + "mean_token_accuracy": 0.7758582949638366, + "num_tokens": 110439381.0, + "step": 32460 + }, + { + "epoch": 0.32588622586213817, + "learning_rate": 0.00013482476213416838, + "loss": 0.7303, + "mean_token_accuracy": 0.7835233032703399, + "num_tokens": 110473526.0, + "step": 32470 + }, + { + "epoch": 0.3259865911919387, + "learning_rate": 0.0001348046890682083, + "loss": 0.7464, + "mean_token_accuracy": 0.7742891490459443, + "num_tokens": 110507850.0, + "step": 32480 + }, + { + "epoch": 0.32608695652173914, + "learning_rate": 0.0001347846160022482, + "loss": 0.7535, + "mean_token_accuracy": 0.7720338225364685, + "num_tokens": 110541759.0, + "step": 32490 + }, + { + "epoch": 0.3261873218515396, + "learning_rate": 0.00013476454293628808, + "loss": 0.755, + "mean_token_accuracy": 0.7763753592967987, + "num_tokens": 110576055.0, + "step": 32500 + }, + { + "epoch": 0.3262876871813401, + "learning_rate": 0.000134744469870328, + "loss": 0.7564, + "mean_token_accuracy": 0.7785202860832214, + "num_tokens": 110610513.0, + "step": 32510 + }, + { + "epoch": 0.32638805251114056, + "learning_rate": 0.0001347243968043679, + "loss": 0.7451, + "mean_token_accuracy": 0.779188472032547, + "num_tokens": 110644185.0, + "step": 32520 + }, + { + "epoch": 0.326488417840941, + "learning_rate": 0.0001347043237384078, + "loss": 0.761, + "mean_token_accuracy": 0.7707403719425201, + "num_tokens": 110678583.0, + "step": 32530 + }, + { + "epoch": 0.3265887831707415, + "learning_rate": 0.0001346842506724477, + "loss": 0.8044, + "mean_token_accuracy": 0.7612372517585755, + "num_tokens": 110712884.0, + "step": 32540 + }, + { + "epoch": 0.326689148500542, + "learning_rate": 0.00013466417760648762, + "loss": 0.7689, + "mean_token_accuracy": 0.7703858196735383, + "num_tokens": 110747062.0, + "step": 32550 + }, + { + "epoch": 0.32678951383034244, + "learning_rate": 0.00013464410454052753, + "loss": 0.7614, + "mean_token_accuracy": 0.7742425918579101, + "num_tokens": 110780826.0, + "step": 32560 + }, + { + "epoch": 0.3268898791601429, + "learning_rate": 0.00013462403147456744, + "loss": 0.7633, + "mean_token_accuracy": 0.7720452129840851, + "num_tokens": 110814562.0, + "step": 32570 + }, + { + "epoch": 0.3269902444899434, + "learning_rate": 0.00013460395840860734, + "loss": 0.7455, + "mean_token_accuracy": 0.7741398751735687, + "num_tokens": 110848154.0, + "step": 32580 + }, + { + "epoch": 0.32709060981974386, + "learning_rate": 0.00013458388534264725, + "loss": 0.7573, + "mean_token_accuracy": 0.7721172392368316, + "num_tokens": 110881459.0, + "step": 32590 + }, + { + "epoch": 0.3271909751495443, + "learning_rate": 0.00013456381227668716, + "loss": 0.7939, + "mean_token_accuracy": 0.7620940685272217, + "num_tokens": 110914397.0, + "step": 32600 + }, + { + "epoch": 0.32729134047934483, + "learning_rate": 0.00013454373921072704, + "loss": 0.7785, + "mean_token_accuracy": 0.7706295728683472, + "num_tokens": 110947918.0, + "step": 32610 + }, + { + "epoch": 0.3273917058091453, + "learning_rate": 0.00013452366614476698, + "loss": 0.7222, + "mean_token_accuracy": 0.781663328409195, + "num_tokens": 110981979.0, + "step": 32620 + }, + { + "epoch": 0.32749207113894574, + "learning_rate": 0.00013450359307880686, + "loss": 0.7669, + "mean_token_accuracy": 0.7725927770137787, + "num_tokens": 111015820.0, + "step": 32630 + }, + { + "epoch": 0.32759243646874625, + "learning_rate": 0.00013448352001284677, + "loss": 0.7562, + "mean_token_accuracy": 0.7748718917369842, + "num_tokens": 111049692.0, + "step": 32640 + }, + { + "epoch": 0.3276928017985467, + "learning_rate": 0.00013446344694688668, + "loss": 0.7309, + "mean_token_accuracy": 0.7789419114589691, + "num_tokens": 111083911.0, + "step": 32650 + }, + { + "epoch": 0.32779316712834716, + "learning_rate": 0.00013444337388092658, + "loss": 0.7848, + "mean_token_accuracy": 0.7680621981620789, + "num_tokens": 111117609.0, + "step": 32660 + }, + { + "epoch": 0.3278935324581477, + "learning_rate": 0.00013442330081496647, + "loss": 0.7443, + "mean_token_accuracy": 0.7761209666728973, + "num_tokens": 111151150.0, + "step": 32670 + }, + { + "epoch": 0.32799389778794813, + "learning_rate": 0.0001344032277490064, + "loss": 0.7367, + "mean_token_accuracy": 0.7787201941013336, + "num_tokens": 111185526.0, + "step": 32680 + }, + { + "epoch": 0.3280942631177486, + "learning_rate": 0.0001343831546830463, + "loss": 0.7413, + "mean_token_accuracy": 0.7789070963859558, + "num_tokens": 111219612.0, + "step": 32690 + }, + { + "epoch": 0.3281946284475491, + "learning_rate": 0.0001343630816170862, + "loss": 0.7764, + "mean_token_accuracy": 0.7700829148292542, + "num_tokens": 111253256.0, + "step": 32700 + }, + { + "epoch": 0.32829499377734955, + "learning_rate": 0.00013434300855112613, + "loss": 0.7816, + "mean_token_accuracy": 0.7685696482658386, + "num_tokens": 111287245.0, + "step": 32710 + }, + { + "epoch": 0.32839535910715, + "learning_rate": 0.000134322935485166, + "loss": 0.7604, + "mean_token_accuracy": 0.7750800907611847, + "num_tokens": 111321100.0, + "step": 32720 + }, + { + "epoch": 0.3284957244369505, + "learning_rate": 0.00013430286241920592, + "loss": 0.7915, + "mean_token_accuracy": 0.7680218696594239, + "num_tokens": 111355057.0, + "step": 32730 + }, + { + "epoch": 0.328596089766751, + "learning_rate": 0.00013428278935324583, + "loss": 0.7215, + "mean_token_accuracy": 0.7815347969532013, + "num_tokens": 111388575.0, + "step": 32740 + }, + { + "epoch": 0.32869645509655143, + "learning_rate": 0.00013426271628728573, + "loss": 0.7809, + "mean_token_accuracy": 0.76324343085289, + "num_tokens": 111422438.0, + "step": 32750 + }, + { + "epoch": 0.32879682042635194, + "learning_rate": 0.00013424264322132561, + "loss": 0.7351, + "mean_token_accuracy": 0.7771598517894744, + "num_tokens": 111456396.0, + "step": 32760 + }, + { + "epoch": 0.3288971857561524, + "learning_rate": 0.00013422257015536555, + "loss": 0.7734, + "mean_token_accuracy": 0.770964401960373, + "num_tokens": 111490311.0, + "step": 32770 + }, + { + "epoch": 0.32899755108595286, + "learning_rate": 0.00013420249708940543, + "loss": 0.7446, + "mean_token_accuracy": 0.7775906801223755, + "num_tokens": 111524145.0, + "step": 32780 + }, + { + "epoch": 0.32909791641575337, + "learning_rate": 0.00013418242402344534, + "loss": 0.7306, + "mean_token_accuracy": 0.7793404579162597, + "num_tokens": 111557884.0, + "step": 32790 + }, + { + "epoch": 0.3291982817455538, + "learning_rate": 0.00013416235095748525, + "loss": 0.7758, + "mean_token_accuracy": 0.7654808759689331, + "num_tokens": 111592317.0, + "step": 32800 + }, + { + "epoch": 0.3292986470753543, + "learning_rate": 0.00013414227789152516, + "loss": 0.7803, + "mean_token_accuracy": 0.7690751791000366, + "num_tokens": 111626167.0, + "step": 32810 + }, + { + "epoch": 0.3293990124051548, + "learning_rate": 0.00013412220482556507, + "loss": 0.7451, + "mean_token_accuracy": 0.7735684156417847, + "num_tokens": 111660400.0, + "step": 32820 + }, + { + "epoch": 0.32949937773495525, + "learning_rate": 0.00013410213175960497, + "loss": 0.7404, + "mean_token_accuracy": 0.7744576811790467, + "num_tokens": 111693706.0, + "step": 32830 + }, + { + "epoch": 0.3295997430647557, + "learning_rate": 0.00013408205869364488, + "loss": 0.7158, + "mean_token_accuracy": 0.7870796263217926, + "num_tokens": 111728784.0, + "step": 32840 + }, + { + "epoch": 0.32970010839455616, + "learning_rate": 0.00013406198562768476, + "loss": 0.7483, + "mean_token_accuracy": 0.7753908455371856, + "num_tokens": 111762190.0, + "step": 32850 + }, + { + "epoch": 0.32980047372435667, + "learning_rate": 0.0001340419125617247, + "loss": 0.7715, + "mean_token_accuracy": 0.7680457413196564, + "num_tokens": 111795924.0, + "step": 32860 + }, + { + "epoch": 0.3299008390541571, + "learning_rate": 0.00013402183949576458, + "loss": 0.7497, + "mean_token_accuracy": 0.780243182182312, + "num_tokens": 111830676.0, + "step": 32870 + }, + { + "epoch": 0.3300012043839576, + "learning_rate": 0.0001340017664298045, + "loss": 0.7237, + "mean_token_accuracy": 0.7785914659500122, + "num_tokens": 111865386.0, + "step": 32880 + }, + { + "epoch": 0.3301015697137581, + "learning_rate": 0.0001339816933638444, + "loss": 0.7486, + "mean_token_accuracy": 0.7758556783199311, + "num_tokens": 111900025.0, + "step": 32890 + }, + { + "epoch": 0.33020193504355855, + "learning_rate": 0.0001339616202978843, + "loss": 0.7167, + "mean_token_accuracy": 0.7822706520557403, + "num_tokens": 111934397.0, + "step": 32900 + }, + { + "epoch": 0.330302300373359, + "learning_rate": 0.00013394154723192421, + "loss": 0.7619, + "mean_token_accuracy": 0.7716590762138367, + "num_tokens": 111968689.0, + "step": 32910 + }, + { + "epoch": 0.3304026657031595, + "learning_rate": 0.00013392147416596412, + "loss": 0.7765, + "mean_token_accuracy": 0.7701333463191986, + "num_tokens": 112002218.0, + "step": 32920 + }, + { + "epoch": 0.33050303103295997, + "learning_rate": 0.00013390140110000403, + "loss": 0.7771, + "mean_token_accuracy": 0.7687518417835235, + "num_tokens": 112036797.0, + "step": 32930 + }, + { + "epoch": 0.3306033963627604, + "learning_rate": 0.0001338813280340439, + "loss": 0.713, + "mean_token_accuracy": 0.7801484882831573, + "num_tokens": 112070215.0, + "step": 32940 + }, + { + "epoch": 0.33070376169256094, + "learning_rate": 0.00013386125496808385, + "loss": 0.7612, + "mean_token_accuracy": 0.7749812602996826, + "num_tokens": 112103638.0, + "step": 32950 + }, + { + "epoch": 0.3308041270223614, + "learning_rate": 0.00013384118190212373, + "loss": 0.7673, + "mean_token_accuracy": 0.7733631312847138, + "num_tokens": 112138067.0, + "step": 32960 + }, + { + "epoch": 0.33090449235216185, + "learning_rate": 0.00013382110883616364, + "loss": 0.7533, + "mean_token_accuracy": 0.7756132185459137, + "num_tokens": 112172079.0, + "step": 32970 + }, + { + "epoch": 0.33100485768196236, + "learning_rate": 0.00013380103577020355, + "loss": 0.7388, + "mean_token_accuracy": 0.7763786613941193, + "num_tokens": 112206025.0, + "step": 32980 + }, + { + "epoch": 0.3311052230117628, + "learning_rate": 0.00013378096270424345, + "loss": 0.7757, + "mean_token_accuracy": 0.7680737316608429, + "num_tokens": 112240165.0, + "step": 32990 + }, + { + "epoch": 0.3312055883415633, + "learning_rate": 0.00013376088963828334, + "loss": 0.735, + "mean_token_accuracy": 0.7775642335414886, + "num_tokens": 112275631.0, + "step": 33000 + }, + { + "epoch": 0.3313059536713638, + "learning_rate": 0.00013374081657232327, + "loss": 0.7499, + "mean_token_accuracy": 0.7708619713783265, + "num_tokens": 112309657.0, + "step": 33010 + }, + { + "epoch": 0.33140631900116424, + "learning_rate": 0.00013372074350636315, + "loss": 0.7433, + "mean_token_accuracy": 0.7745214879512787, + "num_tokens": 112343525.0, + "step": 33020 + }, + { + "epoch": 0.3315066843309647, + "learning_rate": 0.00013370067044040306, + "loss": 0.7469, + "mean_token_accuracy": 0.7738293886184693, + "num_tokens": 112377528.0, + "step": 33030 + }, + { + "epoch": 0.3316070496607652, + "learning_rate": 0.000133680597374443, + "loss": 0.7807, + "mean_token_accuracy": 0.7650661706924439, + "num_tokens": 112411905.0, + "step": 33040 + }, + { + "epoch": 0.33170741499056566, + "learning_rate": 0.00013366052430848288, + "loss": 0.731, + "mean_token_accuracy": 0.786162942647934, + "num_tokens": 112445630.0, + "step": 33050 + }, + { + "epoch": 0.3318077803203661, + "learning_rate": 0.0001336404512425228, + "loss": 0.77, + "mean_token_accuracy": 0.772778207063675, + "num_tokens": 112479626.0, + "step": 33060 + }, + { + "epoch": 0.33190814565016663, + "learning_rate": 0.0001336203781765627, + "loss": 0.7362, + "mean_token_accuracy": 0.779965078830719, + "num_tokens": 112514031.0, + "step": 33070 + }, + { + "epoch": 0.3320085109799671, + "learning_rate": 0.0001336003051106026, + "loss": 0.7623, + "mean_token_accuracy": 0.7643588244915008, + "num_tokens": 112547695.0, + "step": 33080 + }, + { + "epoch": 0.33210887630976754, + "learning_rate": 0.00013358023204464248, + "loss": 0.7772, + "mean_token_accuracy": 0.76376793384552, + "num_tokens": 112581138.0, + "step": 33090 + }, + { + "epoch": 0.33220924163956805, + "learning_rate": 0.00013356015897868242, + "loss": 0.7519, + "mean_token_accuracy": 0.7737384855747222, + "num_tokens": 112614594.0, + "step": 33100 + }, + { + "epoch": 0.3323096069693685, + "learning_rate": 0.0001335400859127223, + "loss": 0.7219, + "mean_token_accuracy": 0.7840776026248932, + "num_tokens": 112649149.0, + "step": 33110 + }, + { + "epoch": 0.33240997229916897, + "learning_rate": 0.0001335200128467622, + "loss": 0.7044, + "mean_token_accuracy": 0.785427987575531, + "num_tokens": 112683810.0, + "step": 33120 + }, + { + "epoch": 0.3325103376289694, + "learning_rate": 0.00013349993978080212, + "loss": 0.7675, + "mean_token_accuracy": 0.7721398591995239, + "num_tokens": 112718643.0, + "step": 33130 + }, + { + "epoch": 0.33261070295876993, + "learning_rate": 0.00013347986671484203, + "loss": 0.7445, + "mean_token_accuracy": 0.7793696880340576, + "num_tokens": 112753716.0, + "step": 33140 + }, + { + "epoch": 0.3327110682885704, + "learning_rate": 0.00013345979364888194, + "loss": 0.738, + "mean_token_accuracy": 0.7804455637931824, + "num_tokens": 112787918.0, + "step": 33150 + }, + { + "epoch": 0.33281143361837084, + "learning_rate": 0.00013343972058292184, + "loss": 0.7676, + "mean_token_accuracy": 0.774154680967331, + "num_tokens": 112821656.0, + "step": 33160 + }, + { + "epoch": 0.33291179894817136, + "learning_rate": 0.00013341964751696175, + "loss": 0.7533, + "mean_token_accuracy": 0.7727014660835266, + "num_tokens": 112854785.0, + "step": 33170 + }, + { + "epoch": 0.3330121642779718, + "learning_rate": 0.00013339957445100166, + "loss": 0.786, + "mean_token_accuracy": 0.7679924726486206, + "num_tokens": 112888695.0, + "step": 33180 + }, + { + "epoch": 0.33311252960777227, + "learning_rate": 0.00013337950138504157, + "loss": 0.7842, + "mean_token_accuracy": 0.7727905869483948, + "num_tokens": 112922612.0, + "step": 33190 + }, + { + "epoch": 0.3332128949375728, + "learning_rate": 0.00013335942831908145, + "loss": 0.7756, + "mean_token_accuracy": 0.7724378049373627, + "num_tokens": 112956776.0, + "step": 33200 + }, + { + "epoch": 0.33331326026737323, + "learning_rate": 0.00013333935525312139, + "loss": 0.747, + "mean_token_accuracy": 0.7820969820022583, + "num_tokens": 112991034.0, + "step": 33210 + }, + { + "epoch": 0.3334136255971737, + "learning_rate": 0.00013331928218716127, + "loss": 0.8043, + "mean_token_accuracy": 0.7656574070453643, + "num_tokens": 113025181.0, + "step": 33220 + }, + { + "epoch": 0.3335139909269742, + "learning_rate": 0.00013329920912120118, + "loss": 0.7941, + "mean_token_accuracy": 0.7625795304775238, + "num_tokens": 113059321.0, + "step": 33230 + }, + { + "epoch": 0.33361435625677466, + "learning_rate": 0.00013327913605524108, + "loss": 0.7509, + "mean_token_accuracy": 0.7745759189128876, + "num_tokens": 113093678.0, + "step": 33240 + }, + { + "epoch": 0.3337147215865751, + "learning_rate": 0.000133259062989281, + "loss": 0.77, + "mean_token_accuracy": 0.7712205052375793, + "num_tokens": 113128563.0, + "step": 33250 + }, + { + "epoch": 0.3338150869163756, + "learning_rate": 0.0001332389899233209, + "loss": 0.7575, + "mean_token_accuracy": 0.7760208666324615, + "num_tokens": 113161900.0, + "step": 33260 + }, + { + "epoch": 0.3339154522461761, + "learning_rate": 0.0001332189168573608, + "loss": 0.7669, + "mean_token_accuracy": 0.7747590005397796, + "num_tokens": 113195796.0, + "step": 33270 + }, + { + "epoch": 0.33401581757597654, + "learning_rate": 0.00013319884379140072, + "loss": 0.7615, + "mean_token_accuracy": 0.7751935005187989, + "num_tokens": 113230217.0, + "step": 33280 + }, + { + "epoch": 0.33411618290577705, + "learning_rate": 0.0001331787707254406, + "loss": 0.7407, + "mean_token_accuracy": 0.7739264309406281, + "num_tokens": 113264363.0, + "step": 33290 + }, + { + "epoch": 0.3342165482355775, + "learning_rate": 0.00013315869765948053, + "loss": 0.7416, + "mean_token_accuracy": 0.777640187740326, + "num_tokens": 113297975.0, + "step": 33300 + }, + { + "epoch": 0.33431691356537796, + "learning_rate": 0.00013313862459352042, + "loss": 0.7687, + "mean_token_accuracy": 0.7725668013095855, + "num_tokens": 113331956.0, + "step": 33310 + }, + { + "epoch": 0.33441727889517847, + "learning_rate": 0.00013311855152756032, + "loss": 0.7507, + "mean_token_accuracy": 0.7736175775527954, + "num_tokens": 113365602.0, + "step": 33320 + }, + { + "epoch": 0.3345176442249789, + "learning_rate": 0.00013309847846160023, + "loss": 0.7624, + "mean_token_accuracy": 0.7726190626621247, + "num_tokens": 113400072.0, + "step": 33330 + }, + { + "epoch": 0.3346180095547794, + "learning_rate": 0.00013307840539564014, + "loss": 0.7673, + "mean_token_accuracy": 0.7765252709388732, + "num_tokens": 113434391.0, + "step": 33340 + }, + { + "epoch": 0.3347183748845799, + "learning_rate": 0.00013305833232968002, + "loss": 0.7335, + "mean_token_accuracy": 0.7800052285194397, + "num_tokens": 113468908.0, + "step": 33350 + }, + { + "epoch": 0.33481874021438035, + "learning_rate": 0.00013303825926371996, + "loss": 0.7814, + "mean_token_accuracy": 0.7701805233955383, + "num_tokens": 113502358.0, + "step": 33360 + }, + { + "epoch": 0.3349191055441808, + "learning_rate": 0.00013301818619775984, + "loss": 0.7517, + "mean_token_accuracy": 0.7761437237262726, + "num_tokens": 113536314.0, + "step": 33370 + }, + { + "epoch": 0.3350194708739813, + "learning_rate": 0.00013299811313179975, + "loss": 0.7681, + "mean_token_accuracy": 0.775888878107071, + "num_tokens": 113570309.0, + "step": 33380 + }, + { + "epoch": 0.3351198362037818, + "learning_rate": 0.00013297804006583968, + "loss": 0.7892, + "mean_token_accuracy": 0.765402227640152, + "num_tokens": 113604455.0, + "step": 33390 + }, + { + "epoch": 0.33522020153358223, + "learning_rate": 0.00013295796699987957, + "loss": 0.779, + "mean_token_accuracy": 0.7697222113609314, + "num_tokens": 113638269.0, + "step": 33400 + }, + { + "epoch": 0.33532056686338274, + "learning_rate": 0.00013293789393391947, + "loss": 0.7676, + "mean_token_accuracy": 0.7712249636650086, + "num_tokens": 113671611.0, + "step": 33410 + }, + { + "epoch": 0.3354209321931832, + "learning_rate": 0.00013291782086795938, + "loss": 0.7975, + "mean_token_accuracy": 0.7598975419998169, + "num_tokens": 113705370.0, + "step": 33420 + }, + { + "epoch": 0.33552129752298365, + "learning_rate": 0.0001328977478019993, + "loss": 0.7537, + "mean_token_accuracy": 0.7766621589660645, + "num_tokens": 113739413.0, + "step": 33430 + }, + { + "epoch": 0.3356216628527841, + "learning_rate": 0.00013287767473603917, + "loss": 0.7412, + "mean_token_accuracy": 0.7762495934963226, + "num_tokens": 113773122.0, + "step": 33440 + }, + { + "epoch": 0.3357220281825846, + "learning_rate": 0.0001328576016700791, + "loss": 0.7583, + "mean_token_accuracy": 0.7701814830303192, + "num_tokens": 113806750.0, + "step": 33450 + }, + { + "epoch": 0.3358223935123851, + "learning_rate": 0.000132837528604119, + "loss": 0.7169, + "mean_token_accuracy": 0.7808758616447449, + "num_tokens": 113840318.0, + "step": 33460 + }, + { + "epoch": 0.33592275884218553, + "learning_rate": 0.0001328174555381589, + "loss": 0.7436, + "mean_token_accuracy": 0.7756459295749665, + "num_tokens": 113874432.0, + "step": 33470 + }, + { + "epoch": 0.33602312417198604, + "learning_rate": 0.0001327973824721988, + "loss": 0.7119, + "mean_token_accuracy": 0.7874850273132324, + "num_tokens": 113908087.0, + "step": 33480 + }, + { + "epoch": 0.3361234895017865, + "learning_rate": 0.00013277730940623871, + "loss": 0.7261, + "mean_token_accuracy": 0.7868964076042175, + "num_tokens": 113942239.0, + "step": 33490 + }, + { + "epoch": 0.33622385483158695, + "learning_rate": 0.00013275723634027862, + "loss": 0.7738, + "mean_token_accuracy": 0.7751582086086273, + "num_tokens": 113977213.0, + "step": 33500 + }, + { + "epoch": 0.33632422016138747, + "learning_rate": 0.00013273716327431853, + "loss": 0.7595, + "mean_token_accuracy": 0.7670100629329681, + "num_tokens": 114011306.0, + "step": 33510 + }, + { + "epoch": 0.3364245854911879, + "learning_rate": 0.00013271709020835844, + "loss": 0.7309, + "mean_token_accuracy": 0.7738402605056762, + "num_tokens": 114044696.0, + "step": 33520 + }, + { + "epoch": 0.3365249508209884, + "learning_rate": 0.00013269701714239832, + "loss": 0.7194, + "mean_token_accuracy": 0.7780163168907166, + "num_tokens": 114079123.0, + "step": 33530 + }, + { + "epoch": 0.3366253161507889, + "learning_rate": 0.00013267694407643826, + "loss": 0.7331, + "mean_token_accuracy": 0.7774795651435852, + "num_tokens": 114112400.0, + "step": 33540 + }, + { + "epoch": 0.33672568148058935, + "learning_rate": 0.00013265687101047814, + "loss": 0.7677, + "mean_token_accuracy": 0.7680506944656372, + "num_tokens": 114146960.0, + "step": 33550 + }, + { + "epoch": 0.3368260468103898, + "learning_rate": 0.00013263679794451805, + "loss": 0.7855, + "mean_token_accuracy": 0.7739035665988923, + "num_tokens": 114181005.0, + "step": 33560 + }, + { + "epoch": 0.3369264121401903, + "learning_rate": 0.00013261672487855795, + "loss": 0.7608, + "mean_token_accuracy": 0.7679487466812134, + "num_tokens": 114215045.0, + "step": 33570 + }, + { + "epoch": 0.33702677746999077, + "learning_rate": 0.00013259665181259786, + "loss": 0.7793, + "mean_token_accuracy": 0.7649344563484192, + "num_tokens": 114249721.0, + "step": 33580 + }, + { + "epoch": 0.3371271427997912, + "learning_rate": 0.00013257657874663777, + "loss": 0.756, + "mean_token_accuracy": 0.7732738375663757, + "num_tokens": 114283046.0, + "step": 33590 + }, + { + "epoch": 0.33722750812959174, + "learning_rate": 0.00013255650568067768, + "loss": 0.7317, + "mean_token_accuracy": 0.7844031035900116, + "num_tokens": 114316849.0, + "step": 33600 + }, + { + "epoch": 0.3373278734593922, + "learning_rate": 0.0001325364326147176, + "loss": 0.7988, + "mean_token_accuracy": 0.7640057265758514, + "num_tokens": 114351571.0, + "step": 33610 + }, + { + "epoch": 0.33742823878919265, + "learning_rate": 0.00013251635954875747, + "loss": 0.7519, + "mean_token_accuracy": 0.7793439984321594, + "num_tokens": 114386001.0, + "step": 33620 + }, + { + "epoch": 0.33752860411899316, + "learning_rate": 0.0001324962864827974, + "loss": 0.7257, + "mean_token_accuracy": 0.7815295815467834, + "num_tokens": 114419334.0, + "step": 33630 + }, + { + "epoch": 0.3376289694487936, + "learning_rate": 0.00013247621341683729, + "loss": 0.7377, + "mean_token_accuracy": 0.7777803003787994, + "num_tokens": 114453671.0, + "step": 33640 + }, + { + "epoch": 0.33772933477859407, + "learning_rate": 0.0001324561403508772, + "loss": 0.7362, + "mean_token_accuracy": 0.7769293785095215, + "num_tokens": 114487910.0, + "step": 33650 + }, + { + "epoch": 0.3378297001083946, + "learning_rate": 0.0001324360672849171, + "loss": 0.773, + "mean_token_accuracy": 0.7708508253097535, + "num_tokens": 114521896.0, + "step": 33660 + }, + { + "epoch": 0.33793006543819504, + "learning_rate": 0.000132415994218957, + "loss": 0.7422, + "mean_token_accuracy": 0.7837636888027191, + "num_tokens": 114555562.0, + "step": 33670 + }, + { + "epoch": 0.3380304307679955, + "learning_rate": 0.0001323959211529969, + "loss": 0.7765, + "mean_token_accuracy": 0.7641663014888763, + "num_tokens": 114589536.0, + "step": 33680 + }, + { + "epoch": 0.338130796097796, + "learning_rate": 0.00013237584808703683, + "loss": 0.7351, + "mean_token_accuracy": 0.7833424389362336, + "num_tokens": 114624010.0, + "step": 33690 + }, + { + "epoch": 0.33823116142759646, + "learning_rate": 0.0001323557750210767, + "loss": 0.7415, + "mean_token_accuracy": 0.7737758994102478, + "num_tokens": 114659004.0, + "step": 33700 + }, + { + "epoch": 0.3383315267573969, + "learning_rate": 0.00013233570195511662, + "loss": 0.7369, + "mean_token_accuracy": 0.7746557354927063, + "num_tokens": 114693217.0, + "step": 33710 + }, + { + "epoch": 0.3384318920871974, + "learning_rate": 0.00013231562888915653, + "loss": 0.758, + "mean_token_accuracy": 0.7718977212905884, + "num_tokens": 114727453.0, + "step": 33720 + }, + { + "epoch": 0.3385322574169979, + "learning_rate": 0.00013229555582319644, + "loss": 0.7768, + "mean_token_accuracy": 0.7677544355392456, + "num_tokens": 114761416.0, + "step": 33730 + }, + { + "epoch": 0.33863262274679834, + "learning_rate": 0.00013227548275723637, + "loss": 0.7648, + "mean_token_accuracy": 0.7792239546775818, + "num_tokens": 114796186.0, + "step": 33740 + }, + { + "epoch": 0.3387329880765988, + "learning_rate": 0.00013225540969127625, + "loss": 0.7497, + "mean_token_accuracy": 0.777522736787796, + "num_tokens": 114830535.0, + "step": 33750 + }, + { + "epoch": 0.3388333534063993, + "learning_rate": 0.00013223533662531616, + "loss": 0.7905, + "mean_token_accuracy": 0.7705022990703583, + "num_tokens": 114864785.0, + "step": 33760 + }, + { + "epoch": 0.33893371873619976, + "learning_rate": 0.00013221526355935607, + "loss": 0.7456, + "mean_token_accuracy": 0.7735327541828155, + "num_tokens": 114899124.0, + "step": 33770 + }, + { + "epoch": 0.3390340840660002, + "learning_rate": 0.00013219519049339598, + "loss": 0.738, + "mean_token_accuracy": 0.7773309469223022, + "num_tokens": 114933255.0, + "step": 33780 + }, + { + "epoch": 0.33913444939580073, + "learning_rate": 0.00013217511742743586, + "loss": 0.7447, + "mean_token_accuracy": 0.7761066138744355, + "num_tokens": 114966444.0, + "step": 33790 + }, + { + "epoch": 0.3392348147256012, + "learning_rate": 0.0001321550443614758, + "loss": 0.7671, + "mean_token_accuracy": 0.7687490105628967, + "num_tokens": 115000794.0, + "step": 33800 + }, + { + "epoch": 0.33933518005540164, + "learning_rate": 0.00013213497129551568, + "loss": 0.8074, + "mean_token_accuracy": 0.7668362140655518, + "num_tokens": 115034685.0, + "step": 33810 + }, + { + "epoch": 0.33943554538520215, + "learning_rate": 0.00013211489822955558, + "loss": 0.7391, + "mean_token_accuracy": 0.776666647195816, + "num_tokens": 115068788.0, + "step": 33820 + }, + { + "epoch": 0.3395359107150026, + "learning_rate": 0.0001320948251635955, + "loss": 0.7724, + "mean_token_accuracy": 0.7716356873512268, + "num_tokens": 115103290.0, + "step": 33830 + }, + { + "epoch": 0.33963627604480306, + "learning_rate": 0.0001320747520976354, + "loss": 0.7464, + "mean_token_accuracy": 0.7730439364910126, + "num_tokens": 115137765.0, + "step": 33840 + }, + { + "epoch": 0.3397366413746036, + "learning_rate": 0.0001320546790316753, + "loss": 0.6979, + "mean_token_accuracy": 0.7836260735988617, + "num_tokens": 115172081.0, + "step": 33850 + }, + { + "epoch": 0.33983700670440403, + "learning_rate": 0.00013203460596571522, + "loss": 0.7441, + "mean_token_accuracy": 0.7787925243377686, + "num_tokens": 115206076.0, + "step": 33860 + }, + { + "epoch": 0.3399373720342045, + "learning_rate": 0.00013201453289975513, + "loss": 0.7535, + "mean_token_accuracy": 0.7702636957168579, + "num_tokens": 115240393.0, + "step": 33870 + }, + { + "epoch": 0.340037737364005, + "learning_rate": 0.000131994459833795, + "loss": 0.7475, + "mean_token_accuracy": 0.7734738945960998, + "num_tokens": 115274738.0, + "step": 33880 + }, + { + "epoch": 0.34013810269380546, + "learning_rate": 0.00013197438676783494, + "loss": 0.7848, + "mean_token_accuracy": 0.7629347026348114, + "num_tokens": 115309232.0, + "step": 33890 + }, + { + "epoch": 0.3402384680236059, + "learning_rate": 0.00013195431370187482, + "loss": 0.7588, + "mean_token_accuracy": 0.7716972589492798, + "num_tokens": 115343459.0, + "step": 33900 + }, + { + "epoch": 0.3403388333534064, + "learning_rate": 0.00013193424063591473, + "loss": 0.7236, + "mean_token_accuracy": 0.7831964731216431, + "num_tokens": 115376601.0, + "step": 33910 + }, + { + "epoch": 0.3404391986832069, + "learning_rate": 0.00013191416756995464, + "loss": 0.7618, + "mean_token_accuracy": 0.7727328360080719, + "num_tokens": 115411652.0, + "step": 33920 + }, + { + "epoch": 0.34053956401300733, + "learning_rate": 0.00013189409450399455, + "loss": 0.785, + "mean_token_accuracy": 0.7645107567310333, + "num_tokens": 115445195.0, + "step": 33930 + }, + { + "epoch": 0.34063992934280785, + "learning_rate": 0.00013187402143803446, + "loss": 0.7518, + "mean_token_accuracy": 0.776811945438385, + "num_tokens": 115480020.0, + "step": 33940 + }, + { + "epoch": 0.3407402946726083, + "learning_rate": 0.00013185394837207437, + "loss": 0.7629, + "mean_token_accuracy": 0.7730513215065002, + "num_tokens": 115513375.0, + "step": 33950 + }, + { + "epoch": 0.34084066000240876, + "learning_rate": 0.00013183387530611427, + "loss": 0.7596, + "mean_token_accuracy": 0.7708856523036957, + "num_tokens": 115547440.0, + "step": 33960 + }, + { + "epoch": 0.34094102533220927, + "learning_rate": 0.00013181380224015416, + "loss": 0.7721, + "mean_token_accuracy": 0.7715115666389465, + "num_tokens": 115581768.0, + "step": 33970 + }, + { + "epoch": 0.3410413906620097, + "learning_rate": 0.0001317937291741941, + "loss": 0.7532, + "mean_token_accuracy": 0.7767409980297089, + "num_tokens": 115615429.0, + "step": 33980 + }, + { + "epoch": 0.3411417559918102, + "learning_rate": 0.00013177365610823397, + "loss": 0.77, + "mean_token_accuracy": 0.7690534293651581, + "num_tokens": 115649748.0, + "step": 33990 + }, + { + "epoch": 0.34124212132161064, + "learning_rate": 0.00013175358304227388, + "loss": 0.7296, + "mean_token_accuracy": 0.7769282817840576, + "num_tokens": 115683651.0, + "step": 34000 + }, + { + "epoch": 0.34134248665141115, + "learning_rate": 0.0001317335099763138, + "loss": 0.7216, + "mean_token_accuracy": 0.7827814757823944, + "num_tokens": 115716730.0, + "step": 34010 + }, + { + "epoch": 0.3414428519812116, + "learning_rate": 0.0001317134369103537, + "loss": 0.7357, + "mean_token_accuracy": 0.7795480132102967, + "num_tokens": 115751124.0, + "step": 34020 + }, + { + "epoch": 0.34154321731101206, + "learning_rate": 0.00013169336384439358, + "loss": 0.7566, + "mean_token_accuracy": 0.7710654735565186, + "num_tokens": 115785214.0, + "step": 34030 + }, + { + "epoch": 0.34164358264081257, + "learning_rate": 0.00013167329077843352, + "loss": 0.7452, + "mean_token_accuracy": 0.7726763129234314, + "num_tokens": 115820126.0, + "step": 34040 + }, + { + "epoch": 0.341743947970613, + "learning_rate": 0.0001316532177124734, + "loss": 0.7341, + "mean_token_accuracy": 0.7802583396434783, + "num_tokens": 115853698.0, + "step": 34050 + }, + { + "epoch": 0.3418443133004135, + "learning_rate": 0.0001316331446465133, + "loss": 0.7339, + "mean_token_accuracy": 0.7817862033843994, + "num_tokens": 115888144.0, + "step": 34060 + }, + { + "epoch": 0.341944678630214, + "learning_rate": 0.0001316130715805532, + "loss": 0.766, + "mean_token_accuracy": 0.770089042186737, + "num_tokens": 115921786.0, + "step": 34070 + }, + { + "epoch": 0.34204504396001445, + "learning_rate": 0.00013159299851459312, + "loss": 0.7531, + "mean_token_accuracy": 0.7753535389900208, + "num_tokens": 115955388.0, + "step": 34080 + }, + { + "epoch": 0.3421454092898149, + "learning_rate": 0.00013157292544863303, + "loss": 0.7529, + "mean_token_accuracy": 0.7741257071495056, + "num_tokens": 115989914.0, + "step": 34090 + }, + { + "epoch": 0.3422457746196154, + "learning_rate": 0.00013155285238267294, + "loss": 0.7196, + "mean_token_accuracy": 0.7788474857807159, + "num_tokens": 116024304.0, + "step": 34100 + }, + { + "epoch": 0.3423461399494159, + "learning_rate": 0.00013153277931671285, + "loss": 0.7428, + "mean_token_accuracy": 0.7727693736553192, + "num_tokens": 116058515.0, + "step": 34110 + }, + { + "epoch": 0.34244650527921633, + "learning_rate": 0.00013151270625075273, + "loss": 0.7728, + "mean_token_accuracy": 0.770117312669754, + "num_tokens": 116092672.0, + "step": 34120 + }, + { + "epoch": 0.34254687060901684, + "learning_rate": 0.00013149263318479266, + "loss": 0.7581, + "mean_token_accuracy": 0.7690131008625031, + "num_tokens": 116125713.0, + "step": 34130 + }, + { + "epoch": 0.3426472359388173, + "learning_rate": 0.00013147256011883255, + "loss": 0.7164, + "mean_token_accuracy": 0.7797726035118103, + "num_tokens": 116159272.0, + "step": 34140 + }, + { + "epoch": 0.34274760126861775, + "learning_rate": 0.00013145248705287245, + "loss": 0.7331, + "mean_token_accuracy": 0.7755063772201538, + "num_tokens": 116193734.0, + "step": 34150 + }, + { + "epoch": 0.34284796659841826, + "learning_rate": 0.00013143241398691236, + "loss": 0.7498, + "mean_token_accuracy": 0.7762515246868134, + "num_tokens": 116227360.0, + "step": 34160 + }, + { + "epoch": 0.3429483319282187, + "learning_rate": 0.00013141234092095227, + "loss": 0.7702, + "mean_token_accuracy": 0.7699919462203979, + "num_tokens": 116261561.0, + "step": 34170 + }, + { + "epoch": 0.3430486972580192, + "learning_rate": 0.00013139226785499218, + "loss": 0.7704, + "mean_token_accuracy": 0.7696660220623016, + "num_tokens": 116295154.0, + "step": 34180 + }, + { + "epoch": 0.3431490625878197, + "learning_rate": 0.0001313721947890321, + "loss": 0.7273, + "mean_token_accuracy": 0.7759283125400543, + "num_tokens": 116329446.0, + "step": 34190 + }, + { + "epoch": 0.34324942791762014, + "learning_rate": 0.000131352121723072, + "loss": 0.7253, + "mean_token_accuracy": 0.780819696187973, + "num_tokens": 116362873.0, + "step": 34200 + }, + { + "epoch": 0.3433497932474206, + "learning_rate": 0.00013133204865711188, + "loss": 0.7716, + "mean_token_accuracy": 0.7736681044101715, + "num_tokens": 116397957.0, + "step": 34210 + }, + { + "epoch": 0.3434501585772211, + "learning_rate": 0.0001313119755911518, + "loss": 0.7398, + "mean_token_accuracy": 0.776227742433548, + "num_tokens": 116431767.0, + "step": 34220 + }, + { + "epoch": 0.34355052390702157, + "learning_rate": 0.0001312919025251917, + "loss": 0.7586, + "mean_token_accuracy": 0.7764150321483612, + "num_tokens": 116465353.0, + "step": 34230 + }, + { + "epoch": 0.343650889236822, + "learning_rate": 0.0001312718294592316, + "loss": 0.7457, + "mean_token_accuracy": 0.778573626279831, + "num_tokens": 116499430.0, + "step": 34240 + }, + { + "epoch": 0.34375125456662253, + "learning_rate": 0.0001312517563932715, + "loss": 0.7607, + "mean_token_accuracy": 0.7732001185417176, + "num_tokens": 116533055.0, + "step": 34250 + }, + { + "epoch": 0.343851619896423, + "learning_rate": 0.00013123168332731142, + "loss": 0.7104, + "mean_token_accuracy": 0.7862925827503204, + "num_tokens": 116566761.0, + "step": 34260 + }, + { + "epoch": 0.34395198522622344, + "learning_rate": 0.0001312116102613513, + "loss": 0.7493, + "mean_token_accuracy": 0.7757634878158569, + "num_tokens": 116601230.0, + "step": 34270 + }, + { + "epoch": 0.3440523505560239, + "learning_rate": 0.00013119153719539124, + "loss": 0.7143, + "mean_token_accuracy": 0.7833714783191681, + "num_tokens": 116635485.0, + "step": 34280 + }, + { + "epoch": 0.3441527158858244, + "learning_rate": 0.00013117146412943114, + "loss": 0.7714, + "mean_token_accuracy": 0.7680694222450256, + "num_tokens": 116669000.0, + "step": 34290 + }, + { + "epoch": 0.34425308121562487, + "learning_rate": 0.00013115139106347105, + "loss": 0.7681, + "mean_token_accuracy": 0.7697263181209564, + "num_tokens": 116702279.0, + "step": 34300 + }, + { + "epoch": 0.3443534465454253, + "learning_rate": 0.00013113131799751096, + "loss": 0.7651, + "mean_token_accuracy": 0.7704175889492035, + "num_tokens": 116737439.0, + "step": 34310 + }, + { + "epoch": 0.34445381187522583, + "learning_rate": 0.00013111124493155084, + "loss": 0.7408, + "mean_token_accuracy": 0.772112762928009, + "num_tokens": 116771416.0, + "step": 34320 + }, + { + "epoch": 0.3445541772050263, + "learning_rate": 0.00013109117186559078, + "loss": 0.7741, + "mean_token_accuracy": 0.7686093211174011, + "num_tokens": 116805417.0, + "step": 34330 + }, + { + "epoch": 0.34465454253482675, + "learning_rate": 0.00013107109879963066, + "loss": 0.7347, + "mean_token_accuracy": 0.7795671701431275, + "num_tokens": 116839763.0, + "step": 34340 + }, + { + "epoch": 0.34475490786462726, + "learning_rate": 0.00013105102573367057, + "loss": 0.7435, + "mean_token_accuracy": 0.7816221535205841, + "num_tokens": 116873743.0, + "step": 34350 + }, + { + "epoch": 0.3448552731944277, + "learning_rate": 0.00013103095266771048, + "loss": 0.7729, + "mean_token_accuracy": 0.7747231245040893, + "num_tokens": 116907959.0, + "step": 34360 + }, + { + "epoch": 0.34495563852422817, + "learning_rate": 0.00013101087960175039, + "loss": 0.776, + "mean_token_accuracy": 0.7699971199035645, + "num_tokens": 116943038.0, + "step": 34370 + }, + { + "epoch": 0.3450560038540287, + "learning_rate": 0.00013099080653579027, + "loss": 0.7639, + "mean_token_accuracy": 0.771040403842926, + "num_tokens": 116977229.0, + "step": 34380 + }, + { + "epoch": 0.34515636918382914, + "learning_rate": 0.0001309707334698302, + "loss": 0.7505, + "mean_token_accuracy": 0.776633882522583, + "num_tokens": 117010447.0, + "step": 34390 + }, + { + "epoch": 0.3452567345136296, + "learning_rate": 0.00013095066040387008, + "loss": 0.7568, + "mean_token_accuracy": 0.7718197226524353, + "num_tokens": 117044615.0, + "step": 34400 + }, + { + "epoch": 0.3453570998434301, + "learning_rate": 0.00013093058733791, + "loss": 0.7609, + "mean_token_accuracy": 0.7776704132556915, + "num_tokens": 117078330.0, + "step": 34410 + }, + { + "epoch": 0.34545746517323056, + "learning_rate": 0.0001309105142719499, + "loss": 0.7387, + "mean_token_accuracy": 0.7776882827281952, + "num_tokens": 117112490.0, + "step": 34420 + }, + { + "epoch": 0.345557830503031, + "learning_rate": 0.0001308904412059898, + "loss": 0.7586, + "mean_token_accuracy": 0.7724784135818481, + "num_tokens": 117146721.0, + "step": 34430 + }, + { + "epoch": 0.3456581958328315, + "learning_rate": 0.00013087036814002972, + "loss": 0.8169, + "mean_token_accuracy": 0.7559751987457275, + "num_tokens": 117180219.0, + "step": 34440 + }, + { + "epoch": 0.345758561162632, + "learning_rate": 0.00013085029507406963, + "loss": 0.7619, + "mean_token_accuracy": 0.7739854872226715, + "num_tokens": 117214541.0, + "step": 34450 + }, + { + "epoch": 0.34585892649243244, + "learning_rate": 0.00013083022200810953, + "loss": 0.751, + "mean_token_accuracy": 0.7724648296833039, + "num_tokens": 117248602.0, + "step": 34460 + }, + { + "epoch": 0.34595929182223295, + "learning_rate": 0.00013081014894214942, + "loss": 0.7364, + "mean_token_accuracy": 0.7811800599098205, + "num_tokens": 117282082.0, + "step": 34470 + }, + { + "epoch": 0.3460596571520334, + "learning_rate": 0.00013079007587618935, + "loss": 0.7703, + "mean_token_accuracy": 0.771990841627121, + "num_tokens": 117315963.0, + "step": 34480 + }, + { + "epoch": 0.34616002248183386, + "learning_rate": 0.00013077000281022923, + "loss": 0.7498, + "mean_token_accuracy": 0.7722388863563537, + "num_tokens": 117350226.0, + "step": 34490 + }, + { + "epoch": 0.3462603878116344, + "learning_rate": 0.00013074992974426914, + "loss": 0.7521, + "mean_token_accuracy": 0.7755684375762939, + "num_tokens": 117383725.0, + "step": 34500 + }, + { + "epoch": 0.34636075314143483, + "learning_rate": 0.00013072985667830905, + "loss": 0.7562, + "mean_token_accuracy": 0.7758636116981507, + "num_tokens": 117417001.0, + "step": 34510 + }, + { + "epoch": 0.3464611184712353, + "learning_rate": 0.00013070978361234896, + "loss": 0.7435, + "mean_token_accuracy": 0.7790121793746948, + "num_tokens": 117451132.0, + "step": 34520 + }, + { + "epoch": 0.3465614838010358, + "learning_rate": 0.00013068971054638887, + "loss": 0.7731, + "mean_token_accuracy": 0.7720594286918641, + "num_tokens": 117485231.0, + "step": 34530 + }, + { + "epoch": 0.34666184913083625, + "learning_rate": 0.00013066963748042877, + "loss": 0.7634, + "mean_token_accuracy": 0.7742433428764344, + "num_tokens": 117519021.0, + "step": 34540 + }, + { + "epoch": 0.3467622144606367, + "learning_rate": 0.00013064956441446868, + "loss": 0.7545, + "mean_token_accuracy": 0.7752372026443481, + "num_tokens": 117553157.0, + "step": 34550 + }, + { + "epoch": 0.34686257979043716, + "learning_rate": 0.00013062949134850856, + "loss": 0.7887, + "mean_token_accuracy": 0.7634439051151276, + "num_tokens": 117586881.0, + "step": 34560 + }, + { + "epoch": 0.3469629451202377, + "learning_rate": 0.0001306094182825485, + "loss": 0.7672, + "mean_token_accuracy": 0.771806401014328, + "num_tokens": 117621407.0, + "step": 34570 + }, + { + "epoch": 0.34706331045003813, + "learning_rate": 0.00013058934521658838, + "loss": 0.7535, + "mean_token_accuracy": 0.7751614928245545, + "num_tokens": 117655538.0, + "step": 34580 + }, + { + "epoch": 0.3471636757798386, + "learning_rate": 0.0001305692721506283, + "loss": 0.7037, + "mean_token_accuracy": 0.7887448370456696, + "num_tokens": 117689169.0, + "step": 34590 + }, + { + "epoch": 0.3472640411096391, + "learning_rate": 0.0001305491990846682, + "loss": 0.7226, + "mean_token_accuracy": 0.7777604997158051, + "num_tokens": 117723065.0, + "step": 34600 + }, + { + "epoch": 0.34736440643943955, + "learning_rate": 0.0001305291260187081, + "loss": 0.7218, + "mean_token_accuracy": 0.7842798173427582, + "num_tokens": 117757752.0, + "step": 34610 + }, + { + "epoch": 0.34746477176924, + "learning_rate": 0.000130509052952748, + "loss": 0.7401, + "mean_token_accuracy": 0.7753164947032929, + "num_tokens": 117791530.0, + "step": 34620 + }, + { + "epoch": 0.3475651370990405, + "learning_rate": 0.00013048897988678792, + "loss": 0.7484, + "mean_token_accuracy": 0.7727838516235351, + "num_tokens": 117825861.0, + "step": 34630 + }, + { + "epoch": 0.347665502428841, + "learning_rate": 0.00013046890682082783, + "loss": 0.7769, + "mean_token_accuracy": 0.7652743220329284, + "num_tokens": 117859863.0, + "step": 34640 + }, + { + "epoch": 0.34776586775864143, + "learning_rate": 0.0001304488337548677, + "loss": 0.7521, + "mean_token_accuracy": 0.778465723991394, + "num_tokens": 117893913.0, + "step": 34650 + }, + { + "epoch": 0.34786623308844195, + "learning_rate": 0.00013042876068890765, + "loss": 0.7707, + "mean_token_accuracy": 0.7738387942314148, + "num_tokens": 117927990.0, + "step": 34660 + }, + { + "epoch": 0.3479665984182424, + "learning_rate": 0.00013040868762294753, + "loss": 0.7527, + "mean_token_accuracy": 0.7747078657150268, + "num_tokens": 117962835.0, + "step": 34670 + }, + { + "epoch": 0.34806696374804286, + "learning_rate": 0.00013038861455698744, + "loss": 0.7576, + "mean_token_accuracy": 0.7754677116870881, + "num_tokens": 117996774.0, + "step": 34680 + }, + { + "epoch": 0.34816732907784337, + "learning_rate": 0.00013036854149102735, + "loss": 0.7348, + "mean_token_accuracy": 0.7804238975048066, + "num_tokens": 118031436.0, + "step": 34690 + }, + { + "epoch": 0.3482676944076438, + "learning_rate": 0.00013034846842506726, + "loss": 0.7565, + "mean_token_accuracy": 0.7717331767082214, + "num_tokens": 118065332.0, + "step": 34700 + }, + { + "epoch": 0.3483680597374443, + "learning_rate": 0.00013032839535910714, + "loss": 0.7345, + "mean_token_accuracy": 0.7782244682312012, + "num_tokens": 118099396.0, + "step": 34710 + }, + { + "epoch": 0.3484684250672448, + "learning_rate": 0.00013030832229314707, + "loss": 0.7393, + "mean_token_accuracy": 0.7732568264007569, + "num_tokens": 118133559.0, + "step": 34720 + }, + { + "epoch": 0.34856879039704525, + "learning_rate": 0.00013028824922718695, + "loss": 0.7557, + "mean_token_accuracy": 0.7746400594711303, + "num_tokens": 118167606.0, + "step": 34730 + }, + { + "epoch": 0.3486691557268457, + "learning_rate": 0.00013026817616122686, + "loss": 0.7452, + "mean_token_accuracy": 0.7743682622909546, + "num_tokens": 118201977.0, + "step": 34740 + }, + { + "epoch": 0.3487695210566462, + "learning_rate": 0.00013024810309526677, + "loss": 0.7286, + "mean_token_accuracy": 0.7818284869194031, + "num_tokens": 118236029.0, + "step": 34750 + }, + { + "epoch": 0.34886988638644667, + "learning_rate": 0.00013022803002930668, + "loss": 0.7231, + "mean_token_accuracy": 0.7850748658180237, + "num_tokens": 118269975.0, + "step": 34760 + }, + { + "epoch": 0.3489702517162471, + "learning_rate": 0.0001302079569633466, + "loss": 0.7516, + "mean_token_accuracy": 0.7747095584869385, + "num_tokens": 118304176.0, + "step": 34770 + }, + { + "epoch": 0.34907061704604764, + "learning_rate": 0.0001301878838973865, + "loss": 0.7529, + "mean_token_accuracy": 0.7725032269954681, + "num_tokens": 118338089.0, + "step": 34780 + }, + { + "epoch": 0.3491709823758481, + "learning_rate": 0.0001301678108314264, + "loss": 0.7505, + "mean_token_accuracy": 0.7774797141551971, + "num_tokens": 118371871.0, + "step": 34790 + }, + { + "epoch": 0.34927134770564855, + "learning_rate": 0.00013014773776546629, + "loss": 0.7407, + "mean_token_accuracy": 0.7733864784240723, + "num_tokens": 118406554.0, + "step": 34800 + }, + { + "epoch": 0.34937171303544906, + "learning_rate": 0.00013012766469950622, + "loss": 0.7157, + "mean_token_accuracy": 0.7768620789051056, + "num_tokens": 118440454.0, + "step": 34810 + }, + { + "epoch": 0.3494720783652495, + "learning_rate": 0.0001301075916335461, + "loss": 0.7451, + "mean_token_accuracy": 0.7789655983448028, + "num_tokens": 118473740.0, + "step": 34820 + }, + { + "epoch": 0.34957244369505, + "learning_rate": 0.000130087518567586, + "loss": 0.7277, + "mean_token_accuracy": 0.7804815113544464, + "num_tokens": 118507591.0, + "step": 34830 + }, + { + "epoch": 0.34967280902485043, + "learning_rate": 0.00013006744550162592, + "loss": 0.7067, + "mean_token_accuracy": 0.7835338473320007, + "num_tokens": 118542423.0, + "step": 34840 + }, + { + "epoch": 0.34977317435465094, + "learning_rate": 0.00013004737243566583, + "loss": 0.7683, + "mean_token_accuracy": 0.7751769661903382, + "num_tokens": 118576057.0, + "step": 34850 + }, + { + "epoch": 0.3498735396844514, + "learning_rate": 0.00013002729936970574, + "loss": 0.7503, + "mean_token_accuracy": 0.7780750274658204, + "num_tokens": 118610283.0, + "step": 34860 + }, + { + "epoch": 0.34997390501425185, + "learning_rate": 0.00013000722630374564, + "loss": 0.7419, + "mean_token_accuracy": 0.7775280714035034, + "num_tokens": 118645136.0, + "step": 34870 + }, + { + "epoch": 0.35007427034405236, + "learning_rate": 0.00012998715323778555, + "loss": 0.7446, + "mean_token_accuracy": 0.7766178011894226, + "num_tokens": 118679708.0, + "step": 34880 + }, + { + "epoch": 0.3501746356738528, + "learning_rate": 0.00012996708017182546, + "loss": 0.745, + "mean_token_accuracy": 0.7750972747802735, + "num_tokens": 118713556.0, + "step": 34890 + }, + { + "epoch": 0.3502750010036533, + "learning_rate": 0.00012994700710586537, + "loss": 0.7508, + "mean_token_accuracy": 0.7772462069988251, + "num_tokens": 118747915.0, + "step": 34900 + }, + { + "epoch": 0.3503753663334538, + "learning_rate": 0.00012992693403990525, + "loss": 0.7364, + "mean_token_accuracy": 0.7773713529109955, + "num_tokens": 118780943.0, + "step": 34910 + }, + { + "epoch": 0.35047573166325424, + "learning_rate": 0.0001299068609739452, + "loss": 0.7935, + "mean_token_accuracy": 0.7650506019592285, + "num_tokens": 118815612.0, + "step": 34920 + }, + { + "epoch": 0.3505760969930547, + "learning_rate": 0.00012988678790798507, + "loss": 0.7442, + "mean_token_accuracy": 0.7729040741920471, + "num_tokens": 118849356.0, + "step": 34930 + }, + { + "epoch": 0.3506764623228552, + "learning_rate": 0.00012986671484202498, + "loss": 0.7363, + "mean_token_accuracy": 0.7809243083000184, + "num_tokens": 118883002.0, + "step": 34940 + }, + { + "epoch": 0.35077682765265567, + "learning_rate": 0.00012984664177606488, + "loss": 0.7398, + "mean_token_accuracy": 0.7733363807201385, + "num_tokens": 118916859.0, + "step": 34950 + }, + { + "epoch": 0.3508771929824561, + "learning_rate": 0.0001298265687101048, + "loss": 0.7857, + "mean_token_accuracy": 0.7694664359092712, + "num_tokens": 118949953.0, + "step": 34960 + }, + { + "epoch": 0.35097755831225663, + "learning_rate": 0.00012980649564414467, + "loss": 0.7595, + "mean_token_accuracy": 0.7718825221061707, + "num_tokens": 118983543.0, + "step": 34970 + }, + { + "epoch": 0.3510779236420571, + "learning_rate": 0.0001297864225781846, + "loss": 0.7233, + "mean_token_accuracy": 0.7823235094547272, + "num_tokens": 119017302.0, + "step": 34980 + }, + { + "epoch": 0.35117828897185754, + "learning_rate": 0.00012976634951222452, + "loss": 0.7734, + "mean_token_accuracy": 0.766890674829483, + "num_tokens": 119051990.0, + "step": 34990 + }, + { + "epoch": 0.35127865430165806, + "learning_rate": 0.0001297462764462644, + "loss": 0.7555, + "mean_token_accuracy": 0.7784459352493286, + "num_tokens": 119086337.0, + "step": 35000 + }, + { + "epoch": 0.3513790196314585, + "learning_rate": 0.00012972620338030434, + "loss": 0.7317, + "mean_token_accuracy": 0.7820458710193634, + "num_tokens": 119120358.0, + "step": 35010 + }, + { + "epoch": 0.35147938496125897, + "learning_rate": 0.00012970613031434422, + "loss": 0.7464, + "mean_token_accuracy": 0.7753281235694885, + "num_tokens": 119154366.0, + "step": 35020 + }, + { + "epoch": 0.3515797502910595, + "learning_rate": 0.00012968605724838413, + "loss": 0.7549, + "mean_token_accuracy": 0.7730974972248077, + "num_tokens": 119189498.0, + "step": 35030 + }, + { + "epoch": 0.35168011562085993, + "learning_rate": 0.00012966598418242403, + "loss": 0.7693, + "mean_token_accuracy": 0.7727134704589844, + "num_tokens": 119223230.0, + "step": 35040 + }, + { + "epoch": 0.3517804809506604, + "learning_rate": 0.00012964591111646394, + "loss": 0.7698, + "mean_token_accuracy": 0.7701881527900696, + "num_tokens": 119256910.0, + "step": 35050 + }, + { + "epoch": 0.3518808462804609, + "learning_rate": 0.00012962583805050382, + "loss": 0.7486, + "mean_token_accuracy": 0.7781509280204773, + "num_tokens": 119290293.0, + "step": 35060 + }, + { + "epoch": 0.35198121161026136, + "learning_rate": 0.00012960576498454376, + "loss": 0.7561, + "mean_token_accuracy": 0.772142744064331, + "num_tokens": 119323527.0, + "step": 35070 + }, + { + "epoch": 0.3520815769400618, + "learning_rate": 0.00012958569191858364, + "loss": 0.7348, + "mean_token_accuracy": 0.776472669839859, + "num_tokens": 119357956.0, + "step": 35080 + }, + { + "epoch": 0.3521819422698623, + "learning_rate": 0.00012956561885262355, + "loss": 0.7893, + "mean_token_accuracy": 0.7657097697257995, + "num_tokens": 119391878.0, + "step": 35090 + }, + { + "epoch": 0.3522823075996628, + "learning_rate": 0.00012954554578666346, + "loss": 0.7827, + "mean_token_accuracy": 0.7680422246456147, + "num_tokens": 119425021.0, + "step": 35100 + }, + { + "epoch": 0.35238267292946324, + "learning_rate": 0.00012952547272070337, + "loss": 0.7347, + "mean_token_accuracy": 0.7755476057529449, + "num_tokens": 119458978.0, + "step": 35110 + }, + { + "epoch": 0.3524830382592637, + "learning_rate": 0.00012950539965474327, + "loss": 0.7541, + "mean_token_accuracy": 0.7770498335361481, + "num_tokens": 119492774.0, + "step": 35120 + }, + { + "epoch": 0.3525834035890642, + "learning_rate": 0.00012948532658878318, + "loss": 0.7626, + "mean_token_accuracy": 0.7735799431800843, + "num_tokens": 119526989.0, + "step": 35130 + }, + { + "epoch": 0.35268376891886466, + "learning_rate": 0.0001294652535228231, + "loss": 0.7584, + "mean_token_accuracy": 0.7750583529472351, + "num_tokens": 119560782.0, + "step": 35140 + }, + { + "epoch": 0.3527841342486651, + "learning_rate": 0.00012944518045686297, + "loss": 0.7641, + "mean_token_accuracy": 0.7715739667415619, + "num_tokens": 119594978.0, + "step": 35150 + }, + { + "epoch": 0.3528844995784656, + "learning_rate": 0.0001294251073909029, + "loss": 0.7301, + "mean_token_accuracy": 0.7819527506828308, + "num_tokens": 119629725.0, + "step": 35160 + }, + { + "epoch": 0.3529848649082661, + "learning_rate": 0.0001294050343249428, + "loss": 0.7613, + "mean_token_accuracy": 0.7737753927707672, + "num_tokens": 119662809.0, + "step": 35170 + }, + { + "epoch": 0.35308523023806654, + "learning_rate": 0.0001293849612589827, + "loss": 0.7381, + "mean_token_accuracy": 0.7770018994808197, + "num_tokens": 119696635.0, + "step": 35180 + }, + { + "epoch": 0.35318559556786705, + "learning_rate": 0.0001293648881930226, + "loss": 0.755, + "mean_token_accuracy": 0.7756446003913879, + "num_tokens": 119730825.0, + "step": 35190 + }, + { + "epoch": 0.3532859608976675, + "learning_rate": 0.00012934481512706251, + "loss": 0.7447, + "mean_token_accuracy": 0.7755038917064667, + "num_tokens": 119765070.0, + "step": 35200 + }, + { + "epoch": 0.35338632622746796, + "learning_rate": 0.00012932474206110242, + "loss": 0.7723, + "mean_token_accuracy": 0.7713152647018433, + "num_tokens": 119799584.0, + "step": 35210 + }, + { + "epoch": 0.3534866915572685, + "learning_rate": 0.00012930466899514233, + "loss": 0.7663, + "mean_token_accuracy": 0.7718316853046417, + "num_tokens": 119833470.0, + "step": 35220 + }, + { + "epoch": 0.35358705688706893, + "learning_rate": 0.00012928459592918224, + "loss": 0.814, + "mean_token_accuracy": 0.7650098145008087, + "num_tokens": 119867558.0, + "step": 35230 + }, + { + "epoch": 0.3536874222168694, + "learning_rate": 0.00012926452286322212, + "loss": 0.7499, + "mean_token_accuracy": 0.7746418297290802, + "num_tokens": 119900867.0, + "step": 35240 + }, + { + "epoch": 0.3537877875466699, + "learning_rate": 0.00012924444979726206, + "loss": 0.7478, + "mean_token_accuracy": 0.7810865759849548, + "num_tokens": 119935275.0, + "step": 35250 + }, + { + "epoch": 0.35388815287647035, + "learning_rate": 0.00012922437673130194, + "loss": 0.7718, + "mean_token_accuracy": 0.7729858040809632, + "num_tokens": 119969548.0, + "step": 35260 + }, + { + "epoch": 0.3539885182062708, + "learning_rate": 0.00012920430366534185, + "loss": 0.7677, + "mean_token_accuracy": 0.7698695123195648, + "num_tokens": 120003401.0, + "step": 35270 + }, + { + "epoch": 0.3540888835360713, + "learning_rate": 0.00012918423059938175, + "loss": 0.7609, + "mean_token_accuracy": 0.7710729897022247, + "num_tokens": 120038126.0, + "step": 35280 + }, + { + "epoch": 0.3541892488658718, + "learning_rate": 0.00012916415753342166, + "loss": 0.74, + "mean_token_accuracy": 0.7778858602046966, + "num_tokens": 120072359.0, + "step": 35290 + }, + { + "epoch": 0.35428961419567223, + "learning_rate": 0.00012914408446746154, + "loss": 0.7641, + "mean_token_accuracy": 0.7736245393753052, + "num_tokens": 120106331.0, + "step": 35300 + }, + { + "epoch": 0.35438997952547274, + "learning_rate": 0.00012912401140150148, + "loss": 0.7479, + "mean_token_accuracy": 0.7788862705230712, + "num_tokens": 120140422.0, + "step": 35310 + }, + { + "epoch": 0.3544903448552732, + "learning_rate": 0.00012910393833554136, + "loss": 0.7651, + "mean_token_accuracy": 0.7646833181381225, + "num_tokens": 120173897.0, + "step": 35320 + }, + { + "epoch": 0.35459071018507365, + "learning_rate": 0.00012908386526958127, + "loss": 0.7614, + "mean_token_accuracy": 0.7729146480560303, + "num_tokens": 120207831.0, + "step": 35330 + }, + { + "epoch": 0.35469107551487417, + "learning_rate": 0.0001290637922036212, + "loss": 0.7664, + "mean_token_accuracy": 0.7723476946353912, + "num_tokens": 120241925.0, + "step": 35340 + }, + { + "epoch": 0.3547914408446746, + "learning_rate": 0.0001290437191376611, + "loss": 0.7642, + "mean_token_accuracy": 0.772037923336029, + "num_tokens": 120277005.0, + "step": 35350 + }, + { + "epoch": 0.3548918061744751, + "learning_rate": 0.000129023646071701, + "loss": 0.7597, + "mean_token_accuracy": 0.7775270521640778, + "num_tokens": 120310403.0, + "step": 35360 + }, + { + "epoch": 0.3549921715042756, + "learning_rate": 0.0001290035730057409, + "loss": 0.7591, + "mean_token_accuracy": 0.7727593421936035, + "num_tokens": 120344465.0, + "step": 35370 + }, + { + "epoch": 0.35509253683407604, + "learning_rate": 0.0001289834999397808, + "loss": 0.7851, + "mean_token_accuracy": 0.767771178483963, + "num_tokens": 120377939.0, + "step": 35380 + }, + { + "epoch": 0.3551929021638765, + "learning_rate": 0.0001289634268738207, + "loss": 0.7451, + "mean_token_accuracy": 0.7773448050022125, + "num_tokens": 120411248.0, + "step": 35390 + }, + { + "epoch": 0.355293267493677, + "learning_rate": 0.00012894335380786063, + "loss": 0.7235, + "mean_token_accuracy": 0.7817453920841217, + "num_tokens": 120443872.0, + "step": 35400 + }, + { + "epoch": 0.35539363282347747, + "learning_rate": 0.0001289232807419005, + "loss": 0.7481, + "mean_token_accuracy": 0.7752549231052399, + "num_tokens": 120477526.0, + "step": 35410 + }, + { + "epoch": 0.3554939981532779, + "learning_rate": 0.00012890320767594042, + "loss": 0.7439, + "mean_token_accuracy": 0.7809197425842285, + "num_tokens": 120511817.0, + "step": 35420 + }, + { + "epoch": 0.3555943634830784, + "learning_rate": 0.00012888313460998033, + "loss": 0.743, + "mean_token_accuracy": 0.7750954687595367, + "num_tokens": 120545772.0, + "step": 35430 + }, + { + "epoch": 0.3556947288128789, + "learning_rate": 0.00012886306154402024, + "loss": 0.7735, + "mean_token_accuracy": 0.769282442331314, + "num_tokens": 120579574.0, + "step": 35440 + }, + { + "epoch": 0.35579509414267935, + "learning_rate": 0.00012884298847806014, + "loss": 0.7494, + "mean_token_accuracy": 0.7742872178554535, + "num_tokens": 120613386.0, + "step": 35450 + }, + { + "epoch": 0.3558954594724798, + "learning_rate": 0.00012882291541210005, + "loss": 0.7359, + "mean_token_accuracy": 0.7799999475479126, + "num_tokens": 120647508.0, + "step": 35460 + }, + { + "epoch": 0.3559958248022803, + "learning_rate": 0.00012880284234613996, + "loss": 0.7635, + "mean_token_accuracy": 0.7773070394992828, + "num_tokens": 120680975.0, + "step": 35470 + }, + { + "epoch": 0.35609619013208077, + "learning_rate": 0.00012878276928017987, + "loss": 0.7352, + "mean_token_accuracy": 0.7768107950687408, + "num_tokens": 120714574.0, + "step": 35480 + }, + { + "epoch": 0.3561965554618812, + "learning_rate": 0.00012876269621421978, + "loss": 0.7722, + "mean_token_accuracy": 0.7694811820983887, + "num_tokens": 120748991.0, + "step": 35490 + }, + { + "epoch": 0.35629692079168174, + "learning_rate": 0.00012874262314825966, + "loss": 0.7676, + "mean_token_accuracy": 0.7733526527881622, + "num_tokens": 120782737.0, + "step": 35500 + }, + { + "epoch": 0.3563972861214822, + "learning_rate": 0.0001287225500822996, + "loss": 0.7621, + "mean_token_accuracy": 0.7753716170787811, + "num_tokens": 120817244.0, + "step": 35510 + }, + { + "epoch": 0.35649765145128265, + "learning_rate": 0.00012870247701633948, + "loss": 0.7179, + "mean_token_accuracy": 0.7856552004814148, + "num_tokens": 120850616.0, + "step": 35520 + }, + { + "epoch": 0.35659801678108316, + "learning_rate": 0.00012868240395037938, + "loss": 0.7295, + "mean_token_accuracy": 0.7802593469619751, + "num_tokens": 120884428.0, + "step": 35530 + }, + { + "epoch": 0.3566983821108836, + "learning_rate": 0.0001286623308844193, + "loss": 0.7472, + "mean_token_accuracy": 0.7753828525543213, + "num_tokens": 120918222.0, + "step": 35540 + }, + { + "epoch": 0.35679874744068407, + "learning_rate": 0.0001286422578184592, + "loss": 0.763, + "mean_token_accuracy": 0.7744974434375763, + "num_tokens": 120952602.0, + "step": 35550 + }, + { + "epoch": 0.3568991127704846, + "learning_rate": 0.0001286221847524991, + "loss": 0.7488, + "mean_token_accuracy": 0.7765093147754669, + "num_tokens": 120985794.0, + "step": 35560 + }, + { + "epoch": 0.35699947810028504, + "learning_rate": 0.00012860211168653902, + "loss": 0.7375, + "mean_token_accuracy": 0.7780269742012024, + "num_tokens": 121020158.0, + "step": 35570 + }, + { + "epoch": 0.3570998434300855, + "learning_rate": 0.00012858203862057893, + "loss": 0.7628, + "mean_token_accuracy": 0.770986270904541, + "num_tokens": 121054426.0, + "step": 35580 + }, + { + "epoch": 0.357200208759886, + "learning_rate": 0.0001285619655546188, + "loss": 0.7816, + "mean_token_accuracy": 0.7665948092937469, + "num_tokens": 121087924.0, + "step": 35590 + }, + { + "epoch": 0.35730057408968646, + "learning_rate": 0.00012854189248865874, + "loss": 0.782, + "mean_token_accuracy": 0.7741276800632477, + "num_tokens": 121121311.0, + "step": 35600 + }, + { + "epoch": 0.3574009394194869, + "learning_rate": 0.00012852181942269862, + "loss": 0.7546, + "mean_token_accuracy": 0.7732280850410461, + "num_tokens": 121155020.0, + "step": 35610 + }, + { + "epoch": 0.35750130474928743, + "learning_rate": 0.00012850174635673853, + "loss": 0.7487, + "mean_token_accuracy": 0.7780355155467987, + "num_tokens": 121189723.0, + "step": 35620 + }, + { + "epoch": 0.3576016700790879, + "learning_rate": 0.00012848167329077844, + "loss": 0.7381, + "mean_token_accuracy": 0.774751079082489, + "num_tokens": 121223810.0, + "step": 35630 + }, + { + "epoch": 0.35770203540888834, + "learning_rate": 0.00012846160022481835, + "loss": 0.7667, + "mean_token_accuracy": 0.7648861527442932, + "num_tokens": 121258285.0, + "step": 35640 + }, + { + "epoch": 0.35780240073868885, + "learning_rate": 0.00012844152715885823, + "loss": 0.7414, + "mean_token_accuracy": 0.782308691740036, + "num_tokens": 121292731.0, + "step": 35650 + }, + { + "epoch": 0.3579027660684893, + "learning_rate": 0.00012842145409289817, + "loss": 0.7618, + "mean_token_accuracy": 0.7717048048973083, + "num_tokens": 121326456.0, + "step": 35660 + }, + { + "epoch": 0.35800313139828976, + "learning_rate": 0.00012840138102693805, + "loss": 0.7591, + "mean_token_accuracy": 0.771227502822876, + "num_tokens": 121361074.0, + "step": 35670 + }, + { + "epoch": 0.3581034967280903, + "learning_rate": 0.00012838130796097796, + "loss": 0.7428, + "mean_token_accuracy": 0.7824000954627991, + "num_tokens": 121394728.0, + "step": 35680 + }, + { + "epoch": 0.35820386205789073, + "learning_rate": 0.0001283612348950179, + "loss": 0.7315, + "mean_token_accuracy": 0.7799839854240418, + "num_tokens": 121429478.0, + "step": 35690 + }, + { + "epoch": 0.3583042273876912, + "learning_rate": 0.00012834116182905777, + "loss": 0.7511, + "mean_token_accuracy": 0.7744730293750763, + "num_tokens": 121462687.0, + "step": 35700 + }, + { + "epoch": 0.35840459271749164, + "learning_rate": 0.00012832108876309768, + "loss": 0.7324, + "mean_token_accuracy": 0.783033686876297, + "num_tokens": 121496030.0, + "step": 35710 + }, + { + "epoch": 0.35850495804729215, + "learning_rate": 0.0001283010156971376, + "loss": 0.8035, + "mean_token_accuracy": 0.7618011116981507, + "num_tokens": 121530474.0, + "step": 35720 + }, + { + "epoch": 0.3586053233770926, + "learning_rate": 0.0001282809426311775, + "loss": 0.7541, + "mean_token_accuracy": 0.7772661507129669, + "num_tokens": 121564440.0, + "step": 35730 + }, + { + "epoch": 0.35870568870689307, + "learning_rate": 0.00012826086956521738, + "loss": 0.737, + "mean_token_accuracy": 0.7823009550571441, + "num_tokens": 121597786.0, + "step": 35740 + }, + { + "epoch": 0.3588060540366936, + "learning_rate": 0.00012824079649925732, + "loss": 0.7905, + "mean_token_accuracy": 0.7676131546497345, + "num_tokens": 121632887.0, + "step": 35750 + }, + { + "epoch": 0.35890641936649403, + "learning_rate": 0.0001282207234332972, + "loss": 0.75, + "mean_token_accuracy": 0.7723377823829651, + "num_tokens": 121667257.0, + "step": 35760 + }, + { + "epoch": 0.3590067846962945, + "learning_rate": 0.0001282006503673371, + "loss": 0.7635, + "mean_token_accuracy": 0.7732644557952881, + "num_tokens": 121701581.0, + "step": 35770 + }, + { + "epoch": 0.359107150026095, + "learning_rate": 0.00012818057730137701, + "loss": 0.7566, + "mean_token_accuracy": 0.7727309167385101, + "num_tokens": 121735125.0, + "step": 35780 + }, + { + "epoch": 0.35920751535589546, + "learning_rate": 0.00012816050423541692, + "loss": 0.7271, + "mean_token_accuracy": 0.7802690982818603, + "num_tokens": 121768958.0, + "step": 35790 + }, + { + "epoch": 0.3593078806856959, + "learning_rate": 0.00012814043116945683, + "loss": 0.7563, + "mean_token_accuracy": 0.7734170138835907, + "num_tokens": 121802223.0, + "step": 35800 + }, + { + "epoch": 0.3594082460154964, + "learning_rate": 0.00012812035810349674, + "loss": 0.7542, + "mean_token_accuracy": 0.7750784277915954, + "num_tokens": 121836128.0, + "step": 35810 + }, + { + "epoch": 0.3595086113452969, + "learning_rate": 0.00012810028503753665, + "loss": 0.7525, + "mean_token_accuracy": 0.7743003606796265, + "num_tokens": 121870033.0, + "step": 35820 + }, + { + "epoch": 0.35960897667509734, + "learning_rate": 0.00012808021197157653, + "loss": 0.7568, + "mean_token_accuracy": 0.775709331035614, + "num_tokens": 121904555.0, + "step": 35830 + }, + { + "epoch": 0.35970934200489785, + "learning_rate": 0.00012806013890561646, + "loss": 0.7643, + "mean_token_accuracy": 0.7707355499267579, + "num_tokens": 121938328.0, + "step": 35840 + }, + { + "epoch": 0.3598097073346983, + "learning_rate": 0.00012804006583965635, + "loss": 0.7381, + "mean_token_accuracy": 0.7774211645126343, + "num_tokens": 121973012.0, + "step": 35850 + }, + { + "epoch": 0.35991007266449876, + "learning_rate": 0.00012801999277369625, + "loss": 0.7592, + "mean_token_accuracy": 0.7730853080749511, + "num_tokens": 122007119.0, + "step": 35860 + }, + { + "epoch": 0.36001043799429927, + "learning_rate": 0.00012799991970773616, + "loss": 0.7423, + "mean_token_accuracy": 0.7800334930419922, + "num_tokens": 122040525.0, + "step": 35870 + }, + { + "epoch": 0.3601108033240997, + "learning_rate": 0.00012797984664177607, + "loss": 0.747, + "mean_token_accuracy": 0.7766052901744842, + "num_tokens": 122075351.0, + "step": 35880 + }, + { + "epoch": 0.3602111686539002, + "learning_rate": 0.00012795977357581598, + "loss": 0.7497, + "mean_token_accuracy": 0.7744327545166015, + "num_tokens": 122109400.0, + "step": 35890 + }, + { + "epoch": 0.3603115339837007, + "learning_rate": 0.0001279397005098559, + "loss": 0.7569, + "mean_token_accuracy": 0.773150897026062, + "num_tokens": 122143863.0, + "step": 35900 + }, + { + "epoch": 0.36041189931350115, + "learning_rate": 0.0001279196274438958, + "loss": 0.7214, + "mean_token_accuracy": 0.7819910287857056, + "num_tokens": 122176909.0, + "step": 35910 + }, + { + "epoch": 0.3605122646433016, + "learning_rate": 0.00012789955437793568, + "loss": 0.721, + "mean_token_accuracy": 0.7813787996768952, + "num_tokens": 122210184.0, + "step": 35920 + }, + { + "epoch": 0.3606126299731021, + "learning_rate": 0.0001278794813119756, + "loss": 0.7653, + "mean_token_accuracy": 0.7672504305839538, + "num_tokens": 122244535.0, + "step": 35930 + }, + { + "epoch": 0.3607129953029026, + "learning_rate": 0.0001278594082460155, + "loss": 0.7697, + "mean_token_accuracy": 0.7666830718517303, + "num_tokens": 122278573.0, + "step": 35940 + }, + { + "epoch": 0.36081336063270303, + "learning_rate": 0.0001278393351800554, + "loss": 0.7392, + "mean_token_accuracy": 0.7782879769802094, + "num_tokens": 122312826.0, + "step": 35950 + }, + { + "epoch": 0.36091372596250354, + "learning_rate": 0.0001278192621140953, + "loss": 0.7702, + "mean_token_accuracy": 0.7697879791259765, + "num_tokens": 122347337.0, + "step": 35960 + }, + { + "epoch": 0.361014091292304, + "learning_rate": 0.00012779918904813522, + "loss": 0.7556, + "mean_token_accuracy": 0.7757453262805939, + "num_tokens": 122380709.0, + "step": 35970 + }, + { + "epoch": 0.36111445662210445, + "learning_rate": 0.0001277791159821751, + "loss": 0.7042, + "mean_token_accuracy": 0.7824141263961792, + "num_tokens": 122415641.0, + "step": 35980 + }, + { + "epoch": 0.3612148219519049, + "learning_rate": 0.00012775904291621504, + "loss": 0.7718, + "mean_token_accuracy": 0.7685666620731354, + "num_tokens": 122449788.0, + "step": 35990 + }, + { + "epoch": 0.3613151872817054, + "learning_rate": 0.00012773896985025492, + "loss": 0.7704, + "mean_token_accuracy": 0.7693254113197326, + "num_tokens": 122484571.0, + "step": 36000 + }, + { + "epoch": 0.3614155526115059, + "learning_rate": 0.00012771889678429485, + "loss": 0.7638, + "mean_token_accuracy": 0.7732280671596528, + "num_tokens": 122518313.0, + "step": 36010 + }, + { + "epoch": 0.36151591794130633, + "learning_rate": 0.00012769882371833473, + "loss": 0.7635, + "mean_token_accuracy": 0.7754628539085389, + "num_tokens": 122552576.0, + "step": 36020 + }, + { + "epoch": 0.36161628327110684, + "learning_rate": 0.00012767875065237464, + "loss": 0.7739, + "mean_token_accuracy": 0.7710064649581909, + "num_tokens": 122586626.0, + "step": 36030 + }, + { + "epoch": 0.3617166486009073, + "learning_rate": 0.00012765867758641458, + "loss": 0.7791, + "mean_token_accuracy": 0.7669225811958313, + "num_tokens": 122620849.0, + "step": 36040 + }, + { + "epoch": 0.36181701393070775, + "learning_rate": 0.00012763860452045446, + "loss": 0.78, + "mean_token_accuracy": 0.7726854979991913, + "num_tokens": 122654206.0, + "step": 36050 + }, + { + "epoch": 0.36191737926050827, + "learning_rate": 0.00012761853145449437, + "loss": 0.7336, + "mean_token_accuracy": 0.7790078163146973, + "num_tokens": 122688152.0, + "step": 36060 + }, + { + "epoch": 0.3620177445903087, + "learning_rate": 0.00012759845838853428, + "loss": 0.7666, + "mean_token_accuracy": 0.7728044927120209, + "num_tokens": 122721656.0, + "step": 36070 + }, + { + "epoch": 0.3621181099201092, + "learning_rate": 0.00012757838532257419, + "loss": 0.7433, + "mean_token_accuracy": 0.7780297935009003, + "num_tokens": 122755914.0, + "step": 36080 + }, + { + "epoch": 0.3622184752499097, + "learning_rate": 0.00012755831225661407, + "loss": 0.7392, + "mean_token_accuracy": 0.7752133071422577, + "num_tokens": 122790201.0, + "step": 36090 + }, + { + "epoch": 0.36231884057971014, + "learning_rate": 0.000127538239190654, + "loss": 0.7132, + "mean_token_accuracy": 0.7838562309741974, + "num_tokens": 122824911.0, + "step": 36100 + }, + { + "epoch": 0.3624192059095106, + "learning_rate": 0.00012751816612469388, + "loss": 0.7333, + "mean_token_accuracy": 0.7770668208599091, + "num_tokens": 122858503.0, + "step": 36110 + }, + { + "epoch": 0.3625195712393111, + "learning_rate": 0.0001274980930587338, + "loss": 0.7346, + "mean_token_accuracy": 0.7744692265987396, + "num_tokens": 122892736.0, + "step": 36120 + }, + { + "epoch": 0.36261993656911157, + "learning_rate": 0.0001274780199927737, + "loss": 0.786, + "mean_token_accuracy": 0.7676080942153931, + "num_tokens": 122926498.0, + "step": 36130 + }, + { + "epoch": 0.362720301898912, + "learning_rate": 0.0001274579469268136, + "loss": 0.7725, + "mean_token_accuracy": 0.7723757565021515, + "num_tokens": 122960969.0, + "step": 36140 + }, + { + "epoch": 0.36282066722871253, + "learning_rate": 0.00012743787386085352, + "loss": 0.7768, + "mean_token_accuracy": 0.7706885755062103, + "num_tokens": 122994995.0, + "step": 36150 + }, + { + "epoch": 0.362921032558513, + "learning_rate": 0.00012741780079489343, + "loss": 0.775, + "mean_token_accuracy": 0.7717813134193421, + "num_tokens": 123028786.0, + "step": 36160 + }, + { + "epoch": 0.36302139788831345, + "learning_rate": 0.00012739772772893333, + "loss": 0.74, + "mean_token_accuracy": 0.7784698903560638, + "num_tokens": 123063918.0, + "step": 36170 + }, + { + "epoch": 0.36312176321811396, + "learning_rate": 0.00012737765466297322, + "loss": 0.7527, + "mean_token_accuracy": 0.7742575347423554, + "num_tokens": 123097707.0, + "step": 36180 + }, + { + "epoch": 0.3632221285479144, + "learning_rate": 0.00012735758159701315, + "loss": 0.7498, + "mean_token_accuracy": 0.7733630478382111, + "num_tokens": 123132416.0, + "step": 36190 + }, + { + "epoch": 0.36332249387771487, + "learning_rate": 0.00012733750853105303, + "loss": 0.7559, + "mean_token_accuracy": 0.7720991015434265, + "num_tokens": 123165899.0, + "step": 36200 + }, + { + "epoch": 0.3634228592075154, + "learning_rate": 0.00012731743546509294, + "loss": 0.7876, + "mean_token_accuracy": 0.7656482338905335, + "num_tokens": 123199786.0, + "step": 36210 + }, + { + "epoch": 0.36352322453731584, + "learning_rate": 0.00012729736239913285, + "loss": 0.7835, + "mean_token_accuracy": 0.7608466207981109, + "num_tokens": 123233311.0, + "step": 36220 + }, + { + "epoch": 0.3636235898671163, + "learning_rate": 0.00012727728933317276, + "loss": 0.7825, + "mean_token_accuracy": 0.7665168404579162, + "num_tokens": 123267317.0, + "step": 36230 + }, + { + "epoch": 0.3637239551969168, + "learning_rate": 0.00012725721626721267, + "loss": 0.7422, + "mean_token_accuracy": 0.775238174200058, + "num_tokens": 123301977.0, + "step": 36240 + }, + { + "epoch": 0.36382432052671726, + "learning_rate": 0.00012723714320125257, + "loss": 0.7442, + "mean_token_accuracy": 0.7765831291675568, + "num_tokens": 123335894.0, + "step": 36250 + }, + { + "epoch": 0.3639246858565177, + "learning_rate": 0.00012721707013529248, + "loss": 0.7848, + "mean_token_accuracy": 0.7693867802619934, + "num_tokens": 123369608.0, + "step": 36260 + }, + { + "epoch": 0.36402505118631817, + "learning_rate": 0.00012719699706933236, + "loss": 0.7299, + "mean_token_accuracy": 0.7803408145904541, + "num_tokens": 123404677.0, + "step": 36270 + }, + { + "epoch": 0.3641254165161187, + "learning_rate": 0.0001271769240033723, + "loss": 0.7166, + "mean_token_accuracy": 0.786678260564804, + "num_tokens": 123439082.0, + "step": 36280 + }, + { + "epoch": 0.36422578184591914, + "learning_rate": 0.00012715685093741218, + "loss": 0.7497, + "mean_token_accuracy": 0.7783904135227203, + "num_tokens": 123473545.0, + "step": 36290 + }, + { + "epoch": 0.3643261471757196, + "learning_rate": 0.0001271367778714521, + "loss": 0.7603, + "mean_token_accuracy": 0.773338520526886, + "num_tokens": 123507677.0, + "step": 36300 + }, + { + "epoch": 0.3644265125055201, + "learning_rate": 0.000127116704805492, + "loss": 0.7527, + "mean_token_accuracy": 0.7701963305473327, + "num_tokens": 123541560.0, + "step": 36310 + }, + { + "epoch": 0.36452687783532056, + "learning_rate": 0.0001270966317395319, + "loss": 0.7538, + "mean_token_accuracy": 0.7746260046958924, + "num_tokens": 123574876.0, + "step": 36320 + }, + { + "epoch": 0.364627243165121, + "learning_rate": 0.0001270765586735718, + "loss": 0.7334, + "mean_token_accuracy": 0.7801806092262268, + "num_tokens": 123608802.0, + "step": 36330 + }, + { + "epoch": 0.36472760849492153, + "learning_rate": 0.00012705648560761172, + "loss": 0.7684, + "mean_token_accuracy": 0.7709551453590393, + "num_tokens": 123641850.0, + "step": 36340 + }, + { + "epoch": 0.364827973824722, + "learning_rate": 0.0001270364125416516, + "loss": 0.7155, + "mean_token_accuracy": 0.785818237066269, + "num_tokens": 123676054.0, + "step": 36350 + }, + { + "epoch": 0.36492833915452244, + "learning_rate": 0.0001270163394756915, + "loss": 0.7449, + "mean_token_accuracy": 0.7793585658073425, + "num_tokens": 123710310.0, + "step": 36360 + }, + { + "epoch": 0.36502870448432295, + "learning_rate": 0.00012699626640973142, + "loss": 0.7147, + "mean_token_accuracy": 0.7818877160549164, + "num_tokens": 123744525.0, + "step": 36370 + }, + { + "epoch": 0.3651290698141234, + "learning_rate": 0.00012697619334377133, + "loss": 0.7472, + "mean_token_accuracy": 0.7787317574024201, + "num_tokens": 123779054.0, + "step": 36380 + }, + { + "epoch": 0.36522943514392386, + "learning_rate": 0.00012695612027781124, + "loss": 0.7748, + "mean_token_accuracy": 0.7739263355731965, + "num_tokens": 123813024.0, + "step": 36390 + }, + { + "epoch": 0.3653298004737244, + "learning_rate": 0.00012693604721185115, + "loss": 0.7489, + "mean_token_accuracy": 0.7733473181724548, + "num_tokens": 123846524.0, + "step": 36400 + }, + { + "epoch": 0.36543016580352483, + "learning_rate": 0.00012691597414589106, + "loss": 0.7646, + "mean_token_accuracy": 0.7685162484645843, + "num_tokens": 123879497.0, + "step": 36410 + }, + { + "epoch": 0.3655305311333253, + "learning_rate": 0.00012689590107993094, + "loss": 0.7519, + "mean_token_accuracy": 0.775278776884079, + "num_tokens": 123913015.0, + "step": 36420 + }, + { + "epoch": 0.3656308964631258, + "learning_rate": 0.00012687582801397087, + "loss": 0.7495, + "mean_token_accuracy": 0.7701024949550629, + "num_tokens": 123946886.0, + "step": 36430 + }, + { + "epoch": 0.36573126179292625, + "learning_rate": 0.00012685575494801075, + "loss": 0.7326, + "mean_token_accuracy": 0.7799596846103668, + "num_tokens": 123981595.0, + "step": 36440 + }, + { + "epoch": 0.3658316271227267, + "learning_rate": 0.00012683568188205066, + "loss": 0.7393, + "mean_token_accuracy": 0.7762674391269684, + "num_tokens": 124015129.0, + "step": 36450 + }, + { + "epoch": 0.3659319924525272, + "learning_rate": 0.00012681560881609057, + "loss": 0.7475, + "mean_token_accuracy": 0.776815903186798, + "num_tokens": 124049488.0, + "step": 36460 + }, + { + "epoch": 0.3660323577823277, + "learning_rate": 0.00012679553575013048, + "loss": 0.731, + "mean_token_accuracy": 0.7786135077476501, + "num_tokens": 124084321.0, + "step": 36470 + }, + { + "epoch": 0.36613272311212813, + "learning_rate": 0.0001267754626841704, + "loss": 0.7527, + "mean_token_accuracy": 0.7756665587425232, + "num_tokens": 124118416.0, + "step": 36480 + }, + { + "epoch": 0.36623308844192864, + "learning_rate": 0.0001267553896182103, + "loss": 0.7595, + "mean_token_accuracy": 0.7719801664352417, + "num_tokens": 124152553.0, + "step": 36490 + }, + { + "epoch": 0.3663334537717291, + "learning_rate": 0.0001267353165522502, + "loss": 0.7468, + "mean_token_accuracy": 0.7742100894451142, + "num_tokens": 124186663.0, + "step": 36500 + }, + { + "epoch": 0.36643381910152956, + "learning_rate": 0.00012671524348629009, + "loss": 0.7253, + "mean_token_accuracy": 0.7852876901626586, + "num_tokens": 124220256.0, + "step": 36510 + }, + { + "epoch": 0.36653418443133007, + "learning_rate": 0.00012669517042033002, + "loss": 0.7769, + "mean_token_accuracy": 0.7759455144405365, + "num_tokens": 124253958.0, + "step": 36520 + }, + { + "epoch": 0.3666345497611305, + "learning_rate": 0.0001266750973543699, + "loss": 0.7643, + "mean_token_accuracy": 0.7705866992473602, + "num_tokens": 124288559.0, + "step": 36530 + }, + { + "epoch": 0.366734915090931, + "learning_rate": 0.0001266550242884098, + "loss": 0.7348, + "mean_token_accuracy": 0.7789439380168914, + "num_tokens": 124322607.0, + "step": 36540 + }, + { + "epoch": 0.36683528042073144, + "learning_rate": 0.00012663495122244972, + "loss": 0.7399, + "mean_token_accuracy": 0.7821188330650329, + "num_tokens": 124356366.0, + "step": 36550 + }, + { + "epoch": 0.36693564575053195, + "learning_rate": 0.00012661487815648963, + "loss": 0.7654, + "mean_token_accuracy": 0.7741107821464539, + "num_tokens": 124390334.0, + "step": 36560 + }, + { + "epoch": 0.3670360110803324, + "learning_rate": 0.00012659480509052954, + "loss": 0.779, + "mean_token_accuracy": 0.7723045289516449, + "num_tokens": 124423962.0, + "step": 36570 + }, + { + "epoch": 0.36713637641013286, + "learning_rate": 0.00012657473202456944, + "loss": 0.7574, + "mean_token_accuracy": 0.7718424618244171, + "num_tokens": 124458136.0, + "step": 36580 + }, + { + "epoch": 0.36723674173993337, + "learning_rate": 0.00012655465895860935, + "loss": 0.7597, + "mean_token_accuracy": 0.7768797993659973, + "num_tokens": 124492658.0, + "step": 36590 + }, + { + "epoch": 0.3673371070697338, + "learning_rate": 0.00012653458589264926, + "loss": 0.7618, + "mean_token_accuracy": 0.7682752072811126, + "num_tokens": 124526025.0, + "step": 36600 + }, + { + "epoch": 0.3674374723995343, + "learning_rate": 0.00012651451282668917, + "loss": 0.7153, + "mean_token_accuracy": 0.7839506208896637, + "num_tokens": 124559705.0, + "step": 36610 + }, + { + "epoch": 0.3675378377293348, + "learning_rate": 0.00012649443976072905, + "loss": 0.7798, + "mean_token_accuracy": 0.7706827342510223, + "num_tokens": 124593705.0, + "step": 36620 + }, + { + "epoch": 0.36763820305913525, + "learning_rate": 0.000126474366694769, + "loss": 0.79, + "mean_token_accuracy": 0.7627219080924987, + "num_tokens": 124627356.0, + "step": 36630 + }, + { + "epoch": 0.3677385683889357, + "learning_rate": 0.00012645429362880887, + "loss": 0.7672, + "mean_token_accuracy": 0.7729246199131012, + "num_tokens": 124661844.0, + "step": 36640 + }, + { + "epoch": 0.3678389337187362, + "learning_rate": 0.00012643422056284878, + "loss": 0.742, + "mean_token_accuracy": 0.7788021087646484, + "num_tokens": 124695749.0, + "step": 36650 + }, + { + "epoch": 0.36793929904853667, + "learning_rate": 0.00012641414749688869, + "loss": 0.786, + "mean_token_accuracy": 0.7673965930938721, + "num_tokens": 124730002.0, + "step": 36660 + }, + { + "epoch": 0.36803966437833713, + "learning_rate": 0.0001263940744309286, + "loss": 0.7331, + "mean_token_accuracy": 0.7784696877002716, + "num_tokens": 124764025.0, + "step": 36670 + }, + { + "epoch": 0.36814002970813764, + "learning_rate": 0.00012637400136496847, + "loss": 0.772, + "mean_token_accuracy": 0.7756337761878968, + "num_tokens": 124797840.0, + "step": 36680 + }, + { + "epoch": 0.3682403950379381, + "learning_rate": 0.0001263539282990084, + "loss": 0.7283, + "mean_token_accuracy": 0.7852561414241791, + "num_tokens": 124831965.0, + "step": 36690 + }, + { + "epoch": 0.36834076036773855, + "learning_rate": 0.0001263338552330483, + "loss": 0.7324, + "mean_token_accuracy": 0.7768737018108368, + "num_tokens": 124865812.0, + "step": 36700 + }, + { + "epoch": 0.36844112569753906, + "learning_rate": 0.0001263137821670882, + "loss": 0.741, + "mean_token_accuracy": 0.7810425579547882, + "num_tokens": 124899291.0, + "step": 36710 + }, + { + "epoch": 0.3685414910273395, + "learning_rate": 0.0001262937091011281, + "loss": 0.7568, + "mean_token_accuracy": 0.7733590781688691, + "num_tokens": 124933442.0, + "step": 36720 + }, + { + "epoch": 0.36864185635714, + "learning_rate": 0.00012627363603516802, + "loss": 0.7473, + "mean_token_accuracy": 0.7781011044979096, + "num_tokens": 124966912.0, + "step": 36730 + }, + { + "epoch": 0.3687422216869405, + "learning_rate": 0.00012625356296920793, + "loss": 0.7422, + "mean_token_accuracy": 0.7781444549560547, + "num_tokens": 125000514.0, + "step": 36740 + }, + { + "epoch": 0.36884258701674094, + "learning_rate": 0.00012623348990324783, + "loss": 0.7532, + "mean_token_accuracy": 0.7719095110893249, + "num_tokens": 125034191.0, + "step": 36750 + }, + { + "epoch": 0.3689429523465414, + "learning_rate": 0.00012621341683728774, + "loss": 0.7706, + "mean_token_accuracy": 0.769522351026535, + "num_tokens": 125068318.0, + "step": 36760 + }, + { + "epoch": 0.3690433176763419, + "learning_rate": 0.00012619334377132762, + "loss": 0.7397, + "mean_token_accuracy": 0.7740334391593933, + "num_tokens": 125102526.0, + "step": 36770 + }, + { + "epoch": 0.36914368300614236, + "learning_rate": 0.00012617327070536756, + "loss": 0.7409, + "mean_token_accuracy": 0.7786827027797699, + "num_tokens": 125137056.0, + "step": 36780 + }, + { + "epoch": 0.3692440483359428, + "learning_rate": 0.00012615319763940744, + "loss": 0.7508, + "mean_token_accuracy": 0.7754316866397858, + "num_tokens": 125172222.0, + "step": 36790 + }, + { + "epoch": 0.36934441366574333, + "learning_rate": 0.00012613312457344735, + "loss": 0.7331, + "mean_token_accuracy": 0.7798702359199524, + "num_tokens": 125206714.0, + "step": 36800 + }, + { + "epoch": 0.3694447789955438, + "learning_rate": 0.00012611305150748726, + "loss": 0.753, + "mean_token_accuracy": 0.7793877422809601, + "num_tokens": 125240778.0, + "step": 36810 + }, + { + "epoch": 0.36954514432534424, + "learning_rate": 0.00012609297844152717, + "loss": 0.7496, + "mean_token_accuracy": 0.7778722882270813, + "num_tokens": 125274674.0, + "step": 36820 + }, + { + "epoch": 0.3696455096551447, + "learning_rate": 0.00012607290537556707, + "loss": 0.7401, + "mean_token_accuracy": 0.7754093527793884, + "num_tokens": 125308296.0, + "step": 36830 + }, + { + "epoch": 0.3697458749849452, + "learning_rate": 0.00012605283230960698, + "loss": 0.7658, + "mean_token_accuracy": 0.7728193759918213, + "num_tokens": 125342130.0, + "step": 36840 + }, + { + "epoch": 0.36984624031474567, + "learning_rate": 0.0001260327592436469, + "loss": 0.7711, + "mean_token_accuracy": 0.7682547867298126, + "num_tokens": 125375303.0, + "step": 36850 + }, + { + "epoch": 0.3699466056445461, + "learning_rate": 0.00012601268617768677, + "loss": 0.7434, + "mean_token_accuracy": 0.7757311046123505, + "num_tokens": 125408713.0, + "step": 36860 + }, + { + "epoch": 0.37004697097434663, + "learning_rate": 0.0001259926131117267, + "loss": 0.75, + "mean_token_accuracy": 0.7736545741558075, + "num_tokens": 125442807.0, + "step": 36870 + }, + { + "epoch": 0.3701473363041471, + "learning_rate": 0.0001259725400457666, + "loss": 0.7238, + "mean_token_accuracy": 0.7788444459438324, + "num_tokens": 125476682.0, + "step": 36880 + }, + { + "epoch": 0.37024770163394755, + "learning_rate": 0.0001259524669798065, + "loss": 0.7333, + "mean_token_accuracy": 0.7783869564533233, + "num_tokens": 125510944.0, + "step": 36890 + }, + { + "epoch": 0.37034806696374806, + "learning_rate": 0.0001259323939138464, + "loss": 0.7818, + "mean_token_accuracy": 0.7712550461292267, + "num_tokens": 125544681.0, + "step": 36900 + }, + { + "epoch": 0.3704484322935485, + "learning_rate": 0.00012591232084788631, + "loss": 0.7148, + "mean_token_accuracy": 0.7841877639293671, + "num_tokens": 125579749.0, + "step": 36910 + }, + { + "epoch": 0.37054879762334897, + "learning_rate": 0.0001258922477819262, + "loss": 0.7792, + "mean_token_accuracy": 0.773759263753891, + "num_tokens": 125613366.0, + "step": 36920 + }, + { + "epoch": 0.3706491629531495, + "learning_rate": 0.00012587217471596613, + "loss": 0.7691, + "mean_token_accuracy": 0.7693368136882782, + "num_tokens": 125647466.0, + "step": 36930 + }, + { + "epoch": 0.37074952828294994, + "learning_rate": 0.00012585210165000604, + "loss": 0.7572, + "mean_token_accuracy": 0.7806031584739686, + "num_tokens": 125682089.0, + "step": 36940 + }, + { + "epoch": 0.3708498936127504, + "learning_rate": 0.00012583202858404592, + "loss": 0.7364, + "mean_token_accuracy": 0.7828087329864502, + "num_tokens": 125715999.0, + "step": 36950 + }, + { + "epoch": 0.3709502589425509, + "learning_rate": 0.00012581195551808586, + "loss": 0.7653, + "mean_token_accuracy": 0.7720663547515869, + "num_tokens": 125750224.0, + "step": 36960 + }, + { + "epoch": 0.37105062427235136, + "learning_rate": 0.00012579188245212574, + "loss": 0.7514, + "mean_token_accuracy": 0.7769839286804199, + "num_tokens": 125784255.0, + "step": 36970 + }, + { + "epoch": 0.3711509896021518, + "learning_rate": 0.00012577180938616565, + "loss": 0.7622, + "mean_token_accuracy": 0.7722682952880859, + "num_tokens": 125818557.0, + "step": 36980 + }, + { + "epoch": 0.3712513549319523, + "learning_rate": 0.00012575173632020556, + "loss": 0.7481, + "mean_token_accuracy": 0.7747491598129272, + "num_tokens": 125852593.0, + "step": 36990 + }, + { + "epoch": 0.3713517202617528, + "learning_rate": 0.00012573166325424546, + "loss": 0.7312, + "mean_token_accuracy": 0.7797623395919799, + "num_tokens": 125886279.0, + "step": 37000 + }, + { + "epoch": 0.37145208559155324, + "learning_rate": 0.00012571159018828534, + "loss": 0.7521, + "mean_token_accuracy": 0.775166916847229, + "num_tokens": 125920013.0, + "step": 37010 + }, + { + "epoch": 0.37155245092135375, + "learning_rate": 0.00012569151712232528, + "loss": 0.7385, + "mean_token_accuracy": 0.7798730194568634, + "num_tokens": 125954378.0, + "step": 37020 + }, + { + "epoch": 0.3716528162511542, + "learning_rate": 0.00012567144405636516, + "loss": 0.7952, + "mean_token_accuracy": 0.7619469940662384, + "num_tokens": 125988314.0, + "step": 37030 + }, + { + "epoch": 0.37175318158095466, + "learning_rate": 0.00012565137099040507, + "loss": 0.7297, + "mean_token_accuracy": 0.7822118043899536, + "num_tokens": 126021084.0, + "step": 37040 + }, + { + "epoch": 0.3718535469107552, + "learning_rate": 0.00012563129792444498, + "loss": 0.7615, + "mean_token_accuracy": 0.7743511915206909, + "num_tokens": 126054971.0, + "step": 37050 + }, + { + "epoch": 0.37195391224055563, + "learning_rate": 0.0001256112248584849, + "loss": 0.7542, + "mean_token_accuracy": 0.7733421862125397, + "num_tokens": 126089252.0, + "step": 37060 + }, + { + "epoch": 0.3720542775703561, + "learning_rate": 0.0001255911517925248, + "loss": 0.739, + "mean_token_accuracy": 0.7727400422096252, + "num_tokens": 126123276.0, + "step": 37070 + }, + { + "epoch": 0.3721546429001566, + "learning_rate": 0.0001255710787265647, + "loss": 0.7305, + "mean_token_accuracy": 0.773516982793808, + "num_tokens": 126157140.0, + "step": 37080 + }, + { + "epoch": 0.37225500822995705, + "learning_rate": 0.0001255510056606046, + "loss": 0.7482, + "mean_token_accuracy": 0.7750555634498596, + "num_tokens": 126190891.0, + "step": 37090 + }, + { + "epoch": 0.3723553735597575, + "learning_rate": 0.0001255309325946445, + "loss": 0.779, + "mean_token_accuracy": 0.7678870260715485, + "num_tokens": 126224600.0, + "step": 37100 + }, + { + "epoch": 0.37245573888955796, + "learning_rate": 0.00012551085952868443, + "loss": 0.7706, + "mean_token_accuracy": 0.7689167320728302, + "num_tokens": 126259173.0, + "step": 37110 + }, + { + "epoch": 0.3725561042193585, + "learning_rate": 0.0001254907864627243, + "loss": 0.7361, + "mean_token_accuracy": 0.7755484044551849, + "num_tokens": 126293443.0, + "step": 37120 + }, + { + "epoch": 0.37265646954915893, + "learning_rate": 0.00012547071339676422, + "loss": 0.7743, + "mean_token_accuracy": 0.7669099032878876, + "num_tokens": 126326676.0, + "step": 37130 + }, + { + "epoch": 0.3727568348789594, + "learning_rate": 0.00012545064033080413, + "loss": 0.7481, + "mean_token_accuracy": 0.7756665706634521, + "num_tokens": 126360511.0, + "step": 37140 + }, + { + "epoch": 0.3728572002087599, + "learning_rate": 0.00012543056726484404, + "loss": 0.7877, + "mean_token_accuracy": 0.7703516781330109, + "num_tokens": 126394643.0, + "step": 37150 + }, + { + "epoch": 0.37295756553856035, + "learning_rate": 0.00012541049419888394, + "loss": 0.7954, + "mean_token_accuracy": 0.7689454019069671, + "num_tokens": 126429303.0, + "step": 37160 + }, + { + "epoch": 0.3730579308683608, + "learning_rate": 0.00012539042113292385, + "loss": 0.7471, + "mean_token_accuracy": 0.7690429866313935, + "num_tokens": 126462979.0, + "step": 37170 + }, + { + "epoch": 0.3731582961981613, + "learning_rate": 0.00012537034806696376, + "loss": 0.7615, + "mean_token_accuracy": 0.7736899137496949, + "num_tokens": 126497695.0, + "step": 37180 + }, + { + "epoch": 0.3732586615279618, + "learning_rate": 0.00012535027500100367, + "loss": 0.7522, + "mean_token_accuracy": 0.7704955279827118, + "num_tokens": 126531858.0, + "step": 37190 + }, + { + "epoch": 0.37335902685776223, + "learning_rate": 0.00012533020193504358, + "loss": 0.7859, + "mean_token_accuracy": 0.765929788351059, + "num_tokens": 126565500.0, + "step": 37200 + }, + { + "epoch": 0.37345939218756274, + "learning_rate": 0.00012531012886908346, + "loss": 0.7629, + "mean_token_accuracy": 0.7764375567436218, + "num_tokens": 126598901.0, + "step": 37210 + }, + { + "epoch": 0.3735597575173632, + "learning_rate": 0.0001252900558031234, + "loss": 0.7729, + "mean_token_accuracy": 0.7729214072227478, + "num_tokens": 126632624.0, + "step": 37220 + }, + { + "epoch": 0.37366012284716366, + "learning_rate": 0.00012526998273716328, + "loss": 0.7678, + "mean_token_accuracy": 0.7708661913871765, + "num_tokens": 126666181.0, + "step": 37230 + }, + { + "epoch": 0.37376048817696417, + "learning_rate": 0.00012524990967120318, + "loss": 0.7438, + "mean_token_accuracy": 0.7777769088745117, + "num_tokens": 126700232.0, + "step": 37240 + }, + { + "epoch": 0.3738608535067646, + "learning_rate": 0.0001252298366052431, + "loss": 0.7397, + "mean_token_accuracy": 0.7761428117752075, + "num_tokens": 126734328.0, + "step": 37250 + }, + { + "epoch": 0.3739612188365651, + "learning_rate": 0.000125209763539283, + "loss": 0.7419, + "mean_token_accuracy": 0.7773242831230164, + "num_tokens": 126767999.0, + "step": 37260 + }, + { + "epoch": 0.3740615841663656, + "learning_rate": 0.00012518969047332288, + "loss": 0.785, + "mean_token_accuracy": 0.7692415654659271, + "num_tokens": 126801550.0, + "step": 37270 + }, + { + "epoch": 0.37416194949616605, + "learning_rate": 0.00012516961740736282, + "loss": 0.7339, + "mean_token_accuracy": 0.7795442044734955, + "num_tokens": 126835838.0, + "step": 37280 + }, + { + "epoch": 0.3742623148259665, + "learning_rate": 0.00012514954434140273, + "loss": 0.7749, + "mean_token_accuracy": 0.7730243325233459, + "num_tokens": 126869550.0, + "step": 37290 + }, + { + "epoch": 0.374362680155767, + "learning_rate": 0.0001251294712754426, + "loss": 0.7701, + "mean_token_accuracy": 0.773316603899002, + "num_tokens": 126903801.0, + "step": 37300 + }, + { + "epoch": 0.37446304548556747, + "learning_rate": 0.00012510939820948254, + "loss": 0.7607, + "mean_token_accuracy": 0.7711721777915954, + "num_tokens": 126937835.0, + "step": 37310 + }, + { + "epoch": 0.3745634108153679, + "learning_rate": 0.00012508932514352242, + "loss": 0.7546, + "mean_token_accuracy": 0.7751730561256409, + "num_tokens": 126972570.0, + "step": 37320 + }, + { + "epoch": 0.37466377614516844, + "learning_rate": 0.00012506925207756233, + "loss": 0.7466, + "mean_token_accuracy": 0.7792658150196076, + "num_tokens": 127005529.0, + "step": 37330 + }, + { + "epoch": 0.3747641414749689, + "learning_rate": 0.00012504917901160224, + "loss": 0.7662, + "mean_token_accuracy": 0.7746534407138824, + "num_tokens": 127039792.0, + "step": 37340 + }, + { + "epoch": 0.37486450680476935, + "learning_rate": 0.00012502910594564215, + "loss": 0.7619, + "mean_token_accuracy": 0.769725251197815, + "num_tokens": 127074021.0, + "step": 37350 + }, + { + "epoch": 0.37496487213456986, + "learning_rate": 0.00012500903287968203, + "loss": 0.7462, + "mean_token_accuracy": 0.7742079257965088, + "num_tokens": 127107609.0, + "step": 37360 + }, + { + "epoch": 0.3750652374643703, + "learning_rate": 0.00012498895981372197, + "loss": 0.7579, + "mean_token_accuracy": 0.774655556678772, + "num_tokens": 127141443.0, + "step": 37370 + }, + { + "epoch": 0.37516560279417077, + "learning_rate": 0.00012496888674776185, + "loss": 0.7144, + "mean_token_accuracy": 0.7826993942260743, + "num_tokens": 127175539.0, + "step": 37380 + }, + { + "epoch": 0.3752659681239713, + "learning_rate": 0.00012494881368180176, + "loss": 0.771, + "mean_token_accuracy": 0.7703517079353333, + "num_tokens": 127209830.0, + "step": 37390 + }, + { + "epoch": 0.37536633345377174, + "learning_rate": 0.00012492874061584167, + "loss": 0.7498, + "mean_token_accuracy": 0.7781586468219757, + "num_tokens": 127244945.0, + "step": 37400 + }, + { + "epoch": 0.3754666987835722, + "learning_rate": 0.00012490866754988157, + "loss": 0.7556, + "mean_token_accuracy": 0.7736250162124634, + "num_tokens": 127278901.0, + "step": 37410 + }, + { + "epoch": 0.37556706411337265, + "learning_rate": 0.00012488859448392148, + "loss": 0.76, + "mean_token_accuracy": 0.7787852048873901, + "num_tokens": 127313577.0, + "step": 37420 + }, + { + "epoch": 0.37566742944317316, + "learning_rate": 0.0001248685214179614, + "loss": 0.7328, + "mean_token_accuracy": 0.7778769314289093, + "num_tokens": 127346907.0, + "step": 37430 + }, + { + "epoch": 0.3757677947729736, + "learning_rate": 0.0001248484483520013, + "loss": 0.7852, + "mean_token_accuracy": 0.7669208109378814, + "num_tokens": 127381209.0, + "step": 37440 + }, + { + "epoch": 0.3758681601027741, + "learning_rate": 0.00012482837528604118, + "loss": 0.7606, + "mean_token_accuracy": 0.7742077112197876, + "num_tokens": 127415900.0, + "step": 37450 + }, + { + "epoch": 0.3759685254325746, + "learning_rate": 0.00012480830222008112, + "loss": 0.7384, + "mean_token_accuracy": 0.7786307811737061, + "num_tokens": 127449805.0, + "step": 37460 + }, + { + "epoch": 0.37606889076237504, + "learning_rate": 0.000124788229154121, + "loss": 0.7547, + "mean_token_accuracy": 0.7758641123771668, + "num_tokens": 127484249.0, + "step": 37470 + }, + { + "epoch": 0.3761692560921755, + "learning_rate": 0.0001247681560881609, + "loss": 0.7584, + "mean_token_accuracy": 0.7752665996551513, + "num_tokens": 127518912.0, + "step": 37480 + }, + { + "epoch": 0.376269621421976, + "learning_rate": 0.00012474808302220081, + "loss": 0.7446, + "mean_token_accuracy": 0.7730976998806, + "num_tokens": 127553336.0, + "step": 37490 + }, + { + "epoch": 0.37636998675177646, + "learning_rate": 0.00012472800995624072, + "loss": 0.7123, + "mean_token_accuracy": 0.779695737361908, + "num_tokens": 127587317.0, + "step": 37500 + }, + { + "epoch": 0.3764703520815769, + "learning_rate": 0.00012470793689028063, + "loss": 0.7472, + "mean_token_accuracy": 0.7722173571586609, + "num_tokens": 127620720.0, + "step": 37510 + }, + { + "epoch": 0.37657071741137743, + "learning_rate": 0.00012468786382432054, + "loss": 0.7075, + "mean_token_accuracy": 0.783935296535492, + "num_tokens": 127655610.0, + "step": 37520 + }, + { + "epoch": 0.3766710827411779, + "learning_rate": 0.00012466779075836045, + "loss": 0.7742, + "mean_token_accuracy": 0.7720625638961792, + "num_tokens": 127689079.0, + "step": 37530 + }, + { + "epoch": 0.37677144807097834, + "learning_rate": 0.00012464771769240033, + "loss": 0.7648, + "mean_token_accuracy": 0.7687886416912079, + "num_tokens": 127723638.0, + "step": 37540 + }, + { + "epoch": 0.37687181340077885, + "learning_rate": 0.00012462764462644026, + "loss": 0.7929, + "mean_token_accuracy": 0.766310304403305, + "num_tokens": 127757394.0, + "step": 37550 + }, + { + "epoch": 0.3769721787305793, + "learning_rate": 0.00012460757156048015, + "loss": 0.7529, + "mean_token_accuracy": 0.7758144676685333, + "num_tokens": 127791887.0, + "step": 37560 + }, + { + "epoch": 0.37707254406037977, + "learning_rate": 0.00012458749849452005, + "loss": 0.7444, + "mean_token_accuracy": 0.7755796909332275, + "num_tokens": 127827347.0, + "step": 37570 + }, + { + "epoch": 0.3771729093901803, + "learning_rate": 0.00012456742542855996, + "loss": 0.7616, + "mean_token_accuracy": 0.7779051125049591, + "num_tokens": 127861561.0, + "step": 37580 + }, + { + "epoch": 0.37727327471998073, + "learning_rate": 0.00012454735236259987, + "loss": 0.7472, + "mean_token_accuracy": 0.7814350962638855, + "num_tokens": 127895629.0, + "step": 37590 + }, + { + "epoch": 0.3773736400497812, + "learning_rate": 0.00012452727929663975, + "loss": 0.7546, + "mean_token_accuracy": 0.7693463325500488, + "num_tokens": 127930957.0, + "step": 37600 + }, + { + "epoch": 0.3774740053795817, + "learning_rate": 0.0001245072062306797, + "loss": 0.74, + "mean_token_accuracy": 0.7794726371765137, + "num_tokens": 127964539.0, + "step": 37610 + }, + { + "epoch": 0.37757437070938216, + "learning_rate": 0.00012448713316471957, + "loss": 0.7354, + "mean_token_accuracy": 0.7787318110466004, + "num_tokens": 127997862.0, + "step": 37620 + }, + { + "epoch": 0.3776747360391826, + "learning_rate": 0.00012446706009875948, + "loss": 0.7348, + "mean_token_accuracy": 0.7819286227226258, + "num_tokens": 128031151.0, + "step": 37630 + }, + { + "epoch": 0.3777751013689831, + "learning_rate": 0.00012444698703279941, + "loss": 0.7738, + "mean_token_accuracy": 0.7697048485279083, + "num_tokens": 128065071.0, + "step": 37640 + }, + { + "epoch": 0.3778754666987836, + "learning_rate": 0.0001244269139668393, + "loss": 0.7486, + "mean_token_accuracy": 0.7777126967906952, + "num_tokens": 128098837.0, + "step": 37650 + }, + { + "epoch": 0.37797583202858404, + "learning_rate": 0.0001244068409008792, + "loss": 0.7779, + "mean_token_accuracy": 0.7643070816993713, + "num_tokens": 128132289.0, + "step": 37660 + }, + { + "epoch": 0.37807619735838455, + "learning_rate": 0.0001243867678349191, + "loss": 0.7416, + "mean_token_accuracy": 0.7768400371074676, + "num_tokens": 128166670.0, + "step": 37670 + }, + { + "epoch": 0.378176562688185, + "learning_rate": 0.00012436669476895902, + "loss": 0.7536, + "mean_token_accuracy": 0.7739063024520874, + "num_tokens": 128200677.0, + "step": 37680 + }, + { + "epoch": 0.37827692801798546, + "learning_rate": 0.0001243466217029989, + "loss": 0.7402, + "mean_token_accuracy": 0.772838932275772, + "num_tokens": 128234446.0, + "step": 37690 + }, + { + "epoch": 0.3783772933477859, + "learning_rate": 0.00012432654863703884, + "loss": 0.7492, + "mean_token_accuracy": 0.7724959373474121, + "num_tokens": 128268474.0, + "step": 37700 + }, + { + "epoch": 0.3784776586775864, + "learning_rate": 0.00012430647557107872, + "loss": 0.7496, + "mean_token_accuracy": 0.7706626117229461, + "num_tokens": 128302859.0, + "step": 37710 + }, + { + "epoch": 0.3785780240073869, + "learning_rate": 0.00012428640250511865, + "loss": 0.7588, + "mean_token_accuracy": 0.771821403503418, + "num_tokens": 128336585.0, + "step": 37720 + }, + { + "epoch": 0.37867838933718734, + "learning_rate": 0.00012426632943915854, + "loss": 0.7493, + "mean_token_accuracy": 0.7749598860740662, + "num_tokens": 128370302.0, + "step": 37730 + }, + { + "epoch": 0.37877875466698785, + "learning_rate": 0.00012424625637319844, + "loss": 0.733, + "mean_token_accuracy": 0.781812310218811, + "num_tokens": 128404138.0, + "step": 37740 + }, + { + "epoch": 0.3788791199967883, + "learning_rate": 0.00012422618330723835, + "loss": 0.7596, + "mean_token_accuracy": 0.7723971903324127, + "num_tokens": 128437981.0, + "step": 37750 + }, + { + "epoch": 0.37897948532658876, + "learning_rate": 0.00012420611024127826, + "loss": 0.779, + "mean_token_accuracy": 0.7666724562644959, + "num_tokens": 128472955.0, + "step": 37760 + }, + { + "epoch": 0.3790798506563893, + "learning_rate": 0.00012418603717531817, + "loss": 0.7549, + "mean_token_accuracy": 0.7720897555351257, + "num_tokens": 128506598.0, + "step": 37770 + }, + { + "epoch": 0.37918021598618973, + "learning_rate": 0.00012416596410935808, + "loss": 0.7518, + "mean_token_accuracy": 0.7744605660438537, + "num_tokens": 128540548.0, + "step": 37780 + }, + { + "epoch": 0.3792805813159902, + "learning_rate": 0.00012414589104339799, + "loss": 0.7451, + "mean_token_accuracy": 0.7729527950286865, + "num_tokens": 128574041.0, + "step": 37790 + }, + { + "epoch": 0.3793809466457907, + "learning_rate": 0.00012412581797743787, + "loss": 0.764, + "mean_token_accuracy": 0.7709854006767273, + "num_tokens": 128607976.0, + "step": 37800 + }, + { + "epoch": 0.37948131197559115, + "learning_rate": 0.0001241057449114778, + "loss": 0.7566, + "mean_token_accuracy": 0.775441586971283, + "num_tokens": 128641925.0, + "step": 37810 + }, + { + "epoch": 0.3795816773053916, + "learning_rate": 0.00012408567184551768, + "loss": 0.7684, + "mean_token_accuracy": 0.7733296632766724, + "num_tokens": 128675818.0, + "step": 37820 + }, + { + "epoch": 0.3796820426351921, + "learning_rate": 0.0001240655987795576, + "loss": 0.7503, + "mean_token_accuracy": 0.7772371828556061, + "num_tokens": 128710322.0, + "step": 37830 + }, + { + "epoch": 0.3797824079649926, + "learning_rate": 0.0001240455257135975, + "loss": 0.7498, + "mean_token_accuracy": 0.7743576824665069, + "num_tokens": 128743458.0, + "step": 37840 + }, + { + "epoch": 0.37988277329479303, + "learning_rate": 0.0001240254526476374, + "loss": 0.7628, + "mean_token_accuracy": 0.7745215237140656, + "num_tokens": 128776880.0, + "step": 37850 + }, + { + "epoch": 0.37998313862459354, + "learning_rate": 0.00012400537958167732, + "loss": 0.758, + "mean_token_accuracy": 0.7736277103424072, + "num_tokens": 128810765.0, + "step": 37860 + }, + { + "epoch": 0.380083503954394, + "learning_rate": 0.00012398530651571723, + "loss": 0.7683, + "mean_token_accuracy": 0.7720694422721863, + "num_tokens": 128843795.0, + "step": 37870 + }, + { + "epoch": 0.38018386928419445, + "learning_rate": 0.00012396523344975713, + "loss": 0.7548, + "mean_token_accuracy": 0.7744679272174835, + "num_tokens": 128878547.0, + "step": 37880 + }, + { + "epoch": 0.38028423461399496, + "learning_rate": 0.00012394516038379702, + "loss": 0.7611, + "mean_token_accuracy": 0.772064471244812, + "num_tokens": 128912492.0, + "step": 37890 + }, + { + "epoch": 0.3803845999437954, + "learning_rate": 0.00012392508731783695, + "loss": 0.7212, + "mean_token_accuracy": 0.7858875036239624, + "num_tokens": 128946006.0, + "step": 37900 + }, + { + "epoch": 0.3804849652735959, + "learning_rate": 0.00012390501425187683, + "loss": 0.7402, + "mean_token_accuracy": 0.7749140918254852, + "num_tokens": 128980245.0, + "step": 37910 + }, + { + "epoch": 0.3805853306033964, + "learning_rate": 0.00012388494118591674, + "loss": 0.7779, + "mean_token_accuracy": 0.7678647816181183, + "num_tokens": 129013458.0, + "step": 37920 + }, + { + "epoch": 0.38068569593319684, + "learning_rate": 0.00012386486811995665, + "loss": 0.7517, + "mean_token_accuracy": 0.7781884849071503, + "num_tokens": 129047531.0, + "step": 37930 + }, + { + "epoch": 0.3807860612629973, + "learning_rate": 0.00012384479505399656, + "loss": 0.7385, + "mean_token_accuracy": 0.7778566002845764, + "num_tokens": 129081531.0, + "step": 37940 + }, + { + "epoch": 0.3808864265927978, + "learning_rate": 0.00012382472198803644, + "loss": 0.767, + "mean_token_accuracy": 0.7704708695411682, + "num_tokens": 129115716.0, + "step": 37950 + }, + { + "epoch": 0.38098679192259827, + "learning_rate": 0.00012380464892207638, + "loss": 0.7781, + "mean_token_accuracy": 0.7695282697677612, + "num_tokens": 129150803.0, + "step": 37960 + }, + { + "epoch": 0.3810871572523987, + "learning_rate": 0.00012378457585611626, + "loss": 0.7717, + "mean_token_accuracy": 0.7646220207214356, + "num_tokens": 129184192.0, + "step": 37970 + }, + { + "epoch": 0.3811875225821992, + "learning_rate": 0.00012376450279015616, + "loss": 0.7709, + "mean_token_accuracy": 0.7719972848892211, + "num_tokens": 129217864.0, + "step": 37980 + }, + { + "epoch": 0.3812878879119997, + "learning_rate": 0.0001237444297241961, + "loss": 0.7496, + "mean_token_accuracy": 0.7696025133132934, + "num_tokens": 129251618.0, + "step": 37990 + }, + { + "epoch": 0.38138825324180015, + "learning_rate": 0.00012372435665823598, + "loss": 0.7725, + "mean_token_accuracy": 0.7679459154605865, + "num_tokens": 129285137.0, + "step": 38000 + }, + { + "epoch": 0.3814886185716006, + "learning_rate": 0.0001237042835922759, + "loss": 0.7738, + "mean_token_accuracy": 0.7686336696147918, + "num_tokens": 129318834.0, + "step": 38010 + }, + { + "epoch": 0.3815889839014011, + "learning_rate": 0.0001236842105263158, + "loss": 0.7478, + "mean_token_accuracy": 0.7723007798194885, + "num_tokens": 129353198.0, + "step": 38020 + }, + { + "epoch": 0.38168934923120157, + "learning_rate": 0.0001236641374603557, + "loss": 0.7817, + "mean_token_accuracy": 0.7713904976844788, + "num_tokens": 129387340.0, + "step": 38030 + }, + { + "epoch": 0.381789714561002, + "learning_rate": 0.0001236440643943956, + "loss": 0.7343, + "mean_token_accuracy": 0.7806975066661834, + "num_tokens": 129421396.0, + "step": 38040 + }, + { + "epoch": 0.38189007989080254, + "learning_rate": 0.00012362399132843552, + "loss": 0.7543, + "mean_token_accuracy": 0.7753277361392975, + "num_tokens": 129454695.0, + "step": 38050 + }, + { + "epoch": 0.381990445220603, + "learning_rate": 0.0001236039182624754, + "loss": 0.7086, + "mean_token_accuracy": 0.787426209449768, + "num_tokens": 129487747.0, + "step": 38060 + }, + { + "epoch": 0.38209081055040345, + "learning_rate": 0.00012358384519651531, + "loss": 0.7587, + "mean_token_accuracy": 0.7715207815170289, + "num_tokens": 129521523.0, + "step": 38070 + }, + { + "epoch": 0.38219117588020396, + "learning_rate": 0.00012356377213055522, + "loss": 0.7447, + "mean_token_accuracy": 0.7790843069553375, + "num_tokens": 129555619.0, + "step": 38080 + }, + { + "epoch": 0.3822915412100044, + "learning_rate": 0.00012354369906459513, + "loss": 0.7683, + "mean_token_accuracy": 0.770205271244049, + "num_tokens": 129590842.0, + "step": 38090 + }, + { + "epoch": 0.38239190653980487, + "learning_rate": 0.00012352362599863504, + "loss": 0.7362, + "mean_token_accuracy": 0.7805061757564544, + "num_tokens": 129625176.0, + "step": 38100 + }, + { + "epoch": 0.3824922718696054, + "learning_rate": 0.00012350355293267495, + "loss": 0.7554, + "mean_token_accuracy": 0.77535160779953, + "num_tokens": 129660292.0, + "step": 38110 + }, + { + "epoch": 0.38259263719940584, + "learning_rate": 0.00012348347986671486, + "loss": 0.7569, + "mean_token_accuracy": 0.7780167102813721, + "num_tokens": 129693764.0, + "step": 38120 + }, + { + "epoch": 0.3826930025292063, + "learning_rate": 0.00012346340680075474, + "loss": 0.7535, + "mean_token_accuracy": 0.7745382368564606, + "num_tokens": 129728851.0, + "step": 38130 + }, + { + "epoch": 0.3827933678590068, + "learning_rate": 0.00012344333373479467, + "loss": 0.7453, + "mean_token_accuracy": 0.7712686598300934, + "num_tokens": 129762943.0, + "step": 38140 + }, + { + "epoch": 0.38289373318880726, + "learning_rate": 0.00012342326066883455, + "loss": 0.7849, + "mean_token_accuracy": 0.7647489547729492, + "num_tokens": 129797045.0, + "step": 38150 + }, + { + "epoch": 0.3829940985186077, + "learning_rate": 0.00012340318760287446, + "loss": 0.7676, + "mean_token_accuracy": 0.7758142232894898, + "num_tokens": 129831329.0, + "step": 38160 + }, + { + "epoch": 0.38309446384840823, + "learning_rate": 0.00012338311453691437, + "loss": 0.771, + "mean_token_accuracy": 0.7669499278068542, + "num_tokens": 129865473.0, + "step": 38170 + }, + { + "epoch": 0.3831948291782087, + "learning_rate": 0.00012336304147095428, + "loss": 0.7539, + "mean_token_accuracy": 0.776168817281723, + "num_tokens": 129899116.0, + "step": 38180 + }, + { + "epoch": 0.38329519450800914, + "learning_rate": 0.0001233429684049942, + "loss": 0.7457, + "mean_token_accuracy": 0.776677405834198, + "num_tokens": 129932521.0, + "step": 38190 + }, + { + "epoch": 0.38339555983780965, + "learning_rate": 0.0001233228953390341, + "loss": 0.6868, + "mean_token_accuracy": 0.7909096240997314, + "num_tokens": 129967257.0, + "step": 38200 + }, + { + "epoch": 0.3834959251676101, + "learning_rate": 0.000123302822273074, + "loss": 0.7614, + "mean_token_accuracy": 0.7738026797771453, + "num_tokens": 130000891.0, + "step": 38210 + }, + { + "epoch": 0.38359629049741056, + "learning_rate": 0.00012328274920711389, + "loss": 0.7661, + "mean_token_accuracy": 0.774511742591858, + "num_tokens": 130035102.0, + "step": 38220 + }, + { + "epoch": 0.3836966558272111, + "learning_rate": 0.00012326267614115382, + "loss": 0.7562, + "mean_token_accuracy": 0.7748418092727661, + "num_tokens": 130068809.0, + "step": 38230 + }, + { + "epoch": 0.38379702115701153, + "learning_rate": 0.0001232426030751937, + "loss": 0.749, + "mean_token_accuracy": 0.7768145143985749, + "num_tokens": 130102140.0, + "step": 38240 + }, + { + "epoch": 0.383897386486812, + "learning_rate": 0.0001232225300092336, + "loss": 0.7685, + "mean_token_accuracy": 0.7733086585998535, + "num_tokens": 130136159.0, + "step": 38250 + }, + { + "epoch": 0.38399775181661244, + "learning_rate": 0.00012320245694327352, + "loss": 0.7713, + "mean_token_accuracy": 0.7655957579612732, + "num_tokens": 130171165.0, + "step": 38260 + }, + { + "epoch": 0.38409811714641295, + "learning_rate": 0.00012318238387731343, + "loss": 0.7384, + "mean_token_accuracy": 0.7753102958202363, + "num_tokens": 130204632.0, + "step": 38270 + }, + { + "epoch": 0.3841984824762134, + "learning_rate": 0.00012316231081135334, + "loss": 0.7387, + "mean_token_accuracy": 0.7776745617389679, + "num_tokens": 130238758.0, + "step": 38280 + }, + { + "epoch": 0.38429884780601387, + "learning_rate": 0.00012314223774539325, + "loss": 0.7489, + "mean_token_accuracy": 0.7758101284503937, + "num_tokens": 130272703.0, + "step": 38290 + }, + { + "epoch": 0.3843992131358144, + "learning_rate": 0.00012312216467943313, + "loss": 0.7628, + "mean_token_accuracy": 0.7725667238235474, + "num_tokens": 130305097.0, + "step": 38300 + }, + { + "epoch": 0.38449957846561483, + "learning_rate": 0.00012310209161347306, + "loss": 0.748, + "mean_token_accuracy": 0.774202698469162, + "num_tokens": 130338847.0, + "step": 38310 + }, + { + "epoch": 0.3845999437954153, + "learning_rate": 0.00012308201854751294, + "loss": 0.7947, + "mean_token_accuracy": 0.7686450958251954, + "num_tokens": 130372560.0, + "step": 38320 + }, + { + "epoch": 0.3847003091252158, + "learning_rate": 0.00012306194548155285, + "loss": 0.7729, + "mean_token_accuracy": 0.7694132089614868, + "num_tokens": 130406376.0, + "step": 38330 + }, + { + "epoch": 0.38480067445501626, + "learning_rate": 0.0001230418724155928, + "loss": 0.7407, + "mean_token_accuracy": 0.7745043933391571, + "num_tokens": 130440324.0, + "step": 38340 + }, + { + "epoch": 0.3849010397848167, + "learning_rate": 0.00012302179934963267, + "loss": 0.7386, + "mean_token_accuracy": 0.7757987082004547, + "num_tokens": 130474536.0, + "step": 38350 + }, + { + "epoch": 0.3850014051146172, + "learning_rate": 0.00012300172628367258, + "loss": 0.7236, + "mean_token_accuracy": 0.7806441009044647, + "num_tokens": 130508465.0, + "step": 38360 + }, + { + "epoch": 0.3851017704444177, + "learning_rate": 0.00012298165321771249, + "loss": 0.7572, + "mean_token_accuracy": 0.7715339839458466, + "num_tokens": 130542995.0, + "step": 38370 + }, + { + "epoch": 0.38520213577421814, + "learning_rate": 0.0001229615801517524, + "loss": 0.7555, + "mean_token_accuracy": 0.7743283450603485, + "num_tokens": 130577429.0, + "step": 38380 + }, + { + "epoch": 0.38530250110401865, + "learning_rate": 0.00012294150708579228, + "loss": 0.7389, + "mean_token_accuracy": 0.7832254827022552, + "num_tokens": 130611545.0, + "step": 38390 + }, + { + "epoch": 0.3854028664338191, + "learning_rate": 0.0001229214340198322, + "loss": 0.7191, + "mean_token_accuracy": 0.7876890063285827, + "num_tokens": 130646019.0, + "step": 38400 + }, + { + "epoch": 0.38550323176361956, + "learning_rate": 0.0001229013609538721, + "loss": 0.7649, + "mean_token_accuracy": 0.7704071640968323, + "num_tokens": 130680793.0, + "step": 38410 + }, + { + "epoch": 0.38560359709342007, + "learning_rate": 0.000122881287887912, + "loss": 0.7601, + "mean_token_accuracy": 0.7702291071414947, + "num_tokens": 130713834.0, + "step": 38420 + }, + { + "epoch": 0.3857039624232205, + "learning_rate": 0.0001228612148219519, + "loss": 0.7368, + "mean_token_accuracy": 0.7808869123458863, + "num_tokens": 130747439.0, + "step": 38430 + }, + { + "epoch": 0.385804327753021, + "learning_rate": 0.00012284114175599182, + "loss": 0.7588, + "mean_token_accuracy": 0.775489890575409, + "num_tokens": 130780557.0, + "step": 38440 + }, + { + "epoch": 0.3859046930828215, + "learning_rate": 0.00012282106869003173, + "loss": 0.7447, + "mean_token_accuracy": 0.7734454572200775, + "num_tokens": 130814569.0, + "step": 38450 + }, + { + "epoch": 0.38600505841262195, + "learning_rate": 0.00012280099562407163, + "loss": 0.7276, + "mean_token_accuracy": 0.7792356193065644, + "num_tokens": 130848026.0, + "step": 38460 + }, + { + "epoch": 0.3861054237424224, + "learning_rate": 0.00012278092255811154, + "loss": 0.7464, + "mean_token_accuracy": 0.778665965795517, + "num_tokens": 130882409.0, + "step": 38470 + }, + { + "epoch": 0.3862057890722229, + "learning_rate": 0.00012276084949215142, + "loss": 0.7307, + "mean_token_accuracy": 0.781080013513565, + "num_tokens": 130916451.0, + "step": 38480 + }, + { + "epoch": 0.38630615440202337, + "learning_rate": 0.00012274077642619136, + "loss": 0.776, + "mean_token_accuracy": 0.7673209249973297, + "num_tokens": 130950498.0, + "step": 38490 + }, + { + "epoch": 0.3864065197318238, + "learning_rate": 0.00012272070336023124, + "loss": 0.7404, + "mean_token_accuracy": 0.7765831172466278, + "num_tokens": 130984362.0, + "step": 38500 + }, + { + "epoch": 0.38650688506162434, + "learning_rate": 0.00012270063029427115, + "loss": 0.7406, + "mean_token_accuracy": 0.7788306057453156, + "num_tokens": 131019472.0, + "step": 38510 + }, + { + "epoch": 0.3866072503914248, + "learning_rate": 0.00012268055722831106, + "loss": 0.7669, + "mean_token_accuracy": 0.7686613500118256, + "num_tokens": 131053639.0, + "step": 38520 + }, + { + "epoch": 0.38670761572122525, + "learning_rate": 0.00012266048416235097, + "loss": 0.789, + "mean_token_accuracy": 0.769978278875351, + "num_tokens": 131087555.0, + "step": 38530 + }, + { + "epoch": 0.3868079810510257, + "learning_rate": 0.00012264041109639087, + "loss": 0.7668, + "mean_token_accuracy": 0.7697659850120544, + "num_tokens": 131121449.0, + "step": 38540 + }, + { + "epoch": 0.3869083463808262, + "learning_rate": 0.00012262033803043078, + "loss": 0.7858, + "mean_token_accuracy": 0.7668357491493225, + "num_tokens": 131155915.0, + "step": 38550 + }, + { + "epoch": 0.3870087117106267, + "learning_rate": 0.0001226002649644707, + "loss": 0.7612, + "mean_token_accuracy": 0.7744127333164215, + "num_tokens": 131189730.0, + "step": 38560 + }, + { + "epoch": 0.38710907704042713, + "learning_rate": 0.00012258019189851057, + "loss": 0.7414, + "mean_token_accuracy": 0.775093162059784, + "num_tokens": 131223537.0, + "step": 38570 + }, + { + "epoch": 0.38720944237022764, + "learning_rate": 0.0001225601188325505, + "loss": 0.7579, + "mean_token_accuracy": 0.7749661922454834, + "num_tokens": 131257383.0, + "step": 38580 + }, + { + "epoch": 0.3873098077000281, + "learning_rate": 0.0001225400457665904, + "loss": 0.7249, + "mean_token_accuracy": 0.7785895526409149, + "num_tokens": 131291828.0, + "step": 38590 + }, + { + "epoch": 0.38741017302982855, + "learning_rate": 0.0001225199727006303, + "loss": 0.7819, + "mean_token_accuracy": 0.7721785426139831, + "num_tokens": 131325991.0, + "step": 38600 + }, + { + "epoch": 0.38751053835962906, + "learning_rate": 0.0001224998996346702, + "loss": 0.7303, + "mean_token_accuracy": 0.7802187919616699, + "num_tokens": 131359877.0, + "step": 38610 + }, + { + "epoch": 0.3876109036894295, + "learning_rate": 0.00012247982656871011, + "loss": 0.7423, + "mean_token_accuracy": 0.7740880131721497, + "num_tokens": 131393686.0, + "step": 38620 + }, + { + "epoch": 0.38771126901923, + "learning_rate": 0.00012245975350275, + "loss": 0.7778, + "mean_token_accuracy": 0.7720871508121491, + "num_tokens": 131427396.0, + "step": 38630 + }, + { + "epoch": 0.3878116343490305, + "learning_rate": 0.00012243968043678993, + "loss": 0.7583, + "mean_token_accuracy": 0.7709931194782257, + "num_tokens": 131462104.0, + "step": 38640 + }, + { + "epoch": 0.38791199967883094, + "learning_rate": 0.0001224196073708298, + "loss": 0.7991, + "mean_token_accuracy": 0.7669247448444366, + "num_tokens": 131495929.0, + "step": 38650 + }, + { + "epoch": 0.3880123650086314, + "learning_rate": 0.00012239953430486972, + "loss": 0.7608, + "mean_token_accuracy": 0.7727199912071228, + "num_tokens": 131530577.0, + "step": 38660 + }, + { + "epoch": 0.3881127303384319, + "learning_rate": 0.00012237946123890963, + "loss": 0.7783, + "mean_token_accuracy": 0.7702851474285126, + "num_tokens": 131564373.0, + "step": 38670 + }, + { + "epoch": 0.38821309566823237, + "learning_rate": 0.00012235938817294954, + "loss": 0.7544, + "mean_token_accuracy": 0.777365791797638, + "num_tokens": 131598366.0, + "step": 38680 + }, + { + "epoch": 0.3883134609980328, + "learning_rate": 0.00012233931510698945, + "loss": 0.691, + "mean_token_accuracy": 0.7855935454368591, + "num_tokens": 131632672.0, + "step": 38690 + }, + { + "epoch": 0.38841382632783333, + "learning_rate": 0.00012231924204102936, + "loss": 0.7812, + "mean_token_accuracy": 0.767137199640274, + "num_tokens": 131666443.0, + "step": 38700 + }, + { + "epoch": 0.3885141916576338, + "learning_rate": 0.00012229916897506926, + "loss": 0.7284, + "mean_token_accuracy": 0.7804687798023224, + "num_tokens": 131700246.0, + "step": 38710 + }, + { + "epoch": 0.38861455698743425, + "learning_rate": 0.00012227909590910915, + "loss": 0.755, + "mean_token_accuracy": 0.7715389132499695, + "num_tokens": 131734412.0, + "step": 38720 + }, + { + "epoch": 0.38871492231723476, + "learning_rate": 0.00012225902284314908, + "loss": 0.7426, + "mean_token_accuracy": 0.7703909456729889, + "num_tokens": 131768375.0, + "step": 38730 + }, + { + "epoch": 0.3888152876470352, + "learning_rate": 0.00012223894977718896, + "loss": 0.729, + "mean_token_accuracy": 0.7757822453975678, + "num_tokens": 131802755.0, + "step": 38740 + }, + { + "epoch": 0.38891565297683567, + "learning_rate": 0.00012221887671122887, + "loss": 0.7558, + "mean_token_accuracy": 0.7776188731193543, + "num_tokens": 131836704.0, + "step": 38750 + }, + { + "epoch": 0.3890160183066362, + "learning_rate": 0.00012219880364526878, + "loss": 0.7869, + "mean_token_accuracy": 0.7667187333106995, + "num_tokens": 131869974.0, + "step": 38760 + }, + { + "epoch": 0.38911638363643664, + "learning_rate": 0.0001221787305793087, + "loss": 0.7579, + "mean_token_accuracy": 0.7685837090015412, + "num_tokens": 131904038.0, + "step": 38770 + }, + { + "epoch": 0.3892167489662371, + "learning_rate": 0.0001221586575133486, + "loss": 0.7767, + "mean_token_accuracy": 0.7679896771907806, + "num_tokens": 131937738.0, + "step": 38780 + }, + { + "epoch": 0.3893171142960376, + "learning_rate": 0.0001221385844473885, + "loss": 0.7818, + "mean_token_accuracy": 0.7681105613708497, + "num_tokens": 131971935.0, + "step": 38790 + }, + { + "epoch": 0.38941747962583806, + "learning_rate": 0.0001221185113814284, + "loss": 0.7328, + "mean_token_accuracy": 0.7784608542919159, + "num_tokens": 132006571.0, + "step": 38800 + }, + { + "epoch": 0.3895178449556385, + "learning_rate": 0.0001220984383154683, + "loss": 0.7608, + "mean_token_accuracy": 0.7722057044506073, + "num_tokens": 132040572.0, + "step": 38810 + }, + { + "epoch": 0.38961821028543897, + "learning_rate": 0.00012207836524950823, + "loss": 0.7398, + "mean_token_accuracy": 0.7809996604919434, + "num_tokens": 132074680.0, + "step": 38820 + }, + { + "epoch": 0.3897185756152395, + "learning_rate": 0.00012205829218354811, + "loss": 0.7421, + "mean_token_accuracy": 0.7776970565319061, + "num_tokens": 132108596.0, + "step": 38830 + }, + { + "epoch": 0.38981894094503994, + "learning_rate": 0.00012203821911758802, + "loss": 0.7506, + "mean_token_accuracy": 0.7727792620658874, + "num_tokens": 132142672.0, + "step": 38840 + }, + { + "epoch": 0.3899193062748404, + "learning_rate": 0.00012201814605162794, + "loss": 0.7424, + "mean_token_accuracy": 0.7815340638160706, + "num_tokens": 132176880.0, + "step": 38850 + }, + { + "epoch": 0.3900196716046409, + "learning_rate": 0.00012199807298566784, + "loss": 0.7745, + "mean_token_accuracy": 0.7714296519756317, + "num_tokens": 132210013.0, + "step": 38860 + }, + { + "epoch": 0.39012003693444136, + "learning_rate": 0.00012197799991970776, + "loss": 0.7401, + "mean_token_accuracy": 0.7776513814926147, + "num_tokens": 132244647.0, + "step": 38870 + }, + { + "epoch": 0.3902204022642418, + "learning_rate": 0.00012195792685374765, + "loss": 0.7731, + "mean_token_accuracy": 0.7630275428295136, + "num_tokens": 132279247.0, + "step": 38880 + }, + { + "epoch": 0.39032076759404233, + "learning_rate": 0.00012193785378778755, + "loss": 0.7405, + "mean_token_accuracy": 0.7797455608844757, + "num_tokens": 132314044.0, + "step": 38890 + }, + { + "epoch": 0.3904211329238428, + "learning_rate": 0.00012191778072182747, + "loss": 0.7663, + "mean_token_accuracy": 0.765515285730362, + "num_tokens": 132347953.0, + "step": 38900 + }, + { + "epoch": 0.39052149825364324, + "learning_rate": 0.00012189770765586736, + "loss": 0.7662, + "mean_token_accuracy": 0.7708156883716584, + "num_tokens": 132382564.0, + "step": 38910 + }, + { + "epoch": 0.39062186358344375, + "learning_rate": 0.00012187763458990726, + "loss": 0.7704, + "mean_token_accuracy": 0.7723477423191071, + "num_tokens": 132416001.0, + "step": 38920 + }, + { + "epoch": 0.3907222289132442, + "learning_rate": 0.00012185756152394718, + "loss": 0.7667, + "mean_token_accuracy": 0.7714898586273193, + "num_tokens": 132450365.0, + "step": 38930 + }, + { + "epoch": 0.39082259424304466, + "learning_rate": 0.00012183748845798708, + "loss": 0.7166, + "mean_token_accuracy": 0.7790085256099701, + "num_tokens": 132484146.0, + "step": 38940 + }, + { + "epoch": 0.3909229595728452, + "learning_rate": 0.00012181741539202698, + "loss": 0.7511, + "mean_token_accuracy": 0.7746637761592865, + "num_tokens": 132518411.0, + "step": 38950 + }, + { + "epoch": 0.39102332490264563, + "learning_rate": 0.0001217973423260669, + "loss": 0.7379, + "mean_token_accuracy": 0.7813819944858551, + "num_tokens": 132552330.0, + "step": 38960 + }, + { + "epoch": 0.3911236902324461, + "learning_rate": 0.0001217772692601068, + "loss": 0.746, + "mean_token_accuracy": 0.7709066867828369, + "num_tokens": 132586964.0, + "step": 38970 + }, + { + "epoch": 0.3912240555622466, + "learning_rate": 0.0001217571961941467, + "loss": 0.7537, + "mean_token_accuracy": 0.7693379759788513, + "num_tokens": 132620807.0, + "step": 38980 + }, + { + "epoch": 0.39132442089204705, + "learning_rate": 0.00012173712312818662, + "loss": 0.7643, + "mean_token_accuracy": 0.7710390269756318, + "num_tokens": 132655281.0, + "step": 38990 + }, + { + "epoch": 0.3914247862218475, + "learning_rate": 0.00012171705006222651, + "loss": 0.7218, + "mean_token_accuracy": 0.7797894060611725, + "num_tokens": 132689630.0, + "step": 39000 + }, + { + "epoch": 0.391525151551648, + "learning_rate": 0.00012169697699626641, + "loss": 0.7749, + "mean_token_accuracy": 0.7722760915756226, + "num_tokens": 132724265.0, + "step": 39010 + }, + { + "epoch": 0.3916255168814485, + "learning_rate": 0.00012167690393030633, + "loss": 0.7282, + "mean_token_accuracy": 0.7828829348087311, + "num_tokens": 132758592.0, + "step": 39020 + }, + { + "epoch": 0.39172588221124893, + "learning_rate": 0.00012165683086434623, + "loss": 0.7601, + "mean_token_accuracy": 0.7701749205589294, + "num_tokens": 132791836.0, + "step": 39030 + }, + { + "epoch": 0.39182624754104944, + "learning_rate": 0.00012163675779838612, + "loss": 0.7761, + "mean_token_accuracy": 0.7680363118648529, + "num_tokens": 132825788.0, + "step": 39040 + }, + { + "epoch": 0.3919266128708499, + "learning_rate": 0.00012161668473242604, + "loss": 0.7336, + "mean_token_accuracy": 0.7725139141082764, + "num_tokens": 132860034.0, + "step": 39050 + }, + { + "epoch": 0.39202697820065036, + "learning_rate": 0.00012159661166646594, + "loss": 0.7484, + "mean_token_accuracy": 0.7744539499282836, + "num_tokens": 132893613.0, + "step": 39060 + }, + { + "epoch": 0.39212734353045087, + "learning_rate": 0.00012157653860050585, + "loss": 0.7464, + "mean_token_accuracy": 0.7795374810695648, + "num_tokens": 132927565.0, + "step": 39070 + }, + { + "epoch": 0.3922277088602513, + "learning_rate": 0.00012155646553454575, + "loss": 0.752, + "mean_token_accuracy": 0.7768670856952667, + "num_tokens": 132962180.0, + "step": 39080 + }, + { + "epoch": 0.3923280741900518, + "learning_rate": 0.00012153639246858566, + "loss": 0.7512, + "mean_token_accuracy": 0.7783297538757324, + "num_tokens": 132996930.0, + "step": 39090 + }, + { + "epoch": 0.39242843951985223, + "learning_rate": 0.00012151631940262556, + "loss": 0.7484, + "mean_token_accuracy": 0.7781550347805023, + "num_tokens": 133031217.0, + "step": 39100 + }, + { + "epoch": 0.39252880484965275, + "learning_rate": 0.00012149624633666548, + "loss": 0.7325, + "mean_token_accuracy": 0.7798486769199371, + "num_tokens": 133065608.0, + "step": 39110 + }, + { + "epoch": 0.3926291701794532, + "learning_rate": 0.00012147617327070537, + "loss": 0.7756, + "mean_token_accuracy": 0.7634629428386688, + "num_tokens": 133099837.0, + "step": 39120 + }, + { + "epoch": 0.39272953550925366, + "learning_rate": 0.00012145610020474527, + "loss": 0.7603, + "mean_token_accuracy": 0.7756829202175141, + "num_tokens": 133132890.0, + "step": 39130 + }, + { + "epoch": 0.39282990083905417, + "learning_rate": 0.00012143602713878519, + "loss": 0.7536, + "mean_token_accuracy": 0.7724991142749786, + "num_tokens": 133166951.0, + "step": 39140 + }, + { + "epoch": 0.3929302661688546, + "learning_rate": 0.00012141595407282509, + "loss": 0.7772, + "mean_token_accuracy": 0.7673039019107819, + "num_tokens": 133200373.0, + "step": 39150 + }, + { + "epoch": 0.3930306314986551, + "learning_rate": 0.00012139588100686498, + "loss": 0.7418, + "mean_token_accuracy": 0.7788579583168029, + "num_tokens": 133234595.0, + "step": 39160 + }, + { + "epoch": 0.3931309968284556, + "learning_rate": 0.0001213758079409049, + "loss": 0.7541, + "mean_token_accuracy": 0.7733618021011353, + "num_tokens": 133268711.0, + "step": 39170 + }, + { + "epoch": 0.39323136215825605, + "learning_rate": 0.0001213557348749448, + "loss": 0.7494, + "mean_token_accuracy": 0.7766754031181335, + "num_tokens": 133302600.0, + "step": 39180 + }, + { + "epoch": 0.3933317274880565, + "learning_rate": 0.0001213356618089847, + "loss": 0.7122, + "mean_token_accuracy": 0.7791902840137481, + "num_tokens": 133336578.0, + "step": 39190 + }, + { + "epoch": 0.393432092817857, + "learning_rate": 0.00012131558874302463, + "loss": 0.7321, + "mean_token_accuracy": 0.780260443687439, + "num_tokens": 133371034.0, + "step": 39200 + }, + { + "epoch": 0.39353245814765747, + "learning_rate": 0.00012129551567706452, + "loss": 0.7377, + "mean_token_accuracy": 0.7821172118186951, + "num_tokens": 133405477.0, + "step": 39210 + }, + { + "epoch": 0.3936328234774579, + "learning_rate": 0.00012127544261110442, + "loss": 0.7296, + "mean_token_accuracy": 0.7814566135406494, + "num_tokens": 133438630.0, + "step": 39220 + }, + { + "epoch": 0.39373318880725844, + "learning_rate": 0.00012125536954514434, + "loss": 0.7748, + "mean_token_accuracy": 0.7685065865516663, + "num_tokens": 133472765.0, + "step": 39230 + }, + { + "epoch": 0.3938335541370589, + "learning_rate": 0.00012123529647918423, + "loss": 0.7582, + "mean_token_accuracy": 0.7735672891139984, + "num_tokens": 133507592.0, + "step": 39240 + }, + { + "epoch": 0.39393391946685935, + "learning_rate": 0.00012121522341322413, + "loss": 0.7449, + "mean_token_accuracy": 0.7802322506904602, + "num_tokens": 133541214.0, + "step": 39250 + }, + { + "epoch": 0.39403428479665986, + "learning_rate": 0.00012119515034726405, + "loss": 0.7601, + "mean_token_accuracy": 0.7737901687622071, + "num_tokens": 133575816.0, + "step": 39260 + }, + { + "epoch": 0.3941346501264603, + "learning_rate": 0.00012117507728130395, + "loss": 0.7735, + "mean_token_accuracy": 0.7727476596832276, + "num_tokens": 133608864.0, + "step": 39270 + }, + { + "epoch": 0.3942350154562608, + "learning_rate": 0.00012115500421534384, + "loss": 0.7278, + "mean_token_accuracy": 0.7765253186225891, + "num_tokens": 133642999.0, + "step": 39280 + }, + { + "epoch": 0.3943353807860613, + "learning_rate": 0.00012113493114938376, + "loss": 0.7584, + "mean_token_accuracy": 0.7723966479301453, + "num_tokens": 133677280.0, + "step": 39290 + }, + { + "epoch": 0.39443574611586174, + "learning_rate": 0.00012111485808342367, + "loss": 0.7446, + "mean_token_accuracy": 0.7744259595870971, + "num_tokens": 133711493.0, + "step": 39300 + }, + { + "epoch": 0.3945361114456622, + "learning_rate": 0.00012109478501746357, + "loss": 0.7543, + "mean_token_accuracy": 0.7753329038619995, + "num_tokens": 133745072.0, + "step": 39310 + }, + { + "epoch": 0.3946364767754627, + "learning_rate": 0.00012107471195150349, + "loss": 0.7849, + "mean_token_accuracy": 0.7633687257766724, + "num_tokens": 133779839.0, + "step": 39320 + }, + { + "epoch": 0.39473684210526316, + "learning_rate": 0.00012105463888554338, + "loss": 0.7682, + "mean_token_accuracy": 0.7730082750320435, + "num_tokens": 133813760.0, + "step": 39330 + }, + { + "epoch": 0.3948372074350636, + "learning_rate": 0.00012103456581958328, + "loss": 0.7456, + "mean_token_accuracy": 0.7697203040122986, + "num_tokens": 133848294.0, + "step": 39340 + }, + { + "epoch": 0.39493757276486413, + "learning_rate": 0.0001210144927536232, + "loss": 0.7596, + "mean_token_accuracy": 0.7708020269870758, + "num_tokens": 133881934.0, + "step": 39350 + }, + { + "epoch": 0.3950379380946646, + "learning_rate": 0.0001209944196876631, + "loss": 0.7521, + "mean_token_accuracy": 0.7752474427223206, + "num_tokens": 133915804.0, + "step": 39360 + }, + { + "epoch": 0.39513830342446504, + "learning_rate": 0.00012097434662170299, + "loss": 0.7526, + "mean_token_accuracy": 0.7766995847225189, + "num_tokens": 133950193.0, + "step": 39370 + }, + { + "epoch": 0.39523866875426555, + "learning_rate": 0.00012095427355574291, + "loss": 0.7838, + "mean_token_accuracy": 0.7682909846305848, + "num_tokens": 133984092.0, + "step": 39380 + }, + { + "epoch": 0.395339034084066, + "learning_rate": 0.00012093420048978281, + "loss": 0.7449, + "mean_token_accuracy": 0.780186551809311, + "num_tokens": 134018007.0, + "step": 39390 + }, + { + "epoch": 0.39543939941386647, + "learning_rate": 0.00012091412742382272, + "loss": 0.7583, + "mean_token_accuracy": 0.7751919984817505, + "num_tokens": 134052068.0, + "step": 39400 + }, + { + "epoch": 0.3955397647436669, + "learning_rate": 0.00012089405435786262, + "loss": 0.7894, + "mean_token_accuracy": 0.7675959348678589, + "num_tokens": 134086871.0, + "step": 39410 + }, + { + "epoch": 0.39564013007346743, + "learning_rate": 0.00012087398129190253, + "loss": 0.7402, + "mean_token_accuracy": 0.7770104825496673, + "num_tokens": 134121099.0, + "step": 39420 + }, + { + "epoch": 0.3957404954032679, + "learning_rate": 0.00012085390822594244, + "loss": 0.7466, + "mean_token_accuracy": 0.7756132900714874, + "num_tokens": 134154883.0, + "step": 39430 + }, + { + "epoch": 0.39584086073306834, + "learning_rate": 0.00012083383515998235, + "loss": 0.7214, + "mean_token_accuracy": 0.7835146069526673, + "num_tokens": 134188767.0, + "step": 39440 + }, + { + "epoch": 0.39594122606286886, + "learning_rate": 0.00012081376209402224, + "loss": 0.7795, + "mean_token_accuracy": 0.7679894447326661, + "num_tokens": 134222891.0, + "step": 39450 + }, + { + "epoch": 0.3960415913926693, + "learning_rate": 0.00012079368902806217, + "loss": 0.7329, + "mean_token_accuracy": 0.7798572301864624, + "num_tokens": 134257281.0, + "step": 39460 + }, + { + "epoch": 0.39614195672246977, + "learning_rate": 0.00012077361596210206, + "loss": 0.7267, + "mean_token_accuracy": 0.7835379421710968, + "num_tokens": 134291092.0, + "step": 39470 + }, + { + "epoch": 0.3962423220522703, + "learning_rate": 0.00012075354289614196, + "loss": 0.7802, + "mean_token_accuracy": 0.7687345266342163, + "num_tokens": 134325484.0, + "step": 39480 + }, + { + "epoch": 0.39634268738207074, + "learning_rate": 0.00012073346983018188, + "loss": 0.7569, + "mean_token_accuracy": 0.7736931264400482, + "num_tokens": 134360034.0, + "step": 39490 + }, + { + "epoch": 0.3964430527118712, + "learning_rate": 0.00012071339676422177, + "loss": 0.7585, + "mean_token_accuracy": 0.7733866035938263, + "num_tokens": 134393906.0, + "step": 39500 + }, + { + "epoch": 0.3965434180416717, + "learning_rate": 0.00012069332369826167, + "loss": 0.7836, + "mean_token_accuracy": 0.7700192868709564, + "num_tokens": 134428403.0, + "step": 39510 + }, + { + "epoch": 0.39664378337147216, + "learning_rate": 0.00012067325063230159, + "loss": 0.7374, + "mean_token_accuracy": 0.7759145796298981, + "num_tokens": 134462462.0, + "step": 39520 + }, + { + "epoch": 0.3967441487012726, + "learning_rate": 0.00012065317756634148, + "loss": 0.7713, + "mean_token_accuracy": 0.7735425055027008, + "num_tokens": 134496437.0, + "step": 39530 + }, + { + "epoch": 0.3968445140310731, + "learning_rate": 0.00012063310450038139, + "loss": 0.7377, + "mean_token_accuracy": 0.7802790820598602, + "num_tokens": 134530426.0, + "step": 39540 + }, + { + "epoch": 0.3969448793608736, + "learning_rate": 0.00012061303143442131, + "loss": 0.744, + "mean_token_accuracy": 0.7735237538814544, + "num_tokens": 134564435.0, + "step": 39550 + }, + { + "epoch": 0.39704524469067404, + "learning_rate": 0.00012059295836846121, + "loss": 0.7358, + "mean_token_accuracy": 0.7738739252090454, + "num_tokens": 134598618.0, + "step": 39560 + }, + { + "epoch": 0.39714561002047455, + "learning_rate": 0.0001205728853025011, + "loss": 0.7634, + "mean_token_accuracy": 0.7694804608821869, + "num_tokens": 134632116.0, + "step": 39570 + }, + { + "epoch": 0.397245975350275, + "learning_rate": 0.00012055281223654103, + "loss": 0.7379, + "mean_token_accuracy": 0.7793560028076172, + "num_tokens": 134666154.0, + "step": 39580 + }, + { + "epoch": 0.39734634068007546, + "learning_rate": 0.00012053273917058092, + "loss": 0.7504, + "mean_token_accuracy": 0.7775729656219482, + "num_tokens": 134701294.0, + "step": 39590 + }, + { + "epoch": 0.39744670600987597, + "learning_rate": 0.00012051266610462082, + "loss": 0.7706, + "mean_token_accuracy": 0.7736427843570709, + "num_tokens": 134735055.0, + "step": 39600 + }, + { + "epoch": 0.3975470713396764, + "learning_rate": 0.00012049259303866074, + "loss": 0.7713, + "mean_token_accuracy": 0.7698934495449066, + "num_tokens": 134768993.0, + "step": 39610 + }, + { + "epoch": 0.3976474366694769, + "learning_rate": 0.00012047251997270063, + "loss": 0.7671, + "mean_token_accuracy": 0.7665896236896514, + "num_tokens": 134802020.0, + "step": 39620 + }, + { + "epoch": 0.3977478019992774, + "learning_rate": 0.00012045244690674053, + "loss": 0.7667, + "mean_token_accuracy": 0.7705266535282135, + "num_tokens": 134835584.0, + "step": 39630 + }, + { + "epoch": 0.39784816732907785, + "learning_rate": 0.00012043237384078045, + "loss": 0.7747, + "mean_token_accuracy": 0.7658677756786346, + "num_tokens": 134869863.0, + "step": 39640 + }, + { + "epoch": 0.3979485326588783, + "learning_rate": 0.00012041230077482036, + "loss": 0.7431, + "mean_token_accuracy": 0.7791848838329315, + "num_tokens": 134904118.0, + "step": 39650 + }, + { + "epoch": 0.3980488979886788, + "learning_rate": 0.00012039222770886025, + "loss": 0.7636, + "mean_token_accuracy": 0.7708900988101959, + "num_tokens": 134938038.0, + "step": 39660 + }, + { + "epoch": 0.3981492633184793, + "learning_rate": 0.00012037215464290018, + "loss": 0.7603, + "mean_token_accuracy": 0.7700263500213623, + "num_tokens": 134972463.0, + "step": 39670 + }, + { + "epoch": 0.39824962864827973, + "learning_rate": 0.00012035208157694007, + "loss": 0.7457, + "mean_token_accuracy": 0.7756147027015686, + "num_tokens": 135005835.0, + "step": 39680 + }, + { + "epoch": 0.3983499939780802, + "learning_rate": 0.00012033200851097997, + "loss": 0.7457, + "mean_token_accuracy": 0.7762618720531463, + "num_tokens": 135040050.0, + "step": 39690 + }, + { + "epoch": 0.3984503593078807, + "learning_rate": 0.00012031193544501989, + "loss": 0.7786, + "mean_token_accuracy": 0.7641853630542755, + "num_tokens": 135073690.0, + "step": 39700 + }, + { + "epoch": 0.39855072463768115, + "learning_rate": 0.00012029186237905978, + "loss": 0.7627, + "mean_token_accuracy": 0.7746669232845307, + "num_tokens": 135106550.0, + "step": 39710 + }, + { + "epoch": 0.3986510899674816, + "learning_rate": 0.00012027178931309968, + "loss": 0.7691, + "mean_token_accuracy": 0.7719944953918457, + "num_tokens": 135140110.0, + "step": 39720 + }, + { + "epoch": 0.3987514552972821, + "learning_rate": 0.0001202517162471396, + "loss": 0.7505, + "mean_token_accuracy": 0.7685466587543488, + "num_tokens": 135174141.0, + "step": 39730 + }, + { + "epoch": 0.3988518206270826, + "learning_rate": 0.0001202316431811795, + "loss": 0.7435, + "mean_token_accuracy": 0.7785994470119476, + "num_tokens": 135207965.0, + "step": 39740 + }, + { + "epoch": 0.39895218595688303, + "learning_rate": 0.0001202115701152194, + "loss": 0.7542, + "mean_token_accuracy": 0.7713268518447876, + "num_tokens": 135242410.0, + "step": 39750 + }, + { + "epoch": 0.39905255128668354, + "learning_rate": 0.00012019149704925931, + "loss": 0.7346, + "mean_token_accuracy": 0.7775916159152985, + "num_tokens": 135276320.0, + "step": 39760 + }, + { + "epoch": 0.399152916616484, + "learning_rate": 0.00012017142398329922, + "loss": 0.7261, + "mean_token_accuracy": 0.7829974949359894, + "num_tokens": 135310970.0, + "step": 39770 + }, + { + "epoch": 0.39925328194628446, + "learning_rate": 0.00012015135091733911, + "loss": 0.7623, + "mean_token_accuracy": 0.7746733903884888, + "num_tokens": 135345360.0, + "step": 39780 + }, + { + "epoch": 0.39935364727608497, + "learning_rate": 0.00012013127785137904, + "loss": 0.7433, + "mean_token_accuracy": 0.7795181810855866, + "num_tokens": 135379554.0, + "step": 39790 + }, + { + "epoch": 0.3994540126058854, + "learning_rate": 0.00012011120478541893, + "loss": 0.7886, + "mean_token_accuracy": 0.7656014263629913, + "num_tokens": 135413554.0, + "step": 39800 + }, + { + "epoch": 0.3995543779356859, + "learning_rate": 0.00012009113171945883, + "loss": 0.7741, + "mean_token_accuracy": 0.7673084974288941, + "num_tokens": 135447136.0, + "step": 39810 + }, + { + "epoch": 0.3996547432654864, + "learning_rate": 0.00012007105865349875, + "loss": 0.7456, + "mean_token_accuracy": 0.7771454095840454, + "num_tokens": 135481422.0, + "step": 39820 + }, + { + "epoch": 0.39975510859528685, + "learning_rate": 0.00012005098558753864, + "loss": 0.7483, + "mean_token_accuracy": 0.7750567555427551, + "num_tokens": 135516082.0, + "step": 39830 + }, + { + "epoch": 0.3998554739250873, + "learning_rate": 0.00012003091252157854, + "loss": 0.7421, + "mean_token_accuracy": 0.7777432143688202, + "num_tokens": 135550461.0, + "step": 39840 + }, + { + "epoch": 0.3999558392548878, + "learning_rate": 0.00012001083945561846, + "loss": 0.7864, + "mean_token_accuracy": 0.767791497707367, + "num_tokens": 135584405.0, + "step": 39850 + }, + { + "epoch": 0.40005620458468827, + "learning_rate": 0.00011999076638965835, + "loss": 0.7232, + "mean_token_accuracy": 0.7791144847869873, + "num_tokens": 135618466.0, + "step": 39860 + }, + { + "epoch": 0.4001565699144887, + "learning_rate": 0.00011997069332369826, + "loss": 0.7816, + "mean_token_accuracy": 0.7730731844902039, + "num_tokens": 135652625.0, + "step": 39870 + }, + { + "epoch": 0.40025693524428924, + "learning_rate": 0.00011995062025773817, + "loss": 0.7491, + "mean_token_accuracy": 0.7685365915298462, + "num_tokens": 135685999.0, + "step": 39880 + }, + { + "epoch": 0.4003573005740897, + "learning_rate": 0.00011993054719177808, + "loss": 0.7417, + "mean_token_accuracy": 0.7769519567489624, + "num_tokens": 135719647.0, + "step": 39890 + }, + { + "epoch": 0.40045766590389015, + "learning_rate": 0.00011991047412581797, + "loss": 0.7416, + "mean_token_accuracy": 0.7781095504760742, + "num_tokens": 135753435.0, + "step": 39900 + }, + { + "epoch": 0.40055803123369066, + "learning_rate": 0.0001198904010598579, + "loss": 0.7599, + "mean_token_accuracy": 0.7716181695461273, + "num_tokens": 135787223.0, + "step": 39910 + }, + { + "epoch": 0.4006583965634911, + "learning_rate": 0.00011987032799389779, + "loss": 0.7417, + "mean_token_accuracy": 0.7748284220695496, + "num_tokens": 135821663.0, + "step": 39920 + }, + { + "epoch": 0.40075876189329157, + "learning_rate": 0.00011985025492793769, + "loss": 0.7541, + "mean_token_accuracy": 0.7745453119277954, + "num_tokens": 135855973.0, + "step": 39930 + }, + { + "epoch": 0.4008591272230921, + "learning_rate": 0.00011983018186197761, + "loss": 0.7401, + "mean_token_accuracy": 0.778628796339035, + "num_tokens": 135889965.0, + "step": 39940 + }, + { + "epoch": 0.40095949255289254, + "learning_rate": 0.0001198101087960175, + "loss": 0.756, + "mean_token_accuracy": 0.7736190974712371, + "num_tokens": 135923490.0, + "step": 39950 + }, + { + "epoch": 0.401059857882693, + "learning_rate": 0.0001197900357300574, + "loss": 0.7501, + "mean_token_accuracy": 0.7710761725902557, + "num_tokens": 135957766.0, + "step": 39960 + }, + { + "epoch": 0.40116022321249345, + "learning_rate": 0.00011976996266409732, + "loss": 0.7434, + "mean_token_accuracy": 0.7756464302539825, + "num_tokens": 135991673.0, + "step": 39970 + }, + { + "epoch": 0.40126058854229396, + "learning_rate": 0.00011974988959813721, + "loss": 0.7583, + "mean_token_accuracy": 0.7727165937423706, + "num_tokens": 136025278.0, + "step": 39980 + }, + { + "epoch": 0.4013609538720944, + "learning_rate": 0.00011972981653217714, + "loss": 0.7375, + "mean_token_accuracy": 0.7782612979412079, + "num_tokens": 136059283.0, + "step": 39990 + }, + { + "epoch": 0.4014613192018949, + "learning_rate": 0.00011970974346621705, + "loss": 0.7679, + "mean_token_accuracy": 0.7702317774295807, + "num_tokens": 136093114.0, + "step": 40000 + }, + { + "epoch": 0.4015616845316954, + "learning_rate": 0.00011968967040025694, + "loss": 0.7292, + "mean_token_accuracy": 0.7799321055412293, + "num_tokens": 136127593.0, + "step": 40010 + }, + { + "epoch": 0.40166204986149584, + "learning_rate": 0.00011966959733429686, + "loss": 0.7762, + "mean_token_accuracy": 0.7717219829559326, + "num_tokens": 136161130.0, + "step": 40020 + }, + { + "epoch": 0.4017624151912963, + "learning_rate": 0.00011964952426833676, + "loss": 0.7399, + "mean_token_accuracy": 0.7801750481128693, + "num_tokens": 136194702.0, + "step": 40030 + }, + { + "epoch": 0.4018627805210968, + "learning_rate": 0.00011962945120237665, + "loss": 0.7717, + "mean_token_accuracy": 0.7715950429439544, + "num_tokens": 136229077.0, + "step": 40040 + }, + { + "epoch": 0.40196314585089726, + "learning_rate": 0.00011960937813641657, + "loss": 0.7583, + "mean_token_accuracy": 0.7762810230255127, + "num_tokens": 136263119.0, + "step": 40050 + }, + { + "epoch": 0.4020635111806977, + "learning_rate": 0.00011958930507045647, + "loss": 0.763, + "mean_token_accuracy": 0.7726292669773102, + "num_tokens": 136297003.0, + "step": 40060 + }, + { + "epoch": 0.40216387651049823, + "learning_rate": 0.00011956923200449636, + "loss": 0.8073, + "mean_token_accuracy": 0.7658033907413483, + "num_tokens": 136331043.0, + "step": 40070 + }, + { + "epoch": 0.4022642418402987, + "learning_rate": 0.00011954915893853629, + "loss": 0.7467, + "mean_token_accuracy": 0.7768625020980835, + "num_tokens": 136364615.0, + "step": 40080 + }, + { + "epoch": 0.40236460717009914, + "learning_rate": 0.00011952908587257618, + "loss": 0.7678, + "mean_token_accuracy": 0.7703774511814118, + "num_tokens": 136398721.0, + "step": 40090 + }, + { + "epoch": 0.40246497249989965, + "learning_rate": 0.00011950901280661609, + "loss": 0.7614, + "mean_token_accuracy": 0.7728688240051269, + "num_tokens": 136432969.0, + "step": 40100 + }, + { + "epoch": 0.4025653378297001, + "learning_rate": 0.000119488939740656, + "loss": 0.78, + "mean_token_accuracy": 0.771339625120163, + "num_tokens": 136467593.0, + "step": 40110 + }, + { + "epoch": 0.40266570315950057, + "learning_rate": 0.0001194688666746959, + "loss": 0.7264, + "mean_token_accuracy": 0.777644407749176, + "num_tokens": 136501159.0, + "step": 40120 + }, + { + "epoch": 0.4027660684893011, + "learning_rate": 0.0001194487936087358, + "loss": 0.7387, + "mean_token_accuracy": 0.7751397848129272, + "num_tokens": 136535752.0, + "step": 40130 + }, + { + "epoch": 0.40286643381910153, + "learning_rate": 0.00011942872054277572, + "loss": 0.7665, + "mean_token_accuracy": 0.7697070360183715, + "num_tokens": 136570297.0, + "step": 40140 + }, + { + "epoch": 0.402966799148902, + "learning_rate": 0.00011940864747681562, + "loss": 0.7268, + "mean_token_accuracy": 0.7820415377616883, + "num_tokens": 136604191.0, + "step": 40150 + }, + { + "epoch": 0.4030671644787025, + "learning_rate": 0.00011938857441085551, + "loss": 0.7938, + "mean_token_accuracy": 0.7644527673721313, + "num_tokens": 136638222.0, + "step": 40160 + }, + { + "epoch": 0.40316752980850296, + "learning_rate": 0.00011936850134489543, + "loss": 0.7641, + "mean_token_accuracy": 0.7696475744247436, + "num_tokens": 136672379.0, + "step": 40170 + }, + { + "epoch": 0.4032678951383034, + "learning_rate": 0.00011934842827893533, + "loss": 0.7164, + "mean_token_accuracy": 0.7865774869918823, + "num_tokens": 136706577.0, + "step": 40180 + }, + { + "epoch": 0.4033682604681039, + "learning_rate": 0.00011932835521297522, + "loss": 0.7676, + "mean_token_accuracy": 0.7706251263618469, + "num_tokens": 136740564.0, + "step": 40190 + }, + { + "epoch": 0.4034686257979044, + "learning_rate": 0.00011930828214701515, + "loss": 0.746, + "mean_token_accuracy": 0.7773006856441498, + "num_tokens": 136774055.0, + "step": 40200 + }, + { + "epoch": 0.40356899112770483, + "learning_rate": 0.00011928820908105504, + "loss": 0.7551, + "mean_token_accuracy": 0.7801610410213471, + "num_tokens": 136808108.0, + "step": 40210 + }, + { + "epoch": 0.40366935645750535, + "learning_rate": 0.00011926813601509495, + "loss": 0.7513, + "mean_token_accuracy": 0.7703775525093078, + "num_tokens": 136842157.0, + "step": 40220 + }, + { + "epoch": 0.4037697217873058, + "learning_rate": 0.00011924806294913486, + "loss": 0.7527, + "mean_token_accuracy": 0.7736020088195801, + "num_tokens": 136877028.0, + "step": 40230 + }, + { + "epoch": 0.40387008711710626, + "learning_rate": 0.00011922798988317477, + "loss": 0.7598, + "mean_token_accuracy": 0.7710412681102753, + "num_tokens": 136911143.0, + "step": 40240 + }, + { + "epoch": 0.4039704524469067, + "learning_rate": 0.00011920791681721466, + "loss": 0.7682, + "mean_token_accuracy": 0.7682018101215362, + "num_tokens": 136944985.0, + "step": 40250 + }, + { + "epoch": 0.4040708177767072, + "learning_rate": 0.00011918784375125458, + "loss": 0.7538, + "mean_token_accuracy": 0.7723013639450074, + "num_tokens": 136979089.0, + "step": 40260 + }, + { + "epoch": 0.4041711831065077, + "learning_rate": 0.00011916777068529448, + "loss": 0.7589, + "mean_token_accuracy": 0.7686575293540955, + "num_tokens": 137013646.0, + "step": 40270 + }, + { + "epoch": 0.40427154843630814, + "learning_rate": 0.00011914769761933437, + "loss": 0.7563, + "mean_token_accuracy": 0.7762044131755829, + "num_tokens": 137047982.0, + "step": 40280 + }, + { + "epoch": 0.40437191376610865, + "learning_rate": 0.0001191276245533743, + "loss": 0.7594, + "mean_token_accuracy": 0.7722022533416748, + "num_tokens": 137082041.0, + "step": 40290 + }, + { + "epoch": 0.4044722790959091, + "learning_rate": 0.00011910755148741419, + "loss": 0.7481, + "mean_token_accuracy": 0.7727467536926269, + "num_tokens": 137115503.0, + "step": 40300 + }, + { + "epoch": 0.40457264442570956, + "learning_rate": 0.00011908747842145408, + "loss": 0.7504, + "mean_token_accuracy": 0.7831682920455932, + "num_tokens": 137149409.0, + "step": 40310 + }, + { + "epoch": 0.40467300975551007, + "learning_rate": 0.00011906740535549401, + "loss": 0.7785, + "mean_token_accuracy": 0.7700968325138092, + "num_tokens": 137182906.0, + "step": 40320 + }, + { + "epoch": 0.4047733750853105, + "learning_rate": 0.0001190473322895339, + "loss": 0.7391, + "mean_token_accuracy": 0.7785880506038666, + "num_tokens": 137216828.0, + "step": 40330 + }, + { + "epoch": 0.404873740415111, + "learning_rate": 0.00011902725922357381, + "loss": 0.7575, + "mean_token_accuracy": 0.7717571794986725, + "num_tokens": 137251433.0, + "step": 40340 + }, + { + "epoch": 0.4049741057449115, + "learning_rate": 0.00011900718615761373, + "loss": 0.7589, + "mean_token_accuracy": 0.7681475281715393, + "num_tokens": 137285818.0, + "step": 40350 + }, + { + "epoch": 0.40507447107471195, + "learning_rate": 0.00011898711309165363, + "loss": 0.7513, + "mean_token_accuracy": 0.7803711235523224, + "num_tokens": 137320567.0, + "step": 40360 + }, + { + "epoch": 0.4051748364045124, + "learning_rate": 0.00011896704002569352, + "loss": 0.7594, + "mean_token_accuracy": 0.7707147121429443, + "num_tokens": 137354244.0, + "step": 40370 + }, + { + "epoch": 0.4052752017343129, + "learning_rate": 0.00011894696695973344, + "loss": 0.7487, + "mean_token_accuracy": 0.7731487333774567, + "num_tokens": 137387920.0, + "step": 40380 + }, + { + "epoch": 0.4053755670641134, + "learning_rate": 0.00011892689389377334, + "loss": 0.7619, + "mean_token_accuracy": 0.7695264756679535, + "num_tokens": 137422308.0, + "step": 40390 + }, + { + "epoch": 0.40547593239391383, + "learning_rate": 0.00011890682082781323, + "loss": 0.7775, + "mean_token_accuracy": 0.7670171678066253, + "num_tokens": 137456020.0, + "step": 40400 + }, + { + "epoch": 0.40557629772371434, + "learning_rate": 0.00011888674776185316, + "loss": 0.747, + "mean_token_accuracy": 0.7790325105190277, + "num_tokens": 137490571.0, + "step": 40410 + }, + { + "epoch": 0.4056766630535148, + "learning_rate": 0.00011886667469589305, + "loss": 0.7544, + "mean_token_accuracy": 0.7761958301067352, + "num_tokens": 137525331.0, + "step": 40420 + }, + { + "epoch": 0.40577702838331525, + "learning_rate": 0.00011884660162993295, + "loss": 0.7316, + "mean_token_accuracy": 0.7793192148208619, + "num_tokens": 137559540.0, + "step": 40430 + }, + { + "epoch": 0.40587739371311576, + "learning_rate": 0.00011882652856397287, + "loss": 0.7504, + "mean_token_accuracy": 0.770765197277069, + "num_tokens": 137593641.0, + "step": 40440 + }, + { + "epoch": 0.4059777590429162, + "learning_rate": 0.00011880645549801278, + "loss": 0.753, + "mean_token_accuracy": 0.7740166127681732, + "num_tokens": 137627269.0, + "step": 40450 + }, + { + "epoch": 0.4060781243727167, + "learning_rate": 0.00011878638243205267, + "loss": 0.7394, + "mean_token_accuracy": 0.7752980709075927, + "num_tokens": 137661338.0, + "step": 40460 + }, + { + "epoch": 0.4061784897025172, + "learning_rate": 0.00011876630936609259, + "loss": 0.7388, + "mean_token_accuracy": 0.7813899517059326, + "num_tokens": 137695734.0, + "step": 40470 + }, + { + "epoch": 0.40627885503231764, + "learning_rate": 0.00011874623630013249, + "loss": 0.7262, + "mean_token_accuracy": 0.7795300543308258, + "num_tokens": 137729585.0, + "step": 40480 + }, + { + "epoch": 0.4063792203621181, + "learning_rate": 0.00011872616323417238, + "loss": 0.7736, + "mean_token_accuracy": 0.7737720370292663, + "num_tokens": 137763600.0, + "step": 40490 + }, + { + "epoch": 0.4064795856919186, + "learning_rate": 0.0001187060901682123, + "loss": 0.7486, + "mean_token_accuracy": 0.7761506915092469, + "num_tokens": 137797753.0, + "step": 40500 + }, + { + "epoch": 0.40657995102171907, + "learning_rate": 0.0001186860171022522, + "loss": 0.7748, + "mean_token_accuracy": 0.7699367046356201, + "num_tokens": 137831717.0, + "step": 40510 + }, + { + "epoch": 0.4066803163515195, + "learning_rate": 0.0001186659440362921, + "loss": 0.7444, + "mean_token_accuracy": 0.7797233581542968, + "num_tokens": 137865259.0, + "step": 40520 + }, + { + "epoch": 0.40678068168132, + "learning_rate": 0.00011864587097033202, + "loss": 0.774, + "mean_token_accuracy": 0.770091712474823, + "num_tokens": 137898475.0, + "step": 40530 + }, + { + "epoch": 0.4068810470111205, + "learning_rate": 0.00011862579790437191, + "loss": 0.7355, + "mean_token_accuracy": 0.7780645191669464, + "num_tokens": 137931714.0, + "step": 40540 + }, + { + "epoch": 0.40698141234092094, + "learning_rate": 0.00011860572483841183, + "loss": 0.7782, + "mean_token_accuracy": 0.7742593169212342, + "num_tokens": 137965370.0, + "step": 40550 + }, + { + "epoch": 0.4070817776707214, + "learning_rate": 0.00011858565177245173, + "loss": 0.7656, + "mean_token_accuracy": 0.7720534443855286, + "num_tokens": 138000108.0, + "step": 40560 + }, + { + "epoch": 0.4071821430005219, + "learning_rate": 0.00011856557870649164, + "loss": 0.778, + "mean_token_accuracy": 0.7693661630153656, + "num_tokens": 138033795.0, + "step": 40570 + }, + { + "epoch": 0.40728250833032237, + "learning_rate": 0.00011854550564053154, + "loss": 0.7438, + "mean_token_accuracy": 0.7773890793323517, + "num_tokens": 138067536.0, + "step": 40580 + }, + { + "epoch": 0.4073828736601228, + "learning_rate": 0.00011852543257457145, + "loss": 0.7743, + "mean_token_accuracy": 0.7715484380722046, + "num_tokens": 138101544.0, + "step": 40590 + }, + { + "epoch": 0.40748323898992334, + "learning_rate": 0.00011850535950861135, + "loss": 0.7064, + "mean_token_accuracy": 0.7851023733615875, + "num_tokens": 138135285.0, + "step": 40600 + }, + { + "epoch": 0.4075836043197238, + "learning_rate": 0.00011848528644265127, + "loss": 0.7476, + "mean_token_accuracy": 0.7710342526435852, + "num_tokens": 138170031.0, + "step": 40610 + }, + { + "epoch": 0.40768396964952425, + "learning_rate": 0.00011846521337669117, + "loss": 0.7515, + "mean_token_accuracy": 0.7754992127418519, + "num_tokens": 138204338.0, + "step": 40620 + }, + { + "epoch": 0.40778433497932476, + "learning_rate": 0.00011844514031073106, + "loss": 0.7358, + "mean_token_accuracy": 0.7735447943210602, + "num_tokens": 138238926.0, + "step": 40630 + }, + { + "epoch": 0.4078847003091252, + "learning_rate": 0.00011842506724477098, + "loss": 0.7565, + "mean_token_accuracy": 0.7683779120445251, + "num_tokens": 138273083.0, + "step": 40640 + }, + { + "epoch": 0.40798506563892567, + "learning_rate": 0.00011840499417881088, + "loss": 0.7102, + "mean_token_accuracy": 0.7821719765663147, + "num_tokens": 138307340.0, + "step": 40650 + }, + { + "epoch": 0.4080854309687262, + "learning_rate": 0.00011838492111285077, + "loss": 0.7406, + "mean_token_accuracy": 0.7764710009098053, + "num_tokens": 138341334.0, + "step": 40660 + }, + { + "epoch": 0.40818579629852664, + "learning_rate": 0.0001183648480468907, + "loss": 0.7235, + "mean_token_accuracy": 0.7790306329727172, + "num_tokens": 138375579.0, + "step": 40670 + }, + { + "epoch": 0.4082861616283271, + "learning_rate": 0.00011834477498093059, + "loss": 0.7573, + "mean_token_accuracy": 0.7704456508159637, + "num_tokens": 138409339.0, + "step": 40680 + }, + { + "epoch": 0.4083865269581276, + "learning_rate": 0.0001183247019149705, + "loss": 0.7631, + "mean_token_accuracy": 0.7724515259265899, + "num_tokens": 138443032.0, + "step": 40690 + }, + { + "epoch": 0.40848689228792806, + "learning_rate": 0.00011830462884901042, + "loss": 0.7234, + "mean_token_accuracy": 0.7780615448951721, + "num_tokens": 138477905.0, + "step": 40700 + }, + { + "epoch": 0.4085872576177285, + "learning_rate": 0.00011828455578305031, + "loss": 0.7823, + "mean_token_accuracy": 0.7687849044799805, + "num_tokens": 138512803.0, + "step": 40710 + }, + { + "epoch": 0.40868762294752903, + "learning_rate": 0.00011826448271709021, + "loss": 0.7545, + "mean_token_accuracy": 0.7672878324985504, + "num_tokens": 138547653.0, + "step": 40720 + }, + { + "epoch": 0.4087879882773295, + "learning_rate": 0.00011824440965113013, + "loss": 0.7322, + "mean_token_accuracy": 0.7838719069957734, + "num_tokens": 138582169.0, + "step": 40730 + }, + { + "epoch": 0.40888835360712994, + "learning_rate": 0.00011822433658517003, + "loss": 0.7204, + "mean_token_accuracy": 0.7826182544231415, + "num_tokens": 138616066.0, + "step": 40740 + }, + { + "epoch": 0.40898871893693045, + "learning_rate": 0.00011820426351920992, + "loss": 0.776, + "mean_token_accuracy": 0.7676548540592194, + "num_tokens": 138650305.0, + "step": 40750 + }, + { + "epoch": 0.4090890842667309, + "learning_rate": 0.00011818419045324984, + "loss": 0.7671, + "mean_token_accuracy": 0.7706285357475281, + "num_tokens": 138684542.0, + "step": 40760 + }, + { + "epoch": 0.40918944959653136, + "learning_rate": 0.00011816411738728974, + "loss": 0.7867, + "mean_token_accuracy": 0.7677037358283997, + "num_tokens": 138718245.0, + "step": 40770 + }, + { + "epoch": 0.4092898149263319, + "learning_rate": 0.00011814404432132963, + "loss": 0.7547, + "mean_token_accuracy": 0.7797528266906738, + "num_tokens": 138752264.0, + "step": 40780 + }, + { + "epoch": 0.40939018025613233, + "learning_rate": 0.00011812397125536955, + "loss": 0.7189, + "mean_token_accuracy": 0.7785382807254791, + "num_tokens": 138786166.0, + "step": 40790 + }, + { + "epoch": 0.4094905455859328, + "learning_rate": 0.00011810389818940946, + "loss": 0.7317, + "mean_token_accuracy": 0.7766336321830749, + "num_tokens": 138819757.0, + "step": 40800 + }, + { + "epoch": 0.40959091091573324, + "learning_rate": 0.00011808382512344936, + "loss": 0.7632, + "mean_token_accuracy": 0.773804223537445, + "num_tokens": 138853929.0, + "step": 40810 + }, + { + "epoch": 0.40969127624553375, + "learning_rate": 0.00011806375205748928, + "loss": 0.7371, + "mean_token_accuracy": 0.7774279773235321, + "num_tokens": 138888189.0, + "step": 40820 + }, + { + "epoch": 0.4097916415753342, + "learning_rate": 0.00011804367899152917, + "loss": 0.7831, + "mean_token_accuracy": 0.7649127542972565, + "num_tokens": 138921873.0, + "step": 40830 + }, + { + "epoch": 0.40989200690513466, + "learning_rate": 0.00011802360592556907, + "loss": 0.7893, + "mean_token_accuracy": 0.7690079867839813, + "num_tokens": 138955520.0, + "step": 40840 + }, + { + "epoch": 0.4099923722349352, + "learning_rate": 0.00011800353285960899, + "loss": 0.7455, + "mean_token_accuracy": 0.7748494923114777, + "num_tokens": 138989147.0, + "step": 40850 + }, + { + "epoch": 0.41009273756473563, + "learning_rate": 0.00011798345979364889, + "loss": 0.7563, + "mean_token_accuracy": 0.77107834815979, + "num_tokens": 139022662.0, + "step": 40860 + }, + { + "epoch": 0.4101931028945361, + "learning_rate": 0.00011796338672768878, + "loss": 0.7072, + "mean_token_accuracy": 0.7833503663539887, + "num_tokens": 139056757.0, + "step": 40870 + }, + { + "epoch": 0.4102934682243366, + "learning_rate": 0.0001179433136617287, + "loss": 0.7281, + "mean_token_accuracy": 0.7813907444477082, + "num_tokens": 139090864.0, + "step": 40880 + }, + { + "epoch": 0.41039383355413706, + "learning_rate": 0.0001179232405957686, + "loss": 0.7547, + "mean_token_accuracy": 0.7724337577819824, + "num_tokens": 139124678.0, + "step": 40890 + }, + { + "epoch": 0.4104941988839375, + "learning_rate": 0.0001179031675298085, + "loss": 0.7595, + "mean_token_accuracy": 0.7724938094615936, + "num_tokens": 139158464.0, + "step": 40900 + }, + { + "epoch": 0.410594564213738, + "learning_rate": 0.00011788309446384841, + "loss": 0.7525, + "mean_token_accuracy": 0.7783440172672271, + "num_tokens": 139192885.0, + "step": 40910 + }, + { + "epoch": 0.4106949295435385, + "learning_rate": 0.00011786302139788832, + "loss": 0.7126, + "mean_token_accuracy": 0.7847510516643524, + "num_tokens": 139227834.0, + "step": 40920 + }, + { + "epoch": 0.41079529487333893, + "learning_rate": 0.00011784294833192822, + "loss": 0.759, + "mean_token_accuracy": 0.7764720797538758, + "num_tokens": 139261774.0, + "step": 40930 + }, + { + "epoch": 0.41089566020313945, + "learning_rate": 0.00011782287526596814, + "loss": 0.7234, + "mean_token_accuracy": 0.7811742126941681, + "num_tokens": 139295678.0, + "step": 40940 + }, + { + "epoch": 0.4109960255329399, + "learning_rate": 0.00011780280220000804, + "loss": 0.7572, + "mean_token_accuracy": 0.7743043065071106, + "num_tokens": 139329327.0, + "step": 40950 + }, + { + "epoch": 0.41109639086274036, + "learning_rate": 0.00011778272913404793, + "loss": 0.7782, + "mean_token_accuracy": 0.7678183138370513, + "num_tokens": 139363631.0, + "step": 40960 + }, + { + "epoch": 0.41119675619254087, + "learning_rate": 0.00011776265606808785, + "loss": 0.7533, + "mean_token_accuracy": 0.77596116065979, + "num_tokens": 139397490.0, + "step": 40970 + }, + { + "epoch": 0.4112971215223413, + "learning_rate": 0.00011774258300212775, + "loss": 0.7351, + "mean_token_accuracy": 0.7769738376140595, + "num_tokens": 139431700.0, + "step": 40980 + }, + { + "epoch": 0.4113974868521418, + "learning_rate": 0.00011772250993616764, + "loss": 0.748, + "mean_token_accuracy": 0.7776111900806427, + "num_tokens": 139465321.0, + "step": 40990 + }, + { + "epoch": 0.4114978521819423, + "learning_rate": 0.00011770243687020756, + "loss": 0.7643, + "mean_token_accuracy": 0.7742827475070954, + "num_tokens": 139499535.0, + "step": 41000 + }, + { + "epoch": 0.41159821751174275, + "learning_rate": 0.00011768236380424746, + "loss": 0.7195, + "mean_token_accuracy": 0.7819054663181305, + "num_tokens": 139533933.0, + "step": 41010 + }, + { + "epoch": 0.4116985828415432, + "learning_rate": 0.00011766229073828737, + "loss": 0.7695, + "mean_token_accuracy": 0.767099529504776, + "num_tokens": 139568333.0, + "step": 41020 + }, + { + "epoch": 0.4117989481713437, + "learning_rate": 0.00011764221767232728, + "loss": 0.7399, + "mean_token_accuracy": 0.7762628257274627, + "num_tokens": 139602665.0, + "step": 41030 + }, + { + "epoch": 0.41189931350114417, + "learning_rate": 0.00011762214460636718, + "loss": 0.7472, + "mean_token_accuracy": 0.7746689438819885, + "num_tokens": 139636128.0, + "step": 41040 + }, + { + "epoch": 0.4119996788309446, + "learning_rate": 0.00011760207154040708, + "loss": 0.7558, + "mean_token_accuracy": 0.7738821566104889, + "num_tokens": 139669982.0, + "step": 41050 + }, + { + "epoch": 0.41210004416074514, + "learning_rate": 0.000117581998474447, + "loss": 0.7689, + "mean_token_accuracy": 0.7646086633205413, + "num_tokens": 139703713.0, + "step": 41060 + }, + { + "epoch": 0.4122004094905456, + "learning_rate": 0.0001175619254084869, + "loss": 0.7692, + "mean_token_accuracy": 0.7704572319984436, + "num_tokens": 139736886.0, + "step": 41070 + }, + { + "epoch": 0.41230077482034605, + "learning_rate": 0.00011754185234252679, + "loss": 0.7346, + "mean_token_accuracy": 0.7775911629199982, + "num_tokens": 139771723.0, + "step": 41080 + }, + { + "epoch": 0.4124011401501465, + "learning_rate": 0.00011752177927656671, + "loss": 0.7569, + "mean_token_accuracy": 0.7772452890872955, + "num_tokens": 139805498.0, + "step": 41090 + }, + { + "epoch": 0.412501505479947, + "learning_rate": 0.00011750170621060661, + "loss": 0.7485, + "mean_token_accuracy": 0.7740998506546021, + "num_tokens": 139839525.0, + "step": 41100 + }, + { + "epoch": 0.4126018708097475, + "learning_rate": 0.0001174816331446465, + "loss": 0.7457, + "mean_token_accuracy": 0.780066853761673, + "num_tokens": 139872842.0, + "step": 41110 + }, + { + "epoch": 0.41270223613954793, + "learning_rate": 0.00011746156007868642, + "loss": 0.7552, + "mean_token_accuracy": 0.7751128315925598, + "num_tokens": 139907535.0, + "step": 41120 + }, + { + "epoch": 0.41280260146934844, + "learning_rate": 0.00011744148701272632, + "loss": 0.7595, + "mean_token_accuracy": 0.7722532749176025, + "num_tokens": 139941345.0, + "step": 41130 + }, + { + "epoch": 0.4129029667991489, + "learning_rate": 0.00011742141394676624, + "loss": 0.7529, + "mean_token_accuracy": 0.7710931181907654, + "num_tokens": 139975219.0, + "step": 41140 + }, + { + "epoch": 0.41300333212894935, + "learning_rate": 0.00011740134088080615, + "loss": 0.735, + "mean_token_accuracy": 0.7752216398715973, + "num_tokens": 140008585.0, + "step": 41150 + }, + { + "epoch": 0.41310369745874986, + "learning_rate": 0.00011738126781484604, + "loss": 0.7485, + "mean_token_accuracy": 0.7801789045333862, + "num_tokens": 140042289.0, + "step": 41160 + }, + { + "epoch": 0.4132040627885503, + "learning_rate": 0.00011736119474888597, + "loss": 0.7721, + "mean_token_accuracy": 0.7664551675319672, + "num_tokens": 140076349.0, + "step": 41170 + }, + { + "epoch": 0.4133044281183508, + "learning_rate": 0.00011734112168292586, + "loss": 0.7676, + "mean_token_accuracy": 0.770530503988266, + "num_tokens": 140109969.0, + "step": 41180 + }, + { + "epoch": 0.4134047934481513, + "learning_rate": 0.00011732104861696576, + "loss": 0.7579, + "mean_token_accuracy": 0.770295524597168, + "num_tokens": 140143764.0, + "step": 41190 + }, + { + "epoch": 0.41350515877795174, + "learning_rate": 0.00011730097555100568, + "loss": 0.7432, + "mean_token_accuracy": 0.7698943912982941, + "num_tokens": 140178335.0, + "step": 41200 + }, + { + "epoch": 0.4136055241077522, + "learning_rate": 0.00011728090248504557, + "loss": 0.7667, + "mean_token_accuracy": 0.7745707631111145, + "num_tokens": 140212049.0, + "step": 41210 + }, + { + "epoch": 0.4137058894375527, + "learning_rate": 0.00011726082941908547, + "loss": 0.7257, + "mean_token_accuracy": 0.7812729001045227, + "num_tokens": 140246142.0, + "step": 41220 + }, + { + "epoch": 0.41380625476735317, + "learning_rate": 0.00011724075635312539, + "loss": 0.7532, + "mean_token_accuracy": 0.7762118577957153, + "num_tokens": 140280003.0, + "step": 41230 + }, + { + "epoch": 0.4139066200971536, + "learning_rate": 0.00011722068328716528, + "loss": 0.7666, + "mean_token_accuracy": 0.7742089807987214, + "num_tokens": 140314210.0, + "step": 41240 + }, + { + "epoch": 0.41400698542695413, + "learning_rate": 0.0001172006102212052, + "loss": 0.7632, + "mean_token_accuracy": 0.7702260375022888, + "num_tokens": 140347757.0, + "step": 41250 + }, + { + "epoch": 0.4141073507567546, + "learning_rate": 0.0001171805371552451, + "loss": 0.7531, + "mean_token_accuracy": 0.7715366303920745, + "num_tokens": 140382109.0, + "step": 41260 + }, + { + "epoch": 0.41420771608655504, + "learning_rate": 0.00011716046408928501, + "loss": 0.7936, + "mean_token_accuracy": 0.7636014819145203, + "num_tokens": 140415812.0, + "step": 41270 + }, + { + "epoch": 0.41430808141635556, + "learning_rate": 0.0001171403910233249, + "loss": 0.7159, + "mean_token_accuracy": 0.7836873412132264, + "num_tokens": 140450053.0, + "step": 41280 + }, + { + "epoch": 0.414408446746156, + "learning_rate": 0.00011712031795736483, + "loss": 0.7702, + "mean_token_accuracy": 0.7716418683528901, + "num_tokens": 140484340.0, + "step": 41290 + }, + { + "epoch": 0.41450881207595647, + "learning_rate": 0.00011710024489140472, + "loss": 0.7392, + "mean_token_accuracy": 0.7766879677772522, + "num_tokens": 140518537.0, + "step": 41300 + }, + { + "epoch": 0.414609177405757, + "learning_rate": 0.00011708017182544462, + "loss": 0.778, + "mean_token_accuracy": 0.7727922677993775, + "num_tokens": 140552468.0, + "step": 41310 + }, + { + "epoch": 0.41470954273555743, + "learning_rate": 0.00011706009875948454, + "loss": 0.727, + "mean_token_accuracy": 0.7849180281162262, + "num_tokens": 140586845.0, + "step": 41320 + }, + { + "epoch": 0.4148099080653579, + "learning_rate": 0.00011704002569352443, + "loss": 0.7367, + "mean_token_accuracy": 0.780201518535614, + "num_tokens": 140620594.0, + "step": 41330 + }, + { + "epoch": 0.4149102733951584, + "learning_rate": 0.00011701995262756433, + "loss": 0.774, + "mean_token_accuracy": 0.7677059173583984, + "num_tokens": 140655350.0, + "step": 41340 + }, + { + "epoch": 0.41501063872495886, + "learning_rate": 0.00011699987956160425, + "loss": 0.7329, + "mean_token_accuracy": 0.7847771227359772, + "num_tokens": 140689492.0, + "step": 41350 + }, + { + "epoch": 0.4151110040547593, + "learning_rate": 0.00011697980649564415, + "loss": 0.7356, + "mean_token_accuracy": 0.7767213582992554, + "num_tokens": 140723377.0, + "step": 41360 + }, + { + "epoch": 0.4152113693845598, + "learning_rate": 0.00011695973342968405, + "loss": 0.7261, + "mean_token_accuracy": 0.7769228696823121, + "num_tokens": 140757454.0, + "step": 41370 + }, + { + "epoch": 0.4153117347143603, + "learning_rate": 0.00011693966036372396, + "loss": 0.7702, + "mean_token_accuracy": 0.772264164686203, + "num_tokens": 140791467.0, + "step": 41380 + }, + { + "epoch": 0.41541210004416074, + "learning_rate": 0.00011691958729776387, + "loss": 0.7376, + "mean_token_accuracy": 0.7786181330680847, + "num_tokens": 140826132.0, + "step": 41390 + }, + { + "epoch": 0.4155124653739612, + "learning_rate": 0.00011689951423180377, + "loss": 0.7479, + "mean_token_accuracy": 0.7768079102039337, + "num_tokens": 140860422.0, + "step": 41400 + }, + { + "epoch": 0.4156128307037617, + "learning_rate": 0.00011687944116584369, + "loss": 0.7605, + "mean_token_accuracy": 0.7711485028266907, + "num_tokens": 140894125.0, + "step": 41410 + }, + { + "epoch": 0.41571319603356216, + "learning_rate": 0.00011685936809988358, + "loss": 0.7507, + "mean_token_accuracy": 0.7740625619888306, + "num_tokens": 140927887.0, + "step": 41420 + }, + { + "epoch": 0.4158135613633626, + "learning_rate": 0.00011683929503392348, + "loss": 0.7538, + "mean_token_accuracy": 0.7745043277740479, + "num_tokens": 140962183.0, + "step": 41430 + }, + { + "epoch": 0.4159139266931631, + "learning_rate": 0.0001168192219679634, + "loss": 0.7283, + "mean_token_accuracy": 0.7818750143051147, + "num_tokens": 140996523.0, + "step": 41440 + }, + { + "epoch": 0.4160142920229636, + "learning_rate": 0.0001167991489020033, + "loss": 0.7458, + "mean_token_accuracy": 0.7724709391593934, + "num_tokens": 141030741.0, + "step": 41450 + }, + { + "epoch": 0.41611465735276404, + "learning_rate": 0.00011677907583604319, + "loss": 0.7401, + "mean_token_accuracy": 0.7825262606143951, + "num_tokens": 141065439.0, + "step": 41460 + }, + { + "epoch": 0.41621502268256455, + "learning_rate": 0.00011675900277008311, + "loss": 0.7559, + "mean_token_accuracy": 0.7768517851829528, + "num_tokens": 141098789.0, + "step": 41470 + }, + { + "epoch": 0.416315388012365, + "learning_rate": 0.000116738929704123, + "loss": 0.7173, + "mean_token_accuracy": 0.7819433808326721, + "num_tokens": 141132998.0, + "step": 41480 + }, + { + "epoch": 0.41641575334216546, + "learning_rate": 0.00011671885663816291, + "loss": 0.7531, + "mean_token_accuracy": 0.7756395041942596, + "num_tokens": 141167153.0, + "step": 41490 + }, + { + "epoch": 0.416516118671966, + "learning_rate": 0.00011669878357220284, + "loss": 0.7353, + "mean_token_accuracy": 0.7808833479881286, + "num_tokens": 141201802.0, + "step": 41500 + }, + { + "epoch": 0.41661648400176643, + "learning_rate": 0.00011667871050624273, + "loss": 0.7476, + "mean_token_accuracy": 0.7750447750091553, + "num_tokens": 141235160.0, + "step": 41510 + }, + { + "epoch": 0.4167168493315669, + "learning_rate": 0.00011665863744028263, + "loss": 0.7626, + "mean_token_accuracy": 0.7666607677936554, + "num_tokens": 141269775.0, + "step": 41520 + }, + { + "epoch": 0.4168172146613674, + "learning_rate": 0.00011663856437432255, + "loss": 0.7793, + "mean_token_accuracy": 0.7676746845245361, + "num_tokens": 141304175.0, + "step": 41530 + }, + { + "epoch": 0.41691757999116785, + "learning_rate": 0.00011661849130836244, + "loss": 0.7443, + "mean_token_accuracy": 0.7779941499233246, + "num_tokens": 141338306.0, + "step": 41540 + }, + { + "epoch": 0.4170179453209683, + "learning_rate": 0.00011659841824240234, + "loss": 0.7634, + "mean_token_accuracy": 0.7654629826545716, + "num_tokens": 141371972.0, + "step": 41550 + }, + { + "epoch": 0.4171183106507688, + "learning_rate": 0.00011657834517644226, + "loss": 0.7736, + "mean_token_accuracy": 0.7669499337673187, + "num_tokens": 141405702.0, + "step": 41560 + }, + { + "epoch": 0.4172186759805693, + "learning_rate": 0.00011655827211048215, + "loss": 0.7295, + "mean_token_accuracy": 0.7826376080513, + "num_tokens": 141439029.0, + "step": 41570 + }, + { + "epoch": 0.41731904131036973, + "learning_rate": 0.00011653819904452205, + "loss": 0.7786, + "mean_token_accuracy": 0.7668355464935303, + "num_tokens": 141473522.0, + "step": 41580 + }, + { + "epoch": 0.41741940664017024, + "learning_rate": 0.00011651812597856197, + "loss": 0.7544, + "mean_token_accuracy": 0.7743890285491943, + "num_tokens": 141507059.0, + "step": 41590 + }, + { + "epoch": 0.4175197719699707, + "learning_rate": 0.00011649805291260188, + "loss": 0.7769, + "mean_token_accuracy": 0.7657489776611328, + "num_tokens": 141541134.0, + "step": 41600 + }, + { + "epoch": 0.41762013729977115, + "learning_rate": 0.00011647797984664177, + "loss": 0.7359, + "mean_token_accuracy": 0.7797170877456665, + "num_tokens": 141575496.0, + "step": 41610 + }, + { + "epoch": 0.41772050262957167, + "learning_rate": 0.0001164579067806817, + "loss": 0.7759, + "mean_token_accuracy": 0.7683320343494415, + "num_tokens": 141610575.0, + "step": 41620 + }, + { + "epoch": 0.4178208679593721, + "learning_rate": 0.00011643783371472159, + "loss": 0.7502, + "mean_token_accuracy": 0.7801962435245514, + "num_tokens": 141645224.0, + "step": 41630 + }, + { + "epoch": 0.4179212332891726, + "learning_rate": 0.00011641776064876149, + "loss": 0.7639, + "mean_token_accuracy": 0.770879864692688, + "num_tokens": 141679721.0, + "step": 41640 + }, + { + "epoch": 0.4180215986189731, + "learning_rate": 0.00011639768758280141, + "loss": 0.7467, + "mean_token_accuracy": 0.779033613204956, + "num_tokens": 141713432.0, + "step": 41650 + }, + { + "epoch": 0.41812196394877355, + "learning_rate": 0.0001163776145168413, + "loss": 0.7842, + "mean_token_accuracy": 0.7664332866668702, + "num_tokens": 141747915.0, + "step": 41660 + }, + { + "epoch": 0.418222329278574, + "learning_rate": 0.0001163575414508812, + "loss": 0.7438, + "mean_token_accuracy": 0.7792607843875885, + "num_tokens": 141781878.0, + "step": 41670 + }, + { + "epoch": 0.41832269460837446, + "learning_rate": 0.00011633746838492112, + "loss": 0.7458, + "mean_token_accuracy": 0.7750950932502747, + "num_tokens": 141815215.0, + "step": 41680 + }, + { + "epoch": 0.41842305993817497, + "learning_rate": 0.00011631739531896102, + "loss": 0.7032, + "mean_token_accuracy": 0.7843857049942017, + "num_tokens": 141849495.0, + "step": 41690 + }, + { + "epoch": 0.4185234252679754, + "learning_rate": 0.00011629732225300094, + "loss": 0.755, + "mean_token_accuracy": 0.776856005191803, + "num_tokens": 141883598.0, + "step": 41700 + }, + { + "epoch": 0.4186237905977759, + "learning_rate": 0.00011627724918704083, + "loss": 0.7578, + "mean_token_accuracy": 0.7720408916473389, + "num_tokens": 141917319.0, + "step": 41710 + }, + { + "epoch": 0.4187241559275764, + "learning_rate": 0.00011625717612108074, + "loss": 0.77, + "mean_token_accuracy": 0.775605422258377, + "num_tokens": 141951575.0, + "step": 41720 + }, + { + "epoch": 0.41882452125737685, + "learning_rate": 0.00011623710305512065, + "loss": 0.7508, + "mean_token_accuracy": 0.7744235992431641, + "num_tokens": 141985525.0, + "step": 41730 + }, + { + "epoch": 0.4189248865871773, + "learning_rate": 0.00011621702998916056, + "loss": 0.7493, + "mean_token_accuracy": 0.7771193206310272, + "num_tokens": 142018386.0, + "step": 41740 + }, + { + "epoch": 0.4190252519169778, + "learning_rate": 0.00011619695692320045, + "loss": 0.7218, + "mean_token_accuracy": 0.7799361944198608, + "num_tokens": 142053318.0, + "step": 41750 + }, + { + "epoch": 0.41912561724677827, + "learning_rate": 0.00011617688385724037, + "loss": 0.7374, + "mean_token_accuracy": 0.7763052105903625, + "num_tokens": 142087398.0, + "step": 41760 + }, + { + "epoch": 0.4192259825765787, + "learning_rate": 0.00011615681079128027, + "loss": 0.7316, + "mean_token_accuracy": 0.7780951380729675, + "num_tokens": 142122626.0, + "step": 41770 + }, + { + "epoch": 0.41932634790637924, + "learning_rate": 0.00011613673772532016, + "loss": 0.7343, + "mean_token_accuracy": 0.7779183864593506, + "num_tokens": 142156233.0, + "step": 41780 + }, + { + "epoch": 0.4194267132361797, + "learning_rate": 0.00011611666465936009, + "loss": 0.7527, + "mean_token_accuracy": 0.7760959804058075, + "num_tokens": 142190636.0, + "step": 41790 + }, + { + "epoch": 0.41952707856598015, + "learning_rate": 0.00011609659159339998, + "loss": 0.7405, + "mean_token_accuracy": 0.7813480198383331, + "num_tokens": 142224812.0, + "step": 41800 + }, + { + "epoch": 0.41962744389578066, + "learning_rate": 0.00011607651852743988, + "loss": 0.7321, + "mean_token_accuracy": 0.7838366448879241, + "num_tokens": 142258952.0, + "step": 41810 + }, + { + "epoch": 0.4197278092255811, + "learning_rate": 0.0001160564454614798, + "loss": 0.7468, + "mean_token_accuracy": 0.7750254154205323, + "num_tokens": 142292930.0, + "step": 41820 + }, + { + "epoch": 0.4198281745553816, + "learning_rate": 0.00011603637239551969, + "loss": 0.7439, + "mean_token_accuracy": 0.7807756662368774, + "num_tokens": 142326719.0, + "step": 41830 + }, + { + "epoch": 0.4199285398851821, + "learning_rate": 0.0001160162993295596, + "loss": 0.7823, + "mean_token_accuracy": 0.7710380792617798, + "num_tokens": 142359477.0, + "step": 41840 + }, + { + "epoch": 0.42002890521498254, + "learning_rate": 0.00011599622626359952, + "loss": 0.749, + "mean_token_accuracy": 0.777097511291504, + "num_tokens": 142393997.0, + "step": 41850 + }, + { + "epoch": 0.420129270544783, + "learning_rate": 0.00011597615319763942, + "loss": 0.7514, + "mean_token_accuracy": 0.7785601139068603, + "num_tokens": 142427956.0, + "step": 41860 + }, + { + "epoch": 0.4202296358745835, + "learning_rate": 0.00011595608013167931, + "loss": 0.789, + "mean_token_accuracy": 0.7634051084518433, + "num_tokens": 142461618.0, + "step": 41870 + }, + { + "epoch": 0.42033000120438396, + "learning_rate": 0.00011593600706571923, + "loss": 0.759, + "mean_token_accuracy": 0.7732995927333832, + "num_tokens": 142495121.0, + "step": 41880 + }, + { + "epoch": 0.4204303665341844, + "learning_rate": 0.00011591593399975913, + "loss": 0.7259, + "mean_token_accuracy": 0.7791109800338745, + "num_tokens": 142529111.0, + "step": 41890 + }, + { + "epoch": 0.42053073186398493, + "learning_rate": 0.00011589586093379902, + "loss": 0.7815, + "mean_token_accuracy": 0.7657994270324707, + "num_tokens": 142562708.0, + "step": 41900 + }, + { + "epoch": 0.4206310971937854, + "learning_rate": 0.00011587578786783895, + "loss": 0.731, + "mean_token_accuracy": 0.7786415398120881, + "num_tokens": 142597009.0, + "step": 41910 + }, + { + "epoch": 0.42073146252358584, + "learning_rate": 0.00011585571480187884, + "loss": 0.7478, + "mean_token_accuracy": 0.7720061779022217, + "num_tokens": 142629882.0, + "step": 41920 + }, + { + "epoch": 0.42083182785338635, + "learning_rate": 0.00011583564173591874, + "loss": 0.728, + "mean_token_accuracy": 0.7804020464420318, + "num_tokens": 142663262.0, + "step": 41930 + }, + { + "epoch": 0.4209321931831868, + "learning_rate": 0.00011581556866995866, + "loss": 0.7389, + "mean_token_accuracy": 0.7790018320083618, + "num_tokens": 142697552.0, + "step": 41940 + }, + { + "epoch": 0.42103255851298726, + "learning_rate": 0.00011579549560399857, + "loss": 0.7374, + "mean_token_accuracy": 0.780879122018814, + "num_tokens": 142731175.0, + "step": 41950 + }, + { + "epoch": 0.4211329238427877, + "learning_rate": 0.00011577542253803846, + "loss": 0.7553, + "mean_token_accuracy": 0.7732527136802674, + "num_tokens": 142766072.0, + "step": 41960 + }, + { + "epoch": 0.42123328917258823, + "learning_rate": 0.00011575534947207838, + "loss": 0.7663, + "mean_token_accuracy": 0.7731917262077331, + "num_tokens": 142800031.0, + "step": 41970 + }, + { + "epoch": 0.4213336545023887, + "learning_rate": 0.00011573527640611828, + "loss": 0.7428, + "mean_token_accuracy": 0.7734259366989136, + "num_tokens": 142832827.0, + "step": 41980 + }, + { + "epoch": 0.42143401983218914, + "learning_rate": 0.00011571520334015817, + "loss": 0.7529, + "mean_token_accuracy": 0.7777356564998626, + "num_tokens": 142866975.0, + "step": 41990 + }, + { + "epoch": 0.42153438516198966, + "learning_rate": 0.0001156951302741981, + "loss": 0.7223, + "mean_token_accuracy": 0.7811121463775634, + "num_tokens": 142900069.0, + "step": 42000 + }, + { + "epoch": 0.4216347504917901, + "learning_rate": 0.00011567505720823799, + "loss": 0.7568, + "mean_token_accuracy": 0.7768263280391693, + "num_tokens": 142933803.0, + "step": 42010 + }, + { + "epoch": 0.42173511582159057, + "learning_rate": 0.00011565498414227789, + "loss": 0.7739, + "mean_token_accuracy": 0.7687878906726837, + "num_tokens": 142968125.0, + "step": 42020 + }, + { + "epoch": 0.4218354811513911, + "learning_rate": 0.00011563491107631781, + "loss": 0.7476, + "mean_token_accuracy": 0.7753892004489898, + "num_tokens": 143002152.0, + "step": 42030 + }, + { + "epoch": 0.42193584648119153, + "learning_rate": 0.0001156148380103577, + "loss": 0.7615, + "mean_token_accuracy": 0.768572723865509, + "num_tokens": 143036434.0, + "step": 42040 + }, + { + "epoch": 0.422036211810992, + "learning_rate": 0.00011559476494439761, + "loss": 0.7378, + "mean_token_accuracy": 0.7769821345806122, + "num_tokens": 143070746.0, + "step": 42050 + }, + { + "epoch": 0.4221365771407925, + "learning_rate": 0.00011557469187843752, + "loss": 0.7258, + "mean_token_accuracy": 0.7808934569358825, + "num_tokens": 143103651.0, + "step": 42060 + }, + { + "epoch": 0.42223694247059296, + "learning_rate": 0.00011555461881247743, + "loss": 0.7374, + "mean_token_accuracy": 0.7748523354530334, + "num_tokens": 143137910.0, + "step": 42070 + }, + { + "epoch": 0.4223373078003934, + "learning_rate": 0.00011553454574651732, + "loss": 0.7479, + "mean_token_accuracy": 0.7740685045719147, + "num_tokens": 143171565.0, + "step": 42080 + }, + { + "epoch": 0.4224376731301939, + "learning_rate": 0.00011551447268055724, + "loss": 0.7599, + "mean_token_accuracy": 0.7703144967555999, + "num_tokens": 143205989.0, + "step": 42090 + }, + { + "epoch": 0.4225380384599944, + "learning_rate": 0.00011549439961459714, + "loss": 0.7799, + "mean_token_accuracy": 0.7680784404277802, + "num_tokens": 143240141.0, + "step": 42100 + }, + { + "epoch": 0.42263840378979484, + "learning_rate": 0.00011547432654863703, + "loss": 0.7363, + "mean_token_accuracy": 0.777568644285202, + "num_tokens": 143275019.0, + "step": 42110 + }, + { + "epoch": 0.42273876911959535, + "learning_rate": 0.00011545425348267696, + "loss": 0.7591, + "mean_token_accuracy": 0.7781234681606293, + "num_tokens": 143309493.0, + "step": 42120 + }, + { + "epoch": 0.4228391344493958, + "learning_rate": 0.00011543418041671685, + "loss": 0.7544, + "mean_token_accuracy": 0.7739103138446808, + "num_tokens": 143343264.0, + "step": 42130 + }, + { + "epoch": 0.42293949977919626, + "learning_rate": 0.00011541410735075675, + "loss": 0.7663, + "mean_token_accuracy": 0.7781742632389068, + "num_tokens": 143376970.0, + "step": 42140 + }, + { + "epoch": 0.42303986510899677, + "learning_rate": 0.00011539403428479667, + "loss": 0.7552, + "mean_token_accuracy": 0.7751582503318787, + "num_tokens": 143410449.0, + "step": 42150 + }, + { + "epoch": 0.4231402304387972, + "learning_rate": 0.00011537396121883656, + "loss": 0.7557, + "mean_token_accuracy": 0.7700955033302307, + "num_tokens": 143444118.0, + "step": 42160 + }, + { + "epoch": 0.4232405957685977, + "learning_rate": 0.00011535388815287647, + "loss": 0.7375, + "mean_token_accuracy": 0.771321439743042, + "num_tokens": 143477535.0, + "step": 42170 + }, + { + "epoch": 0.4233409610983982, + "learning_rate": 0.00011533381508691638, + "loss": 0.7311, + "mean_token_accuracy": 0.777759313583374, + "num_tokens": 143511652.0, + "step": 42180 + }, + { + "epoch": 0.42344132642819865, + "learning_rate": 0.00011531374202095629, + "loss": 0.7553, + "mean_token_accuracy": 0.7791213870048523, + "num_tokens": 143545525.0, + "step": 42190 + }, + { + "epoch": 0.4235416917579991, + "learning_rate": 0.00011529366895499618, + "loss": 0.7633, + "mean_token_accuracy": 0.7726755797863006, + "num_tokens": 143579727.0, + "step": 42200 + }, + { + "epoch": 0.4236420570877996, + "learning_rate": 0.0001152735958890361, + "loss": 0.7438, + "mean_token_accuracy": 0.7750461578369141, + "num_tokens": 143614240.0, + "step": 42210 + }, + { + "epoch": 0.4237424224176001, + "learning_rate": 0.000115253522823076, + "loss": 0.7529, + "mean_token_accuracy": 0.7775866985321045, + "num_tokens": 143647665.0, + "step": 42220 + }, + { + "epoch": 0.42384278774740053, + "learning_rate": 0.0001152334497571159, + "loss": 0.7472, + "mean_token_accuracy": 0.7775680303573609, + "num_tokens": 143681430.0, + "step": 42230 + }, + { + "epoch": 0.423943153077201, + "learning_rate": 0.00011521337669115582, + "loss": 0.7568, + "mean_token_accuracy": 0.77844118475914, + "num_tokens": 143715338.0, + "step": 42240 + }, + { + "epoch": 0.4240435184070015, + "learning_rate": 0.00011519330362519571, + "loss": 0.782, + "mean_token_accuracy": 0.7664641857147216, + "num_tokens": 143750014.0, + "step": 42250 + }, + { + "epoch": 0.42414388373680195, + "learning_rate": 0.00011517323055923563, + "loss": 0.7461, + "mean_token_accuracy": 0.7792369246482849, + "num_tokens": 143784996.0, + "step": 42260 + }, + { + "epoch": 0.4242442490666024, + "learning_rate": 0.00011515315749327553, + "loss": 0.7664, + "mean_token_accuracy": 0.7747955799102784, + "num_tokens": 143819719.0, + "step": 42270 + }, + { + "epoch": 0.4243446143964029, + "learning_rate": 0.00011513308442731542, + "loss": 0.7531, + "mean_token_accuracy": 0.7744141519069672, + "num_tokens": 143853169.0, + "step": 42280 + }, + { + "epoch": 0.4244449797262034, + "learning_rate": 0.00011511301136135535, + "loss": 0.7568, + "mean_token_accuracy": 0.7710319399833679, + "num_tokens": 143886625.0, + "step": 42290 + }, + { + "epoch": 0.42454534505600383, + "learning_rate": 0.00011509293829539525, + "loss": 0.7635, + "mean_token_accuracy": 0.7699625313282012, + "num_tokens": 143920842.0, + "step": 42300 + }, + { + "epoch": 0.42464571038580434, + "learning_rate": 0.00011507286522943515, + "loss": 0.7649, + "mean_token_accuracy": 0.769263744354248, + "num_tokens": 143954610.0, + "step": 42310 + }, + { + "epoch": 0.4247460757156048, + "learning_rate": 0.00011505279216347507, + "loss": 0.7878, + "mean_token_accuracy": 0.7658296942710876, + "num_tokens": 143988125.0, + "step": 42320 + }, + { + "epoch": 0.42484644104540525, + "learning_rate": 0.00011503271909751497, + "loss": 0.7302, + "mean_token_accuracy": 0.7820160806179046, + "num_tokens": 144022118.0, + "step": 42330 + }, + { + "epoch": 0.42494680637520577, + "learning_rate": 0.00011501264603155486, + "loss": 0.768, + "mean_token_accuracy": 0.7747110068798065, + "num_tokens": 144057330.0, + "step": 42340 + }, + { + "epoch": 0.4250471717050062, + "learning_rate": 0.00011499257296559478, + "loss": 0.7311, + "mean_token_accuracy": 0.7816978096961975, + "num_tokens": 144091710.0, + "step": 42350 + }, + { + "epoch": 0.4251475370348067, + "learning_rate": 0.00011497249989963468, + "loss": 0.7477, + "mean_token_accuracy": 0.7742366671562195, + "num_tokens": 144125285.0, + "step": 42360 + }, + { + "epoch": 0.4252479023646072, + "learning_rate": 0.00011495242683367457, + "loss": 0.7863, + "mean_token_accuracy": 0.769205504655838, + "num_tokens": 144159023.0, + "step": 42370 + }, + { + "epoch": 0.42534826769440764, + "learning_rate": 0.0001149323537677145, + "loss": 0.7348, + "mean_token_accuracy": 0.7731286525726319, + "num_tokens": 144193543.0, + "step": 42380 + }, + { + "epoch": 0.4254486330242081, + "learning_rate": 0.00011491228070175439, + "loss": 0.752, + "mean_token_accuracy": 0.7733675420284272, + "num_tokens": 144227794.0, + "step": 42390 + }, + { + "epoch": 0.4255489983540086, + "learning_rate": 0.0001148922076357943, + "loss": 0.7608, + "mean_token_accuracy": 0.7742749333381653, + "num_tokens": 144261510.0, + "step": 42400 + }, + { + "epoch": 0.42564936368380907, + "learning_rate": 0.0001148721345698342, + "loss": 0.7561, + "mean_token_accuracy": 0.7709795594215393, + "num_tokens": 144295409.0, + "step": 42410 + }, + { + "epoch": 0.4257497290136095, + "learning_rate": 0.00011485206150387411, + "loss": 0.7287, + "mean_token_accuracy": 0.7776812016963959, + "num_tokens": 144328163.0, + "step": 42420 + }, + { + "epoch": 0.42585009434341003, + "learning_rate": 0.00011483198843791401, + "loss": 0.791, + "mean_token_accuracy": 0.7648392498493195, + "num_tokens": 144362159.0, + "step": 42430 + }, + { + "epoch": 0.4259504596732105, + "learning_rate": 0.00011481191537195393, + "loss": 0.7614, + "mean_token_accuracy": 0.7748533010482788, + "num_tokens": 144396163.0, + "step": 42440 + }, + { + "epoch": 0.42605082500301095, + "learning_rate": 0.00011479184230599383, + "loss": 0.7505, + "mean_token_accuracy": 0.7726286232471467, + "num_tokens": 144429723.0, + "step": 42450 + }, + { + "epoch": 0.42615119033281146, + "learning_rate": 0.00011477176924003372, + "loss": 0.7231, + "mean_token_accuracy": 0.7830985367298127, + "num_tokens": 144463855.0, + "step": 42460 + }, + { + "epoch": 0.4262515556626119, + "learning_rate": 0.00011475169617407364, + "loss": 0.7471, + "mean_token_accuracy": 0.777648288011551, + "num_tokens": 144497794.0, + "step": 42470 + }, + { + "epoch": 0.42635192099241237, + "learning_rate": 0.00011473162310811354, + "loss": 0.7313, + "mean_token_accuracy": 0.7775257229804993, + "num_tokens": 144531243.0, + "step": 42480 + }, + { + "epoch": 0.4264522863222129, + "learning_rate": 0.00011471155004215343, + "loss": 0.762, + "mean_token_accuracy": 0.7685877799987793, + "num_tokens": 144564993.0, + "step": 42490 + }, + { + "epoch": 0.42655265165201334, + "learning_rate": 0.00011469147697619335, + "loss": 0.7743, + "mean_token_accuracy": 0.7730763196945191, + "num_tokens": 144598872.0, + "step": 42500 + }, + { + "epoch": 0.4266530169818138, + "learning_rate": 0.00011467140391023325, + "loss": 0.7407, + "mean_token_accuracy": 0.7757616639137268, + "num_tokens": 144633256.0, + "step": 42510 + }, + { + "epoch": 0.42675338231161425, + "learning_rate": 0.00011465133084427316, + "loss": 0.7642, + "mean_token_accuracy": 0.7709073722362518, + "num_tokens": 144667867.0, + "step": 42520 + }, + { + "epoch": 0.42685374764141476, + "learning_rate": 0.00011463125777831307, + "loss": 0.7775, + "mean_token_accuracy": 0.7658672034740448, + "num_tokens": 144701722.0, + "step": 42530 + }, + { + "epoch": 0.4269541129712152, + "learning_rate": 0.00011461118471235297, + "loss": 0.7499, + "mean_token_accuracy": 0.7720082879066468, + "num_tokens": 144735854.0, + "step": 42540 + }, + { + "epoch": 0.42705447830101567, + "learning_rate": 0.00011459111164639287, + "loss": 0.7797, + "mean_token_accuracy": 0.7656648099422455, + "num_tokens": 144769258.0, + "step": 42550 + }, + { + "epoch": 0.4271548436308162, + "learning_rate": 0.00011457103858043279, + "loss": 0.7564, + "mean_token_accuracy": 0.7687288165092468, + "num_tokens": 144802998.0, + "step": 42560 + }, + { + "epoch": 0.42725520896061664, + "learning_rate": 0.00011455096551447269, + "loss": 0.7779, + "mean_token_accuracy": 0.769432681798935, + "num_tokens": 144837811.0, + "step": 42570 + }, + { + "epoch": 0.4273555742904171, + "learning_rate": 0.00011453089244851258, + "loss": 0.7723, + "mean_token_accuracy": 0.774343591928482, + "num_tokens": 144871769.0, + "step": 42580 + }, + { + "epoch": 0.4274559396202176, + "learning_rate": 0.0001145108193825525, + "loss": 0.7432, + "mean_token_accuracy": 0.7731312811374664, + "num_tokens": 144905705.0, + "step": 42590 + }, + { + "epoch": 0.42755630495001806, + "learning_rate": 0.0001144907463165924, + "loss": 0.7228, + "mean_token_accuracy": 0.7832659125328064, + "num_tokens": 144939609.0, + "step": 42600 + }, + { + "epoch": 0.4276566702798185, + "learning_rate": 0.0001144706732506323, + "loss": 0.7175, + "mean_token_accuracy": 0.7817785501480102, + "num_tokens": 144974461.0, + "step": 42610 + }, + { + "epoch": 0.42775703560961903, + "learning_rate": 0.00011445060018467222, + "loss": 0.7643, + "mean_token_accuracy": 0.7768852293491364, + "num_tokens": 145008987.0, + "step": 42620 + }, + { + "epoch": 0.4278574009394195, + "learning_rate": 0.00011443052711871211, + "loss": 0.7595, + "mean_token_accuracy": 0.772595363855362, + "num_tokens": 145043081.0, + "step": 42630 + }, + { + "epoch": 0.42795776626921994, + "learning_rate": 0.00011441045405275202, + "loss": 0.7788, + "mean_token_accuracy": 0.7669863939285279, + "num_tokens": 145076597.0, + "step": 42640 + }, + { + "epoch": 0.42805813159902045, + "learning_rate": 0.00011439038098679194, + "loss": 0.7572, + "mean_token_accuracy": 0.7708061218261719, + "num_tokens": 145110220.0, + "step": 42650 + }, + { + "epoch": 0.4281584969288209, + "learning_rate": 0.00011437030792083184, + "loss": 0.7696, + "mean_token_accuracy": 0.7687025308609009, + "num_tokens": 145144375.0, + "step": 42660 + }, + { + "epoch": 0.42825886225862136, + "learning_rate": 0.00011435023485487173, + "loss": 0.7492, + "mean_token_accuracy": 0.7752351701259613, + "num_tokens": 145178694.0, + "step": 42670 + }, + { + "epoch": 0.4283592275884219, + "learning_rate": 0.00011433016178891165, + "loss": 0.746, + "mean_token_accuracy": 0.7760239541530609, + "num_tokens": 145212679.0, + "step": 42680 + }, + { + "epoch": 0.42845959291822233, + "learning_rate": 0.00011431008872295155, + "loss": 0.7762, + "mean_token_accuracy": 0.7718257665634155, + "num_tokens": 145246193.0, + "step": 42690 + }, + { + "epoch": 0.4285599582480228, + "learning_rate": 0.00011429001565699144, + "loss": 0.7614, + "mean_token_accuracy": 0.7723347902297973, + "num_tokens": 145279682.0, + "step": 42700 + }, + { + "epoch": 0.4286603235778233, + "learning_rate": 0.00011426994259103136, + "loss": 0.7197, + "mean_token_accuracy": 0.7853658556938171, + "num_tokens": 145313919.0, + "step": 42710 + }, + { + "epoch": 0.42876068890762375, + "learning_rate": 0.00011424986952507126, + "loss": 0.765, + "mean_token_accuracy": 0.7730284512043, + "num_tokens": 145347406.0, + "step": 42720 + }, + { + "epoch": 0.4288610542374242, + "learning_rate": 0.00011422979645911115, + "loss": 0.7662, + "mean_token_accuracy": 0.7666055858135223, + "num_tokens": 145381587.0, + "step": 42730 + }, + { + "epoch": 0.4289614195672247, + "learning_rate": 0.00011420972339315108, + "loss": 0.7112, + "mean_token_accuracy": 0.7838475942611695, + "num_tokens": 145416177.0, + "step": 42740 + }, + { + "epoch": 0.4290617848970252, + "learning_rate": 0.00011418965032719098, + "loss": 0.7887, + "mean_token_accuracy": 0.7718412697315216, + "num_tokens": 145449761.0, + "step": 42750 + }, + { + "epoch": 0.42916215022682563, + "learning_rate": 0.00011416957726123088, + "loss": 0.7185, + "mean_token_accuracy": 0.7836577832698822, + "num_tokens": 145483524.0, + "step": 42760 + }, + { + "epoch": 0.42926251555662615, + "learning_rate": 0.0001141495041952708, + "loss": 0.7263, + "mean_token_accuracy": 0.7785545229911804, + "num_tokens": 145517639.0, + "step": 42770 + }, + { + "epoch": 0.4293628808864266, + "learning_rate": 0.0001141294311293107, + "loss": 0.7382, + "mean_token_accuracy": 0.7751895666122437, + "num_tokens": 145552476.0, + "step": 42780 + }, + { + "epoch": 0.42946324621622706, + "learning_rate": 0.00011410935806335059, + "loss": 0.7589, + "mean_token_accuracy": 0.7743195414543151, + "num_tokens": 145585953.0, + "step": 42790 + }, + { + "epoch": 0.4295636115460275, + "learning_rate": 0.00011408928499739051, + "loss": 0.7299, + "mean_token_accuracy": 0.78284832239151, + "num_tokens": 145619705.0, + "step": 42800 + }, + { + "epoch": 0.429663976875828, + "learning_rate": 0.00011406921193143041, + "loss": 0.7621, + "mean_token_accuracy": 0.7725806474685669, + "num_tokens": 145653006.0, + "step": 42810 + }, + { + "epoch": 0.4297643422056285, + "learning_rate": 0.0001140491388654703, + "loss": 0.7486, + "mean_token_accuracy": 0.7755830824375153, + "num_tokens": 145687064.0, + "step": 42820 + }, + { + "epoch": 0.42986470753542894, + "learning_rate": 0.00011402906579951022, + "loss": 0.7784, + "mean_token_accuracy": 0.7719202518463135, + "num_tokens": 145720957.0, + "step": 42830 + }, + { + "epoch": 0.42996507286522945, + "learning_rate": 0.00011400899273355012, + "loss": 0.7606, + "mean_token_accuracy": 0.7707092642784119, + "num_tokens": 145754449.0, + "step": 42840 + }, + { + "epoch": 0.4300654381950299, + "learning_rate": 0.00011398891966759004, + "loss": 0.7515, + "mean_token_accuracy": 0.7736448407173157, + "num_tokens": 145787727.0, + "step": 42850 + }, + { + "epoch": 0.43016580352483036, + "learning_rate": 0.00011396884660162994, + "loss": 0.7468, + "mean_token_accuracy": 0.7771518647670745, + "num_tokens": 145821506.0, + "step": 42860 + }, + { + "epoch": 0.43026616885463087, + "learning_rate": 0.00011394877353566984, + "loss": 0.7672, + "mean_token_accuracy": 0.7683781266212464, + "num_tokens": 145854865.0, + "step": 42870 + }, + { + "epoch": 0.4303665341844313, + "learning_rate": 0.00011392870046970975, + "loss": 0.7702, + "mean_token_accuracy": 0.7732557237148285, + "num_tokens": 145889360.0, + "step": 42880 + }, + { + "epoch": 0.4304668995142318, + "learning_rate": 0.00011390862740374966, + "loss": 0.7637, + "mean_token_accuracy": 0.7752172887325287, + "num_tokens": 145923478.0, + "step": 42890 + }, + { + "epoch": 0.4305672648440323, + "learning_rate": 0.00011388855433778956, + "loss": 0.7983, + "mean_token_accuracy": 0.762095820903778, + "num_tokens": 145958344.0, + "step": 42900 + }, + { + "epoch": 0.43066763017383275, + "learning_rate": 0.00011386848127182948, + "loss": 0.766, + "mean_token_accuracy": 0.7728649318218231, + "num_tokens": 145992565.0, + "step": 42910 + }, + { + "epoch": 0.4307679955036332, + "learning_rate": 0.00011384840820586937, + "loss": 0.7023, + "mean_token_accuracy": 0.7814755737781525, + "num_tokens": 146025837.0, + "step": 42920 + }, + { + "epoch": 0.4308683608334337, + "learning_rate": 0.00011382833513990927, + "loss": 0.7496, + "mean_token_accuracy": 0.7717016398906708, + "num_tokens": 146060082.0, + "step": 42930 + }, + { + "epoch": 0.4309687261632342, + "learning_rate": 0.00011380826207394919, + "loss": 0.7506, + "mean_token_accuracy": 0.7746443390846253, + "num_tokens": 146093673.0, + "step": 42940 + }, + { + "epoch": 0.43106909149303463, + "learning_rate": 0.00011378818900798909, + "loss": 0.7262, + "mean_token_accuracy": 0.7759982824325562, + "num_tokens": 146127839.0, + "step": 42950 + }, + { + "epoch": 0.43116945682283514, + "learning_rate": 0.00011376811594202898, + "loss": 0.7774, + "mean_token_accuracy": 0.7662631928920746, + "num_tokens": 146161483.0, + "step": 42960 + }, + { + "epoch": 0.4312698221526356, + "learning_rate": 0.0001137480428760689, + "loss": 0.7733, + "mean_token_accuracy": 0.7674487829208374, + "num_tokens": 146195755.0, + "step": 42970 + }, + { + "epoch": 0.43137018748243605, + "learning_rate": 0.0001137279698101088, + "loss": 0.7486, + "mean_token_accuracy": 0.7768530964851379, + "num_tokens": 146229186.0, + "step": 42980 + }, + { + "epoch": 0.43147055281223656, + "learning_rate": 0.0001137078967441487, + "loss": 0.7498, + "mean_token_accuracy": 0.7748568475246429, + "num_tokens": 146263112.0, + "step": 42990 + }, + { + "epoch": 0.431570918142037, + "learning_rate": 0.00011368782367818863, + "loss": 0.7451, + "mean_token_accuracy": 0.7756645023822785, + "num_tokens": 146296685.0, + "step": 43000 + }, + { + "epoch": 0.4316712834718375, + "learning_rate": 0.00011366775061222852, + "loss": 0.7592, + "mean_token_accuracy": 0.7742310643196106, + "num_tokens": 146330720.0, + "step": 43010 + }, + { + "epoch": 0.431771648801638, + "learning_rate": 0.00011364767754626842, + "loss": 0.7228, + "mean_token_accuracy": 0.780841052532196, + "num_tokens": 146365615.0, + "step": 43020 + }, + { + "epoch": 0.43187201413143844, + "learning_rate": 0.00011362760448030834, + "loss": 0.7349, + "mean_token_accuracy": 0.7785764336585999, + "num_tokens": 146399285.0, + "step": 43030 + }, + { + "epoch": 0.4319723794612389, + "learning_rate": 0.00011360753141434823, + "loss": 0.7332, + "mean_token_accuracy": 0.7761741042137146, + "num_tokens": 146433625.0, + "step": 43040 + }, + { + "epoch": 0.4320727447910394, + "learning_rate": 0.00011358745834838813, + "loss": 0.7322, + "mean_token_accuracy": 0.781286609172821, + "num_tokens": 146466849.0, + "step": 43050 + }, + { + "epoch": 0.43217311012083987, + "learning_rate": 0.00011356738528242805, + "loss": 0.7637, + "mean_token_accuracy": 0.7679896533489228, + "num_tokens": 146500899.0, + "step": 43060 + }, + { + "epoch": 0.4322734754506403, + "learning_rate": 0.00011354731221646795, + "loss": 0.7493, + "mean_token_accuracy": 0.7758651614189148, + "num_tokens": 146535913.0, + "step": 43070 + }, + { + "epoch": 0.4323738407804408, + "learning_rate": 0.00011352723915050784, + "loss": 0.7364, + "mean_token_accuracy": 0.7757045984268188, + "num_tokens": 146570949.0, + "step": 43080 + }, + { + "epoch": 0.4324742061102413, + "learning_rate": 0.00011350716608454776, + "loss": 0.7528, + "mean_token_accuracy": 0.7761816620826721, + "num_tokens": 146605146.0, + "step": 43090 + }, + { + "epoch": 0.43257457144004174, + "learning_rate": 0.00011348709301858767, + "loss": 0.755, + "mean_token_accuracy": 0.7720991194248199, + "num_tokens": 146638703.0, + "step": 43100 + }, + { + "epoch": 0.4326749367698422, + "learning_rate": 0.00011346701995262757, + "loss": 0.7637, + "mean_token_accuracy": 0.7714218497276306, + "num_tokens": 146673208.0, + "step": 43110 + }, + { + "epoch": 0.4327753020996427, + "learning_rate": 0.00011344694688666749, + "loss": 0.7621, + "mean_token_accuracy": 0.768765789270401, + "num_tokens": 146706635.0, + "step": 43120 + }, + { + "epoch": 0.43287566742944317, + "learning_rate": 0.00011342687382070738, + "loss": 0.721, + "mean_token_accuracy": 0.7781619131565094, + "num_tokens": 146740682.0, + "step": 43130 + }, + { + "epoch": 0.4329760327592436, + "learning_rate": 0.00011340680075474728, + "loss": 0.7711, + "mean_token_accuracy": 0.7729579508304596, + "num_tokens": 146774162.0, + "step": 43140 + }, + { + "epoch": 0.43307639808904413, + "learning_rate": 0.0001133867276887872, + "loss": 0.7362, + "mean_token_accuracy": 0.7753993928432464, + "num_tokens": 146808242.0, + "step": 43150 + }, + { + "epoch": 0.4331767634188446, + "learning_rate": 0.0001133666546228271, + "loss": 0.7897, + "mean_token_accuracy": 0.7667720377445221, + "num_tokens": 146842093.0, + "step": 43160 + }, + { + "epoch": 0.43327712874864505, + "learning_rate": 0.00011334658155686699, + "loss": 0.7774, + "mean_token_accuracy": 0.7674240648746491, + "num_tokens": 146875708.0, + "step": 43170 + }, + { + "epoch": 0.43337749407844556, + "learning_rate": 0.00011332650849090691, + "loss": 0.7324, + "mean_token_accuracy": 0.7821752607822419, + "num_tokens": 146909808.0, + "step": 43180 + }, + { + "epoch": 0.433477859408246, + "learning_rate": 0.0001133064354249468, + "loss": 0.7317, + "mean_token_accuracy": 0.776114422082901, + "num_tokens": 146943677.0, + "step": 43190 + }, + { + "epoch": 0.43357822473804647, + "learning_rate": 0.00011328636235898671, + "loss": 0.7313, + "mean_token_accuracy": 0.7763771116733551, + "num_tokens": 146977457.0, + "step": 43200 + }, + { + "epoch": 0.433678590067847, + "learning_rate": 0.00011326628929302662, + "loss": 0.7248, + "mean_token_accuracy": 0.786783367395401, + "num_tokens": 147011235.0, + "step": 43210 + }, + { + "epoch": 0.43377895539764744, + "learning_rate": 0.00011324621622706653, + "loss": 0.7602, + "mean_token_accuracy": 0.7720573008060455, + "num_tokens": 147044449.0, + "step": 43220 + }, + { + "epoch": 0.4338793207274479, + "learning_rate": 0.00011322614316110643, + "loss": 0.7151, + "mean_token_accuracy": 0.7858515202999115, + "num_tokens": 147078592.0, + "step": 43230 + }, + { + "epoch": 0.4339796860572484, + "learning_rate": 0.00011320607009514635, + "loss": 0.7616, + "mean_token_accuracy": 0.7693959653377533, + "num_tokens": 147112695.0, + "step": 43240 + }, + { + "epoch": 0.43408005138704886, + "learning_rate": 0.00011318599702918624, + "loss": 0.7407, + "mean_token_accuracy": 0.7777252614498138, + "num_tokens": 147147202.0, + "step": 43250 + }, + { + "epoch": 0.4341804167168493, + "learning_rate": 0.00011316592396322614, + "loss": 0.7755, + "mean_token_accuracy": 0.7707893550395966, + "num_tokens": 147181151.0, + "step": 43260 + }, + { + "epoch": 0.4342807820466498, + "learning_rate": 0.00011314585089726606, + "loss": 0.7632, + "mean_token_accuracy": 0.7738515973091126, + "num_tokens": 147215481.0, + "step": 43270 + }, + { + "epoch": 0.4343811473764503, + "learning_rate": 0.00011312577783130596, + "loss": 0.766, + "mean_token_accuracy": 0.7724314451217651, + "num_tokens": 147248850.0, + "step": 43280 + }, + { + "epoch": 0.43448151270625074, + "learning_rate": 0.00011310570476534585, + "loss": 0.764, + "mean_token_accuracy": 0.7727940082550049, + "num_tokens": 147282441.0, + "step": 43290 + }, + { + "epoch": 0.43458187803605125, + "learning_rate": 0.00011308563169938577, + "loss": 0.7686, + "mean_token_accuracy": 0.7741721034049988, + "num_tokens": 147316660.0, + "step": 43300 + }, + { + "epoch": 0.4346822433658517, + "learning_rate": 0.00011306555863342567, + "loss": 0.7157, + "mean_token_accuracy": 0.7825799405574798, + "num_tokens": 147351036.0, + "step": 43310 + }, + { + "epoch": 0.43478260869565216, + "learning_rate": 0.00011304548556746558, + "loss": 0.7505, + "mean_token_accuracy": 0.7806974291801453, + "num_tokens": 147384464.0, + "step": 43320 + }, + { + "epoch": 0.4348829740254527, + "learning_rate": 0.00011302541250150548, + "loss": 0.7794, + "mean_token_accuracy": 0.7736136972904205, + "num_tokens": 147418810.0, + "step": 43330 + }, + { + "epoch": 0.43498333935525313, + "learning_rate": 0.00011300533943554539, + "loss": 0.7576, + "mean_token_accuracy": 0.7703942358493805, + "num_tokens": 147452464.0, + "step": 43340 + }, + { + "epoch": 0.4350837046850536, + "learning_rate": 0.00011298526636958529, + "loss": 0.7399, + "mean_token_accuracy": 0.7802060544490814, + "num_tokens": 147486019.0, + "step": 43350 + }, + { + "epoch": 0.4351840700148541, + "learning_rate": 0.00011296519330362521, + "loss": 0.7777, + "mean_token_accuracy": 0.7689915657043457, + "num_tokens": 147519125.0, + "step": 43360 + }, + { + "epoch": 0.43528443534465455, + "learning_rate": 0.0001129451202376651, + "loss": 0.7309, + "mean_token_accuracy": 0.7763258755207062, + "num_tokens": 147552872.0, + "step": 43370 + }, + { + "epoch": 0.435384800674455, + "learning_rate": 0.000112925047171705, + "loss": 0.7458, + "mean_token_accuracy": 0.7751060128211975, + "num_tokens": 147586885.0, + "step": 43380 + }, + { + "epoch": 0.43548516600425546, + "learning_rate": 0.00011290497410574492, + "loss": 0.7917, + "mean_token_accuracy": 0.7648883879184722, + "num_tokens": 147621258.0, + "step": 43390 + }, + { + "epoch": 0.435585531334056, + "learning_rate": 0.00011288490103978482, + "loss": 0.7596, + "mean_token_accuracy": 0.7755088090896607, + "num_tokens": 147654561.0, + "step": 43400 + }, + { + "epoch": 0.43568589666385643, + "learning_rate": 0.00011286482797382474, + "loss": 0.7507, + "mean_token_accuracy": 0.7761448502540589, + "num_tokens": 147688265.0, + "step": 43410 + }, + { + "epoch": 0.4357862619936569, + "learning_rate": 0.00011284475490786463, + "loss": 0.7592, + "mean_token_accuracy": 0.7711888194084168, + "num_tokens": 147722114.0, + "step": 43420 + }, + { + "epoch": 0.4358866273234574, + "learning_rate": 0.00011282468184190453, + "loss": 0.777, + "mean_token_accuracy": 0.7686375737190246, + "num_tokens": 147755892.0, + "step": 43430 + }, + { + "epoch": 0.43598699265325785, + "learning_rate": 0.00011280460877594445, + "loss": 0.778, + "mean_token_accuracy": 0.7742932558059692, + "num_tokens": 147789319.0, + "step": 43440 + }, + { + "epoch": 0.4360873579830583, + "learning_rate": 0.00011278453570998436, + "loss": 0.7649, + "mean_token_accuracy": 0.7734306454658508, + "num_tokens": 147822474.0, + "step": 43450 + }, + { + "epoch": 0.4361877233128588, + "learning_rate": 0.00011276446264402425, + "loss": 0.7415, + "mean_token_accuracy": 0.7750584840774536, + "num_tokens": 147856600.0, + "step": 43460 + }, + { + "epoch": 0.4362880886426593, + "learning_rate": 0.00011274438957806417, + "loss": 0.7546, + "mean_token_accuracy": 0.7757338583469391, + "num_tokens": 147889611.0, + "step": 43470 + }, + { + "epoch": 0.43638845397245973, + "learning_rate": 0.00011272431651210407, + "loss": 0.7761, + "mean_token_accuracy": 0.7676257133483887, + "num_tokens": 147924358.0, + "step": 43480 + }, + { + "epoch": 0.43648881930226024, + "learning_rate": 0.00011270424344614396, + "loss": 0.7474, + "mean_token_accuracy": 0.7697301208972931, + "num_tokens": 147958186.0, + "step": 43490 + }, + { + "epoch": 0.4365891846320607, + "learning_rate": 0.00011268417038018389, + "loss": 0.7327, + "mean_token_accuracy": 0.7785479128360748, + "num_tokens": 147992440.0, + "step": 43500 + }, + { + "epoch": 0.43668954996186116, + "learning_rate": 0.00011266409731422378, + "loss": 0.7158, + "mean_token_accuracy": 0.7759631454944611, + "num_tokens": 148026123.0, + "step": 43510 + }, + { + "epoch": 0.43678991529166167, + "learning_rate": 0.00011264402424826368, + "loss": 0.7501, + "mean_token_accuracy": 0.775789487361908, + "num_tokens": 148060170.0, + "step": 43520 + }, + { + "epoch": 0.4368902806214621, + "learning_rate": 0.0001126239511823036, + "loss": 0.7443, + "mean_token_accuracy": 0.7734920859336853, + "num_tokens": 148094738.0, + "step": 43530 + }, + { + "epoch": 0.4369906459512626, + "learning_rate": 0.00011260387811634349, + "loss": 0.7617, + "mean_token_accuracy": 0.7684929430484772, + "num_tokens": 148128157.0, + "step": 43540 + }, + { + "epoch": 0.4370910112810631, + "learning_rate": 0.0001125838050503834, + "loss": 0.7525, + "mean_token_accuracy": 0.776504111289978, + "num_tokens": 148163114.0, + "step": 43550 + }, + { + "epoch": 0.43719137661086355, + "learning_rate": 0.00011256373198442331, + "loss": 0.7764, + "mean_token_accuracy": 0.7684085130691528, + "num_tokens": 148196998.0, + "step": 43560 + }, + { + "epoch": 0.437291741940664, + "learning_rate": 0.00011254365891846322, + "loss": 0.7363, + "mean_token_accuracy": 0.7734168648719788, + "num_tokens": 148230922.0, + "step": 43570 + }, + { + "epoch": 0.4373921072704645, + "learning_rate": 0.00011252358585250311, + "loss": 0.7672, + "mean_token_accuracy": 0.7757761478424072, + "num_tokens": 148265034.0, + "step": 43580 + }, + { + "epoch": 0.43749247260026497, + "learning_rate": 0.00011250351278654304, + "loss": 0.7228, + "mean_token_accuracy": 0.780917638540268, + "num_tokens": 148299100.0, + "step": 43590 + }, + { + "epoch": 0.4375928379300654, + "learning_rate": 0.00011248343972058293, + "loss": 0.739, + "mean_token_accuracy": 0.7782020151615143, + "num_tokens": 148333913.0, + "step": 43600 + }, + { + "epoch": 0.43769320325986594, + "learning_rate": 0.00011246336665462283, + "loss": 0.763, + "mean_token_accuracy": 0.7715815305709839, + "num_tokens": 148367724.0, + "step": 43610 + }, + { + "epoch": 0.4377935685896664, + "learning_rate": 0.00011244329358866275, + "loss": 0.7528, + "mean_token_accuracy": 0.7737765967845917, + "num_tokens": 148401807.0, + "step": 43620 + }, + { + "epoch": 0.43789393391946685, + "learning_rate": 0.00011242322052270264, + "loss": 0.7465, + "mean_token_accuracy": 0.7716784477233887, + "num_tokens": 148435545.0, + "step": 43630 + }, + { + "epoch": 0.43799429924926736, + "learning_rate": 0.00011240314745674254, + "loss": 0.7552, + "mean_token_accuracy": 0.776634031534195, + "num_tokens": 148469623.0, + "step": 43640 + }, + { + "epoch": 0.4380946645790678, + "learning_rate": 0.00011238307439078246, + "loss": 0.7294, + "mean_token_accuracy": 0.7753891468048095, + "num_tokens": 148502671.0, + "step": 43650 + }, + { + "epoch": 0.43819502990886827, + "learning_rate": 0.00011236300132482235, + "loss": 0.7266, + "mean_token_accuracy": 0.779669314622879, + "num_tokens": 148536980.0, + "step": 43660 + }, + { + "epoch": 0.43829539523866873, + "learning_rate": 0.00011234292825886226, + "loss": 0.7783, + "mean_token_accuracy": 0.7682388186454773, + "num_tokens": 148570675.0, + "step": 43670 + }, + { + "epoch": 0.43839576056846924, + "learning_rate": 0.00011232285519290217, + "loss": 0.7646, + "mean_token_accuracy": 0.7727665424346923, + "num_tokens": 148604730.0, + "step": 43680 + }, + { + "epoch": 0.4384961258982697, + "learning_rate": 0.00011230278212694208, + "loss": 0.722, + "mean_token_accuracy": 0.7830365002155304, + "num_tokens": 148638983.0, + "step": 43690 + }, + { + "epoch": 0.43859649122807015, + "learning_rate": 0.00011228270906098197, + "loss": 0.7491, + "mean_token_accuracy": 0.7743676781654358, + "num_tokens": 148672923.0, + "step": 43700 + }, + { + "epoch": 0.43869685655787066, + "learning_rate": 0.0001122626359950219, + "loss": 0.7255, + "mean_token_accuracy": 0.7819778323173523, + "num_tokens": 148707032.0, + "step": 43710 + }, + { + "epoch": 0.4387972218876711, + "learning_rate": 0.00011224256292906179, + "loss": 0.7355, + "mean_token_accuracy": 0.7821864724159241, + "num_tokens": 148740780.0, + "step": 43720 + }, + { + "epoch": 0.4388975872174716, + "learning_rate": 0.00011222248986310169, + "loss": 0.7204, + "mean_token_accuracy": 0.7825488030910492, + "num_tokens": 148774642.0, + "step": 43730 + }, + { + "epoch": 0.4389979525472721, + "learning_rate": 0.00011220241679714161, + "loss": 0.7429, + "mean_token_accuracy": 0.7777960121631622, + "num_tokens": 148808512.0, + "step": 43740 + }, + { + "epoch": 0.43909831787707254, + "learning_rate": 0.0001121823437311815, + "loss": 0.7159, + "mean_token_accuracy": 0.7805725157260894, + "num_tokens": 148842492.0, + "step": 43750 + }, + { + "epoch": 0.439198683206873, + "learning_rate": 0.0001121622706652214, + "loss": 0.7439, + "mean_token_accuracy": 0.7803267896175384, + "num_tokens": 148876804.0, + "step": 43760 + }, + { + "epoch": 0.4392990485366735, + "learning_rate": 0.00011214219759926132, + "loss": 0.7601, + "mean_token_accuracy": 0.7764488101005554, + "num_tokens": 148910864.0, + "step": 43770 + }, + { + "epoch": 0.43939941386647396, + "learning_rate": 0.00011212212453330121, + "loss": 0.7685, + "mean_token_accuracy": 0.7743898093700409, + "num_tokens": 148945189.0, + "step": 43780 + }, + { + "epoch": 0.4394997791962744, + "learning_rate": 0.00011210205146734112, + "loss": 0.7247, + "mean_token_accuracy": 0.7831371545791626, + "num_tokens": 148980389.0, + "step": 43790 + }, + { + "epoch": 0.43960014452607493, + "learning_rate": 0.00011208197840138104, + "loss": 0.7657, + "mean_token_accuracy": 0.7732807636260987, + "num_tokens": 149014489.0, + "step": 43800 + }, + { + "epoch": 0.4397005098558754, + "learning_rate": 0.00011206190533542094, + "loss": 0.7768, + "mean_token_accuracy": 0.7680534720420837, + "num_tokens": 149048386.0, + "step": 43810 + }, + { + "epoch": 0.43980087518567584, + "learning_rate": 0.00011204183226946083, + "loss": 0.7605, + "mean_token_accuracy": 0.7759904325008392, + "num_tokens": 149083384.0, + "step": 43820 + }, + { + "epoch": 0.43990124051547635, + "learning_rate": 0.00011202175920350076, + "loss": 0.7334, + "mean_token_accuracy": 0.782331782579422, + "num_tokens": 149117597.0, + "step": 43830 + }, + { + "epoch": 0.4400016058452768, + "learning_rate": 0.00011200168613754065, + "loss": 0.7647, + "mean_token_accuracy": 0.7740571975708008, + "num_tokens": 149151403.0, + "step": 43840 + }, + { + "epoch": 0.44010197117507727, + "learning_rate": 0.00011198161307158055, + "loss": 0.7756, + "mean_token_accuracy": 0.7720715939998627, + "num_tokens": 149184826.0, + "step": 43850 + }, + { + "epoch": 0.4402023365048778, + "learning_rate": 0.00011196154000562047, + "loss": 0.7698, + "mean_token_accuracy": 0.7729233264923095, + "num_tokens": 149219488.0, + "step": 43860 + }, + { + "epoch": 0.44030270183467823, + "learning_rate": 0.00011194146693966036, + "loss": 0.7215, + "mean_token_accuracy": 0.7808591425418854, + "num_tokens": 149253761.0, + "step": 43870 + }, + { + "epoch": 0.4404030671644787, + "learning_rate": 0.00011192139387370026, + "loss": 0.7472, + "mean_token_accuracy": 0.7746274948120118, + "num_tokens": 149288748.0, + "step": 43880 + }, + { + "epoch": 0.4405034324942792, + "learning_rate": 0.00011190132080774018, + "loss": 0.7425, + "mean_token_accuracy": 0.7758005857467651, + "num_tokens": 149322532.0, + "step": 43890 + }, + { + "epoch": 0.44060379782407966, + "learning_rate": 0.00011188124774178009, + "loss": 0.7444, + "mean_token_accuracy": 0.778124886751175, + "num_tokens": 149357154.0, + "step": 43900 + }, + { + "epoch": 0.4407041631538801, + "learning_rate": 0.00011186117467581998, + "loss": 0.7631, + "mean_token_accuracy": 0.7752729535102845, + "num_tokens": 149391861.0, + "step": 43910 + }, + { + "epoch": 0.4408045284836806, + "learning_rate": 0.0001118411016098599, + "loss": 0.7553, + "mean_token_accuracy": 0.770001494884491, + "num_tokens": 149425672.0, + "step": 43920 + }, + { + "epoch": 0.4409048938134811, + "learning_rate": 0.0001118210285438998, + "loss": 0.7421, + "mean_token_accuracy": 0.7809359133243561, + "num_tokens": 149460223.0, + "step": 43930 + }, + { + "epoch": 0.44100525914328154, + "learning_rate": 0.0001118009554779397, + "loss": 0.7204, + "mean_token_accuracy": 0.7850530624389649, + "num_tokens": 149493781.0, + "step": 43940 + }, + { + "epoch": 0.441105624473082, + "learning_rate": 0.00011178088241197962, + "loss": 0.7252, + "mean_token_accuracy": 0.7797057867050171, + "num_tokens": 149528669.0, + "step": 43950 + }, + { + "epoch": 0.4412059898028825, + "learning_rate": 0.00011176080934601951, + "loss": 0.7568, + "mean_token_accuracy": 0.7771291673183441, + "num_tokens": 149562236.0, + "step": 43960 + }, + { + "epoch": 0.44130635513268296, + "learning_rate": 0.00011174073628005943, + "loss": 0.7623, + "mean_token_accuracy": 0.7755987465381622, + "num_tokens": 149596168.0, + "step": 43970 + }, + { + "epoch": 0.4414067204624834, + "learning_rate": 0.00011172066321409933, + "loss": 0.7263, + "mean_token_accuracy": 0.7827870607376098, + "num_tokens": 149630105.0, + "step": 43980 + }, + { + "epoch": 0.4415070857922839, + "learning_rate": 0.00011170059014813922, + "loss": 0.7481, + "mean_token_accuracy": 0.7742818355560303, + "num_tokens": 149664931.0, + "step": 43990 + }, + { + "epoch": 0.4416074511220844, + "learning_rate": 0.00011168051708217915, + "loss": 0.7752, + "mean_token_accuracy": 0.770356547832489, + "num_tokens": 149697876.0, + "step": 44000 + }, + { + "epoch": 0.44170781645188484, + "learning_rate": 0.00011166044401621904, + "loss": 0.7507, + "mean_token_accuracy": 0.7784092545509338, + "num_tokens": 149731738.0, + "step": 44010 + }, + { + "epoch": 0.44180818178168535, + "learning_rate": 0.00011164037095025895, + "loss": 0.7059, + "mean_token_accuracy": 0.7859094977378845, + "num_tokens": 149765648.0, + "step": 44020 + }, + { + "epoch": 0.4419085471114858, + "learning_rate": 0.00011162029788429886, + "loss": 0.762, + "mean_token_accuracy": 0.774725592136383, + "num_tokens": 149800114.0, + "step": 44030 + }, + { + "epoch": 0.44200891244128626, + "learning_rate": 0.00011160022481833877, + "loss": 0.731, + "mean_token_accuracy": 0.7784102320671081, + "num_tokens": 149834841.0, + "step": 44040 + }, + { + "epoch": 0.4421092777710868, + "learning_rate": 0.00011158015175237866, + "loss": 0.7157, + "mean_token_accuracy": 0.7827341020107269, + "num_tokens": 149868802.0, + "step": 44050 + }, + { + "epoch": 0.44220964310088723, + "learning_rate": 0.00011156007868641858, + "loss": 0.7534, + "mean_token_accuracy": 0.7758202314376831, + "num_tokens": 149902453.0, + "step": 44060 + }, + { + "epoch": 0.4423100084306877, + "learning_rate": 0.00011154000562045848, + "loss": 0.7614, + "mean_token_accuracy": 0.7681388676166534, + "num_tokens": 149937141.0, + "step": 44070 + }, + { + "epoch": 0.4424103737604882, + "learning_rate": 0.00011151993255449837, + "loss": 0.783, + "mean_token_accuracy": 0.7707764804363251, + "num_tokens": 149971447.0, + "step": 44080 + }, + { + "epoch": 0.44251073909028865, + "learning_rate": 0.0001114998594885383, + "loss": 0.7493, + "mean_token_accuracy": 0.7753174424171447, + "num_tokens": 150005271.0, + "step": 44090 + }, + { + "epoch": 0.4426111044200891, + "learning_rate": 0.00011147978642257819, + "loss": 0.7534, + "mean_token_accuracy": 0.7698142409324646, + "num_tokens": 150039632.0, + "step": 44100 + }, + { + "epoch": 0.4427114697498896, + "learning_rate": 0.00011145971335661808, + "loss": 0.7691, + "mean_token_accuracy": 0.7704128801822663, + "num_tokens": 150074429.0, + "step": 44110 + }, + { + "epoch": 0.4428118350796901, + "learning_rate": 0.000111439640290658, + "loss": 0.754, + "mean_token_accuracy": 0.767986536026001, + "num_tokens": 150108714.0, + "step": 44120 + }, + { + "epoch": 0.44291220040949053, + "learning_rate": 0.0001114195672246979, + "loss": 0.7313, + "mean_token_accuracy": 0.7801444411277771, + "num_tokens": 150143349.0, + "step": 44130 + }, + { + "epoch": 0.44301256573929104, + "learning_rate": 0.00011139949415873781, + "loss": 0.769, + "mean_token_accuracy": 0.7680265784263611, + "num_tokens": 150177716.0, + "step": 44140 + }, + { + "epoch": 0.4431129310690915, + "learning_rate": 0.00011137942109277773, + "loss": 0.7555, + "mean_token_accuracy": 0.7723772168159485, + "num_tokens": 150212615.0, + "step": 44150 + }, + { + "epoch": 0.44321329639889195, + "learning_rate": 0.00011135934802681763, + "loss": 0.7439, + "mean_token_accuracy": 0.7749141871929168, + "num_tokens": 150246173.0, + "step": 44160 + }, + { + "epoch": 0.44331366172869247, + "learning_rate": 0.00011133927496085752, + "loss": 0.7371, + "mean_token_accuracy": 0.7740356266498566, + "num_tokens": 150280009.0, + "step": 44170 + }, + { + "epoch": 0.4434140270584929, + "learning_rate": 0.00011131920189489744, + "loss": 0.7833, + "mean_token_accuracy": 0.7707145631313324, + "num_tokens": 150315302.0, + "step": 44180 + }, + { + "epoch": 0.4435143923882934, + "learning_rate": 0.00011129912882893734, + "loss": 0.7599, + "mean_token_accuracy": 0.772494101524353, + "num_tokens": 150349697.0, + "step": 44190 + }, + { + "epoch": 0.4436147577180939, + "learning_rate": 0.00011127905576297723, + "loss": 0.7576, + "mean_token_accuracy": 0.7743092060089112, + "num_tokens": 150384328.0, + "step": 44200 + }, + { + "epoch": 0.44371512304789434, + "learning_rate": 0.00011125898269701716, + "loss": 0.7171, + "mean_token_accuracy": 0.782273119688034, + "num_tokens": 150417859.0, + "step": 44210 + }, + { + "epoch": 0.4438154883776948, + "learning_rate": 0.00011123890963105705, + "loss": 0.7779, + "mean_token_accuracy": 0.7740826606750488, + "num_tokens": 150451836.0, + "step": 44220 + }, + { + "epoch": 0.44391585370749526, + "learning_rate": 0.00011121883656509694, + "loss": 0.7414, + "mean_token_accuracy": 0.7781951189041137, + "num_tokens": 150486201.0, + "step": 44230 + }, + { + "epoch": 0.44401621903729577, + "learning_rate": 0.00011119876349913687, + "loss": 0.7301, + "mean_token_accuracy": 0.7788292706012726, + "num_tokens": 150519669.0, + "step": 44240 + }, + { + "epoch": 0.4441165843670962, + "learning_rate": 0.00011117869043317678, + "loss": 0.7575, + "mean_token_accuracy": 0.7742524087429047, + "num_tokens": 150553112.0, + "step": 44250 + }, + { + "epoch": 0.4442169496968967, + "learning_rate": 0.00011115861736721667, + "loss": 0.7408, + "mean_token_accuracy": 0.7746887743473053, + "num_tokens": 150587479.0, + "step": 44260 + }, + { + "epoch": 0.4443173150266972, + "learning_rate": 0.00011113854430125659, + "loss": 0.7493, + "mean_token_accuracy": 0.7738109111785889, + "num_tokens": 150621557.0, + "step": 44270 + }, + { + "epoch": 0.44441768035649765, + "learning_rate": 0.00011111847123529649, + "loss": 0.7206, + "mean_token_accuracy": 0.7809482932090759, + "num_tokens": 150656884.0, + "step": 44280 + }, + { + "epoch": 0.4445180456862981, + "learning_rate": 0.00011109839816933638, + "loss": 0.7546, + "mean_token_accuracy": 0.775887793302536, + "num_tokens": 150690433.0, + "step": 44290 + }, + { + "epoch": 0.4446184110160986, + "learning_rate": 0.0001110783251033763, + "loss": 0.7631, + "mean_token_accuracy": 0.7731802225112915, + "num_tokens": 150724169.0, + "step": 44300 + }, + { + "epoch": 0.44471877634589907, + "learning_rate": 0.0001110582520374162, + "loss": 0.7471, + "mean_token_accuracy": 0.7732235372066498, + "num_tokens": 150759354.0, + "step": 44310 + }, + { + "epoch": 0.4448191416756995, + "learning_rate": 0.0001110381789714561, + "loss": 0.7327, + "mean_token_accuracy": 0.7866859495639801, + "num_tokens": 150792697.0, + "step": 44320 + }, + { + "epoch": 0.44491950700550004, + "learning_rate": 0.00011101810590549602, + "loss": 0.7328, + "mean_token_accuracy": 0.7779637038707733, + "num_tokens": 150825950.0, + "step": 44330 + }, + { + "epoch": 0.4450198723353005, + "learning_rate": 0.00011099803283953591, + "loss": 0.714, + "mean_token_accuracy": 0.7852058053016663, + "num_tokens": 150859211.0, + "step": 44340 + }, + { + "epoch": 0.44512023766510095, + "learning_rate": 0.00011097795977357582, + "loss": 0.7416, + "mean_token_accuracy": 0.7797508060932159, + "num_tokens": 150892624.0, + "step": 44350 + }, + { + "epoch": 0.44522060299490146, + "learning_rate": 0.00011095788670761573, + "loss": 0.7918, + "mean_token_accuracy": 0.7642795860767364, + "num_tokens": 150926497.0, + "step": 44360 + }, + { + "epoch": 0.4453209683247019, + "learning_rate": 0.00011093781364165564, + "loss": 0.7533, + "mean_token_accuracy": 0.7732256591320038, + "num_tokens": 150960100.0, + "step": 44370 + }, + { + "epoch": 0.44542133365450237, + "learning_rate": 0.00011091774057569553, + "loss": 0.7976, + "mean_token_accuracy": 0.7641650021076203, + "num_tokens": 150994591.0, + "step": 44380 + }, + { + "epoch": 0.4455216989843029, + "learning_rate": 0.00011089766750973545, + "loss": 0.7487, + "mean_token_accuracy": 0.7758909225463867, + "num_tokens": 151028977.0, + "step": 44390 + }, + { + "epoch": 0.44562206431410334, + "learning_rate": 0.00011087759444377535, + "loss": 0.7403, + "mean_token_accuracy": 0.7733930587768555, + "num_tokens": 151063183.0, + "step": 44400 + }, + { + "epoch": 0.4457224296439038, + "learning_rate": 0.00011085752137781524, + "loss": 0.7305, + "mean_token_accuracy": 0.7791752755641937, + "num_tokens": 151097491.0, + "step": 44410 + }, + { + "epoch": 0.4458227949737043, + "learning_rate": 0.00011083744831185516, + "loss": 0.7367, + "mean_token_accuracy": 0.7794057905673981, + "num_tokens": 151131641.0, + "step": 44420 + }, + { + "epoch": 0.44592316030350476, + "learning_rate": 0.00011081737524589506, + "loss": 0.7263, + "mean_token_accuracy": 0.7804259061813354, + "num_tokens": 151166489.0, + "step": 44430 + }, + { + "epoch": 0.4460235256333052, + "learning_rate": 0.00011079730217993495, + "loss": 0.7809, + "mean_token_accuracy": 0.7714639127254486, + "num_tokens": 151200008.0, + "step": 44440 + }, + { + "epoch": 0.44612389096310573, + "learning_rate": 0.00011077722911397488, + "loss": 0.7866, + "mean_token_accuracy": 0.7731386125087738, + "num_tokens": 151233927.0, + "step": 44450 + }, + { + "epoch": 0.4462242562929062, + "learning_rate": 0.00011075715604801477, + "loss": 0.7067, + "mean_token_accuracy": 0.7901102244853974, + "num_tokens": 151267858.0, + "step": 44460 + }, + { + "epoch": 0.44632462162270664, + "learning_rate": 0.00011073708298205468, + "loss": 0.7218, + "mean_token_accuracy": 0.7798720598220825, + "num_tokens": 151302475.0, + "step": 44470 + }, + { + "epoch": 0.44642498695250715, + "learning_rate": 0.00011071700991609459, + "loss": 0.7592, + "mean_token_accuracy": 0.7675409078598022, + "num_tokens": 151337152.0, + "step": 44480 + }, + { + "epoch": 0.4465253522823076, + "learning_rate": 0.0001106969368501345, + "loss": 0.7652, + "mean_token_accuracy": 0.7725721955299377, + "num_tokens": 151371174.0, + "step": 44490 + }, + { + "epoch": 0.44662571761210806, + "learning_rate": 0.00011067686378417439, + "loss": 0.7406, + "mean_token_accuracy": 0.779172706604004, + "num_tokens": 151405625.0, + "step": 44500 + }, + { + "epoch": 0.4467260829419085, + "learning_rate": 0.00011065679071821431, + "loss": 0.7582, + "mean_token_accuracy": 0.7733696103096008, + "num_tokens": 151439959.0, + "step": 44510 + }, + { + "epoch": 0.44682644827170903, + "learning_rate": 0.00011063671765225421, + "loss": 0.7573, + "mean_token_accuracy": 0.7659881412982941, + "num_tokens": 151473539.0, + "step": 44520 + }, + { + "epoch": 0.4469268136015095, + "learning_rate": 0.0001106166445862941, + "loss": 0.7334, + "mean_token_accuracy": 0.7809433043003082, + "num_tokens": 151507369.0, + "step": 44530 + }, + { + "epoch": 0.44702717893130994, + "learning_rate": 0.00011059657152033402, + "loss": 0.7186, + "mean_token_accuracy": 0.7804858088493347, + "num_tokens": 151541480.0, + "step": 44540 + }, + { + "epoch": 0.44712754426111045, + "learning_rate": 0.00011057649845437392, + "loss": 0.7547, + "mean_token_accuracy": 0.7767960965633393, + "num_tokens": 151575833.0, + "step": 44550 + }, + { + "epoch": 0.4472279095909109, + "learning_rate": 0.00011055642538841384, + "loss": 0.7525, + "mean_token_accuracy": 0.7782451093196869, + "num_tokens": 151609860.0, + "step": 44560 + }, + { + "epoch": 0.44732827492071137, + "learning_rate": 0.00011053635232245374, + "loss": 0.7038, + "mean_token_accuracy": 0.7875931859016418, + "num_tokens": 151644156.0, + "step": 44570 + }, + { + "epoch": 0.4474286402505119, + "learning_rate": 0.00011051627925649363, + "loss": 0.7759, + "mean_token_accuracy": 0.7787350296974183, + "num_tokens": 151677964.0, + "step": 44580 + }, + { + "epoch": 0.44752900558031233, + "learning_rate": 0.00011049620619053355, + "loss": 0.7525, + "mean_token_accuracy": 0.7707826018333435, + "num_tokens": 151711574.0, + "step": 44590 + }, + { + "epoch": 0.4476293709101128, + "learning_rate": 0.00011047613312457346, + "loss": 0.7491, + "mean_token_accuracy": 0.7768722116947174, + "num_tokens": 151745582.0, + "step": 44600 + }, + { + "epoch": 0.4477297362399133, + "learning_rate": 0.00011045606005861336, + "loss": 0.7669, + "mean_token_accuracy": 0.7713538646697998, + "num_tokens": 151780065.0, + "step": 44610 + }, + { + "epoch": 0.44783010156971376, + "learning_rate": 0.00011043598699265328, + "loss": 0.7473, + "mean_token_accuracy": 0.776011997461319, + "num_tokens": 151814621.0, + "step": 44620 + }, + { + "epoch": 0.4479304668995142, + "learning_rate": 0.00011041591392669317, + "loss": 0.7217, + "mean_token_accuracy": 0.7846306204795838, + "num_tokens": 151848477.0, + "step": 44630 + }, + { + "epoch": 0.4480308322293147, + "learning_rate": 0.00011039584086073307, + "loss": 0.7295, + "mean_token_accuracy": 0.7849527895450592, + "num_tokens": 151883337.0, + "step": 44640 + }, + { + "epoch": 0.4481311975591152, + "learning_rate": 0.00011037576779477299, + "loss": 0.7574, + "mean_token_accuracy": 0.7724159836769104, + "num_tokens": 151916760.0, + "step": 44650 + }, + { + "epoch": 0.44823156288891564, + "learning_rate": 0.00011035569472881289, + "loss": 0.7637, + "mean_token_accuracy": 0.7737322509288788, + "num_tokens": 151950685.0, + "step": 44660 + }, + { + "epoch": 0.44833192821871615, + "learning_rate": 0.00011033562166285278, + "loss": 0.7194, + "mean_token_accuracy": 0.7801818192005158, + "num_tokens": 151984859.0, + "step": 44670 + }, + { + "epoch": 0.4484322935485166, + "learning_rate": 0.0001103155485968927, + "loss": 0.7338, + "mean_token_accuracy": 0.781706178188324, + "num_tokens": 152019151.0, + "step": 44680 + }, + { + "epoch": 0.44853265887831706, + "learning_rate": 0.0001102954755309326, + "loss": 0.7529, + "mean_token_accuracy": 0.7799510359764099, + "num_tokens": 152053767.0, + "step": 44690 + }, + { + "epoch": 0.44863302420811757, + "learning_rate": 0.0001102754024649725, + "loss": 0.7218, + "mean_token_accuracy": 0.7807285010814666, + "num_tokens": 152088255.0, + "step": 44700 + }, + { + "epoch": 0.448733389537918, + "learning_rate": 0.00011025532939901241, + "loss": 0.7885, + "mean_token_accuracy": 0.7673042953014374, + "num_tokens": 152122375.0, + "step": 44710 + }, + { + "epoch": 0.4488337548677185, + "learning_rate": 0.00011023525633305232, + "loss": 0.7403, + "mean_token_accuracy": 0.7771869957447052, + "num_tokens": 152156587.0, + "step": 44720 + }, + { + "epoch": 0.448934120197519, + "learning_rate": 0.00011021518326709222, + "loss": 0.7501, + "mean_token_accuracy": 0.7746523737907409, + "num_tokens": 152190688.0, + "step": 44730 + }, + { + "epoch": 0.44903448552731945, + "learning_rate": 0.00011019511020113214, + "loss": 0.7294, + "mean_token_accuracy": 0.7841888248920441, + "num_tokens": 152225354.0, + "step": 44740 + }, + { + "epoch": 0.4491348508571199, + "learning_rate": 0.00011017503713517203, + "loss": 0.7547, + "mean_token_accuracy": 0.7752269029617309, + "num_tokens": 152259841.0, + "step": 44750 + }, + { + "epoch": 0.4492352161869204, + "learning_rate": 0.00011015496406921193, + "loss": 0.709, + "mean_token_accuracy": 0.7895790874958039, + "num_tokens": 152294626.0, + "step": 44760 + }, + { + "epoch": 0.44933558151672087, + "learning_rate": 0.00011013489100325185, + "loss": 0.7565, + "mean_token_accuracy": 0.7733225226402283, + "num_tokens": 152328799.0, + "step": 44770 + }, + { + "epoch": 0.44943594684652133, + "learning_rate": 0.00011011481793729175, + "loss": 0.7224, + "mean_token_accuracy": 0.7841477155685425, + "num_tokens": 152363147.0, + "step": 44780 + }, + { + "epoch": 0.4495363121763218, + "learning_rate": 0.00011009474487133164, + "loss": 0.7523, + "mean_token_accuracy": 0.7750907003879547, + "num_tokens": 152397871.0, + "step": 44790 + }, + { + "epoch": 0.4496366775061223, + "learning_rate": 0.00011007467180537156, + "loss": 0.7183, + "mean_token_accuracy": 0.7833089828491211, + "num_tokens": 152432334.0, + "step": 44800 + }, + { + "epoch": 0.44973704283592275, + "learning_rate": 0.00011005459873941146, + "loss": 0.7488, + "mean_token_accuracy": 0.7749288022518158, + "num_tokens": 152465909.0, + "step": 44810 + }, + { + "epoch": 0.4498374081657232, + "learning_rate": 0.00011003452567345137, + "loss": 0.7312, + "mean_token_accuracy": 0.7770084142684937, + "num_tokens": 152499684.0, + "step": 44820 + }, + { + "epoch": 0.4499377734955237, + "learning_rate": 0.00011001445260749127, + "loss": 0.7403, + "mean_token_accuracy": 0.7816311717033386, + "num_tokens": 152534067.0, + "step": 44830 + }, + { + "epoch": 0.4500381388253242, + "learning_rate": 0.00010999437954153118, + "loss": 0.7358, + "mean_token_accuracy": 0.783948940038681, + "num_tokens": 152567928.0, + "step": 44840 + }, + { + "epoch": 0.45013850415512463, + "learning_rate": 0.00010997430647557108, + "loss": 0.7558, + "mean_token_accuracy": 0.7711122810840607, + "num_tokens": 152602037.0, + "step": 44850 + }, + { + "epoch": 0.45023886948492514, + "learning_rate": 0.000109954233409611, + "loss": 0.742, + "mean_token_accuracy": 0.77590092420578, + "num_tokens": 152636816.0, + "step": 44860 + }, + { + "epoch": 0.4503392348147256, + "learning_rate": 0.0001099341603436509, + "loss": 0.7564, + "mean_token_accuracy": 0.772537213563919, + "num_tokens": 152671468.0, + "step": 44870 + }, + { + "epoch": 0.45043960014452605, + "learning_rate": 0.00010991408727769079, + "loss": 0.7897, + "mean_token_accuracy": 0.767767709493637, + "num_tokens": 152705343.0, + "step": 44880 + }, + { + "epoch": 0.45053996547432656, + "learning_rate": 0.00010989401421173071, + "loss": 0.7162, + "mean_token_accuracy": 0.7875835716724395, + "num_tokens": 152739295.0, + "step": 44890 + }, + { + "epoch": 0.450640330804127, + "learning_rate": 0.0001098739411457706, + "loss": 0.7553, + "mean_token_accuracy": 0.7732517123222351, + "num_tokens": 152773289.0, + "step": 44900 + }, + { + "epoch": 0.4507406961339275, + "learning_rate": 0.0001098538680798105, + "loss": 0.7365, + "mean_token_accuracy": 0.7796446919441223, + "num_tokens": 152806787.0, + "step": 44910 + }, + { + "epoch": 0.450841061463728, + "learning_rate": 0.00010983379501385042, + "loss": 0.7393, + "mean_token_accuracy": 0.782460218667984, + "num_tokens": 152841397.0, + "step": 44920 + }, + { + "epoch": 0.45094142679352844, + "learning_rate": 0.00010981372194789032, + "loss": 0.7203, + "mean_token_accuracy": 0.7838031113147735, + "num_tokens": 152876756.0, + "step": 44930 + }, + { + "epoch": 0.4510417921233289, + "learning_rate": 0.00010979364888193023, + "loss": 0.7636, + "mean_token_accuracy": 0.7748829603195191, + "num_tokens": 152910930.0, + "step": 44940 + }, + { + "epoch": 0.4511421574531294, + "learning_rate": 0.00010977357581597015, + "loss": 0.721, + "mean_token_accuracy": 0.7819502830505372, + "num_tokens": 152944540.0, + "step": 44950 + }, + { + "epoch": 0.45124252278292987, + "learning_rate": 0.00010975350275001004, + "loss": 0.7315, + "mean_token_accuracy": 0.7765802860260009, + "num_tokens": 152979407.0, + "step": 44960 + }, + { + "epoch": 0.4513428881127303, + "learning_rate": 0.00010973342968404994, + "loss": 0.7499, + "mean_token_accuracy": 0.7792832970619201, + "num_tokens": 153013721.0, + "step": 44970 + }, + { + "epoch": 0.45144325344253083, + "learning_rate": 0.00010971335661808986, + "loss": 0.7203, + "mean_token_accuracy": 0.7842995822429657, + "num_tokens": 153049466.0, + "step": 44980 + }, + { + "epoch": 0.4515436187723313, + "learning_rate": 0.00010969328355212976, + "loss": 0.7149, + "mean_token_accuracy": 0.7853386759757995, + "num_tokens": 153084689.0, + "step": 44990 + }, + { + "epoch": 0.45164398410213175, + "learning_rate": 0.00010967321048616965, + "loss": 0.7136, + "mean_token_accuracy": 0.7828909814357757, + "num_tokens": 153120308.0, + "step": 45000 + }, + { + "epoch": 0.45174434943193226, + "learning_rate": 0.00010965313742020957, + "loss": 0.7786, + "mean_token_accuracy": 0.7707717061042786, + "num_tokens": 153153962.0, + "step": 45010 + }, + { + "epoch": 0.4518447147617327, + "learning_rate": 0.00010963306435424947, + "loss": 0.7105, + "mean_token_accuracy": 0.7827567040920258, + "num_tokens": 153188249.0, + "step": 45020 + }, + { + "epoch": 0.45194508009153317, + "learning_rate": 0.00010961299128828936, + "loss": 0.7274, + "mean_token_accuracy": 0.7786150217056275, + "num_tokens": 153223850.0, + "step": 45030 + }, + { + "epoch": 0.4520454454213337, + "learning_rate": 0.00010959291822232928, + "loss": 0.7495, + "mean_token_accuracy": 0.7740147352218628, + "num_tokens": 153259052.0, + "step": 45040 + }, + { + "epoch": 0.45214581075113414, + "learning_rate": 0.00010957284515636919, + "loss": 0.7279, + "mean_token_accuracy": 0.7824159443378449, + "num_tokens": 153294295.0, + "step": 45050 + }, + { + "epoch": 0.4522461760809346, + "learning_rate": 0.00010955277209040909, + "loss": 0.7455, + "mean_token_accuracy": 0.7790737450122833, + "num_tokens": 153329893.0, + "step": 45060 + }, + { + "epoch": 0.45234654141073505, + "learning_rate": 0.00010953269902444901, + "loss": 0.7302, + "mean_token_accuracy": 0.7857704102993012, + "num_tokens": 153364620.0, + "step": 45070 + }, + { + "epoch": 0.45244690674053556, + "learning_rate": 0.0001095126259584889, + "loss": 0.7335, + "mean_token_accuracy": 0.7841358959674836, + "num_tokens": 153400195.0, + "step": 45080 + }, + { + "epoch": 0.452547272070336, + "learning_rate": 0.0001094925528925288, + "loss": 0.7118, + "mean_token_accuracy": 0.7873798191547394, + "num_tokens": 153436065.0, + "step": 45090 + }, + { + "epoch": 0.45264763740013647, + "learning_rate": 0.00010947247982656872, + "loss": 0.7097, + "mean_token_accuracy": 0.7894898891448975, + "num_tokens": 153470537.0, + "step": 45100 + }, + { + "epoch": 0.452748002729937, + "learning_rate": 0.00010945240676060862, + "loss": 0.6934, + "mean_token_accuracy": 0.7880873382091522, + "num_tokens": 153505241.0, + "step": 45110 + }, + { + "epoch": 0.45284836805973744, + "learning_rate": 0.00010943233369464854, + "loss": 0.7378, + "mean_token_accuracy": 0.7773111522197723, + "num_tokens": 153540342.0, + "step": 45120 + }, + { + "epoch": 0.4529487333895379, + "learning_rate": 0.00010941226062868843, + "loss": 0.7293, + "mean_token_accuracy": 0.7838761627674102, + "num_tokens": 153574356.0, + "step": 45130 + }, + { + "epoch": 0.4530490987193384, + "learning_rate": 0.00010939218756272833, + "loss": 0.7543, + "mean_token_accuracy": 0.7750289261341095, + "num_tokens": 153609263.0, + "step": 45140 + }, + { + "epoch": 0.45314946404913886, + "learning_rate": 0.00010937211449676825, + "loss": 0.757, + "mean_token_accuracy": 0.771094697713852, + "num_tokens": 153644077.0, + "step": 45150 + }, + { + "epoch": 0.4532498293789393, + "learning_rate": 0.00010935204143080814, + "loss": 0.6772, + "mean_token_accuracy": 0.7960553526878357, + "num_tokens": 153678370.0, + "step": 45160 + }, + { + "epoch": 0.45335019470873983, + "learning_rate": 0.00010933196836484805, + "loss": 0.7351, + "mean_token_accuracy": 0.7795609951019287, + "num_tokens": 153713627.0, + "step": 45170 + }, + { + "epoch": 0.4534505600385403, + "learning_rate": 0.00010931189529888796, + "loss": 0.7204, + "mean_token_accuracy": 0.7858222723007202, + "num_tokens": 153749165.0, + "step": 45180 + }, + { + "epoch": 0.45355092536834074, + "learning_rate": 0.00010929182223292787, + "loss": 0.7185, + "mean_token_accuracy": 0.7809831619262695, + "num_tokens": 153783844.0, + "step": 45190 + }, + { + "epoch": 0.45365129069814125, + "learning_rate": 0.00010927174916696776, + "loss": 0.7588, + "mean_token_accuracy": 0.7743128657341003, + "num_tokens": 153819545.0, + "step": 45200 + }, + { + "epoch": 0.4537516560279417, + "learning_rate": 0.00010925167610100769, + "loss": 0.7398, + "mean_token_accuracy": 0.7764536440372467, + "num_tokens": 153854909.0, + "step": 45210 + }, + { + "epoch": 0.45385202135774216, + "learning_rate": 0.00010923160303504758, + "loss": 0.7376, + "mean_token_accuracy": 0.7779523968696594, + "num_tokens": 153888924.0, + "step": 45220 + }, + { + "epoch": 0.4539523866875427, + "learning_rate": 0.00010921152996908748, + "loss": 0.7594, + "mean_token_accuracy": 0.7741849064826966, + "num_tokens": 153923677.0, + "step": 45230 + }, + { + "epoch": 0.45405275201734313, + "learning_rate": 0.0001091914569031274, + "loss": 0.7667, + "mean_token_accuracy": 0.7729076683521271, + "num_tokens": 153958052.0, + "step": 45240 + }, + { + "epoch": 0.4541531173471436, + "learning_rate": 0.0001091713838371673, + "loss": 0.7289, + "mean_token_accuracy": 0.7829089462757111, + "num_tokens": 153993469.0, + "step": 45250 + }, + { + "epoch": 0.4542534826769441, + "learning_rate": 0.00010915131077120719, + "loss": 0.7414, + "mean_token_accuracy": 0.776902949810028, + "num_tokens": 154027804.0, + "step": 45260 + }, + { + "epoch": 0.45435384800674455, + "learning_rate": 0.00010913123770524711, + "loss": 0.7839, + "mean_token_accuracy": 0.7743165254592895, + "num_tokens": 154062293.0, + "step": 45270 + }, + { + "epoch": 0.454454213336545, + "learning_rate": 0.000109111164639287, + "loss": 0.7439, + "mean_token_accuracy": 0.7767428517341614, + "num_tokens": 154096430.0, + "step": 45280 + }, + { + "epoch": 0.4545545786663455, + "learning_rate": 0.00010909109157332691, + "loss": 0.7317, + "mean_token_accuracy": 0.7799388825893402, + "num_tokens": 154130176.0, + "step": 45290 + }, + { + "epoch": 0.454654943996146, + "learning_rate": 0.00010907101850736684, + "loss": 0.7365, + "mean_token_accuracy": 0.7814435422420501, + "num_tokens": 154165050.0, + "step": 45300 + }, + { + "epoch": 0.45475530932594643, + "learning_rate": 0.00010905094544140673, + "loss": 0.7404, + "mean_token_accuracy": 0.7786262392997741, + "num_tokens": 154201074.0, + "step": 45310 + }, + { + "epoch": 0.45485567465574694, + "learning_rate": 0.00010903087237544663, + "loss": 0.7584, + "mean_token_accuracy": 0.7741450905799866, + "num_tokens": 154235624.0, + "step": 45320 + }, + { + "epoch": 0.4549560399855474, + "learning_rate": 0.00010901079930948655, + "loss": 0.7304, + "mean_token_accuracy": 0.7823881149291992, + "num_tokens": 154270374.0, + "step": 45330 + }, + { + "epoch": 0.45505640531534786, + "learning_rate": 0.00010899072624352644, + "loss": 0.7514, + "mean_token_accuracy": 0.7742278933525085, + "num_tokens": 154305065.0, + "step": 45340 + }, + { + "epoch": 0.45515677064514837, + "learning_rate": 0.00010897065317756634, + "loss": 0.754, + "mean_token_accuracy": 0.7744691073894501, + "num_tokens": 154339332.0, + "step": 45350 + }, + { + "epoch": 0.4552571359749488, + "learning_rate": 0.00010895058011160626, + "loss": 0.7119, + "mean_token_accuracy": 0.785189688205719, + "num_tokens": 154374046.0, + "step": 45360 + }, + { + "epoch": 0.4553575013047493, + "learning_rate": 0.00010893050704564615, + "loss": 0.7178, + "mean_token_accuracy": 0.7814117550849915, + "num_tokens": 154409918.0, + "step": 45370 + }, + { + "epoch": 0.45545786663454974, + "learning_rate": 0.00010891043397968605, + "loss": 0.7421, + "mean_token_accuracy": 0.7787565946578979, + "num_tokens": 154444201.0, + "step": 45380 + }, + { + "epoch": 0.45555823196435025, + "learning_rate": 0.00010889036091372597, + "loss": 0.7259, + "mean_token_accuracy": 0.7825199484825134, + "num_tokens": 154479637.0, + "step": 45390 + }, + { + "epoch": 0.4556585972941507, + "learning_rate": 0.00010887028784776588, + "loss": 0.6876, + "mean_token_accuracy": 0.7944839775562287, + "num_tokens": 154514378.0, + "step": 45400 + }, + { + "epoch": 0.45575896262395116, + "learning_rate": 0.00010885021478180577, + "loss": 0.6979, + "mean_token_accuracy": 0.7917682349681854, + "num_tokens": 154549440.0, + "step": 45410 + }, + { + "epoch": 0.45585932795375167, + "learning_rate": 0.0001088301417158457, + "loss": 0.6868, + "mean_token_accuracy": 0.7883335769176483, + "num_tokens": 154583459.0, + "step": 45420 + }, + { + "epoch": 0.4559596932835521, + "learning_rate": 0.00010881006864988559, + "loss": 0.7167, + "mean_token_accuracy": 0.7852450430393219, + "num_tokens": 154618681.0, + "step": 45430 + }, + { + "epoch": 0.4560600586133526, + "learning_rate": 0.00010878999558392549, + "loss": 0.7006, + "mean_token_accuracy": 0.7889388144016266, + "num_tokens": 154655079.0, + "step": 45440 + }, + { + "epoch": 0.4561604239431531, + "learning_rate": 0.00010876992251796541, + "loss": 0.7173, + "mean_token_accuracy": 0.7862299740314483, + "num_tokens": 154689987.0, + "step": 45450 + }, + { + "epoch": 0.45626078927295355, + "learning_rate": 0.0001087498494520053, + "loss": 0.7543, + "mean_token_accuracy": 0.7773892939090729, + "num_tokens": 154725531.0, + "step": 45460 + }, + { + "epoch": 0.456361154602754, + "learning_rate": 0.0001087297763860452, + "loss": 0.6791, + "mean_token_accuracy": 0.79625204205513, + "num_tokens": 154760949.0, + "step": 45470 + }, + { + "epoch": 0.4564615199325545, + "learning_rate": 0.00010870970332008512, + "loss": 0.7394, + "mean_token_accuracy": 0.7802935123443604, + "num_tokens": 154795596.0, + "step": 45480 + }, + { + "epoch": 0.45656188526235497, + "learning_rate": 0.00010868963025412501, + "loss": 0.69, + "mean_token_accuracy": 0.7932131230831146, + "num_tokens": 154831966.0, + "step": 45490 + }, + { + "epoch": 0.4566622505921554, + "learning_rate": 0.00010866955718816492, + "loss": 0.7384, + "mean_token_accuracy": 0.781095540523529, + "num_tokens": 154867253.0, + "step": 45500 + }, + { + "epoch": 0.45676261592195594, + "learning_rate": 0.00010864948412220483, + "loss": 0.7215, + "mean_token_accuracy": 0.7840093016624451, + "num_tokens": 154900976.0, + "step": 45510 + }, + { + "epoch": 0.4568629812517564, + "learning_rate": 0.00010862941105624474, + "loss": 0.6961, + "mean_token_accuracy": 0.7899511754512787, + "num_tokens": 154935158.0, + "step": 45520 + }, + { + "epoch": 0.45696334658155685, + "learning_rate": 0.00010860933799028463, + "loss": 0.7339, + "mean_token_accuracy": 0.7798848330974579, + "num_tokens": 154970636.0, + "step": 45530 + }, + { + "epoch": 0.45706371191135736, + "learning_rate": 0.00010858926492432456, + "loss": 0.7331, + "mean_token_accuracy": 0.7831038177013397, + "num_tokens": 155006127.0, + "step": 45540 + }, + { + "epoch": 0.4571640772411578, + "learning_rate": 0.00010856919185836445, + "loss": 0.7258, + "mean_token_accuracy": 0.783970981836319, + "num_tokens": 155040627.0, + "step": 45550 + }, + { + "epoch": 0.4572644425709583, + "learning_rate": 0.00010854911879240435, + "loss": 0.677, + "mean_token_accuracy": 0.797710633277893, + "num_tokens": 155075643.0, + "step": 45560 + }, + { + "epoch": 0.4573648079007588, + "learning_rate": 0.00010852904572644427, + "loss": 0.7518, + "mean_token_accuracy": 0.7771606564521789, + "num_tokens": 155110559.0, + "step": 45570 + }, + { + "epoch": 0.45746517323055924, + "learning_rate": 0.00010850897266048416, + "loss": 0.7317, + "mean_token_accuracy": 0.7806562066078186, + "num_tokens": 155145920.0, + "step": 45580 + }, + { + "epoch": 0.4575655385603597, + "learning_rate": 0.00010848889959452406, + "loss": 0.6945, + "mean_token_accuracy": 0.7896435856819153, + "num_tokens": 155181887.0, + "step": 45590 + }, + { + "epoch": 0.4576659038901602, + "learning_rate": 0.00010846882652856398, + "loss": 0.7561, + "mean_token_accuracy": 0.7798638761043548, + "num_tokens": 155216768.0, + "step": 45600 + }, + { + "epoch": 0.45776626921996066, + "learning_rate": 0.00010844875346260388, + "loss": 0.719, + "mean_token_accuracy": 0.7846980154514313, + "num_tokens": 155250378.0, + "step": 45610 + }, + { + "epoch": 0.4578666345497611, + "learning_rate": 0.00010842868039664378, + "loss": 0.7079, + "mean_token_accuracy": 0.7912899911403656, + "num_tokens": 155285650.0, + "step": 45620 + }, + { + "epoch": 0.45796699987956163, + "learning_rate": 0.00010840860733068369, + "loss": 0.6993, + "mean_token_accuracy": 0.7907711029052734, + "num_tokens": 155319932.0, + "step": 45630 + }, + { + "epoch": 0.4580673652093621, + "learning_rate": 0.0001083885342647236, + "loss": 0.6954, + "mean_token_accuracy": 0.7919665277004242, + "num_tokens": 155354891.0, + "step": 45640 + }, + { + "epoch": 0.45816773053916254, + "learning_rate": 0.0001083684611987635, + "loss": 0.7217, + "mean_token_accuracy": 0.7810214936733246, + "num_tokens": 155390599.0, + "step": 45650 + }, + { + "epoch": 0.458268095868963, + "learning_rate": 0.00010834838813280342, + "loss": 0.7328, + "mean_token_accuracy": 0.7812167346477509, + "num_tokens": 155426956.0, + "step": 45660 + }, + { + "epoch": 0.4583684611987635, + "learning_rate": 0.00010832831506684331, + "loss": 0.7415, + "mean_token_accuracy": 0.775298398733139, + "num_tokens": 155461457.0, + "step": 45670 + }, + { + "epoch": 0.45846882652856397, + "learning_rate": 0.00010830824200088323, + "loss": 0.7573, + "mean_token_accuracy": 0.7747935891151428, + "num_tokens": 155496523.0, + "step": 45680 + }, + { + "epoch": 0.4585691918583644, + "learning_rate": 0.00010828816893492313, + "loss": 0.7088, + "mean_token_accuracy": 0.7924448072910308, + "num_tokens": 155531567.0, + "step": 45690 + }, + { + "epoch": 0.45866955718816493, + "learning_rate": 0.00010826809586896302, + "loss": 0.7197, + "mean_token_accuracy": 0.7861683249473572, + "num_tokens": 155567009.0, + "step": 45700 + }, + { + "epoch": 0.4587699225179654, + "learning_rate": 0.00010824802280300295, + "loss": 0.7209, + "mean_token_accuracy": 0.7828059613704681, + "num_tokens": 155601500.0, + "step": 45710 + }, + { + "epoch": 0.45887028784776585, + "learning_rate": 0.00010822794973704284, + "loss": 0.6994, + "mean_token_accuracy": 0.7851306378841401, + "num_tokens": 155637849.0, + "step": 45720 + }, + { + "epoch": 0.45897065317756636, + "learning_rate": 0.00010820787667108274, + "loss": 0.7675, + "mean_token_accuracy": 0.7704609274864197, + "num_tokens": 155672443.0, + "step": 45730 + }, + { + "epoch": 0.4590710185073668, + "learning_rate": 0.00010818780360512266, + "loss": 0.7471, + "mean_token_accuracy": 0.7772091090679168, + "num_tokens": 155707804.0, + "step": 45740 + }, + { + "epoch": 0.45917138383716727, + "learning_rate": 0.00010816773053916257, + "loss": 0.7221, + "mean_token_accuracy": 0.7843359291553498, + "num_tokens": 155742610.0, + "step": 45750 + }, + { + "epoch": 0.4592717491669678, + "learning_rate": 0.00010814765747320246, + "loss": 0.7159, + "mean_token_accuracy": 0.78268381357193, + "num_tokens": 155777374.0, + "step": 45760 + }, + { + "epoch": 0.45937211449676824, + "learning_rate": 0.00010812758440724238, + "loss": 0.7114, + "mean_token_accuracy": 0.7857536256313324, + "num_tokens": 155812932.0, + "step": 45770 + }, + { + "epoch": 0.4594724798265687, + "learning_rate": 0.00010810751134128228, + "loss": 0.712, + "mean_token_accuracy": 0.7849782645702362, + "num_tokens": 155848264.0, + "step": 45780 + }, + { + "epoch": 0.4595728451563692, + "learning_rate": 0.00010808743827532217, + "loss": 0.7135, + "mean_token_accuracy": 0.7836347043514251, + "num_tokens": 155883947.0, + "step": 45790 + }, + { + "epoch": 0.45967321048616966, + "learning_rate": 0.0001080673652093621, + "loss": 0.7009, + "mean_token_accuracy": 0.7856990694999695, + "num_tokens": 155919399.0, + "step": 45800 + }, + { + "epoch": 0.4597735758159701, + "learning_rate": 0.00010804729214340199, + "loss": 0.6993, + "mean_token_accuracy": 0.7913999378681182, + "num_tokens": 155954288.0, + "step": 45810 + }, + { + "epoch": 0.4598739411457706, + "learning_rate": 0.00010802721907744188, + "loss": 0.7121, + "mean_token_accuracy": 0.7861483752727508, + "num_tokens": 155989524.0, + "step": 45820 + }, + { + "epoch": 0.4599743064755711, + "learning_rate": 0.0001080071460114818, + "loss": 0.7216, + "mean_token_accuracy": 0.7861035943031311, + "num_tokens": 156024902.0, + "step": 45830 + }, + { + "epoch": 0.46007467180537154, + "learning_rate": 0.0001079870729455217, + "loss": 0.678, + "mean_token_accuracy": 0.796373850107193, + "num_tokens": 156060776.0, + "step": 45840 + }, + { + "epoch": 0.46017503713517205, + "learning_rate": 0.00010796699987956161, + "loss": 0.7376, + "mean_token_accuracy": 0.7753163158893586, + "num_tokens": 156094988.0, + "step": 45850 + }, + { + "epoch": 0.4602754024649725, + "learning_rate": 0.00010794692681360152, + "loss": 0.7073, + "mean_token_accuracy": 0.7867257773876191, + "num_tokens": 156130118.0, + "step": 45860 + }, + { + "epoch": 0.46037576779477296, + "learning_rate": 0.00010792685374764143, + "loss": 0.714, + "mean_token_accuracy": 0.7838221549987793, + "num_tokens": 156164745.0, + "step": 45870 + }, + { + "epoch": 0.4604761331245735, + "learning_rate": 0.00010790678068168132, + "loss": 0.705, + "mean_token_accuracy": 0.7828870356082916, + "num_tokens": 156200350.0, + "step": 45880 + }, + { + "epoch": 0.46057649845437393, + "learning_rate": 0.00010788670761572124, + "loss": 0.6883, + "mean_token_accuracy": 0.7931342422962189, + "num_tokens": 156236015.0, + "step": 45890 + }, + { + "epoch": 0.4606768637841744, + "learning_rate": 0.00010786663454976114, + "loss": 0.7284, + "mean_token_accuracy": 0.7817682504653931, + "num_tokens": 156272743.0, + "step": 45900 + }, + { + "epoch": 0.4607772291139749, + "learning_rate": 0.00010784656148380103, + "loss": 0.7142, + "mean_token_accuracy": 0.7831542611122131, + "num_tokens": 156308985.0, + "step": 45910 + }, + { + "epoch": 0.46087759444377535, + "learning_rate": 0.00010782648841784096, + "loss": 0.7159, + "mean_token_accuracy": 0.7871647775173187, + "num_tokens": 156343738.0, + "step": 45920 + }, + { + "epoch": 0.4609779597735758, + "learning_rate": 0.00010780641535188085, + "loss": 0.7162, + "mean_token_accuracy": 0.7845615029335022, + "num_tokens": 156379077.0, + "step": 45930 + }, + { + "epoch": 0.46107832510337626, + "learning_rate": 0.00010778634228592075, + "loss": 0.7375, + "mean_token_accuracy": 0.7808549463748932, + "num_tokens": 156414109.0, + "step": 45940 + }, + { + "epoch": 0.4611786904331768, + "learning_rate": 0.00010776626921996067, + "loss": 0.708, + "mean_token_accuracy": 0.7884536445140838, + "num_tokens": 156449434.0, + "step": 45950 + }, + { + "epoch": 0.46127905576297723, + "learning_rate": 0.00010774619615400056, + "loss": 0.6897, + "mean_token_accuracy": 0.7883106231689453, + "num_tokens": 156484881.0, + "step": 45960 + }, + { + "epoch": 0.4613794210927777, + "learning_rate": 0.00010772612308804047, + "loss": 0.72, + "mean_token_accuracy": 0.7828457951545715, + "num_tokens": 156520355.0, + "step": 45970 + }, + { + "epoch": 0.4614797864225782, + "learning_rate": 0.00010770605002208038, + "loss": 0.6935, + "mean_token_accuracy": 0.7907245039939881, + "num_tokens": 156555662.0, + "step": 45980 + }, + { + "epoch": 0.46158015175237865, + "learning_rate": 0.00010768597695612029, + "loss": 0.7392, + "mean_token_accuracy": 0.7876706302165986, + "num_tokens": 156590255.0, + "step": 45990 + }, + { + "epoch": 0.4616805170821791, + "learning_rate": 0.00010766590389016018, + "loss": 0.7175, + "mean_token_accuracy": 0.790300065279007, + "num_tokens": 156625458.0, + "step": 46000 + }, + { + "epoch": 0.4617808824119796, + "learning_rate": 0.0001076458308242001, + "loss": 0.7247, + "mean_token_accuracy": 0.784890878200531, + "num_tokens": 156662011.0, + "step": 46010 + }, + { + "epoch": 0.4618812477417801, + "learning_rate": 0.00010762575775824, + "loss": 0.7045, + "mean_token_accuracy": 0.7865753948688508, + "num_tokens": 156697122.0, + "step": 46020 + }, + { + "epoch": 0.46198161307158053, + "learning_rate": 0.0001076056846922799, + "loss": 0.7179, + "mean_token_accuracy": 0.7825608730316163, + "num_tokens": 156732175.0, + "step": 46030 + }, + { + "epoch": 0.46208197840138104, + "learning_rate": 0.00010758561162631982, + "loss": 0.705, + "mean_token_accuracy": 0.7832401931285858, + "num_tokens": 156767635.0, + "step": 46040 + }, + { + "epoch": 0.4621823437311815, + "learning_rate": 0.00010756553856035971, + "loss": 0.7308, + "mean_token_accuracy": 0.780849301815033, + "num_tokens": 156801943.0, + "step": 46050 + }, + { + "epoch": 0.46228270906098196, + "learning_rate": 0.0001075454654943996, + "loss": 0.7358, + "mean_token_accuracy": 0.7800325095653534, + "num_tokens": 156836748.0, + "step": 46060 + }, + { + "epoch": 0.46238307439078247, + "learning_rate": 0.00010752539242843953, + "loss": 0.6611, + "mean_token_accuracy": 0.7982037842273713, + "num_tokens": 156872539.0, + "step": 46070 + }, + { + "epoch": 0.4624834397205829, + "learning_rate": 0.00010750531936247942, + "loss": 0.72, + "mean_token_accuracy": 0.7860180675983429, + "num_tokens": 156907083.0, + "step": 46080 + }, + { + "epoch": 0.4625838050503834, + "learning_rate": 0.00010748524629651933, + "loss": 0.7332, + "mean_token_accuracy": 0.7771995067596436, + "num_tokens": 156942262.0, + "step": 46090 + }, + { + "epoch": 0.4626841703801839, + "learning_rate": 0.00010746517323055925, + "loss": 0.7231, + "mean_token_accuracy": 0.7848806202411651, + "num_tokens": 156978630.0, + "step": 46100 + }, + { + "epoch": 0.46278453570998435, + "learning_rate": 0.00010744510016459915, + "loss": 0.7335, + "mean_token_accuracy": 0.7821138381958008, + "num_tokens": 157013098.0, + "step": 46110 + }, + { + "epoch": 0.4628849010397848, + "learning_rate": 0.00010742502709863904, + "loss": 0.7254, + "mean_token_accuracy": 0.7811341166496277, + "num_tokens": 157047915.0, + "step": 46120 + }, + { + "epoch": 0.4629852663695853, + "learning_rate": 0.00010740495403267896, + "loss": 0.6864, + "mean_token_accuracy": 0.7955152571201325, + "num_tokens": 157083690.0, + "step": 46130 + }, + { + "epoch": 0.46308563169938577, + "learning_rate": 0.00010738488096671886, + "loss": 0.705, + "mean_token_accuracy": 0.7844863951206207, + "num_tokens": 157118204.0, + "step": 46140 + }, + { + "epoch": 0.4631859970291862, + "learning_rate": 0.00010736480790075875, + "loss": 0.6849, + "mean_token_accuracy": 0.7934133410453796, + "num_tokens": 157152228.0, + "step": 46150 + }, + { + "epoch": 0.46328636235898674, + "learning_rate": 0.00010734473483479868, + "loss": 0.7248, + "mean_token_accuracy": 0.7831818222999573, + "num_tokens": 157188068.0, + "step": 46160 + }, + { + "epoch": 0.4633867276887872, + "learning_rate": 0.00010732466176883857, + "loss": 0.6677, + "mean_token_accuracy": 0.7984673023223877, + "num_tokens": 157223352.0, + "step": 46170 + }, + { + "epoch": 0.46348709301858765, + "learning_rate": 0.00010730458870287847, + "loss": 0.6803, + "mean_token_accuracy": 0.796294242143631, + "num_tokens": 157258284.0, + "step": 46180 + }, + { + "epoch": 0.46358745834838816, + "learning_rate": 0.00010728451563691839, + "loss": 0.6924, + "mean_token_accuracy": 0.7861761391162873, + "num_tokens": 157293501.0, + "step": 46190 + }, + { + "epoch": 0.4636878236781886, + "learning_rate": 0.0001072644425709583, + "loss": 0.688, + "mean_token_accuracy": 0.7971710205078125, + "num_tokens": 157330040.0, + "step": 46200 + }, + { + "epoch": 0.46378818900798907, + "learning_rate": 0.00010724436950499819, + "loss": 0.6885, + "mean_token_accuracy": 0.7873896420001983, + "num_tokens": 157365148.0, + "step": 46210 + }, + { + "epoch": 0.4638885543377895, + "learning_rate": 0.00010722429643903811, + "loss": 0.7051, + "mean_token_accuracy": 0.7853258192539215, + "num_tokens": 157401536.0, + "step": 46220 + }, + { + "epoch": 0.46398891966759004, + "learning_rate": 0.00010720422337307801, + "loss": 0.7102, + "mean_token_accuracy": 0.7846766710281372, + "num_tokens": 157436736.0, + "step": 46230 + }, + { + "epoch": 0.4640892849973905, + "learning_rate": 0.00010718415030711793, + "loss": 0.7403, + "mean_token_accuracy": 0.7822953999042511, + "num_tokens": 157471551.0, + "step": 46240 + }, + { + "epoch": 0.46418965032719095, + "learning_rate": 0.00010716407724115783, + "loss": 0.6797, + "mean_token_accuracy": 0.7962810456752777, + "num_tokens": 157507143.0, + "step": 46250 + }, + { + "epoch": 0.46429001565699146, + "learning_rate": 0.00010714400417519772, + "loss": 0.6965, + "mean_token_accuracy": 0.7917849063873291, + "num_tokens": 157543095.0, + "step": 46260 + }, + { + "epoch": 0.4643903809867919, + "learning_rate": 0.00010712393110923764, + "loss": 0.7074, + "mean_token_accuracy": 0.7860041975975036, + "num_tokens": 157578818.0, + "step": 46270 + }, + { + "epoch": 0.4644907463165924, + "learning_rate": 0.00010710385804327754, + "loss": 0.7194, + "mean_token_accuracy": 0.7866369724273682, + "num_tokens": 157613086.0, + "step": 46280 + }, + { + "epoch": 0.4645911116463929, + "learning_rate": 0.00010708378497731743, + "loss": 0.7323, + "mean_token_accuracy": 0.7846727252006531, + "num_tokens": 157647792.0, + "step": 46290 + }, + { + "epoch": 0.46469147697619334, + "learning_rate": 0.00010706371191135735, + "loss": 0.75, + "mean_token_accuracy": 0.7749805808067322, + "num_tokens": 157683453.0, + "step": 46300 + }, + { + "epoch": 0.4647918423059938, + "learning_rate": 0.00010704363884539725, + "loss": 0.681, + "mean_token_accuracy": 0.7935085654258728, + "num_tokens": 157719305.0, + "step": 46310 + }, + { + "epoch": 0.4648922076357943, + "learning_rate": 0.00010702356577943716, + "loss": 0.7045, + "mean_token_accuracy": 0.79261554479599, + "num_tokens": 157754832.0, + "step": 46320 + }, + { + "epoch": 0.46499257296559476, + "learning_rate": 0.00010700349271347707, + "loss": 0.673, + "mean_token_accuracy": 0.7986871778964997, + "num_tokens": 157789464.0, + "step": 46330 + }, + { + "epoch": 0.4650929382953952, + "learning_rate": 0.00010698341964751697, + "loss": 0.687, + "mean_token_accuracy": 0.7916176676750183, + "num_tokens": 157824600.0, + "step": 46340 + }, + { + "epoch": 0.46519330362519573, + "learning_rate": 0.00010696334658155687, + "loss": 0.7182, + "mean_token_accuracy": 0.7853668570518494, + "num_tokens": 157858964.0, + "step": 46350 + }, + { + "epoch": 0.4652936689549962, + "learning_rate": 0.00010694327351559679, + "loss": 0.7119, + "mean_token_accuracy": 0.7871406614780426, + "num_tokens": 157894188.0, + "step": 46360 + }, + { + "epoch": 0.46539403428479664, + "learning_rate": 0.00010692320044963669, + "loss": 0.7194, + "mean_token_accuracy": 0.786019378900528, + "num_tokens": 157929823.0, + "step": 46370 + }, + { + "epoch": 0.46549439961459715, + "learning_rate": 0.00010690312738367658, + "loss": 0.6977, + "mean_token_accuracy": 0.7925242602825164, + "num_tokens": 157964698.0, + "step": 46380 + }, + { + "epoch": 0.4655947649443976, + "learning_rate": 0.0001068830543177165, + "loss": 0.7354, + "mean_token_accuracy": 0.784424090385437, + "num_tokens": 157999845.0, + "step": 46390 + }, + { + "epoch": 0.46569513027419807, + "learning_rate": 0.0001068629812517564, + "loss": 0.7034, + "mean_token_accuracy": 0.7869425654411316, + "num_tokens": 158035108.0, + "step": 46400 + }, + { + "epoch": 0.4657954956039986, + "learning_rate": 0.00010684290818579629, + "loss": 0.703, + "mean_token_accuracy": 0.7890412390232087, + "num_tokens": 158070592.0, + "step": 46410 + }, + { + "epoch": 0.46589586093379903, + "learning_rate": 0.00010682283511983621, + "loss": 0.6805, + "mean_token_accuracy": 0.7949465453624726, + "num_tokens": 158105994.0, + "step": 46420 + }, + { + "epoch": 0.4659962262635995, + "learning_rate": 0.00010680276205387611, + "loss": 0.7034, + "mean_token_accuracy": 0.7892135560512543, + "num_tokens": 158142003.0, + "step": 46430 + }, + { + "epoch": 0.4660965915934, + "learning_rate": 0.00010678268898791602, + "loss": 0.6919, + "mean_token_accuracy": 0.7986708045005798, + "num_tokens": 158177831.0, + "step": 46440 + }, + { + "epoch": 0.46619695692320046, + "learning_rate": 0.00010676261592195593, + "loss": 0.7129, + "mean_token_accuracy": 0.7889884889125824, + "num_tokens": 158212578.0, + "step": 46450 + }, + { + "epoch": 0.4662973222530009, + "learning_rate": 0.00010674254285599583, + "loss": 0.7223, + "mean_token_accuracy": 0.7806691288948059, + "num_tokens": 158247415.0, + "step": 46460 + }, + { + "epoch": 0.4663976875828014, + "learning_rate": 0.00010672246979003573, + "loss": 0.73, + "mean_token_accuracy": 0.7802925348281861, + "num_tokens": 158283404.0, + "step": 46470 + }, + { + "epoch": 0.4664980529126019, + "learning_rate": 0.00010670239672407565, + "loss": 0.7161, + "mean_token_accuracy": 0.7881710827350616, + "num_tokens": 158318305.0, + "step": 46480 + }, + { + "epoch": 0.46659841824240234, + "learning_rate": 0.00010668232365811555, + "loss": 0.6878, + "mean_token_accuracy": 0.7952527344226837, + "num_tokens": 158353990.0, + "step": 46490 + }, + { + "epoch": 0.4666987835722028, + "learning_rate": 0.00010666225059215544, + "loss": 0.6749, + "mean_token_accuracy": 0.7952859818935394, + "num_tokens": 158389377.0, + "step": 46500 + }, + { + "epoch": 0.4667991489020033, + "learning_rate": 0.00010664217752619536, + "loss": 0.6919, + "mean_token_accuracy": 0.790702360868454, + "num_tokens": 158423925.0, + "step": 46510 + }, + { + "epoch": 0.46689951423180376, + "learning_rate": 0.00010662210446023526, + "loss": 0.6766, + "mean_token_accuracy": 0.7953005731105804, + "num_tokens": 158459573.0, + "step": 46520 + }, + { + "epoch": 0.4669998795616042, + "learning_rate": 0.00010660203139427515, + "loss": 0.7178, + "mean_token_accuracy": 0.7834354937076569, + "num_tokens": 158494715.0, + "step": 46530 + }, + { + "epoch": 0.4671002448914047, + "learning_rate": 0.00010658195832831508, + "loss": 0.7163, + "mean_token_accuracy": 0.7839456260204315, + "num_tokens": 158530318.0, + "step": 46540 + }, + { + "epoch": 0.4672006102212052, + "learning_rate": 0.00010656188526235498, + "loss": 0.6858, + "mean_token_accuracy": 0.795786327123642, + "num_tokens": 158566561.0, + "step": 46550 + }, + { + "epoch": 0.46730097555100564, + "learning_rate": 0.00010654181219639488, + "loss": 0.7185, + "mean_token_accuracy": 0.7875998079776764, + "num_tokens": 158602989.0, + "step": 46560 + }, + { + "epoch": 0.46740134088080615, + "learning_rate": 0.0001065217391304348, + "loss": 0.7199, + "mean_token_accuracy": 0.782318115234375, + "num_tokens": 158637538.0, + "step": 46570 + }, + { + "epoch": 0.4675017062106066, + "learning_rate": 0.0001065016660644747, + "loss": 0.7044, + "mean_token_accuracy": 0.7850953221321106, + "num_tokens": 158672562.0, + "step": 46580 + }, + { + "epoch": 0.46760207154040706, + "learning_rate": 0.00010648159299851459, + "loss": 0.6886, + "mean_token_accuracy": 0.7909720003604889, + "num_tokens": 158708099.0, + "step": 46590 + }, + { + "epoch": 0.46770243687020757, + "learning_rate": 0.00010646151993255451, + "loss": 0.7244, + "mean_token_accuracy": 0.7835875153541565, + "num_tokens": 158744023.0, + "step": 46600 + }, + { + "epoch": 0.467802802200008, + "learning_rate": 0.00010644144686659441, + "loss": 0.6923, + "mean_token_accuracy": 0.7904627203941346, + "num_tokens": 158780913.0, + "step": 46610 + }, + { + "epoch": 0.4679031675298085, + "learning_rate": 0.0001064213738006343, + "loss": 0.7, + "mean_token_accuracy": 0.7869254350662231, + "num_tokens": 158815378.0, + "step": 46620 + }, + { + "epoch": 0.468003532859609, + "learning_rate": 0.00010640130073467422, + "loss": 0.698, + "mean_token_accuracy": 0.7847469210624695, + "num_tokens": 158850652.0, + "step": 46630 + }, + { + "epoch": 0.46810389818940945, + "learning_rate": 0.00010638122766871412, + "loss": 0.729, + "mean_token_accuracy": 0.7812280833721161, + "num_tokens": 158885127.0, + "step": 46640 + }, + { + "epoch": 0.4682042635192099, + "learning_rate": 0.00010636115460275403, + "loss": 0.7087, + "mean_token_accuracy": 0.7840165257453918, + "num_tokens": 158920160.0, + "step": 46650 + }, + { + "epoch": 0.4683046288490104, + "learning_rate": 0.00010634108153679394, + "loss": 0.6999, + "mean_token_accuracy": 0.7896547734737396, + "num_tokens": 158956129.0, + "step": 46660 + }, + { + "epoch": 0.4684049941788109, + "learning_rate": 0.00010632100847083384, + "loss": 0.6897, + "mean_token_accuracy": 0.7955524504184723, + "num_tokens": 158992607.0, + "step": 46670 + }, + { + "epoch": 0.46850535950861133, + "learning_rate": 0.00010630093540487374, + "loss": 0.688, + "mean_token_accuracy": 0.791974002122879, + "num_tokens": 159028574.0, + "step": 46680 + }, + { + "epoch": 0.46860572483841184, + "learning_rate": 0.00010628086233891366, + "loss": 0.6904, + "mean_token_accuracy": 0.7901484429836273, + "num_tokens": 159063310.0, + "step": 46690 + }, + { + "epoch": 0.4687060901682123, + "learning_rate": 0.00010626078927295356, + "loss": 0.6924, + "mean_token_accuracy": 0.7883610904216767, + "num_tokens": 159098102.0, + "step": 46700 + }, + { + "epoch": 0.46880645549801275, + "learning_rate": 0.00010624071620699345, + "loss": 0.7042, + "mean_token_accuracy": 0.7841535389423371, + "num_tokens": 159133043.0, + "step": 46710 + }, + { + "epoch": 0.46890682082781326, + "learning_rate": 0.00010622064314103337, + "loss": 0.7399, + "mean_token_accuracy": 0.7765646338462829, + "num_tokens": 159168109.0, + "step": 46720 + }, + { + "epoch": 0.4690071861576137, + "learning_rate": 0.00010620057007507327, + "loss": 0.6987, + "mean_token_accuracy": 0.7861594557762146, + "num_tokens": 159203514.0, + "step": 46730 + }, + { + "epoch": 0.4691075514874142, + "learning_rate": 0.00010618049700911316, + "loss": 0.6795, + "mean_token_accuracy": 0.7951503574848175, + "num_tokens": 159239365.0, + "step": 46740 + }, + { + "epoch": 0.4692079168172147, + "learning_rate": 0.00010616042394315308, + "loss": 0.7216, + "mean_token_accuracy": 0.7838666141033173, + "num_tokens": 159275307.0, + "step": 46750 + }, + { + "epoch": 0.46930828214701514, + "learning_rate": 0.00010614035087719298, + "loss": 0.707, + "mean_token_accuracy": 0.7920927166938782, + "num_tokens": 159310176.0, + "step": 46760 + }, + { + "epoch": 0.4694086474768156, + "learning_rate": 0.00010612027781123289, + "loss": 0.7161, + "mean_token_accuracy": 0.785585218667984, + "num_tokens": 159345957.0, + "step": 46770 + }, + { + "epoch": 0.46950901280661606, + "learning_rate": 0.0001061002047452728, + "loss": 0.7228, + "mean_token_accuracy": 0.7791460871696472, + "num_tokens": 159380901.0, + "step": 46780 + }, + { + "epoch": 0.46960937813641657, + "learning_rate": 0.0001060801316793127, + "loss": 0.7145, + "mean_token_accuracy": 0.7856329619884491, + "num_tokens": 159415532.0, + "step": 46790 + }, + { + "epoch": 0.469709743466217, + "learning_rate": 0.0001060600586133526, + "loss": 0.6804, + "mean_token_accuracy": 0.7934350728988647, + "num_tokens": 159451370.0, + "step": 46800 + }, + { + "epoch": 0.4698101087960175, + "learning_rate": 0.00010603998554739252, + "loss": 0.7475, + "mean_token_accuracy": 0.7766209721565247, + "num_tokens": 159486342.0, + "step": 46810 + }, + { + "epoch": 0.469910474125818, + "learning_rate": 0.00010601991248143242, + "loss": 0.7309, + "mean_token_accuracy": 0.7836766362190246, + "num_tokens": 159521532.0, + "step": 46820 + }, + { + "epoch": 0.47001083945561845, + "learning_rate": 0.00010599983941547234, + "loss": 0.7163, + "mean_token_accuracy": 0.7804810166358948, + "num_tokens": 159557383.0, + "step": 46830 + }, + { + "epoch": 0.4701112047854189, + "learning_rate": 0.00010597976634951223, + "loss": 0.7222, + "mean_token_accuracy": 0.7816921055316925, + "num_tokens": 159592790.0, + "step": 46840 + }, + { + "epoch": 0.4702115701152194, + "learning_rate": 0.00010595969328355213, + "loss": 0.7286, + "mean_token_accuracy": 0.783270001411438, + "num_tokens": 159629078.0, + "step": 46850 + }, + { + "epoch": 0.47031193544501987, + "learning_rate": 0.00010593962021759205, + "loss": 0.7284, + "mean_token_accuracy": 0.7808925092220307, + "num_tokens": 159665237.0, + "step": 46860 + }, + { + "epoch": 0.4704123007748203, + "learning_rate": 0.00010591954715163195, + "loss": 0.6923, + "mean_token_accuracy": 0.7907767117023468, + "num_tokens": 159700427.0, + "step": 46870 + }, + { + "epoch": 0.47051266610462084, + "learning_rate": 0.00010589947408567184, + "loss": 0.7066, + "mean_token_accuracy": 0.787431925535202, + "num_tokens": 159735443.0, + "step": 46880 + }, + { + "epoch": 0.4706130314344213, + "learning_rate": 0.00010587940101971176, + "loss": 0.7247, + "mean_token_accuracy": 0.7834123134613037, + "num_tokens": 159771058.0, + "step": 46890 + }, + { + "epoch": 0.47071339676422175, + "learning_rate": 0.00010585932795375167, + "loss": 0.7399, + "mean_token_accuracy": 0.7818175792694092, + "num_tokens": 159805741.0, + "step": 46900 + }, + { + "epoch": 0.47081376209402226, + "learning_rate": 0.00010583925488779157, + "loss": 0.6757, + "mean_token_accuracy": 0.7935092628002167, + "num_tokens": 159840654.0, + "step": 46910 + }, + { + "epoch": 0.4709141274238227, + "learning_rate": 0.00010581918182183149, + "loss": 0.7174, + "mean_token_accuracy": 0.781839793920517, + "num_tokens": 159875540.0, + "step": 46920 + }, + { + "epoch": 0.47101449275362317, + "learning_rate": 0.00010579910875587138, + "loss": 0.7264, + "mean_token_accuracy": 0.7855076014995575, + "num_tokens": 159911077.0, + "step": 46930 + }, + { + "epoch": 0.4711148580834237, + "learning_rate": 0.00010577903568991128, + "loss": 0.7224, + "mean_token_accuracy": 0.7857255399227142, + "num_tokens": 159946051.0, + "step": 46940 + }, + { + "epoch": 0.47121522341322414, + "learning_rate": 0.0001057589626239512, + "loss": 0.7131, + "mean_token_accuracy": 0.7874164462089539, + "num_tokens": 159980596.0, + "step": 46950 + }, + { + "epoch": 0.4713155887430246, + "learning_rate": 0.0001057388895579911, + "loss": 0.697, + "mean_token_accuracy": 0.7895408928394317, + "num_tokens": 160015468.0, + "step": 46960 + }, + { + "epoch": 0.4714159540728251, + "learning_rate": 0.00010571881649203099, + "loss": 0.6808, + "mean_token_accuracy": 0.794541311264038, + "num_tokens": 160051232.0, + "step": 46970 + }, + { + "epoch": 0.47151631940262556, + "learning_rate": 0.00010569874342607091, + "loss": 0.6809, + "mean_token_accuracy": 0.7936924457550049, + "num_tokens": 160086443.0, + "step": 46980 + }, + { + "epoch": 0.471616684732426, + "learning_rate": 0.0001056786703601108, + "loss": 0.7042, + "mean_token_accuracy": 0.7852703154087066, + "num_tokens": 160121781.0, + "step": 46990 + }, + { + "epoch": 0.47171705006222653, + "learning_rate": 0.00010565859729415071, + "loss": 0.7128, + "mean_token_accuracy": 0.7857403755187988, + "num_tokens": 160157537.0, + "step": 47000 + }, + { + "epoch": 0.471817415392027, + "learning_rate": 0.00010563852422819062, + "loss": 0.701, + "mean_token_accuracy": 0.7863259792327881, + "num_tokens": 160192578.0, + "step": 47010 + }, + { + "epoch": 0.47191778072182744, + "learning_rate": 0.00010561845116223053, + "loss": 0.7109, + "mean_token_accuracy": 0.790937626361847, + "num_tokens": 160227880.0, + "step": 47020 + }, + { + "epoch": 0.47201814605162795, + "learning_rate": 0.00010559837809627043, + "loss": 0.6927, + "mean_token_accuracy": 0.7863008499145507, + "num_tokens": 160263157.0, + "step": 47030 + }, + { + "epoch": 0.4721185113814284, + "learning_rate": 0.00010557830503031035, + "loss": 0.6976, + "mean_token_accuracy": 0.7901015520095825, + "num_tokens": 160298414.0, + "step": 47040 + }, + { + "epoch": 0.47221887671122886, + "learning_rate": 0.00010555823196435024, + "loss": 0.7208, + "mean_token_accuracy": 0.7872840464115143, + "num_tokens": 160333241.0, + "step": 47050 + }, + { + "epoch": 0.4723192420410293, + "learning_rate": 0.00010553815889839014, + "loss": 0.6925, + "mean_token_accuracy": 0.7923729300498963, + "num_tokens": 160368384.0, + "step": 47060 + }, + { + "epoch": 0.47241960737082983, + "learning_rate": 0.00010551808583243006, + "loss": 0.6982, + "mean_token_accuracy": 0.7913429319858551, + "num_tokens": 160404066.0, + "step": 47070 + }, + { + "epoch": 0.4725199727006303, + "learning_rate": 0.00010549801276646995, + "loss": 0.6821, + "mean_token_accuracy": 0.7913277566432952, + "num_tokens": 160439108.0, + "step": 47080 + }, + { + "epoch": 0.47262033803043074, + "learning_rate": 0.00010547793970050985, + "loss": 0.7312, + "mean_token_accuracy": 0.7841997802257538, + "num_tokens": 160474451.0, + "step": 47090 + }, + { + "epoch": 0.47272070336023125, + "learning_rate": 0.00010545786663454977, + "loss": 0.6899, + "mean_token_accuracy": 0.7895389914512634, + "num_tokens": 160511167.0, + "step": 47100 + }, + { + "epoch": 0.4728210686900317, + "learning_rate": 0.00010543779356858967, + "loss": 0.685, + "mean_token_accuracy": 0.7937025189399719, + "num_tokens": 160546665.0, + "step": 47110 + }, + { + "epoch": 0.47292143401983217, + "learning_rate": 0.00010541772050262957, + "loss": 0.6752, + "mean_token_accuracy": 0.7924473464488984, + "num_tokens": 160581892.0, + "step": 47120 + }, + { + "epoch": 0.4730217993496327, + "learning_rate": 0.00010539764743666948, + "loss": 0.6958, + "mean_token_accuracy": 0.7883609414100647, + "num_tokens": 160617929.0, + "step": 47130 + }, + { + "epoch": 0.47312216467943313, + "learning_rate": 0.00010537757437070939, + "loss": 0.6845, + "mean_token_accuracy": 0.7942955136299134, + "num_tokens": 160653461.0, + "step": 47140 + }, + { + "epoch": 0.4732225300092336, + "learning_rate": 0.00010535750130474929, + "loss": 0.6831, + "mean_token_accuracy": 0.7937300324440002, + "num_tokens": 160690001.0, + "step": 47150 + }, + { + "epoch": 0.4733228953390341, + "learning_rate": 0.00010533742823878921, + "loss": 0.6631, + "mean_token_accuracy": 0.8001127362251281, + "num_tokens": 160725785.0, + "step": 47160 + }, + { + "epoch": 0.47342326066883456, + "learning_rate": 0.0001053173551728291, + "loss": 0.7243, + "mean_token_accuracy": 0.7867645204067231, + "num_tokens": 160762595.0, + "step": 47170 + }, + { + "epoch": 0.473523625998635, + "learning_rate": 0.000105297282106869, + "loss": 0.6938, + "mean_token_accuracy": 0.7910487055778503, + "num_tokens": 160797614.0, + "step": 47180 + }, + { + "epoch": 0.4736239913284355, + "learning_rate": 0.00010527720904090892, + "loss": 0.6979, + "mean_token_accuracy": 0.7920831203460693, + "num_tokens": 160833634.0, + "step": 47190 + }, + { + "epoch": 0.473724356658236, + "learning_rate": 0.00010525713597494881, + "loss": 0.7532, + "mean_token_accuracy": 0.7816699028015137, + "num_tokens": 160869280.0, + "step": 47200 + }, + { + "epoch": 0.47382472198803643, + "learning_rate": 0.00010523706290898871, + "loss": 0.6871, + "mean_token_accuracy": 0.7951245188713074, + "num_tokens": 160905819.0, + "step": 47210 + }, + { + "epoch": 0.47392508731783695, + "learning_rate": 0.00010521698984302863, + "loss": 0.6751, + "mean_token_accuracy": 0.7951266944408417, + "num_tokens": 160942206.0, + "step": 47220 + }, + { + "epoch": 0.4740254526476374, + "learning_rate": 0.00010519691677706853, + "loss": 0.7116, + "mean_token_accuracy": 0.7847038805484772, + "num_tokens": 160978577.0, + "step": 47230 + }, + { + "epoch": 0.47412581797743786, + "learning_rate": 0.00010517684371110844, + "loss": 0.6958, + "mean_token_accuracy": 0.7886900484561921, + "num_tokens": 161013465.0, + "step": 47240 + }, + { + "epoch": 0.47422618330723837, + "learning_rate": 0.00010515677064514834, + "loss": 0.6786, + "mean_token_accuracy": 0.7906596243381501, + "num_tokens": 161049466.0, + "step": 47250 + }, + { + "epoch": 0.4743265486370388, + "learning_rate": 0.00010513669757918825, + "loss": 0.6674, + "mean_token_accuracy": 0.7982393562793731, + "num_tokens": 161085007.0, + "step": 47260 + }, + { + "epoch": 0.4744269139668393, + "learning_rate": 0.00010511662451322815, + "loss": 0.6767, + "mean_token_accuracy": 0.7966917872428894, + "num_tokens": 161121639.0, + "step": 47270 + }, + { + "epoch": 0.4745272792966398, + "learning_rate": 0.00010509655144726807, + "loss": 0.71, + "mean_token_accuracy": 0.7855958700180053, + "num_tokens": 161158615.0, + "step": 47280 + }, + { + "epoch": 0.47462764462644025, + "learning_rate": 0.00010507647838130796, + "loss": 0.6909, + "mean_token_accuracy": 0.7912957191467285, + "num_tokens": 161194038.0, + "step": 47290 + }, + { + "epoch": 0.4747280099562407, + "learning_rate": 0.00010505640531534786, + "loss": 0.6953, + "mean_token_accuracy": 0.7897424101829529, + "num_tokens": 161229845.0, + "step": 47300 + }, + { + "epoch": 0.4748283752860412, + "learning_rate": 0.00010503633224938778, + "loss": 0.7494, + "mean_token_accuracy": 0.773971438407898, + "num_tokens": 161266003.0, + "step": 47310 + }, + { + "epoch": 0.47492874061584167, + "learning_rate": 0.00010501625918342768, + "loss": 0.7151, + "mean_token_accuracy": 0.7860597670078278, + "num_tokens": 161301194.0, + "step": 47320 + }, + { + "epoch": 0.4750291059456421, + "learning_rate": 0.00010499618611746757, + "loss": 0.6298, + "mean_token_accuracy": 0.8060030400753021, + "num_tokens": 161337294.0, + "step": 47330 + }, + { + "epoch": 0.47512947127544264, + "learning_rate": 0.00010497611305150749, + "loss": 0.6808, + "mean_token_accuracy": 0.7956064879894257, + "num_tokens": 161373107.0, + "step": 47340 + }, + { + "epoch": 0.4752298366052431, + "learning_rate": 0.0001049560399855474, + "loss": 0.7048, + "mean_token_accuracy": 0.7940467596054077, + "num_tokens": 161408814.0, + "step": 47350 + }, + { + "epoch": 0.47533020193504355, + "learning_rate": 0.0001049359669195873, + "loss": 0.7486, + "mean_token_accuracy": 0.7760293006896972, + "num_tokens": 161443917.0, + "step": 47360 + }, + { + "epoch": 0.475430567264844, + "learning_rate": 0.00010491589385362722, + "loss": 0.7265, + "mean_token_accuracy": 0.7832448840141296, + "num_tokens": 161479605.0, + "step": 47370 + }, + { + "epoch": 0.4755309325946445, + "learning_rate": 0.00010489582078766711, + "loss": 0.7102, + "mean_token_accuracy": 0.7841754913330078, + "num_tokens": 161515285.0, + "step": 47380 + }, + { + "epoch": 0.475631297924445, + "learning_rate": 0.00010487574772170703, + "loss": 0.6772, + "mean_token_accuracy": 0.7950868487358094, + "num_tokens": 161550831.0, + "step": 47390 + }, + { + "epoch": 0.47573166325424543, + "learning_rate": 0.00010485567465574693, + "loss": 0.7081, + "mean_token_accuracy": 0.7866260468959808, + "num_tokens": 161586881.0, + "step": 47400 + }, + { + "epoch": 0.47583202858404594, + "learning_rate": 0.00010483560158978682, + "loss": 0.6949, + "mean_token_accuracy": 0.7889688670635223, + "num_tokens": 161622634.0, + "step": 47410 + }, + { + "epoch": 0.4759323939138464, + "learning_rate": 0.00010481552852382675, + "loss": 0.7066, + "mean_token_accuracy": 0.7932239294052124, + "num_tokens": 161659136.0, + "step": 47420 + }, + { + "epoch": 0.47603275924364685, + "learning_rate": 0.00010479545545786664, + "loss": 0.7152, + "mean_token_accuracy": 0.7909041404724121, + "num_tokens": 161694868.0, + "step": 47430 + }, + { + "epoch": 0.47613312457344736, + "learning_rate": 0.00010477538239190654, + "loss": 0.712, + "mean_token_accuracy": 0.7855082929134369, + "num_tokens": 161730614.0, + "step": 47440 + }, + { + "epoch": 0.4762334899032478, + "learning_rate": 0.00010475530932594646, + "loss": 0.6949, + "mean_token_accuracy": 0.7938051342964172, + "num_tokens": 161767012.0, + "step": 47450 + }, + { + "epoch": 0.4763338552330483, + "learning_rate": 0.00010473523625998635, + "loss": 0.6633, + "mean_token_accuracy": 0.796594899892807, + "num_tokens": 161803108.0, + "step": 47460 + }, + { + "epoch": 0.4764342205628488, + "learning_rate": 0.00010471516319402626, + "loss": 0.7105, + "mean_token_accuracy": 0.782571405172348, + "num_tokens": 161838645.0, + "step": 47470 + }, + { + "epoch": 0.47653458589264924, + "learning_rate": 0.00010469509012806617, + "loss": 0.7094, + "mean_token_accuracy": 0.7875165998935699, + "num_tokens": 161874286.0, + "step": 47480 + }, + { + "epoch": 0.4766349512224497, + "learning_rate": 0.00010467501706210608, + "loss": 0.7128, + "mean_token_accuracy": 0.7863965630531311, + "num_tokens": 161909907.0, + "step": 47490 + }, + { + "epoch": 0.4767353165522502, + "learning_rate": 0.00010465494399614597, + "loss": 0.7182, + "mean_token_accuracy": 0.7878428757190704, + "num_tokens": 161944935.0, + "step": 47500 + }, + { + "epoch": 0.47683568188205067, + "learning_rate": 0.0001046348709301859, + "loss": 0.6971, + "mean_token_accuracy": 0.794540810585022, + "num_tokens": 161981262.0, + "step": 47510 + }, + { + "epoch": 0.4769360472118511, + "learning_rate": 0.00010461479786422579, + "loss": 0.708, + "mean_token_accuracy": 0.7874243080615997, + "num_tokens": 162016280.0, + "step": 47520 + }, + { + "epoch": 0.47703641254165163, + "learning_rate": 0.00010459472479826568, + "loss": 0.6525, + "mean_token_accuracy": 0.8007276117801666, + "num_tokens": 162051253.0, + "step": 47530 + }, + { + "epoch": 0.4771367778714521, + "learning_rate": 0.00010457465173230561, + "loss": 0.7023, + "mean_token_accuracy": 0.7896904945373535, + "num_tokens": 162087552.0, + "step": 47540 + }, + { + "epoch": 0.47723714320125254, + "learning_rate": 0.0001045545786663455, + "loss": 0.6924, + "mean_token_accuracy": 0.7869489848613739, + "num_tokens": 162122832.0, + "step": 47550 + }, + { + "epoch": 0.47733750853105306, + "learning_rate": 0.0001045345056003854, + "loss": 0.6936, + "mean_token_accuracy": 0.7942219018936157, + "num_tokens": 162158731.0, + "step": 47560 + }, + { + "epoch": 0.4774378738608535, + "learning_rate": 0.00010451443253442532, + "loss": 0.6841, + "mean_token_accuracy": 0.7955293655395508, + "num_tokens": 162194422.0, + "step": 47570 + }, + { + "epoch": 0.47753823919065397, + "learning_rate": 0.00010449435946846521, + "loss": 0.7177, + "mean_token_accuracy": 0.7842896938323974, + "num_tokens": 162230673.0, + "step": 47580 + }, + { + "epoch": 0.4776386045204545, + "learning_rate": 0.00010447428640250512, + "loss": 0.7382, + "mean_token_accuracy": 0.7757864713668823, + "num_tokens": 162266350.0, + "step": 47590 + }, + { + "epoch": 0.47773896985025494, + "learning_rate": 0.00010445421333654503, + "loss": 0.7236, + "mean_token_accuracy": 0.7828563153743744, + "num_tokens": 162301576.0, + "step": 47600 + }, + { + "epoch": 0.4778393351800554, + "learning_rate": 0.00010443414027058494, + "loss": 0.6793, + "mean_token_accuracy": 0.7924531519412994, + "num_tokens": 162337268.0, + "step": 47610 + }, + { + "epoch": 0.4779397005098559, + "learning_rate": 0.00010441406720462483, + "loss": 0.6919, + "mean_token_accuracy": 0.7864301800727844, + "num_tokens": 162372409.0, + "step": 47620 + }, + { + "epoch": 0.47804006583965636, + "learning_rate": 0.00010439399413866476, + "loss": 0.674, + "mean_token_accuracy": 0.7930449903011322, + "num_tokens": 162408319.0, + "step": 47630 + }, + { + "epoch": 0.4781404311694568, + "learning_rate": 0.00010437392107270465, + "loss": 0.6903, + "mean_token_accuracy": 0.79172642827034, + "num_tokens": 162444898.0, + "step": 47640 + }, + { + "epoch": 0.47824079649925727, + "learning_rate": 0.00010435384800674455, + "loss": 0.6861, + "mean_token_accuracy": 0.7925096869468689, + "num_tokens": 162480532.0, + "step": 47650 + }, + { + "epoch": 0.4783411618290578, + "learning_rate": 0.00010433377494078447, + "loss": 0.687, + "mean_token_accuracy": 0.7912269413471222, + "num_tokens": 162516434.0, + "step": 47660 + }, + { + "epoch": 0.47844152715885824, + "learning_rate": 0.00010431370187482436, + "loss": 0.7054, + "mean_token_accuracy": 0.7908867537975312, + "num_tokens": 162552621.0, + "step": 47670 + }, + { + "epoch": 0.4785418924886587, + "learning_rate": 0.00010429362880886426, + "loss": 0.6796, + "mean_token_accuracy": 0.7933435320854187, + "num_tokens": 162588410.0, + "step": 47680 + }, + { + "epoch": 0.4786422578184592, + "learning_rate": 0.00010427355574290418, + "loss": 0.6498, + "mean_token_accuracy": 0.8042173683643341, + "num_tokens": 162625530.0, + "step": 47690 + }, + { + "epoch": 0.47874262314825966, + "learning_rate": 0.00010425348267694407, + "loss": 0.6755, + "mean_token_accuracy": 0.7967062354087829, + "num_tokens": 162661367.0, + "step": 47700 + }, + { + "epoch": 0.4788429884780601, + "learning_rate": 0.00010423340961098398, + "loss": 0.7098, + "mean_token_accuracy": 0.7858090043067932, + "num_tokens": 162696852.0, + "step": 47710 + }, + { + "epoch": 0.47894335380786063, + "learning_rate": 0.0001042133365450239, + "loss": 0.6726, + "mean_token_accuracy": 0.7962167382240295, + "num_tokens": 162732782.0, + "step": 47720 + }, + { + "epoch": 0.4790437191376611, + "learning_rate": 0.0001041932634790638, + "loss": 0.6759, + "mean_token_accuracy": 0.7944247961044312, + "num_tokens": 162768668.0, + "step": 47730 + }, + { + "epoch": 0.47914408446746154, + "learning_rate": 0.0001041731904131037, + "loss": 0.7139, + "mean_token_accuracy": 0.785028612613678, + "num_tokens": 162803623.0, + "step": 47740 + }, + { + "epoch": 0.47924444979726205, + "learning_rate": 0.00010415311734714362, + "loss": 0.6542, + "mean_token_accuracy": 0.800380527973175, + "num_tokens": 162839575.0, + "step": 47750 + }, + { + "epoch": 0.4793448151270625, + "learning_rate": 0.00010413304428118351, + "loss": 0.6459, + "mean_token_accuracy": 0.7978033125400543, + "num_tokens": 162876112.0, + "step": 47760 + }, + { + "epoch": 0.47944518045686296, + "learning_rate": 0.0001041129712152234, + "loss": 0.7162, + "mean_token_accuracy": 0.7856225728988647, + "num_tokens": 162911288.0, + "step": 47770 + }, + { + "epoch": 0.4795455457866635, + "learning_rate": 0.00010409289814926333, + "loss": 0.6821, + "mean_token_accuracy": 0.7910649538040161, + "num_tokens": 162946297.0, + "step": 47780 + }, + { + "epoch": 0.47964591111646393, + "learning_rate": 0.00010407282508330322, + "loss": 0.72, + "mean_token_accuracy": 0.7854718923568725, + "num_tokens": 162981256.0, + "step": 47790 + }, + { + "epoch": 0.4797462764462644, + "learning_rate": 0.00010405275201734313, + "loss": 0.6887, + "mean_token_accuracy": 0.7937243342399597, + "num_tokens": 163016659.0, + "step": 47800 + }, + { + "epoch": 0.4798466417760649, + "learning_rate": 0.00010403267895138304, + "loss": 0.6769, + "mean_token_accuracy": 0.7947654485702514, + "num_tokens": 163052921.0, + "step": 47810 + }, + { + "epoch": 0.47994700710586535, + "learning_rate": 0.00010401260588542295, + "loss": 0.6673, + "mean_token_accuracy": 0.799593985080719, + "num_tokens": 163089902.0, + "step": 47820 + }, + { + "epoch": 0.4800473724356658, + "learning_rate": 0.00010399253281946284, + "loss": 0.684, + "mean_token_accuracy": 0.7932468891143799, + "num_tokens": 163125318.0, + "step": 47830 + }, + { + "epoch": 0.4801477377654663, + "learning_rate": 0.00010397245975350277, + "loss": 0.742, + "mean_token_accuracy": 0.7809097528457641, + "num_tokens": 163160809.0, + "step": 47840 + }, + { + "epoch": 0.4802481030952668, + "learning_rate": 0.00010395238668754266, + "loss": 0.6726, + "mean_token_accuracy": 0.7962616145610809, + "num_tokens": 163195946.0, + "step": 47850 + }, + { + "epoch": 0.48034846842506723, + "learning_rate": 0.00010393231362158255, + "loss": 0.6883, + "mean_token_accuracy": 0.7961674690246582, + "num_tokens": 163231686.0, + "step": 47860 + }, + { + "epoch": 0.48044883375486774, + "learning_rate": 0.00010391224055562248, + "loss": 0.6822, + "mean_token_accuracy": 0.7897140741348266, + "num_tokens": 163268030.0, + "step": 47870 + }, + { + "epoch": 0.4805491990846682, + "learning_rate": 0.00010389216748966237, + "loss": 0.692, + "mean_token_accuracy": 0.7926612317562103, + "num_tokens": 163303833.0, + "step": 47880 + }, + { + "epoch": 0.48064956441446866, + "learning_rate": 0.00010387209442370227, + "loss": 0.7397, + "mean_token_accuracy": 0.7783870279788971, + "num_tokens": 163338956.0, + "step": 47890 + }, + { + "epoch": 0.48074992974426917, + "learning_rate": 0.00010385202135774219, + "loss": 0.6783, + "mean_token_accuracy": 0.7934011518955231, + "num_tokens": 163375923.0, + "step": 47900 + }, + { + "epoch": 0.4808502950740696, + "learning_rate": 0.00010383194829178208, + "loss": 0.6754, + "mean_token_accuracy": 0.7942137479782104, + "num_tokens": 163410955.0, + "step": 47910 + }, + { + "epoch": 0.4809506604038701, + "learning_rate": 0.00010381187522582199, + "loss": 0.6776, + "mean_token_accuracy": 0.7968982100486756, + "num_tokens": 163445528.0, + "step": 47920 + }, + { + "epoch": 0.48105102573367053, + "learning_rate": 0.0001037918021598619, + "loss": 0.6751, + "mean_token_accuracy": 0.7926284074783325, + "num_tokens": 163481903.0, + "step": 47930 + }, + { + "epoch": 0.48115139106347105, + "learning_rate": 0.00010377172909390181, + "loss": 0.6576, + "mean_token_accuracy": 0.7997497975826263, + "num_tokens": 163518436.0, + "step": 47940 + }, + { + "epoch": 0.4812517563932715, + "learning_rate": 0.00010375165602794172, + "loss": 0.7369, + "mean_token_accuracy": 0.7813829720020294, + "num_tokens": 163554326.0, + "step": 47950 + }, + { + "epoch": 0.48135212172307196, + "learning_rate": 0.00010373158296198163, + "loss": 0.7072, + "mean_token_accuracy": 0.7888287842273712, + "num_tokens": 163590652.0, + "step": 47960 + }, + { + "epoch": 0.48145248705287247, + "learning_rate": 0.00010371150989602152, + "loss": 0.6511, + "mean_token_accuracy": 0.7944359362125397, + "num_tokens": 163626494.0, + "step": 47970 + }, + { + "epoch": 0.4815528523826729, + "learning_rate": 0.00010369143683006144, + "loss": 0.6718, + "mean_token_accuracy": 0.7970012128353119, + "num_tokens": 163661563.0, + "step": 47980 + }, + { + "epoch": 0.4816532177124734, + "learning_rate": 0.00010367136376410134, + "loss": 0.6784, + "mean_token_accuracy": 0.7969679594039917, + "num_tokens": 163697040.0, + "step": 47990 + }, + { + "epoch": 0.4817535830422739, + "learning_rate": 0.00010365129069814123, + "loss": 0.681, + "mean_token_accuracy": 0.7943235516548157, + "num_tokens": 163732537.0, + "step": 48000 + }, + { + "epoch": 0.48185394837207435, + "learning_rate": 0.00010363121763218115, + "loss": 0.6951, + "mean_token_accuracy": 0.7890613734722137, + "num_tokens": 163768361.0, + "step": 48010 + }, + { + "epoch": 0.4819543137018748, + "learning_rate": 0.00010361114456622105, + "loss": 0.7016, + "mean_token_accuracy": 0.7916137874126434, + "num_tokens": 163803475.0, + "step": 48020 + }, + { + "epoch": 0.4820546790316753, + "learning_rate": 0.00010359107150026094, + "loss": 0.6598, + "mean_token_accuracy": 0.8004237949848175, + "num_tokens": 163839338.0, + "step": 48030 + }, + { + "epoch": 0.48215504436147577, + "learning_rate": 0.00010357099843430087, + "loss": 0.6912, + "mean_token_accuracy": 0.7930728733539582, + "num_tokens": 163874577.0, + "step": 48040 + }, + { + "epoch": 0.4822554096912762, + "learning_rate": 0.00010355092536834076, + "loss": 0.7043, + "mean_token_accuracy": 0.789654529094696, + "num_tokens": 163910646.0, + "step": 48050 + }, + { + "epoch": 0.48235577502107674, + "learning_rate": 0.00010353085230238067, + "loss": 0.6644, + "mean_token_accuracy": 0.7975339889526367, + "num_tokens": 163946744.0, + "step": 48060 + }, + { + "epoch": 0.4824561403508772, + "learning_rate": 0.00010351077923642059, + "loss": 0.6915, + "mean_token_accuracy": 0.789144366979599, + "num_tokens": 163982922.0, + "step": 48070 + }, + { + "epoch": 0.48255650568067765, + "learning_rate": 0.00010349070617046049, + "loss": 0.6586, + "mean_token_accuracy": 0.8003958880901336, + "num_tokens": 164018490.0, + "step": 48080 + }, + { + "epoch": 0.48265687101047816, + "learning_rate": 0.00010347063310450038, + "loss": 0.6936, + "mean_token_accuracy": 0.7923797130584717, + "num_tokens": 164053312.0, + "step": 48090 + }, + { + "epoch": 0.4827572363402786, + "learning_rate": 0.0001034505600385403, + "loss": 0.7184, + "mean_token_accuracy": 0.7866088509559631, + "num_tokens": 164088516.0, + "step": 48100 + }, + { + "epoch": 0.4828576016700791, + "learning_rate": 0.0001034304869725802, + "loss": 0.6624, + "mean_token_accuracy": 0.7987448096275329, + "num_tokens": 164125498.0, + "step": 48110 + }, + { + "epoch": 0.4829579669998796, + "learning_rate": 0.00010341041390662009, + "loss": 0.6403, + "mean_token_accuracy": 0.804091477394104, + "num_tokens": 164161279.0, + "step": 48120 + }, + { + "epoch": 0.48305833232968004, + "learning_rate": 0.00010339034084066001, + "loss": 0.727, + "mean_token_accuracy": 0.781208735704422, + "num_tokens": 164196114.0, + "step": 48130 + }, + { + "epoch": 0.4831586976594805, + "learning_rate": 0.00010337026777469991, + "loss": 0.722, + "mean_token_accuracy": 0.7808577239513397, + "num_tokens": 164231733.0, + "step": 48140 + }, + { + "epoch": 0.483259062989281, + "learning_rate": 0.00010335019470873982, + "loss": 0.673, + "mean_token_accuracy": 0.7946267187595367, + "num_tokens": 164267460.0, + "step": 48150 + }, + { + "epoch": 0.48335942831908146, + "learning_rate": 0.00010333012164277973, + "loss": 0.679, + "mean_token_accuracy": 0.795447838306427, + "num_tokens": 164302051.0, + "step": 48160 + }, + { + "epoch": 0.4834597936488819, + "learning_rate": 0.00010331004857681964, + "loss": 0.6521, + "mean_token_accuracy": 0.7975180566310882, + "num_tokens": 164337925.0, + "step": 48170 + }, + { + "epoch": 0.48356015897868243, + "learning_rate": 0.00010328997551085953, + "loss": 0.6621, + "mean_token_accuracy": 0.8010074675083161, + "num_tokens": 164373647.0, + "step": 48180 + }, + { + "epoch": 0.4836605243084829, + "learning_rate": 0.00010326990244489945, + "loss": 0.6718, + "mean_token_accuracy": 0.7939490079879761, + "num_tokens": 164409199.0, + "step": 48190 + }, + { + "epoch": 0.48376088963828334, + "learning_rate": 0.00010324982937893935, + "loss": 0.6579, + "mean_token_accuracy": 0.7961607813835144, + "num_tokens": 164445741.0, + "step": 48200 + }, + { + "epoch": 0.4838612549680838, + "learning_rate": 0.00010322975631297924, + "loss": 0.6565, + "mean_token_accuracy": 0.7984263598918915, + "num_tokens": 164482421.0, + "step": 48210 + }, + { + "epoch": 0.4839616202978843, + "learning_rate": 0.00010320968324701916, + "loss": 0.6909, + "mean_token_accuracy": 0.7874985694885254, + "num_tokens": 164517951.0, + "step": 48220 + }, + { + "epoch": 0.48406198562768477, + "learning_rate": 0.00010318961018105906, + "loss": 0.6705, + "mean_token_accuracy": 0.797230851650238, + "num_tokens": 164554573.0, + "step": 48230 + }, + { + "epoch": 0.4841623509574852, + "learning_rate": 0.00010316953711509895, + "loss": 0.6821, + "mean_token_accuracy": 0.795600700378418, + "num_tokens": 164590873.0, + "step": 48240 + }, + { + "epoch": 0.48426271628728573, + "learning_rate": 0.00010314946404913888, + "loss": 0.7072, + "mean_token_accuracy": 0.7906558811664581, + "num_tokens": 164627073.0, + "step": 48250 + }, + { + "epoch": 0.4843630816170862, + "learning_rate": 0.00010312939098317877, + "loss": 0.6872, + "mean_token_accuracy": 0.7920962035655975, + "num_tokens": 164662493.0, + "step": 48260 + }, + { + "epoch": 0.48446344694688664, + "learning_rate": 0.00010310931791721868, + "loss": 0.6774, + "mean_token_accuracy": 0.7944299578666687, + "num_tokens": 164698299.0, + "step": 48270 + }, + { + "epoch": 0.48456381227668716, + "learning_rate": 0.00010308924485125859, + "loss": 0.7223, + "mean_token_accuracy": 0.7846730351448059, + "num_tokens": 164734390.0, + "step": 48280 + }, + { + "epoch": 0.4846641776064876, + "learning_rate": 0.0001030691717852985, + "loss": 0.6414, + "mean_token_accuracy": 0.8061159372329711, + "num_tokens": 164770787.0, + "step": 48290 + }, + { + "epoch": 0.48476454293628807, + "learning_rate": 0.00010304909871933839, + "loss": 0.664, + "mean_token_accuracy": 0.7991957008838654, + "num_tokens": 164806877.0, + "step": 48300 + }, + { + "epoch": 0.4848649082660886, + "learning_rate": 0.00010302902565337831, + "loss": 0.6992, + "mean_token_accuracy": 0.7914974689483643, + "num_tokens": 164842674.0, + "step": 48310 + }, + { + "epoch": 0.48496527359588903, + "learning_rate": 0.00010300895258741821, + "loss": 0.6354, + "mean_token_accuracy": 0.806444126367569, + "num_tokens": 164878725.0, + "step": 48320 + }, + { + "epoch": 0.4850656389256895, + "learning_rate": 0.0001029888795214581, + "loss": 0.7072, + "mean_token_accuracy": 0.7881014108657837, + "num_tokens": 164914354.0, + "step": 48330 + }, + { + "epoch": 0.48516600425549, + "learning_rate": 0.00010296880645549802, + "loss": 0.6931, + "mean_token_accuracy": 0.7914582073688508, + "num_tokens": 164951175.0, + "step": 48340 + }, + { + "epoch": 0.48526636958529046, + "learning_rate": 0.00010294873338953792, + "loss": 0.6771, + "mean_token_accuracy": 0.7916079461574554, + "num_tokens": 164988217.0, + "step": 48350 + }, + { + "epoch": 0.4853667349150909, + "learning_rate": 0.00010292866032357781, + "loss": 0.6617, + "mean_token_accuracy": 0.7961135387420655, + "num_tokens": 165023908.0, + "step": 48360 + }, + { + "epoch": 0.4854671002448914, + "learning_rate": 0.00010290858725761774, + "loss": 0.6929, + "mean_token_accuracy": 0.7928700387477875, + "num_tokens": 165059954.0, + "step": 48370 + }, + { + "epoch": 0.4855674655746919, + "learning_rate": 0.00010288851419165763, + "loss": 0.6912, + "mean_token_accuracy": 0.7901743710041046, + "num_tokens": 165096806.0, + "step": 48380 + }, + { + "epoch": 0.48566783090449234, + "learning_rate": 0.00010286844112569754, + "loss": 0.694, + "mean_token_accuracy": 0.7921668708324432, + "num_tokens": 165132310.0, + "step": 48390 + }, + { + "epoch": 0.48576819623429285, + "learning_rate": 0.00010284836805973745, + "loss": 0.6701, + "mean_token_accuracy": 0.7965425670146942, + "num_tokens": 165168260.0, + "step": 48400 + }, + { + "epoch": 0.4858685615640933, + "learning_rate": 0.00010282829499377736, + "loss": 0.6903, + "mean_token_accuracy": 0.793122661113739, + "num_tokens": 165204508.0, + "step": 48410 + }, + { + "epoch": 0.48596892689389376, + "learning_rate": 0.00010280822192781725, + "loss": 0.6573, + "mean_token_accuracy": 0.800396591424942, + "num_tokens": 165240999.0, + "step": 48420 + }, + { + "epoch": 0.48606929222369427, + "learning_rate": 0.00010278814886185717, + "loss": 0.6445, + "mean_token_accuracy": 0.800655859708786, + "num_tokens": 165277706.0, + "step": 48430 + }, + { + "epoch": 0.4861696575534947, + "learning_rate": 0.00010276807579589707, + "loss": 0.6958, + "mean_token_accuracy": 0.7916760146617889, + "num_tokens": 165312787.0, + "step": 48440 + }, + { + "epoch": 0.4862700228832952, + "learning_rate": 0.00010274800272993696, + "loss": 0.6804, + "mean_token_accuracy": 0.7930470466613769, + "num_tokens": 165348317.0, + "step": 48450 + }, + { + "epoch": 0.4863703882130957, + "learning_rate": 0.00010272792966397688, + "loss": 0.6506, + "mean_token_accuracy": 0.8018568575382232, + "num_tokens": 165385040.0, + "step": 48460 + }, + { + "epoch": 0.48647075354289615, + "learning_rate": 0.00010270785659801678, + "loss": 0.6931, + "mean_token_accuracy": 0.783112621307373, + "num_tokens": 165421786.0, + "step": 48470 + }, + { + "epoch": 0.4865711188726966, + "learning_rate": 0.00010268778353205667, + "loss": 0.6831, + "mean_token_accuracy": 0.7922792792320251, + "num_tokens": 165457647.0, + "step": 48480 + }, + { + "epoch": 0.48667148420249706, + "learning_rate": 0.0001026677104660966, + "loss": 0.6987, + "mean_token_accuracy": 0.7867967963218689, + "num_tokens": 165493599.0, + "step": 48490 + }, + { + "epoch": 0.4867718495322976, + "learning_rate": 0.00010264763740013649, + "loss": 0.6617, + "mean_token_accuracy": 0.7973835945129395, + "num_tokens": 165529231.0, + "step": 48500 + }, + { + "epoch": 0.48687221486209803, + "learning_rate": 0.0001026275643341764, + "loss": 0.6587, + "mean_token_accuracy": 0.7987306237220764, + "num_tokens": 165566117.0, + "step": 48510 + }, + { + "epoch": 0.4869725801918985, + "learning_rate": 0.00010260749126821632, + "loss": 0.6776, + "mean_token_accuracy": 0.7935501039028168, + "num_tokens": 165602360.0, + "step": 48520 + }, + { + "epoch": 0.487072945521699, + "learning_rate": 0.00010258741820225622, + "loss": 0.6813, + "mean_token_accuracy": 0.7961971998214722, + "num_tokens": 165639131.0, + "step": 48530 + }, + { + "epoch": 0.48717331085149945, + "learning_rate": 0.00010256734513629614, + "loss": 0.6497, + "mean_token_accuracy": 0.8006950974464416, + "num_tokens": 165676654.0, + "step": 48540 + }, + { + "epoch": 0.4872736761812999, + "learning_rate": 0.00010254727207033603, + "loss": 0.6629, + "mean_token_accuracy": 0.7984619259834289, + "num_tokens": 165713192.0, + "step": 48550 + }, + { + "epoch": 0.4873740415111004, + "learning_rate": 0.00010252719900437593, + "loss": 0.647, + "mean_token_accuracy": 0.8039807558059693, + "num_tokens": 165749737.0, + "step": 48560 + }, + { + "epoch": 0.4874744068409009, + "learning_rate": 0.00010250712593841585, + "loss": 0.6746, + "mean_token_accuracy": 0.7973509192466736, + "num_tokens": 165785171.0, + "step": 48570 + }, + { + "epoch": 0.48757477217070133, + "learning_rate": 0.00010248705287245575, + "loss": 0.6998, + "mean_token_accuracy": 0.7900561451911926, + "num_tokens": 165821362.0, + "step": 48580 + }, + { + "epoch": 0.48767513750050184, + "learning_rate": 0.00010246697980649564, + "loss": 0.6383, + "mean_token_accuracy": 0.8029297113418579, + "num_tokens": 165858520.0, + "step": 48590 + }, + { + "epoch": 0.4877755028303023, + "learning_rate": 0.00010244690674053556, + "loss": 0.6647, + "mean_token_accuracy": 0.7972795307636261, + "num_tokens": 165895360.0, + "step": 48600 + }, + { + "epoch": 0.48787586816010275, + "learning_rate": 0.00010242683367457546, + "loss": 0.6649, + "mean_token_accuracy": 0.7969582557678223, + "num_tokens": 165932580.0, + "step": 48610 + }, + { + "epoch": 0.48797623348990327, + "learning_rate": 0.00010240676060861537, + "loss": 0.6778, + "mean_token_accuracy": 0.7921225070953369, + "num_tokens": 165968971.0, + "step": 48620 + }, + { + "epoch": 0.4880765988197037, + "learning_rate": 0.00010238668754265527, + "loss": 0.6896, + "mean_token_accuracy": 0.7959330201148986, + "num_tokens": 166004902.0, + "step": 48630 + }, + { + "epoch": 0.4881769641495042, + "learning_rate": 0.00010236661447669518, + "loss": 0.692, + "mean_token_accuracy": 0.7915273070335388, + "num_tokens": 166040884.0, + "step": 48640 + }, + { + "epoch": 0.4882773294793047, + "learning_rate": 0.00010234654141073508, + "loss": 0.6529, + "mean_token_accuracy": 0.8000566363334656, + "num_tokens": 166077731.0, + "step": 48650 + }, + { + "epoch": 0.48837769480910515, + "learning_rate": 0.000102326468344775, + "loss": 0.6744, + "mean_token_accuracy": 0.7959813833236694, + "num_tokens": 166114314.0, + "step": 48660 + }, + { + "epoch": 0.4884780601389056, + "learning_rate": 0.0001023063952788149, + "loss": 0.6817, + "mean_token_accuracy": 0.7944016873836517, + "num_tokens": 166149915.0, + "step": 48670 + }, + { + "epoch": 0.4885784254687061, + "learning_rate": 0.00010228632221285479, + "loss": 0.6778, + "mean_token_accuracy": 0.7906705737113953, + "num_tokens": 166184851.0, + "step": 48680 + }, + { + "epoch": 0.48867879079850657, + "learning_rate": 0.00010226624914689471, + "loss": 0.7067, + "mean_token_accuracy": 0.7922101736068725, + "num_tokens": 166220345.0, + "step": 48690 + }, + { + "epoch": 0.488779156128307, + "learning_rate": 0.0001022461760809346, + "loss": 0.662, + "mean_token_accuracy": 0.8018300950527191, + "num_tokens": 166256077.0, + "step": 48700 + }, + { + "epoch": 0.48887952145810754, + "learning_rate": 0.0001022261030149745, + "loss": 0.6916, + "mean_token_accuracy": 0.7912471473217011, + "num_tokens": 166292475.0, + "step": 48710 + }, + { + "epoch": 0.488979886787908, + "learning_rate": 0.00010220602994901442, + "loss": 0.6423, + "mean_token_accuracy": 0.7997991442680359, + "num_tokens": 166329031.0, + "step": 48720 + }, + { + "epoch": 0.48908025211770845, + "learning_rate": 0.00010218595688305432, + "loss": 0.6528, + "mean_token_accuracy": 0.7999334573745728, + "num_tokens": 166363954.0, + "step": 48730 + }, + { + "epoch": 0.48918061744750896, + "learning_rate": 0.00010216588381709423, + "loss": 0.674, + "mean_token_accuracy": 0.7921888053417205, + "num_tokens": 166400684.0, + "step": 48740 + }, + { + "epoch": 0.4892809827773094, + "learning_rate": 0.00010214581075113413, + "loss": 0.666, + "mean_token_accuracy": 0.7992009162902832, + "num_tokens": 166436290.0, + "step": 48750 + }, + { + "epoch": 0.48938134810710987, + "learning_rate": 0.00010212573768517404, + "loss": 0.6451, + "mean_token_accuracy": 0.8084811270236969, + "num_tokens": 166472149.0, + "step": 48760 + }, + { + "epoch": 0.4894817134369103, + "learning_rate": 0.00010210566461921394, + "loss": 0.6563, + "mean_token_accuracy": 0.8018660724163056, + "num_tokens": 166508884.0, + "step": 48770 + }, + { + "epoch": 0.48958207876671084, + "learning_rate": 0.00010208559155325386, + "loss": 0.6501, + "mean_token_accuracy": 0.8009030163288117, + "num_tokens": 166545244.0, + "step": 48780 + }, + { + "epoch": 0.4896824440965113, + "learning_rate": 0.00010206551848729375, + "loss": 0.678, + "mean_token_accuracy": 0.7926466882228851, + "num_tokens": 166581823.0, + "step": 48790 + }, + { + "epoch": 0.48978280942631175, + "learning_rate": 0.00010204544542133365, + "loss": 0.6618, + "mean_token_accuracy": 0.8020177721977234, + "num_tokens": 166618826.0, + "step": 48800 + }, + { + "epoch": 0.48988317475611226, + "learning_rate": 0.00010202537235537357, + "loss": 0.6815, + "mean_token_accuracy": 0.7936260044574738, + "num_tokens": 166654734.0, + "step": 48810 + }, + { + "epoch": 0.4899835400859127, + "learning_rate": 0.00010200529928941347, + "loss": 0.6418, + "mean_token_accuracy": 0.8066985130310058, + "num_tokens": 166691645.0, + "step": 48820 + }, + { + "epoch": 0.4900839054157132, + "learning_rate": 0.00010198522622345336, + "loss": 0.6597, + "mean_token_accuracy": 0.7996945679187775, + "num_tokens": 166727650.0, + "step": 48830 + }, + { + "epoch": 0.4901842707455137, + "learning_rate": 0.00010196515315749328, + "loss": 0.6809, + "mean_token_accuracy": 0.792582529783249, + "num_tokens": 166763886.0, + "step": 48840 + }, + { + "epoch": 0.49028463607531414, + "learning_rate": 0.00010194508009153318, + "loss": 0.7033, + "mean_token_accuracy": 0.786809754371643, + "num_tokens": 166799672.0, + "step": 48850 + }, + { + "epoch": 0.4903850014051146, + "learning_rate": 0.00010192500702557309, + "loss": 0.6783, + "mean_token_accuracy": 0.7955593287944793, + "num_tokens": 166834849.0, + "step": 48860 + }, + { + "epoch": 0.4904853667349151, + "learning_rate": 0.00010190493395961301, + "loss": 0.647, + "mean_token_accuracy": 0.8022721767425537, + "num_tokens": 166870259.0, + "step": 48870 + }, + { + "epoch": 0.49058573206471556, + "learning_rate": 0.0001018848608936529, + "loss": 0.6751, + "mean_token_accuracy": 0.8003849744796753, + "num_tokens": 166906060.0, + "step": 48880 + }, + { + "epoch": 0.490686097394516, + "learning_rate": 0.0001018647878276928, + "loss": 0.6758, + "mean_token_accuracy": 0.7969516217708588, + "num_tokens": 166942371.0, + "step": 48890 + }, + { + "epoch": 0.49078646272431653, + "learning_rate": 0.00010184471476173272, + "loss": 0.6725, + "mean_token_accuracy": 0.7958665549755096, + "num_tokens": 166978893.0, + "step": 48900 + }, + { + "epoch": 0.490886828054117, + "learning_rate": 0.00010182464169577262, + "loss": 0.6459, + "mean_token_accuracy": 0.8034192264080048, + "num_tokens": 167015286.0, + "step": 48910 + }, + { + "epoch": 0.49098719338391744, + "learning_rate": 0.00010180456862981251, + "loss": 0.648, + "mean_token_accuracy": 0.802105039358139, + "num_tokens": 167051732.0, + "step": 48920 + }, + { + "epoch": 0.49108755871371795, + "learning_rate": 0.00010178449556385243, + "loss": 0.682, + "mean_token_accuracy": 0.7966529786586761, + "num_tokens": 167086827.0, + "step": 48930 + }, + { + "epoch": 0.4911879240435184, + "learning_rate": 0.00010176442249789233, + "loss": 0.6815, + "mean_token_accuracy": 0.7956272065639496, + "num_tokens": 167122570.0, + "step": 48940 + }, + { + "epoch": 0.49128828937331886, + "learning_rate": 0.00010174434943193224, + "loss": 0.6448, + "mean_token_accuracy": 0.8040194809436798, + "num_tokens": 167158267.0, + "step": 48950 + }, + { + "epoch": 0.4913886547031194, + "learning_rate": 0.00010172427636597214, + "loss": 0.6736, + "mean_token_accuracy": 0.791230309009552, + "num_tokens": 167194290.0, + "step": 48960 + }, + { + "epoch": 0.49148902003291983, + "learning_rate": 0.00010170420330001205, + "loss": 0.6891, + "mean_token_accuracy": 0.7936301529407501, + "num_tokens": 167229898.0, + "step": 48970 + }, + { + "epoch": 0.4915893853627203, + "learning_rate": 0.00010168413023405195, + "loss": 0.6653, + "mean_token_accuracy": 0.8004696249961853, + "num_tokens": 167266071.0, + "step": 48980 + }, + { + "epoch": 0.4916897506925208, + "learning_rate": 0.00010166405716809187, + "loss": 0.6598, + "mean_token_accuracy": 0.7968671381473541, + "num_tokens": 167303234.0, + "step": 48990 + }, + { + "epoch": 0.49179011602232126, + "learning_rate": 0.00010164398410213176, + "loss": 0.6603, + "mean_token_accuracy": 0.8036011934280396, + "num_tokens": 167339447.0, + "step": 49000 + }, + { + "epoch": 0.4918904813521217, + "learning_rate": 0.00010162391103617166, + "loss": 0.661, + "mean_token_accuracy": 0.7965591430664063, + "num_tokens": 167375969.0, + "step": 49010 + }, + { + "epoch": 0.4919908466819222, + "learning_rate": 0.00010160383797021158, + "loss": 0.6534, + "mean_token_accuracy": 0.795904415845871, + "num_tokens": 167412465.0, + "step": 49020 + }, + { + "epoch": 0.4920912120117227, + "learning_rate": 0.00010158376490425148, + "loss": 0.6913, + "mean_token_accuracy": 0.7899755477905274, + "num_tokens": 167448800.0, + "step": 49030 + }, + { + "epoch": 0.49219157734152313, + "learning_rate": 0.00010156369183829137, + "loss": 0.658, + "mean_token_accuracy": 0.7980289340019227, + "num_tokens": 167485083.0, + "step": 49040 + }, + { + "epoch": 0.49229194267132365, + "learning_rate": 0.00010154361877233129, + "loss": 0.6702, + "mean_token_accuracy": 0.7956407785415649, + "num_tokens": 167522992.0, + "step": 49050 + }, + { + "epoch": 0.4923923080011241, + "learning_rate": 0.00010152354570637119, + "loss": 0.6795, + "mean_token_accuracy": 0.7919821202754974, + "num_tokens": 167559245.0, + "step": 49060 + }, + { + "epoch": 0.49249267333092456, + "learning_rate": 0.0001015034726404111, + "loss": 0.7002, + "mean_token_accuracy": 0.788819408416748, + "num_tokens": 167596616.0, + "step": 49070 + }, + { + "epoch": 0.492593038660725, + "learning_rate": 0.000101483399574451, + "loss": 0.6537, + "mean_token_accuracy": 0.7997047662734985, + "num_tokens": 167631223.0, + "step": 49080 + }, + { + "epoch": 0.4926934039905255, + "learning_rate": 0.00010146332650849091, + "loss": 0.6921, + "mean_token_accuracy": 0.7928080320358276, + "num_tokens": 167667315.0, + "step": 49090 + }, + { + "epoch": 0.492793769320326, + "learning_rate": 0.00010144325344253082, + "loss": 0.633, + "mean_token_accuracy": 0.8074764609336853, + "num_tokens": 167702728.0, + "step": 49100 + }, + { + "epoch": 0.49289413465012644, + "learning_rate": 0.00010142318037657073, + "loss": 0.6803, + "mean_token_accuracy": 0.7898491978645324, + "num_tokens": 167738498.0, + "step": 49110 + }, + { + "epoch": 0.49299449997992695, + "learning_rate": 0.00010140310731061062, + "loss": 0.667, + "mean_token_accuracy": 0.799743378162384, + "num_tokens": 167774600.0, + "step": 49120 + }, + { + "epoch": 0.4930948653097274, + "learning_rate": 0.00010138303424465055, + "loss": 0.6774, + "mean_token_accuracy": 0.7991834044456482, + "num_tokens": 167810392.0, + "step": 49130 + }, + { + "epoch": 0.49319523063952786, + "learning_rate": 0.00010136296117869044, + "loss": 0.6419, + "mean_token_accuracy": 0.80216743350029, + "num_tokens": 167846423.0, + "step": 49140 + }, + { + "epoch": 0.49329559596932837, + "learning_rate": 0.00010134288811273034, + "loss": 0.6904, + "mean_token_accuracy": 0.7967431306838989, + "num_tokens": 167882764.0, + "step": 49150 + }, + { + "epoch": 0.4933959612991288, + "learning_rate": 0.00010132281504677026, + "loss": 0.6737, + "mean_token_accuracy": 0.7951765596866608, + "num_tokens": 167918193.0, + "step": 49160 + }, + { + "epoch": 0.4934963266289293, + "learning_rate": 0.00010130274198081015, + "loss": 0.6455, + "mean_token_accuracy": 0.8014727294445038, + "num_tokens": 167953522.0, + "step": 49170 + }, + { + "epoch": 0.4935966919587298, + "learning_rate": 0.00010128266891485005, + "loss": 0.6846, + "mean_token_accuracy": 0.7900352478027344, + "num_tokens": 167989788.0, + "step": 49180 + }, + { + "epoch": 0.49369705728853025, + "learning_rate": 0.00010126259584888997, + "loss": 0.653, + "mean_token_accuracy": 0.8036088228225708, + "num_tokens": 168026492.0, + "step": 49190 + }, + { + "epoch": 0.4937974226183307, + "learning_rate": 0.00010124252278292987, + "loss": 0.6212, + "mean_token_accuracy": 0.8075027704238892, + "num_tokens": 168063125.0, + "step": 49200 + }, + { + "epoch": 0.4938977879481312, + "learning_rate": 0.00010122244971696977, + "loss": 0.6641, + "mean_token_accuracy": 0.8012927532196045, + "num_tokens": 168100114.0, + "step": 49210 + }, + { + "epoch": 0.4939981532779317, + "learning_rate": 0.0001012023766510097, + "loss": 0.6206, + "mean_token_accuracy": 0.8106712639331818, + "num_tokens": 168137049.0, + "step": 49220 + }, + { + "epoch": 0.49409851860773213, + "learning_rate": 0.00010118230358504959, + "loss": 0.6676, + "mean_token_accuracy": 0.8016164481639863, + "num_tokens": 168173489.0, + "step": 49230 + }, + { + "epoch": 0.49419888393753264, + "learning_rate": 0.00010116223051908949, + "loss": 0.6707, + "mean_token_accuracy": 0.7990468502044678, + "num_tokens": 168210405.0, + "step": 49240 + }, + { + "epoch": 0.4942992492673331, + "learning_rate": 0.00010114215745312941, + "loss": 0.6819, + "mean_token_accuracy": 0.7885425746440887, + "num_tokens": 168246121.0, + "step": 49250 + }, + { + "epoch": 0.49439961459713355, + "learning_rate": 0.0001011220843871693, + "loss": 0.6384, + "mean_token_accuracy": 0.8060955345630646, + "num_tokens": 168282885.0, + "step": 49260 + }, + { + "epoch": 0.49449997992693406, + "learning_rate": 0.0001011020113212092, + "loss": 0.6329, + "mean_token_accuracy": 0.8048595309257507, + "num_tokens": 168320252.0, + "step": 49270 + }, + { + "epoch": 0.4946003452567345, + "learning_rate": 0.00010108193825524912, + "loss": 0.6712, + "mean_token_accuracy": 0.7946819722652435, + "num_tokens": 168356206.0, + "step": 49280 + }, + { + "epoch": 0.494700710586535, + "learning_rate": 0.00010106186518928901, + "loss": 0.6733, + "mean_token_accuracy": 0.7937299966812134, + "num_tokens": 168391953.0, + "step": 49290 + }, + { + "epoch": 0.4948010759163355, + "learning_rate": 0.00010104179212332891, + "loss": 0.6366, + "mean_token_accuracy": 0.8032675206661224, + "num_tokens": 168428933.0, + "step": 49300 + }, + { + "epoch": 0.49490144124613594, + "learning_rate": 0.00010102171905736883, + "loss": 0.6546, + "mean_token_accuracy": 0.8021373987197876, + "num_tokens": 168465598.0, + "step": 49310 + }, + { + "epoch": 0.4950018065759364, + "learning_rate": 0.00010100164599140874, + "loss": 0.6679, + "mean_token_accuracy": 0.7983918905258178, + "num_tokens": 168501674.0, + "step": 49320 + }, + { + "epoch": 0.4951021719057369, + "learning_rate": 0.00010098157292544863, + "loss": 0.6692, + "mean_token_accuracy": 0.7963124752044678, + "num_tokens": 168538275.0, + "step": 49330 + }, + { + "epoch": 0.49520253723553737, + "learning_rate": 0.00010096149985948856, + "loss": 0.6484, + "mean_token_accuracy": 0.8078245878219604, + "num_tokens": 168574324.0, + "step": 49340 + }, + { + "epoch": 0.4953029025653378, + "learning_rate": 0.00010094142679352845, + "loss": 0.6205, + "mean_token_accuracy": 0.8130067169666291, + "num_tokens": 168612080.0, + "step": 49350 + }, + { + "epoch": 0.4954032678951383, + "learning_rate": 0.00010092135372756835, + "loss": 0.6383, + "mean_token_accuracy": 0.8053999781608582, + "num_tokens": 168647904.0, + "step": 49360 + }, + { + "epoch": 0.4955036332249388, + "learning_rate": 0.00010090128066160827, + "loss": 0.6892, + "mean_token_accuracy": 0.792946869134903, + "num_tokens": 168684673.0, + "step": 49370 + }, + { + "epoch": 0.49560399855473924, + "learning_rate": 0.00010088120759564816, + "loss": 0.6418, + "mean_token_accuracy": 0.8067975401878357, + "num_tokens": 168721319.0, + "step": 49380 + }, + { + "epoch": 0.4957043638845397, + "learning_rate": 0.00010086113452968806, + "loss": 0.6532, + "mean_token_accuracy": 0.8007255733013153, + "num_tokens": 168756977.0, + "step": 49390 + }, + { + "epoch": 0.4958047292143402, + "learning_rate": 0.00010084106146372798, + "loss": 0.6465, + "mean_token_accuracy": 0.8025450706481934, + "num_tokens": 168793421.0, + "step": 49400 + }, + { + "epoch": 0.49590509454414067, + "learning_rate": 0.00010082098839776787, + "loss": 0.6299, + "mean_token_accuracy": 0.8060990929603576, + "num_tokens": 168830890.0, + "step": 49410 + }, + { + "epoch": 0.4960054598739411, + "learning_rate": 0.00010080091533180778, + "loss": 0.6706, + "mean_token_accuracy": 0.8004979431629181, + "num_tokens": 168867582.0, + "step": 49420 + }, + { + "epoch": 0.49610582520374163, + "learning_rate": 0.00010078084226584769, + "loss": 0.6628, + "mean_token_accuracy": 0.8030794143676758, + "num_tokens": 168904001.0, + "step": 49430 + }, + { + "epoch": 0.4962061905335421, + "learning_rate": 0.0001007607691998876, + "loss": 0.6462, + "mean_token_accuracy": 0.8015866696834564, + "num_tokens": 168940290.0, + "step": 49440 + }, + { + "epoch": 0.49630655586334255, + "learning_rate": 0.0001007406961339275, + "loss": 0.6191, + "mean_token_accuracy": 0.8119408249855041, + "num_tokens": 168976309.0, + "step": 49450 + }, + { + "epoch": 0.49640692119314306, + "learning_rate": 0.00010072062306796742, + "loss": 0.6673, + "mean_token_accuracy": 0.8010443806648254, + "num_tokens": 169012558.0, + "step": 49460 + }, + { + "epoch": 0.4965072865229435, + "learning_rate": 0.00010070055000200731, + "loss": 0.6195, + "mean_token_accuracy": 0.8097262918949127, + "num_tokens": 169049535.0, + "step": 49470 + }, + { + "epoch": 0.49660765185274397, + "learning_rate": 0.0001006804769360472, + "loss": 0.6852, + "mean_token_accuracy": 0.7921403408050537, + "num_tokens": 169085900.0, + "step": 49480 + }, + { + "epoch": 0.4967080171825445, + "learning_rate": 0.00010066040387008713, + "loss": 0.6463, + "mean_token_accuracy": 0.803951519727707, + "num_tokens": 169122709.0, + "step": 49490 + }, + { + "epoch": 0.49680838251234494, + "learning_rate": 0.00010064033080412702, + "loss": 0.6329, + "mean_token_accuracy": 0.8065069198608399, + "num_tokens": 169159716.0, + "step": 49500 + }, + { + "epoch": 0.4969087478421454, + "learning_rate": 0.00010062025773816692, + "loss": 0.6487, + "mean_token_accuracy": 0.805515992641449, + "num_tokens": 169196873.0, + "step": 49510 + }, + { + "epoch": 0.4970091131719459, + "learning_rate": 0.00010060018467220684, + "loss": 0.6463, + "mean_token_accuracy": 0.8037728667259216, + "num_tokens": 169233220.0, + "step": 49520 + }, + { + "epoch": 0.49710947850174636, + "learning_rate": 0.00010058011160624674, + "loss": 0.6525, + "mean_token_accuracy": 0.8033924281597138, + "num_tokens": 169268598.0, + "step": 49530 + }, + { + "epoch": 0.4972098438315468, + "learning_rate": 0.00010056003854028664, + "loss": 0.6387, + "mean_token_accuracy": 0.8102546036243439, + "num_tokens": 169305958.0, + "step": 49540 + }, + { + "epoch": 0.4973102091613473, + "learning_rate": 0.00010053996547432655, + "loss": 0.6351, + "mean_token_accuracy": 0.8053695142269135, + "num_tokens": 169343030.0, + "step": 49550 + }, + { + "epoch": 0.4974105744911478, + "learning_rate": 0.00010051989240836646, + "loss": 0.6684, + "mean_token_accuracy": 0.7995011508464813, + "num_tokens": 169379356.0, + "step": 49560 + }, + { + "epoch": 0.49751093982094824, + "learning_rate": 0.00010049981934240636, + "loss": 0.6539, + "mean_token_accuracy": 0.8013176560401917, + "num_tokens": 169416109.0, + "step": 49570 + }, + { + "epoch": 0.49761130515074875, + "learning_rate": 0.00010047974627644628, + "loss": 0.6802, + "mean_token_accuracy": 0.7919177412986755, + "num_tokens": 169451622.0, + "step": 49580 + }, + { + "epoch": 0.4977116704805492, + "learning_rate": 0.00010045967321048617, + "loss": 0.6383, + "mean_token_accuracy": 0.8054239809513092, + "num_tokens": 169488330.0, + "step": 49590 + }, + { + "epoch": 0.49781203581034966, + "learning_rate": 0.00010043960014452607, + "loss": 0.6481, + "mean_token_accuracy": 0.802841168642044, + "num_tokens": 169525885.0, + "step": 49600 + }, + { + "epoch": 0.4979124011401502, + "learning_rate": 0.00010041952707856599, + "loss": 0.6379, + "mean_token_accuracy": 0.8047163426876068, + "num_tokens": 169562296.0, + "step": 49610 + }, + { + "epoch": 0.49801276646995063, + "learning_rate": 0.00010039945401260588, + "loss": 0.6268, + "mean_token_accuracy": 0.8083502173423767, + "num_tokens": 169599402.0, + "step": 49620 + }, + { + "epoch": 0.4981131317997511, + "learning_rate": 0.00010037938094664578, + "loss": 0.6333, + "mean_token_accuracy": 0.803332257270813, + "num_tokens": 169636381.0, + "step": 49630 + }, + { + "epoch": 0.49821349712955154, + "learning_rate": 0.0001003593078806857, + "loss": 0.6426, + "mean_token_accuracy": 0.8038518130779266, + "num_tokens": 169672825.0, + "step": 49640 + }, + { + "epoch": 0.49831386245935205, + "learning_rate": 0.0001003392348147256, + "loss": 0.6638, + "mean_token_accuracy": 0.8027487874031067, + "num_tokens": 169709047.0, + "step": 49650 + }, + { + "epoch": 0.4984142277891525, + "learning_rate": 0.00010031916174876552, + "loss": 0.6689, + "mean_token_accuracy": 0.8009410977363587, + "num_tokens": 169745629.0, + "step": 49660 + }, + { + "epoch": 0.49851459311895296, + "learning_rate": 0.00010029908868280543, + "loss": 0.6241, + "mean_token_accuracy": 0.8074738621711731, + "num_tokens": 169782734.0, + "step": 49670 + }, + { + "epoch": 0.4986149584487535, + "learning_rate": 0.00010027901561684532, + "loss": 0.6336, + "mean_token_accuracy": 0.8067907512187957, + "num_tokens": 169818752.0, + "step": 49680 + }, + { + "epoch": 0.49871532377855393, + "learning_rate": 0.00010025894255088524, + "loss": 0.6743, + "mean_token_accuracy": 0.7934290409088135, + "num_tokens": 169855523.0, + "step": 49690 + }, + { + "epoch": 0.4988156891083544, + "learning_rate": 0.00010023886948492514, + "loss": 0.6636, + "mean_token_accuracy": 0.7973025441169739, + "num_tokens": 169891446.0, + "step": 49700 + }, + { + "epoch": 0.4989160544381549, + "learning_rate": 0.00010021879641896503, + "loss": 0.6419, + "mean_token_accuracy": 0.803942346572876, + "num_tokens": 169928179.0, + "step": 49710 + }, + { + "epoch": 0.49901641976795535, + "learning_rate": 0.00010019872335300495, + "loss": 0.6543, + "mean_token_accuracy": 0.8052600800991059, + "num_tokens": 169965747.0, + "step": 49720 + }, + { + "epoch": 0.4991167850977558, + "learning_rate": 0.00010017865028704485, + "loss": 0.6674, + "mean_token_accuracy": 0.7950818300247192, + "num_tokens": 170002866.0, + "step": 49730 + }, + { + "epoch": 0.4992171504275563, + "learning_rate": 0.00010015857722108474, + "loss": 0.6541, + "mean_token_accuracy": 0.8007044196128845, + "num_tokens": 170038593.0, + "step": 49740 + }, + { + "epoch": 0.4993175157573568, + "learning_rate": 0.00010013850415512467, + "loss": 0.6492, + "mean_token_accuracy": 0.7999036848545075, + "num_tokens": 170074815.0, + "step": 49750 + }, + { + "epoch": 0.49941788108715723, + "learning_rate": 0.00010011843108916456, + "loss": 0.6641, + "mean_token_accuracy": 0.8008026003837585, + "num_tokens": 170111348.0, + "step": 49760 + }, + { + "epoch": 0.49951824641695775, + "learning_rate": 0.00010009835802320447, + "loss": 0.6804, + "mean_token_accuracy": 0.7891123533248902, + "num_tokens": 170148266.0, + "step": 49770 + }, + { + "epoch": 0.4996186117467582, + "learning_rate": 0.00010007828495724438, + "loss": 0.6088, + "mean_token_accuracy": 0.8154561638832092, + "num_tokens": 170185136.0, + "step": 49780 + }, + { + "epoch": 0.49971897707655866, + "learning_rate": 0.00010005821189128429, + "loss": 0.6328, + "mean_token_accuracy": 0.8048878014087677, + "num_tokens": 170221700.0, + "step": 49790 + }, + { + "epoch": 0.49981934240635917, + "learning_rate": 0.00010003813882532418, + "loss": 0.6362, + "mean_token_accuracy": 0.8061830341815949, + "num_tokens": 170257157.0, + "step": 49800 + }, + { + "epoch": 0.4999197077361596, + "learning_rate": 0.0001000180657593641, + "loss": 0.6683, + "mean_token_accuracy": 0.8000795781612396, + "num_tokens": 170294589.0, + "step": 49810 + } + ], + "logging_steps": 10, + "max_steps": 99636, + "num_input_tokens_seen": 0, + "num_train_epochs": 9223372036854775807, + "save_steps": 6227, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": true, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 1.0383456402076877e+19, + "train_batch_size": 8, + "trial_name": null, + "trial_params": null +}