{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 0.14933296000093332, "eval_steps": 500, "global_step": 1600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "clip_ratio/high_max": 0.0, "clip_ratio/high_mean": 0.0, "clip_ratio/low_mean": 0.0, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0, "completions/clipped_ratio": 0.013994489397321397, "completions/max_length": 4096.0, "completions/max_terminated_length": 4089.0, "completions/mean_length": 602.2059326171875, "completions/mean_terminated_length": 552.6181030273438, "completions/min_length": 2.0, "completions/min_terminated_length": 2.0, "epoch": 9.333310000058333e-05, "grad_norm": 0.13759930431842804, "learning_rate": 2e-07, "loss": -0.0068, "num_tokens": 80487871.0, "reward": 0.4955357313156128, "reward_std": 0.2621634304523468, "rewards/simpleverify_reward/mean": 0.4955357015132904, "rewards/simpleverify_reward/std": 0.49998223781585693, "step": 1 }, { "clip_ratio/high_max": 0.0022065689372539055, "clip_ratio/high_mean": 0.0009625226794014452, "clip_ratio/low_mean": 0.0005663340789396898, "clip_ratio/low_min": 4.5972034968144726e-05, "clip_ratio/region_mean": 0.0015288567119569052, "epoch": 0.00018666620000116666, "grad_norm": 0.14593245089054108, "learning_rate": 2e-07, "loss": 0.0385, "step": 2 }, { "clip_ratio/high_max": 0.0023433368041878566, "clip_ratio/high_mean": 0.0010155166455660947, "clip_ratio/low_mean": 0.0007225574772746768, "clip_ratio/low_min": 8.648486345919082e-05, "clip_ratio/region_mean": 0.0017380741555825807, "epoch": 0.00027999930000175, "grad_norm": 0.16658517718315125, "learning_rate": 2e-07, "loss": 0.014, "step": 3 }, { "clip_ratio/high_max": 0.0024255002208519727, "clip_ratio/high_mean": 0.00110565867726109, "clip_ratio/low_mean": 0.0005728674550482538, "clip_ratio/low_min": 6.876951829326572e-05, "clip_ratio/region_mean": 0.0016785261141194496, "epoch": 0.0003733324000023333, "grad_norm": 0.1453002244234085, "learning_rate": 2e-07, "loss": 0.0007, "step": 4 }, { "clip_ratio/high_max": 0.002428713138215244, "clip_ratio/high_mean": 0.0009994842312153196, "clip_ratio/low_mean": 0.0005600511813099729, "clip_ratio/low_min": 1.4038634617463686e-05, "clip_ratio/region_mean": 0.001559535459819017, "epoch": 0.0004666655000029167, "grad_norm": 0.15716636180877686, "learning_rate": 2e-07, "loss": 0.0044, "step": 5 }, { "clip_ratio/high_max": 0.0023563221766380593, "clip_ratio/high_mean": 0.0009962689400708769, "clip_ratio/low_mean": 0.0006411945159925381, "clip_ratio/low_min": 9.113018040807219e-05, "clip_ratio/region_mean": 0.0016374634578824043, "epoch": 0.0005599986000035, "grad_norm": 0.15626825392246246, "learning_rate": 2e-07, "loss": 0.0617, "step": 6 }, { "clip_ratio/high_max": 0.002178309681767132, "clip_ratio/high_mean": 0.001017291702737566, "clip_ratio/low_mean": 0.0005438413527372177, "clip_ratio/low_min": 3.59353189196554e-05, "clip_ratio/region_mean": 0.0015611330200044904, "epoch": 0.0006533317000040833, "grad_norm": 0.14875125885009766, "learning_rate": 2e-07, "loss": -0.0333, "step": 7 }, { "clip_ratio/high_max": 0.0020686753632617183, "clip_ratio/high_mean": 0.0009919455715134973, "clip_ratio/low_mean": 0.0007107318015187047, "clip_ratio/low_min": 8.877150139596779e-05, "clip_ratio/region_mean": 0.001702677363937255, "epoch": 0.0007466648000046666, "grad_norm": 0.13935565948486328, "learning_rate": 2e-07, "loss": 0.0417, "step": 8 }, { "clip_ratio/high_max": 0.002448531100526452, "clip_ratio/high_mean": 0.001032476775435498, "clip_ratio/low_mean": 0.0006827364650234813, "clip_ratio/low_min": 5.694810579370824e-05, "clip_ratio/region_mean": 0.001715213235002011, "epoch": 0.00083999790000525, "grad_norm": 0.13871818780899048, "learning_rate": 2e-07, "loss": 0.052, "step": 9 }, { "clip_ratio/high_max": 0.002254709688713774, "clip_ratio/high_mean": 0.0009634299531171564, "clip_ratio/low_mean": 0.0006807682948419824, "clip_ratio/low_min": 9.688676891528303e-05, "clip_ratio/region_mean": 0.0016441982152173296, "epoch": 0.0009333310000058334, "grad_norm": 0.11543914675712585, "learning_rate": 2e-07, "loss": 0.0401, "step": 10 }, { "clip_ratio/high_max": 0.002200855604314711, "clip_ratio/high_mean": 0.000960339792072773, "clip_ratio/low_mean": 0.0006979637983022258, "clip_ratio/low_min": 7.159902634157334e-05, "clip_ratio/region_mean": 0.0016583035539952107, "epoch": 0.0010266641000064166, "grad_norm": 0.12318608164787292, "learning_rate": 2e-07, "loss": 0.032, "step": 11 }, { "clip_ratio/high_max": 0.002388564680586569, "clip_ratio/high_mean": 0.0010493910122022498, "clip_ratio/low_mean": 0.0007610994052811293, "clip_ratio/low_min": 4.3404000280133914e-05, "clip_ratio/region_mean": 0.0018104904374922626, "epoch": 0.001119997200007, "grad_norm": 0.1322244256734848, "learning_rate": 2e-07, "loss": 0.054, "step": 12 }, { "clip_ratio/high_max": 0.0021475492685567588, "clip_ratio/high_mean": 0.0010192736262979452, "clip_ratio/low_mean": 0.0007309346656256821, "clip_ratio/low_min": 0.00011046460804209346, "clip_ratio/region_mean": 0.0017502082919236273, "epoch": 0.0012133303000075833, "grad_norm": 0.12162082642316818, "learning_rate": 2e-07, "loss": 0.0253, "step": 13 }, { "clip_ratio/high_max": 0.002686457461095415, "clip_ratio/high_mean": 0.0011275794568064157, "clip_ratio/low_mean": 0.000709394373188843, "clip_ratio/low_min": 9.19399926715414e-05, "clip_ratio/region_mean": 0.0018369737517787144, "epoch": 0.0013066634000081666, "grad_norm": 0.13558144867420197, "learning_rate": 2e-07, "loss": -0.0071, "step": 14 }, { "clip_ratio/high_max": 0.0023075636563589796, "clip_ratio/high_mean": 0.0010349815183872124, "clip_ratio/low_mean": 0.000776863449573284, "clip_ratio/low_min": 7.838475630705943e-05, "clip_ratio/region_mean": 0.001811845002521295, "epoch": 0.00139999650000875, "grad_norm": 0.12378548085689545, "learning_rate": 2e-07, "loss": 0.0035, "step": 15 }, { "clip_ratio/high_max": 0.0020779223086719867, "clip_ratio/high_mean": 0.0009064354762813309, "clip_ratio/low_mean": 0.000857465904118726, "clip_ratio/low_min": 0.00012368221723590977, "clip_ratio/region_mean": 0.0017639013822190464, "epoch": 0.0014933296000093333, "grad_norm": 0.13121728599071503, "learning_rate": 2e-07, "loss": 0.0395, "step": 16 }, { "clip_ratio/high_max": 0.002105526415107306, "clip_ratio/high_mean": 0.0008541039060219191, "clip_ratio/low_mean": 0.000901067291124491, "clip_ratio/low_min": 0.00012885413616459118, "clip_ratio/region_mean": 0.0017551711935084313, "epoch": 0.0015866627000099165, "grad_norm": 0.13397668302059174, "learning_rate": 2e-07, "loss": 0.0818, "step": 17 }, { "clip_ratio/high_max": 0.0021584492351394147, "clip_ratio/high_mean": 0.0010009718389483169, "clip_ratio/low_mean": 0.0007376163357548648, "clip_ratio/low_min": 8.004610208445229e-06, "clip_ratio/region_mean": 0.00173858818016015, "epoch": 0.0016799958000105, "grad_norm": 0.12542670965194702, "learning_rate": 2e-07, "loss": 0.0075, "step": 18 }, { "clip_ratio/high_max": 0.0023861460140324198, "clip_ratio/high_mean": 0.0009763397756614722, "clip_ratio/low_mean": 0.0006927458180143731, "clip_ratio/low_min": 5.242733914201381e-05, "clip_ratio/region_mean": 0.001669085628236644, "epoch": 0.0017733289000110833, "grad_norm": 0.11937450617551804, "learning_rate": 2e-07, "loss": 0.0292, "step": 19 }, { "clip_ratio/high_max": 0.002495621891284827, "clip_ratio/high_mean": 0.0011207825918972958, "clip_ratio/low_mean": 0.000782809733209433, "clip_ratio/low_min": 0.00011933081896131625, "clip_ratio/region_mean": 0.0019035923469346017, "epoch": 0.0018666620000116667, "grad_norm": 0.13186220824718475, "learning_rate": 2e-07, "loss": -0.0139, "step": 20 }, { "clip_ratio/high_max": 0.002186767407692969, "clip_ratio/high_mean": 0.0009634944144636393, "clip_ratio/low_mean": 0.000755790622861241, "clip_ratio/low_min": 2.755909736151807e-05, "clip_ratio/region_mean": 0.0017192850427818485, "epoch": 0.00195999510001225, "grad_norm": 0.11095698177814484, "learning_rate": 2e-07, "loss": -0.0212, "step": 21 }, { "clip_ratio/high_max": 0.0024067769627436064, "clip_ratio/high_mean": 0.0010147795474040322, "clip_ratio/low_mean": 0.0008198579434974818, "clip_ratio/low_min": 0.00011022948638128582, "clip_ratio/region_mean": 0.001834637499996461, "epoch": 0.002053328200012833, "grad_norm": 0.11780126392841339, "learning_rate": 2e-07, "loss": 0.0236, "step": 22 }, { "clip_ratio/high_max": 0.002067869958409574, "clip_ratio/high_mean": 0.001010547701298492, "clip_ratio/low_mean": 0.0009143011920969002, "clip_ratio/low_min": 0.00014466201173490845, "clip_ratio/region_mean": 0.0019248489406891167, "epoch": 0.0021466613000134167, "grad_norm": 0.12104950100183487, "learning_rate": 2e-07, "loss": -0.008, "step": 23 }, { "clip_ratio/high_max": 0.002511536680685822, "clip_ratio/high_mean": 0.0011440807102189865, "clip_ratio/low_mean": 0.0009340474935015664, "clip_ratio/low_min": 9.351481185149169e-05, "clip_ratio/region_mean": 0.0020781282073585317, "epoch": 0.002239994400014, "grad_norm": 0.12738487124443054, "learning_rate": 2e-07, "loss": 0.0094, "step": 24 }, { "clip_ratio/high_max": 0.00258793770626653, "clip_ratio/high_mean": 0.0011139254238514695, "clip_ratio/low_mean": 0.0009335441409348277, "clip_ratio/low_min": 0.00019500773305480834, "clip_ratio/region_mean": 0.002047469562967308, "epoch": 0.002333327500014583, "grad_norm": 0.1277008205652237, "learning_rate": 2e-07, "loss": -0.02, "step": 25 }, { "clip_ratio/high_max": 0.002398582386376802, "clip_ratio/high_mean": 0.0011080115582444705, "clip_ratio/low_mean": 0.0010934132551483344, "clip_ratio/low_min": 0.00013346978857953218, "clip_ratio/region_mean": 0.0022014248606865294, "epoch": 0.0024266606000151666, "grad_norm": 0.12345385551452637, "learning_rate": 2e-07, "loss": -0.0036, "step": 26 }, { "clip_ratio/high_max": 0.002720094969845377, "clip_ratio/high_mean": 0.0011887760629178956, "clip_ratio/low_mean": 0.0010345951486669946, "clip_ratio/low_min": 0.00013475633886628202, "clip_ratio/region_mean": 0.0022233712224988267, "epoch": 0.00251999370001575, "grad_norm": 0.13430047035217285, "learning_rate": 2e-07, "loss": 0.0234, "step": 27 }, { "clip_ratio/high_max": 0.002498956186173018, "clip_ratio/high_mean": 0.001244164272065973, "clip_ratio/low_mean": 0.0010510852043807972, "clip_ratio/low_min": 0.00020377309829200385, "clip_ratio/region_mean": 0.0022952494182391092, "epoch": 0.002613326800016333, "grad_norm": 0.12569083273410797, "learning_rate": 2e-07, "loss": -0.0333, "step": 28 }, { "clip_ratio/high_max": 0.003136533014185261, "clip_ratio/high_mean": 0.0013053406073595397, "clip_ratio/low_mean": 0.0009992614723159932, "clip_ratio/low_min": 0.00012081209615644184, "clip_ratio/region_mean": 0.00230460205784766, "epoch": 0.0027066599000169166, "grad_norm": 0.1379885971546173, "learning_rate": 2e-07, "loss": -0.0162, "step": 29 }, { "clip_ratio/high_max": 0.002233131916000275, "clip_ratio/high_mean": 0.0010059003379865317, "clip_ratio/low_mean": 0.0009712669161672238, "clip_ratio/low_min": 0.00011079046635131817, "clip_ratio/region_mean": 0.0019771672086790204, "epoch": 0.0027999930000175, "grad_norm": 0.12021656334400177, "learning_rate": 2e-07, "loss": 0.0035, "step": 30 }, { "clip_ratio/high_max": 0.002493700674676802, "clip_ratio/high_mean": 0.0011914396454812959, "clip_ratio/low_mean": 0.0011226971728319768, "clip_ratio/low_min": 0.0003030256293641287, "clip_ratio/region_mean": 0.002314136851055082, "epoch": 0.002893326100018083, "grad_norm": 0.12451107800006866, "learning_rate": 2e-07, "loss": 0.0446, "step": 31 }, { "clip_ratio/high_max": 0.002848641110176686, "clip_ratio/high_mean": 0.001282274919503834, "clip_ratio/low_mean": 0.0010856482258532196, "clip_ratio/low_min": 0.0001100680374293006, "clip_ratio/region_mean": 0.002367923138081096, "epoch": 0.0029866592000186666, "grad_norm": 0.12093507498502731, "learning_rate": 2e-07, "loss": 0.0189, "step": 32 }, { "clip_ratio/high_max": 0.0026684673321142327, "clip_ratio/high_mean": 0.0013065275743429083, "clip_ratio/low_mean": 0.0010640513010002906, "clip_ratio/low_min": 9.5175262686098e-05, "clip_ratio/region_mean": 0.0023705788407824002, "epoch": 0.00307999230001925, "grad_norm": 0.1341838538646698, "learning_rate": 2e-07, "loss": 0.0055, "step": 33 }, { "clip_ratio/high_max": 0.002769510538200848, "clip_ratio/high_mean": 0.001244209361175308, "clip_ratio/low_mean": 0.0010910430428339168, "clip_ratio/low_min": 0.0001066028157765686, "clip_ratio/region_mean": 0.0023352523712674156, "epoch": 0.003173325400019833, "grad_norm": 0.12575463950634003, "learning_rate": 2e-07, "loss": 0.0033, "step": 34 }, { "clip_ratio/high_max": 0.0024367462610825896, "clip_ratio/high_mean": 0.0011747546486731153, "clip_ratio/low_mean": 0.0010955417164950632, "clip_ratio/low_min": 3.440639738983009e-05, "clip_ratio/region_mean": 0.0022702963105984963, "epoch": 0.0032666585000204165, "grad_norm": 0.12949351966381073, "learning_rate": 2e-07, "loss": -0.0113, "step": 35 }, { "clip_ratio/high_max": 0.002706043560465332, "clip_ratio/high_mean": 0.001173496599221835, "clip_ratio/low_mean": 0.0010954059689538553, "clip_ratio/low_min": 9.105438311962644e-05, "clip_ratio/region_mean": 0.002268902593641542, "epoch": 0.003359991600021, "grad_norm": 0.11561225354671478, "learning_rate": 2e-07, "loss": 0.0003, "step": 36 }, { "clip_ratio/high_max": 0.002640869985043537, "clip_ratio/high_mean": 0.0010825259705598, "clip_ratio/low_mean": 0.0010512191183806863, "clip_ratio/low_min": 0.00014737742640136275, "clip_ratio/region_mean": 0.0021337450671126135, "epoch": 0.0034533247000215835, "grad_norm": 0.12649182975292206, "learning_rate": 2e-07, "loss": -0.0135, "step": 37 }, { "clip_ratio/high_max": 0.0028139656424173154, "clip_ratio/high_mean": 0.0012453914059733506, "clip_ratio/low_mean": 0.0010105448673130013, "clip_ratio/low_min": 0.00016016728750400944, "clip_ratio/region_mean": 0.002255936313304119, "epoch": 0.0035466578000221665, "grad_norm": 0.119010329246521, "learning_rate": 2e-07, "loss": -0.0077, "step": 38 }, { "clip_ratio/high_max": 0.0026386542813270353, "clip_ratio/high_mean": 0.0011948112114623655, "clip_ratio/low_mean": 0.0011335028684698045, "clip_ratio/low_min": 0.00017363267943437677, "clip_ratio/region_mean": 0.002328314039914403, "epoch": 0.00363999090002275, "grad_norm": 0.12449844926595688, "learning_rate": 2e-07, "loss": -0.0109, "step": 39 }, { "clip_ratio/high_max": 0.002565615861385595, "clip_ratio/high_mean": 0.0011511226402944885, "clip_ratio/low_mean": 0.0009204857378790621, "clip_ratio/low_min": 8.271289652839187e-05, "clip_ratio/region_mean": 0.0020716083381557837, "epoch": 0.0037333240000233334, "grad_norm": 0.11791258305311203, "learning_rate": 2e-07, "loss": -0.0073, "step": 40 }, { "clip_ratio/high_max": 0.002406888008408714, "clip_ratio/high_mean": 0.0010053035766759422, "clip_ratio/low_mean": 0.0010807540129462723, "clip_ratio/low_min": 0.00020829499953833874, "clip_ratio/region_mean": 0.0020860576114500873, "epoch": 0.0038266571000239165, "grad_norm": 0.12728513777256012, "learning_rate": 2e-07, "loss": 0.0777, "step": 41 }, { "clip_ratio/high_max": 0.0025397560675628483, "clip_ratio/high_mean": 0.00122109302537865, "clip_ratio/low_mean": 0.0010099066676048096, "clip_ratio/low_min": 0.0002008970968745416, "clip_ratio/region_mean": 0.0022309997293632478, "epoch": 0.0039199902000245, "grad_norm": 0.1368962973356247, "learning_rate": 2e-07, "loss": 0.0095, "step": 42 }, { "clip_ratio/high_max": 0.0023320901600527577, "clip_ratio/high_mean": 0.001088251665350981, "clip_ratio/low_mean": 0.0008656851623527473, "clip_ratio/low_min": 4.923844608129002e-05, "clip_ratio/region_mean": 0.0019539367931429297, "epoch": 0.004013323300025083, "grad_norm": 0.1204458698630333, "learning_rate": 2e-07, "loss": -0.0052, "step": 43 }, { "clip_ratio/high_max": 0.0025958994301618077, "clip_ratio/high_mean": 0.0010896955718635581, "clip_ratio/low_mean": 0.0010444923136674333, "clip_ratio/low_min": 0.00019318930208100937, "clip_ratio/region_mean": 0.002134187838237267, "epoch": 0.004106656400025666, "grad_norm": 0.11986131966114044, "learning_rate": 2e-07, "loss": 0.0231, "step": 44 }, { "clip_ratio/high_max": 0.0024874499431462027, "clip_ratio/high_mean": 0.0011461662506917492, "clip_ratio/low_mean": 0.0009556092281854944, "clip_ratio/low_min": 8.585712748754304e-05, "clip_ratio/region_mean": 0.0021017754916101694, "epoch": 0.00419998950002625, "grad_norm": 0.11773476004600525, "learning_rate": 2e-07, "loss": 0.0058, "step": 45 }, { "clip_ratio/high_max": 0.0024630759507999755, "clip_ratio/high_mean": 0.0010726907930802554, "clip_ratio/low_mean": 0.0009227466362062842, "clip_ratio/low_min": 0.00011095819900219794, "clip_ratio/region_mean": 0.0019954374147346243, "epoch": 0.004293322600026833, "grad_norm": 0.1204761192202568, "learning_rate": 2e-07, "loss": 0.0259, "step": 46 }, { "clip_ratio/high_max": 0.002413340269413311, "clip_ratio/high_mean": 0.0010251000931020826, "clip_ratio/low_mean": 0.0010457343742018566, "clip_ratio/low_min": 0.0001564217691338854, "clip_ratio/region_mean": 0.0020708344382001087, "epoch": 0.004386655700027417, "grad_norm": 0.12802086770534515, "learning_rate": 2e-07, "loss": 0.014, "step": 47 }, { "clip_ratio/high_max": 0.002588268253020942, "clip_ratio/high_mean": 0.0010833831474883482, "clip_ratio/low_mean": 0.0009809893563215155, "clip_ratio/low_min": 0.00017070886860892642, "clip_ratio/region_mean": 0.0020643725219997577, "epoch": 0.004479988800028, "grad_norm": 0.1164955422282219, "learning_rate": 2e-07, "loss": 0.0191, "step": 48 }, { "clip_ratio/high_max": 0.002303596593264956, "clip_ratio/high_mean": 0.00103465188658447, "clip_ratio/low_mean": 0.001013257020531455, "clip_ratio/low_min": 0.00013841588042851072, "clip_ratio/region_mean": 0.00204790889256401, "epoch": 0.004573321900028583, "grad_norm": 0.12419898808002472, "learning_rate": 2e-07, "loss": 0.0213, "step": 49 }, { "clip_ratio/high_max": 0.0022159460859256797, "clip_ratio/high_mean": 0.0009582727507222444, "clip_ratio/low_mean": 0.0008815987021080218, "clip_ratio/low_min": 0.0001522265965832048, "clip_ratio/region_mean": 0.0018398714528302662, "epoch": 0.004666655000029166, "grad_norm": 0.1171102523803711, "learning_rate": 2e-07, "loss": 0.0138, "step": 50 }, { "clip_ratio/high_max": 0.0023076578800100833, "clip_ratio/high_mean": 0.0010390221359557472, "clip_ratio/low_mean": 0.0009462763209739933, "clip_ratio/low_min": 0.0001251860048796516, "clip_ratio/region_mean": 0.0019852984114550054, "epoch": 0.00475998810002975, "grad_norm": 0.11780759692192078, "learning_rate": 2e-07, "loss": -0.0109, "step": 51 }, { "clip_ratio/high_max": 0.0024243152220151387, "clip_ratio/high_mean": 0.0011258704216743354, "clip_ratio/low_mean": 0.0010017458153015468, "clip_ratio/low_min": 9.4264531526278e-05, "clip_ratio/region_mean": 0.002127616258803755, "epoch": 0.004853321200030333, "grad_norm": 0.1206725686788559, "learning_rate": 2e-07, "loss": -0.0063, "step": 52 }, { "clip_ratio/high_max": 0.002432298511848785, "clip_ratio/high_mean": 0.0010811018401000183, "clip_ratio/low_mean": 0.0010167405926040374, "clip_ratio/low_min": 0.00022763140168535756, "clip_ratio/region_mean": 0.0020978424217901193, "epoch": 0.004946654300030917, "grad_norm": 0.12259439378976822, "learning_rate": 2e-07, "loss": 0.0325, "step": 53 }, { "clip_ratio/high_max": 0.002412291396467481, "clip_ratio/high_mean": 0.001037335683577112, "clip_ratio/low_mean": 0.0009035905022756197, "clip_ratio/low_min": 0.00010732095506682526, "clip_ratio/region_mean": 0.0019409262094995938, "epoch": 0.0050399874000315, "grad_norm": 0.1314329355955124, "learning_rate": 2e-07, "loss": 0.0118, "step": 54 }, { "clip_ratio/high_max": 0.0019421509277890436, "clip_ratio/high_mean": 0.0009373329194204416, "clip_ratio/low_mean": 0.0009320156805188162, "clip_ratio/low_min": 0.0001615060737094609, "clip_ratio/region_mean": 0.001869348605396226, "epoch": 0.005133320500032083, "grad_norm": 0.12206357717514038, "learning_rate": 2e-07, "loss": 0.0421, "step": 55 }, { "clip_ratio/high_max": 0.002275485239806585, "clip_ratio/high_mean": 0.0009570264955982566, "clip_ratio/low_mean": 0.0010482631223567296, "clip_ratio/low_min": 0.0002368123568885494, "clip_ratio/region_mean": 0.0020052896070410497, "epoch": 0.005226653600032666, "grad_norm": 0.1227516457438469, "learning_rate": 2e-07, "loss": 0.0403, "step": 56 }, { "clip_ratio/high_max": 0.002850349628715776, "clip_ratio/high_mean": 0.0011409435865061823, "clip_ratio/low_mean": 0.0010455916599312332, "clip_ratio/low_min": 0.00015849582632654347, "clip_ratio/region_mean": 0.0021865351882297546, "epoch": 0.00531998670003325, "grad_norm": 0.12860107421875, "learning_rate": 2e-07, "loss": 0.0561, "step": 57 }, { "clip_ratio/high_max": 0.002556306804763153, "clip_ratio/high_mean": 0.0012527340149972588, "clip_ratio/low_mean": 0.0008978071728051873, "clip_ratio/low_min": 7.28205914128921e-05, "clip_ratio/region_mean": 0.002150541215087287, "epoch": 0.005413319800033833, "grad_norm": 0.14245173335075378, "learning_rate": 2e-07, "loss": -0.0159, "step": 58 }, { "clip_ratio/high_max": 0.0024526212000637315, "clip_ratio/high_mean": 0.0011366845283191651, "clip_ratio/low_mean": 0.0010550674196565524, "clip_ratio/low_min": 0.00019996703304059338, "clip_ratio/region_mean": 0.0021917519698035903, "epoch": 0.005506652900034417, "grad_norm": 0.11834948509931564, "learning_rate": 2e-07, "loss": 0.0011, "step": 59 }, { "clip_ratio/high_max": 0.0025687809466035105, "clip_ratio/high_mean": 0.001065177140844753, "clip_ratio/low_mean": 0.0009816348192543956, "clip_ratio/low_min": 0.00016122754732350586, "clip_ratio/region_mean": 0.002046811983746011, "epoch": 0.005599986000035, "grad_norm": 0.12353020906448364, "learning_rate": 2e-07, "loss": 0.0392, "step": 60 }, { "clip_ratio/high_max": 0.0024015321432671044, "clip_ratio/high_mean": 0.0011070701530115912, "clip_ratio/low_mean": 0.0009576883185218321, "clip_ratio/low_min": 0.00024875444069039077, "clip_ratio/region_mean": 0.002064758460619487, "epoch": 0.005693319100035584, "grad_norm": 0.12785834074020386, "learning_rate": 2e-07, "loss": -0.0037, "step": 61 }, { "clip_ratio/high_max": 0.002829837794706691, "clip_ratio/high_mean": 0.0012178211654827464, "clip_ratio/low_mean": 0.0010184730381297413, "clip_ratio/low_min": 0.00011663909299386432, "clip_ratio/region_mean": 0.0022362941526807845, "epoch": 0.005786652200036166, "grad_norm": 0.12496073544025421, "learning_rate": 2e-07, "loss": 0.0039, "step": 62 }, { "clip_ratio/high_max": 0.0025347245900775306, "clip_ratio/high_mean": 0.0011178080385434441, "clip_ratio/low_mean": 0.0009502239408902824, "clip_ratio/low_min": 0.00016332157247234136, "clip_ratio/region_mean": 0.0020680319576058537, "epoch": 0.00587998530003675, "grad_norm": 0.11821945011615753, "learning_rate": 2e-07, "loss": 0.0117, "step": 63 }, { "clip_ratio/high_max": 0.0023334631114266813, "clip_ratio/high_mean": 0.0011029594425053801, "clip_ratio/low_mean": 0.001021804189804243, "clip_ratio/low_min": 7.583933984278701e-05, "clip_ratio/region_mean": 0.0021247636614134535, "epoch": 0.005973318400037333, "grad_norm": 0.12680988013744354, "learning_rate": 2e-07, "loss": -0.0123, "step": 64 }, { "clip_ratio/high_max": 0.0023923879089124966, "clip_ratio/high_mean": 0.0010150034868274815, "clip_ratio/low_mean": 0.001049237140250625, "clip_ratio/low_min": 9.225586654793005e-05, "clip_ratio/region_mean": 0.002064240637992043, "epoch": 0.006066651500037917, "grad_norm": 0.11140301078557968, "learning_rate": 2e-07, "loss": 0.0243, "step": 65 }, { "clip_ratio/high_max": 0.0024977811190183274, "clip_ratio/high_mean": 0.001150256806795369, "clip_ratio/low_mean": 0.0010544906981522217, "clip_ratio/low_min": 0.00019430756219662726, "clip_ratio/region_mean": 0.002204747484938707, "epoch": 0.0061599846000385, "grad_norm": 0.12916722893714905, "learning_rate": 2e-07, "loss": 0.0185, "step": 66 }, { "clip_ratio/high_max": 0.0025959548584069125, "clip_ratio/high_mean": 0.001167371137853479, "clip_ratio/low_mean": 0.0010923495319730137, "clip_ratio/low_min": 0.0001944821551660425, "clip_ratio/region_mean": 0.002259720698930323, "epoch": 0.0062533177000390835, "grad_norm": 0.12627947330474854, "learning_rate": 2e-07, "loss": 0.0355, "step": 67 }, { "clip_ratio/high_max": 0.002560061167969252, "clip_ratio/high_mean": 0.0010423159728816245, "clip_ratio/low_mean": 0.001075398762623081, "clip_ratio/low_min": 0.0001800854970497312, "clip_ratio/region_mean": 0.002117714684573002, "epoch": 0.006346650800039666, "grad_norm": 0.12196554243564606, "learning_rate": 2e-07, "loss": 0.044, "step": 68 }, { "clip_ratio/high_max": 0.002183907854487188, "clip_ratio/high_mean": 0.001033797969284933, "clip_ratio/low_mean": 0.0009016285021061776, "clip_ratio/low_min": 9.236746063834289e-05, "clip_ratio/region_mean": 0.0019354264732101, "epoch": 0.00643998390004025, "grad_norm": 0.11326209455728531, "learning_rate": 2e-07, "loss": -0.018, "step": 69 }, { "clip_ratio/high_max": 0.00226112810196355, "clip_ratio/high_mean": 0.0010268794794683345, "clip_ratio/low_mean": 0.00116620509288623, "clip_ratio/low_min": 0.00018076651394949295, "clip_ratio/region_mean": 0.0021930846050963737, "epoch": 0.006533317000040833, "grad_norm": 0.1239795833826065, "learning_rate": 2e-07, "loss": 0.001, "step": 70 }, { "clip_ratio/high_max": 0.002383978986472357, "clip_ratio/high_mean": 0.0010442595266795252, "clip_ratio/low_mean": 0.0010725457850639941, "clip_ratio/low_min": 0.000289766438982042, "clip_ratio/region_mean": 0.0021168053572182544, "epoch": 0.0066266501000414165, "grad_norm": 0.12646859884262085, "learning_rate": 2e-07, "loss": 0.0482, "step": 71 }, { "clip_ratio/high_max": 0.0021316590427886695, "clip_ratio/high_mean": 0.001035705838148715, "clip_ratio/low_mean": 0.0009940873133018613, "clip_ratio/low_min": 0.00015565583544230321, "clip_ratio/region_mean": 0.00202979314053664, "epoch": 0.006719983200042, "grad_norm": 0.1169920563697815, "learning_rate": 2e-07, "loss": -0.0145, "step": 72 }, { "clip_ratio/high_max": 0.0025822133757174015, "clip_ratio/high_mean": 0.0011686998295772355, "clip_ratio/low_mean": 0.0010936918588413391, "clip_ratio/low_min": 0.0001518342505733017, "clip_ratio/region_mean": 0.002262391659314744, "epoch": 0.0068133163000425835, "grad_norm": 0.12037884443998337, "learning_rate": 2e-07, "loss": 0.0198, "step": 73 }, { "clip_ratio/high_max": 0.0023944088025018573, "clip_ratio/high_mean": 0.001014676319755381, "clip_ratio/low_mean": 0.0010029844579548808, "clip_ratio/low_min": 0.00015791595251357649, "clip_ratio/region_mean": 0.002017660837736912, "epoch": 0.006906649400043167, "grad_norm": 0.11627409607172012, "learning_rate": 2e-07, "loss": 0.014, "step": 74 }, { "clip_ratio/high_max": 0.002566905299318023, "clip_ratio/high_mean": 0.0010877121276280377, "clip_ratio/low_mean": 0.0010018059547292069, "clip_ratio/low_min": 9.08300103219517e-05, "clip_ratio/region_mean": 0.002089518093271181, "epoch": 0.0069999825000437495, "grad_norm": 0.11353359371423721, "learning_rate": 2e-07, "loss": -0.0076, "step": 75 }, { "clip_ratio/high_max": 0.002526150274206884, "clip_ratio/high_mean": 0.0010816377834999003, "clip_ratio/low_mean": 0.0010003346942539793, "clip_ratio/low_min": 9.497723112872336e-05, "clip_ratio/region_mean": 0.002081972488667816, "epoch": 0.007093315600044333, "grad_norm": 0.13528339564800262, "learning_rate": 2e-07, "loss": 0.0146, "step": 76 }, { "clip_ratio/high_max": 0.0023559087348985486, "clip_ratio/high_mean": 0.0009873982016870286, "clip_ratio/low_mean": 0.000992194331047358, "clip_ratio/low_min": 0.0001231843475579808, "clip_ratio/region_mean": 0.0019795924818026833, "epoch": 0.0071866487000449165, "grad_norm": 0.12325123697519302, "learning_rate": 2e-07, "loss": 0.0539, "step": 77 }, { "clip_ratio/high_max": 0.0024407586024608463, "clip_ratio/high_mean": 0.0010995592892868444, "clip_ratio/low_mean": 0.0009877428547042655, "clip_ratio/low_min": 0.0001845628157752799, "clip_ratio/region_mean": 0.0020873021239822265, "epoch": 0.0072799818000455, "grad_norm": 0.12408103048801422, "learning_rate": 2e-07, "loss": -0.0092, "step": 78 }, { "clip_ratio/high_max": 0.002455210189509671, "clip_ratio/high_mean": 0.001221607471961761, "clip_ratio/low_mean": 0.0010295740103174467, "clip_ratio/low_min": 0.0001738988285069354, "clip_ratio/region_mean": 0.002251181489555165, "epoch": 0.007373314900046083, "grad_norm": 0.12384219467639923, "learning_rate": 2e-07, "loss": -0.0278, "step": 79 }, { "clip_ratio/high_max": 0.002472327949362807, "clip_ratio/high_mean": 0.0010085265930683818, "clip_ratio/low_mean": 0.001022365533572156, "clip_ratio/low_min": 0.00011979383361904183, "clip_ratio/region_mean": 0.0020308921157266013, "epoch": 0.007466648000046667, "grad_norm": 0.11716713756322861, "learning_rate": 2e-07, "loss": 0.0058, "step": 80 }, { "clip_ratio/high_max": 0.0026414465173729695, "clip_ratio/high_mean": 0.0011580698592297267, "clip_ratio/low_mean": 0.0010016011256084312, "clip_ratio/low_min": 0.00011491430086607579, "clip_ratio/region_mean": 0.002159670984838158, "epoch": 0.0075599811000472495, "grad_norm": 0.12005658447742462, "learning_rate": 2e-07, "loss": -0.011, "step": 81 }, { "clip_ratio/high_max": 0.0023819441121304408, "clip_ratio/high_mean": 0.0009984525095205754, "clip_ratio/low_mean": 0.0011438190049375407, "clip_ratio/low_min": 0.00016325494561897358, "clip_ratio/region_mean": 0.0021422715290100314, "epoch": 0.007653314200047833, "grad_norm": 0.13109754025936127, "learning_rate": 2e-07, "loss": 0.0606, "step": 82 }, { "clip_ratio/high_max": 0.00229565099652973, "clip_ratio/high_mean": 0.0010132619972864632, "clip_ratio/low_mean": 0.0009851778740994632, "clip_ratio/low_min": 0.00011706572968250839, "clip_ratio/region_mean": 0.00199843986047199, "epoch": 0.007746647300048416, "grad_norm": 0.12174177169799805, "learning_rate": 2e-07, "loss": 0.0045, "step": 83 }, { "clip_ratio/high_max": 0.0024214958248194307, "clip_ratio/high_mean": 0.0010194134210905759, "clip_ratio/low_mean": 0.0009943436853063758, "clip_ratio/low_min": 0.00011279054706392344, "clip_ratio/region_mean": 0.0020137571191298775, "epoch": 0.007839980400049, "grad_norm": 0.11000645905733109, "learning_rate": 2e-07, "loss": 0.0346, "step": 84 }, { "clip_ratio/high_max": 0.0024294516260852106, "clip_ratio/high_mean": 0.0010958889488392742, "clip_ratio/low_mean": 0.000996136248431867, "clip_ratio/low_min": 0.00011430255835875869, "clip_ratio/region_mean": 0.002092025155434385, "epoch": 0.007933313500049582, "grad_norm": 0.11078117787837982, "learning_rate": 2e-07, "loss": -0.0005, "step": 85 }, { "clip_ratio/high_max": 0.0020795044329133816, "clip_ratio/high_mean": 0.0010098625753016677, "clip_ratio/low_mean": 0.0009847307010204531, "clip_ratio/low_min": 0.0001200552878799499, "clip_ratio/region_mean": 0.0019945932217524387, "epoch": 0.008026646600050166, "grad_norm": 0.13004706799983978, "learning_rate": 2e-07, "loss": 0.0506, "step": 86 }, { "clip_ratio/high_max": 0.0023037327482597902, "clip_ratio/high_mean": 0.0009644545898481738, "clip_ratio/low_mean": 0.0010997420649800915, "clip_ratio/low_min": 0.0002121145516866818, "clip_ratio/region_mean": 0.0020641966330003925, "epoch": 0.00811997970005075, "grad_norm": 0.11882181465625763, "learning_rate": 2e-07, "loss": 0.0475, "step": 87 }, { "clip_ratio/high_max": 0.0021188969258219004, "clip_ratio/high_mean": 0.0009328400810773019, "clip_ratio/low_mean": 0.0010141383063455578, "clip_ratio/low_min": 0.00018170668226957787, "clip_ratio/region_mean": 0.0019469783510430716, "epoch": 0.008213312800051333, "grad_norm": 0.10904403775930405, "learning_rate": 2e-07, "loss": 0.0436, "step": 88 }, { "clip_ratio/high_max": 0.0022453466372098774, "clip_ratio/high_mean": 0.0011324450533720665, "clip_ratio/low_mean": 0.0010070324315165635, "clip_ratio/low_min": 7.470083437510766e-05, "clip_ratio/region_mean": 0.002139477481250651, "epoch": 0.008306645900051916, "grad_norm": 0.119810089468956, "learning_rate": 2e-07, "loss": 0.0159, "step": 89 }, { "clip_ratio/high_max": 0.002243947372335242, "clip_ratio/high_mean": 0.0009060739503183868, "clip_ratio/low_mean": 0.0009464389586355537, "clip_ratio/low_min": 0.00012365468001007685, "clip_ratio/region_mean": 0.0018525129416957498, "epoch": 0.0083999790000525, "grad_norm": 0.12912625074386597, "learning_rate": 2e-07, "loss": 0.0583, "step": 90 }, { "clip_ratio/high_max": 0.0027310406221658923, "clip_ratio/high_mean": 0.0012210035019961651, "clip_ratio/low_mean": 0.0010018622306233738, "clip_ratio/low_min": 0.00013228166972112376, "clip_ratio/region_mean": 0.0022228657398954965, "epoch": 0.008493312100053083, "grad_norm": 0.12694548070430756, "learning_rate": 2e-07, "loss": -0.0062, "step": 91 }, { "clip_ratio/high_max": 0.0025176576746162027, "clip_ratio/high_mean": 0.0010547294295975007, "clip_ratio/low_mean": 0.001119173779443372, "clip_ratio/low_min": 0.00016456622051919112, "clip_ratio/region_mean": 0.0021739032526966184, "epoch": 0.008586645200053667, "grad_norm": 0.12151345610618591, "learning_rate": 2e-07, "loss": 0.0272, "step": 92 }, { "clip_ratio/high_max": 0.002156324975658208, "clip_ratio/high_mean": 0.0010037311440100893, "clip_ratio/low_mean": 0.001022699161694618, "clip_ratio/low_min": 0.00021622756867145654, "clip_ratio/region_mean": 0.0020264303166186437, "epoch": 0.00867997830005425, "grad_norm": 0.12105920165777206, "learning_rate": 2e-07, "loss": 0.0384, "step": 93 }, { "clip_ratio/high_max": 0.00222276975546265, "clip_ratio/high_mean": 0.0010122564999619499, "clip_ratio/low_mean": 0.0009835495220613666, "clip_ratio/low_min": 0.00014661465775134275, "clip_ratio/region_mean": 0.001995805956539698, "epoch": 0.008773311400054834, "grad_norm": 0.11528412252664566, "learning_rate": 2e-07, "loss": 0.0233, "step": 94 }, { "clip_ratio/high_max": 0.002193732259911485, "clip_ratio/high_mean": 0.0010109655395353911, "clip_ratio/low_mean": 0.0010105909095727839, "clip_ratio/low_min": 0.00013143275282345712, "clip_ratio/region_mean": 0.0020215564290992916, "epoch": 0.008866644500055417, "grad_norm": 0.13224723935127258, "learning_rate": 2e-07, "loss": 0.0249, "step": 95 }, { "clip_ratio/high_max": 0.002265732779051177, "clip_ratio/high_mean": 0.0010632648336468264, "clip_ratio/low_mean": 0.0008662667805765523, "clip_ratio/low_min": 0.00011939525484194746, "clip_ratio/region_mean": 0.0019295316160423681, "epoch": 0.008959977600056, "grad_norm": 0.1173136830329895, "learning_rate": 2e-07, "loss": -0.0199, "step": 96 }, { "clip_ratio/high_max": 0.002467413080012193, "clip_ratio/high_mean": 0.0011397613561712205, "clip_ratio/low_mean": 0.0010071933284052648, "clip_ratio/low_min": 0.0001621500305191148, "clip_ratio/region_mean": 0.0021469547136803158, "epoch": 0.009053310700056582, "grad_norm": 0.11718394607305527, "learning_rate": 2e-07, "loss": 0.0203, "step": 97 }, { "clip_ratio/high_max": 0.002432377641525818, "clip_ratio/high_mean": 0.0009835719247348607, "clip_ratio/low_mean": 0.0010314748578821309, "clip_ratio/low_min": 0.00012290663289604709, "clip_ratio/region_mean": 0.0020150468189967796, "epoch": 0.009146643800057166, "grad_norm": 0.1221708208322525, "learning_rate": 2e-07, "loss": 0.0461, "step": 98 }, { "clip_ratio/high_max": 0.0020005115657113492, "clip_ratio/high_mean": 0.0010057074468932115, "clip_ratio/low_mean": 0.0010036065668828087, "clip_ratio/low_min": 0.00011503671430546092, "clip_ratio/region_mean": 0.002009314026508946, "epoch": 0.00923997690005775, "grad_norm": 0.12201784551143646, "learning_rate": 2e-07, "loss": 0.0083, "step": 99 }, { "clip_ratio/high_max": 0.0025391852686880156, "clip_ratio/high_mean": 0.0011396261470508762, "clip_ratio/low_mean": 0.0010271278661093675, "clip_ratio/low_min": 8.206730399251683e-05, "clip_ratio/region_mean": 0.002166754005884286, "epoch": 0.009333310000058333, "grad_norm": 0.1262112408876419, "learning_rate": 2e-07, "loss": -0.0029, "step": 100 }, { "clip_ratio/high_max": 0.0024612022534711286, "clip_ratio/high_mean": 0.0010904588416451588, "clip_ratio/low_mean": 0.0010210126583842793, "clip_ratio/low_min": 0.00016702443826943636, "clip_ratio/region_mean": 0.0021114715200383216, "epoch": 0.009426643100058916, "grad_norm": 0.11717819422483444, "learning_rate": 2e-07, "loss": 0.0071, "step": 101 }, { "clip_ratio/high_max": 0.0021987882573739626, "clip_ratio/high_mean": 0.0010625940121826716, "clip_ratio/low_mean": 0.0009707744065963197, "clip_ratio/low_min": 0.00013208571908762679, "clip_ratio/region_mean": 0.0020333684151410125, "epoch": 0.0095199762000595, "grad_norm": 0.11552350968122482, "learning_rate": 2e-07, "loss": 0.0224, "step": 102 }, { "clip_ratio/high_max": 0.0024559906305512413, "clip_ratio/high_mean": 0.0011159146124555264, "clip_ratio/low_mean": 0.0009331657183793141, "clip_ratio/low_min": 4.919136245007394e-05, "clip_ratio/region_mean": 0.0020490803362918086, "epoch": 0.009613309300060083, "grad_norm": 0.11701920628547668, "learning_rate": 2e-07, "loss": -0.0258, "step": 103 }, { "clip_ratio/high_max": 0.0023816749671823345, "clip_ratio/high_mean": 0.001012193530186778, "clip_ratio/low_mean": 0.0009461851859668968, "clip_ratio/low_min": 0.00010549517264735186, "clip_ratio/region_mean": 0.0019583787507144734, "epoch": 0.009706642400060667, "grad_norm": 0.11259889602661133, "learning_rate": 2e-07, "loss": 0.0251, "step": 104 }, { "clip_ratio/high_max": 0.00212989590363577, "clip_ratio/high_mean": 0.0009342385528725572, "clip_ratio/low_mean": 0.0009668715902080294, "clip_ratio/low_min": 0.00010830151722984738, "clip_ratio/region_mean": 0.0019011101830983534, "epoch": 0.00979997550006125, "grad_norm": 0.12469930946826935, "learning_rate": 2e-07, "loss": 0.0533, "step": 105 }, { "clip_ratio/high_max": 0.002451618667691946, "clip_ratio/high_mean": 0.0011513749886944424, "clip_ratio/low_mean": 0.0010595429776003584, "clip_ratio/low_min": 0.00022127971715235617, "clip_ratio/region_mean": 0.002210917926277034, "epoch": 0.009893308600061834, "grad_norm": 0.11920561641454697, "learning_rate": 2e-07, "loss": -0.0019, "step": 106 }, { "clip_ratio/high_max": 0.0025042207271326333, "clip_ratio/high_mean": 0.0011723431707650889, "clip_ratio/low_mean": 0.0009398496458743466, "clip_ratio/low_min": 0.00010294335697835777, "clip_ratio/region_mean": 0.00211219289485598, "epoch": 0.009986641700062417, "grad_norm": 0.1202285960316658, "learning_rate": 2e-07, "loss": -0.0136, "step": 107 }, { "clip_ratio/high_max": 0.002313672528543975, "clip_ratio/high_mean": 0.0010140827907889616, "clip_ratio/low_mean": 0.0009474849794059992, "clip_ratio/low_min": 9.074427362065762e-05, "clip_ratio/region_mean": 0.0019615677738329396, "epoch": 0.010079974800063, "grad_norm": 0.10966669023036957, "learning_rate": 2e-07, "loss": 0.0368, "step": 108 }, { "clip_ratio/high_max": 0.0023918012739159167, "clip_ratio/high_mean": 0.0010347984916734276, "clip_ratio/low_mean": 0.00109369298479578, "clip_ratio/low_min": 0.0001953406954271486, "clip_ratio/region_mean": 0.002128491483745165, "epoch": 0.010173307900063584, "grad_norm": 0.11710379272699356, "learning_rate": 2e-07, "loss": 0.0152, "step": 109 }, { "clip_ratio/high_max": 0.0027658634789986536, "clip_ratio/high_mean": 0.0011351373177603818, "clip_ratio/low_mean": 0.0012089416195522062, "clip_ratio/low_min": 0.0002850216296792496, "clip_ratio/region_mean": 0.0023440789664164186, "epoch": 0.010266641000064166, "grad_norm": 0.11934376507997513, "learning_rate": 2e-07, "loss": 0.056, "step": 110 }, { "clip_ratio/high_max": 0.002852796300430782, "clip_ratio/high_mean": 0.0011598841665545478, "clip_ratio/low_mean": 0.001075643111107638, "clip_ratio/low_min": 0.00011548764632607345, "clip_ratio/region_mean": 0.0022355272667482495, "epoch": 0.010359974100064749, "grad_norm": 0.12586535513401031, "learning_rate": 2e-07, "loss": 0.0103, "step": 111 }, { "clip_ratio/high_max": 0.0026857995180762373, "clip_ratio/high_mean": 0.0011435229353082832, "clip_ratio/low_mean": 0.000963541697274195, "clip_ratio/low_min": 2.432853216305375e-05, "clip_ratio/region_mean": 0.002107064654410351, "epoch": 0.010453307200065333, "grad_norm": 0.11803115159273148, "learning_rate": 2e-07, "loss": -0.0018, "step": 112 }, { "clip_ratio/high_max": 0.002378153170866426, "clip_ratio/high_mean": 0.0011447355609561782, "clip_ratio/low_mean": 0.0010742325212049764, "clip_ratio/low_min": 0.00016662020789226517, "clip_ratio/region_mean": 0.0022189680312294513, "epoch": 0.010546640300065916, "grad_norm": 0.1251862347126007, "learning_rate": 2e-07, "loss": 0.0357, "step": 113 }, { "clip_ratio/high_max": 0.0026185399838141166, "clip_ratio/high_mean": 0.0010829621423908975, "clip_ratio/low_mean": 0.001015963982354151, "clip_ratio/low_min": 0.0001398567055730382, "clip_ratio/region_mean": 0.002098926095641218, "epoch": 0.0106399734000665, "grad_norm": 0.12317952513694763, "learning_rate": 2e-07, "loss": 0.0521, "step": 114 }, { "clip_ratio/high_max": 0.0021184968427405693, "clip_ratio/high_mean": 0.0009378883842146024, "clip_ratio/low_mean": 0.0010725193696998758, "clip_ratio/low_min": 8.47551305014349e-05, "clip_ratio/region_mean": 0.0020104077557334676, "epoch": 0.010733306500067083, "grad_norm": 0.11267170310020447, "learning_rate": 2e-07, "loss": 0.0513, "step": 115 }, { "clip_ratio/high_max": 0.0025126855543931015, "clip_ratio/high_mean": 0.0010404367785668, "clip_ratio/low_mean": 0.0011350272052368382, "clip_ratio/low_min": 0.00015253056062647374, "clip_ratio/region_mean": 0.002175463981984649, "epoch": 0.010826639600067666, "grad_norm": 0.11584781855344772, "learning_rate": 2e-07, "loss": 0.0269, "step": 116 }, { "clip_ratio/high_max": 0.002355060656554997, "clip_ratio/high_mean": 0.0011476631516416091, "clip_ratio/low_mean": 0.0009783512996364152, "clip_ratio/low_min": 0.00014119092520559207, "clip_ratio/region_mean": 0.00212601446401095, "epoch": 0.01091997270006825, "grad_norm": 0.12706851959228516, "learning_rate": 2e-07, "loss": -0.0213, "step": 117 }, { "clip_ratio/high_max": 0.002446399499604013, "clip_ratio/high_mean": 0.0011725875046977308, "clip_ratio/low_mean": 0.0010147828197659692, "clip_ratio/low_min": 0.0001541780011393712, "clip_ratio/region_mean": 0.00218737029354088, "epoch": 0.011013305800068833, "grad_norm": 0.1259663850069046, "learning_rate": 2e-07, "loss": -0.0408, "step": 118 }, { "clip_ratio/high_max": 0.002223934541689232, "clip_ratio/high_mean": 0.0009736770844028797, "clip_ratio/low_mean": 0.0009884823630272876, "clip_ratio/low_min": 0.00015057997279654955, "clip_ratio/region_mean": 0.0019621594983618706, "epoch": 0.011106638900069417, "grad_norm": 0.11884410679340363, "learning_rate": 2e-07, "loss": 0.0311, "step": 119 }, { "clip_ratio/high_max": 0.002796456406940706, "clip_ratio/high_mean": 0.0011866843269672245, "clip_ratio/low_mean": 0.0010362978973716963, "clip_ratio/low_min": 4.235373671690468e-05, "clip_ratio/region_mean": 0.0022229822134249844, "epoch": 0.01119997200007, "grad_norm": 0.11630505323410034, "learning_rate": 2e-07, "loss": 0.026, "step": 120 }, { "clip_ratio/high_max": 0.0025063391512958333, "clip_ratio/high_mean": 0.0010551042378210695, "clip_ratio/low_mean": 0.001064993270119885, "clip_ratio/low_min": 0.00017890606522996677, "clip_ratio/region_mean": 0.002120097487932071, "epoch": 0.011293305100070584, "grad_norm": 0.11852765828371048, "learning_rate": 2e-07, "loss": 0.0004, "step": 121 }, { "clip_ratio/high_max": 0.0022325711106532253, "clip_ratio/high_mean": 0.0011019281300832517, "clip_ratio/low_mean": 0.0010778661835502135, "clip_ratio/low_min": 0.00022602467743126908, "clip_ratio/region_mean": 0.0021797943336423486, "epoch": 0.011386638200071167, "grad_norm": 0.12814253568649292, "learning_rate": 2e-07, "loss": 0.026, "step": 122 }, { "clip_ratio/high_max": 0.0021846044510311913, "clip_ratio/high_mean": 0.0010939260846498655, "clip_ratio/low_mean": 0.0010973173193633556, "clip_ratio/low_min": 0.00018606262528919615, "clip_ratio/region_mean": 0.0021912433512625284, "epoch": 0.011479971300071749, "grad_norm": 0.12078071385622025, "learning_rate": 2e-07, "loss": 0.0264, "step": 123 }, { "clip_ratio/high_max": 0.002277482344652526, "clip_ratio/high_mean": 0.001035465222230414, "clip_ratio/low_mean": 0.0011094832807430066, "clip_ratio/low_min": 0.00019225356118113268, "clip_ratio/region_mean": 0.00214494853571523, "epoch": 0.011573304400072332, "grad_norm": 0.12044785916805267, "learning_rate": 2e-07, "loss": 0.0533, "step": 124 }, { "clip_ratio/high_max": 0.002055894408840686, "clip_ratio/high_mean": 0.0009552461688144831, "clip_ratio/low_mean": 0.0011814787358161993, "clip_ratio/low_min": 0.00018279723190062214, "clip_ratio/region_mean": 0.0021367249355535023, "epoch": 0.011666637500072916, "grad_norm": 0.11136198788881302, "learning_rate": 2e-07, "loss": 0.0256, "step": 125 }, { "clip_ratio/high_max": 0.0021344584347389173, "clip_ratio/high_mean": 0.0009915252703649458, "clip_ratio/low_mean": 0.0010342523928557057, "clip_ratio/low_min": 8.750762754061725e-05, "clip_ratio/region_mean": 0.0020257776486687362, "epoch": 0.0117599706000735, "grad_norm": 0.11416833102703094, "learning_rate": 2e-07, "loss": 0.0178, "step": 126 }, { "clip_ratio/high_max": 0.0023940432074596174, "clip_ratio/high_mean": 0.0010396204561402556, "clip_ratio/low_mean": 0.0010296534455846995, "clip_ratio/low_min": 0.00014903274586686166, "clip_ratio/region_mean": 0.002069273861707188, "epoch": 0.011853303700074083, "grad_norm": 0.11465053260326385, "learning_rate": 2e-07, "loss": -0.0009, "step": 127 }, { "clip_ratio/high_max": 0.0026578558317851275, "clip_ratio/high_mean": 0.0012486195446399506, "clip_ratio/low_mean": 0.0012774387905665208, "clip_ratio/low_min": 0.00030210926070139976, "clip_ratio/region_mean": 0.002526058306102641, "epoch": 0.011946636800074666, "grad_norm": 0.1288243681192398, "learning_rate": 2e-07, "loss": 0.0361, "step": 128 }, { "clip_ratio/high_max": 0.0, "clip_ratio/high_mean": 0.0, "clip_ratio/low_mean": 0.0, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0, "completions/clipped_ratio": 0.014474051339285698, "completions/max_length": 4096.0, "completions/max_terminated_length": 4094.0, "completions/mean_length": 610.05322265625, "completions/mean_terminated_length": 558.8564453125, "completions/min_length": 2.0, "completions/min_terminated_length": 2.0, "epoch": 0.01203996990007525, "grad_norm": 0.1481635570526123, "learning_rate": 2e-07, "loss": 0.0137, "num_tokens": 161917157.0, "reward": 0.5136893391609192, "reward_std": 0.24727264046669006, "rewards/simpleverify_reward/mean": 0.5136893391609192, "rewards/simpleverify_reward/std": 0.4998147487640381, "step": 129 }, { "clip_ratio/high_max": 0.002211647341027856, "clip_ratio/high_mean": 0.000984449598036008, "clip_ratio/low_mean": 0.0006245471195143182, "clip_ratio/low_min": 3.37695755661116e-05, "clip_ratio/region_mean": 0.0016089966957224533, "epoch": 0.012133303000075833, "grad_norm": 0.15445207059383392, "learning_rate": 2e-07, "loss": 0.0037, "step": 130 }, { "clip_ratio/high_max": 0.00216038481448777, "clip_ratio/high_mean": 0.000923966563277645, "clip_ratio/low_mean": 0.0006574549606739311, "clip_ratio/low_min": 4.991430296286126e-05, "clip_ratio/region_mean": 0.0015814215439604595, "epoch": 0.012226636100076417, "grad_norm": 0.13598668575286865, "learning_rate": 2e-07, "loss": 0.0691, "step": 131 }, { "clip_ratio/high_max": 0.002012094970268663, "clip_ratio/high_mean": 0.0008784737201494863, "clip_ratio/low_mean": 0.0006145324923636508, "clip_ratio/low_min": 2.2145901311887428e-05, "clip_ratio/region_mean": 0.0014930061879567802, "epoch": 0.012319969200077, "grad_norm": 0.12511757016181946, "learning_rate": 2e-07, "loss": 0.0448, "step": 132 }, { "clip_ratio/high_max": 0.0023118868994060904, "clip_ratio/high_mean": 0.0009706778546387795, "clip_ratio/low_mean": 0.0005756515620305436, "clip_ratio/low_min": 6.218823000381235e-05, "clip_ratio/region_mean": 0.0015463294039363973, "epoch": 0.012413302300077584, "grad_norm": 0.15425211191177368, "learning_rate": 2e-07, "loss": -0.007, "step": 133 }, { "clip_ratio/high_max": 0.0018785969077725895, "clip_ratio/high_mean": 0.0009155198531516362, "clip_ratio/low_mean": 0.0006921184613020159, "clip_ratio/low_min": 4.8694160796003416e-05, "clip_ratio/region_mean": 0.0016076382889878005, "epoch": 0.012506635400078167, "grad_norm": 0.13897864520549774, "learning_rate": 2e-07, "loss": -0.0316, "step": 134 }, { "clip_ratio/high_max": 0.002373968221945688, "clip_ratio/high_mean": 0.0009355184920423198, "clip_ratio/low_mean": 0.0006981673650443554, "clip_ratio/low_min": 5.6507944464101456e-05, "clip_ratio/region_mean": 0.0016336858716385905, "epoch": 0.01259996850007875, "grad_norm": 0.1365860253572464, "learning_rate": 2e-07, "loss": 0.061, "step": 135 }, { "clip_ratio/high_max": 0.002057610938209109, "clip_ratio/high_mean": 0.0008843443738442147, "clip_ratio/low_mean": 0.0006922691063664388, "clip_ratio/low_min": 7.425179410347482e-05, "clip_ratio/region_mean": 0.0015766134893056005, "epoch": 0.012693301600079332, "grad_norm": 0.1134004071354866, "learning_rate": 2e-07, "loss": -0.0163, "step": 136 }, { "clip_ratio/high_max": 0.00218633831536863, "clip_ratio/high_mean": 0.0009235689030901995, "clip_ratio/low_mean": 0.0006719948432873935, "clip_ratio/low_min": 2.8179449145682156e-05, "clip_ratio/region_mean": 0.0015955637500155717, "epoch": 0.012786634700079916, "grad_norm": 0.12747465074062347, "learning_rate": 2e-07, "loss": -0.0312, "step": 137 }, { "clip_ratio/high_max": 0.002430728869512677, "clip_ratio/high_mean": 0.0010949140796583379, "clip_ratio/low_mean": 0.0007029299140413059, "clip_ratio/low_min": 4.506847562879557e-05, "clip_ratio/region_mean": 0.0017978440009756014, "epoch": 0.0128799678000805, "grad_norm": 0.12068028748035431, "learning_rate": 2e-07, "loss": -0.0171, "step": 138 }, { "clip_ratio/high_max": 0.002370481764955912, "clip_ratio/high_mean": 0.0010152555114473216, "clip_ratio/low_mean": 0.0008535381530236918, "clip_ratio/low_min": 0.00013393160861596698, "clip_ratio/region_mean": 0.0018687936317292042, "epoch": 0.012973300900081083, "grad_norm": 0.11235835403203964, "learning_rate": 2e-07, "loss": 0.0459, "step": 139 }, { "clip_ratio/high_max": 0.0022311235952656716, "clip_ratio/high_mean": 0.0009908980537147727, "clip_ratio/low_mean": 0.0007660091373509204, "clip_ratio/low_min": 7.527978232246824e-05, "clip_ratio/region_mean": 0.001756907171511557, "epoch": 0.013066634000081666, "grad_norm": 0.12476195394992828, "learning_rate": 2e-07, "loss": 0.0339, "step": 140 }, { "clip_ratio/high_max": 0.0022383901305147447, "clip_ratio/high_mean": 0.0010416057630209252, "clip_ratio/low_mean": 0.0008024508297239663, "clip_ratio/low_min": 5.7943819228967186e-05, "clip_ratio/region_mean": 0.0018440565909259021, "epoch": 0.01315996710008225, "grad_norm": 0.109299436211586, "learning_rate": 2e-07, "loss": 0.0152, "step": 141 }, { "clip_ratio/high_max": 0.0025618308791308664, "clip_ratio/high_mean": 0.0011667920807667542, "clip_ratio/low_mean": 0.0008302256574097555, "clip_ratio/low_min": 0.00021148962741790456, "clip_ratio/region_mean": 0.001997017730900552, "epoch": 0.013253300200082833, "grad_norm": 0.12275847792625427, "learning_rate": 2e-07, "loss": -0.0001, "step": 142 }, { "clip_ratio/high_max": 0.002405607134278398, "clip_ratio/high_mean": 0.0010996874152624514, "clip_ratio/low_mean": 0.0008707080196472816, "clip_ratio/low_min": 0.00011949604868277675, "clip_ratio/region_mean": 0.0019703954822034575, "epoch": 0.013346633300083417, "grad_norm": 0.12709520757198334, "learning_rate": 2e-07, "loss": 0.0058, "step": 143 }, { "clip_ratio/high_max": 0.0023418017954099923, "clip_ratio/high_mean": 0.001025439654767979, "clip_ratio/low_mean": 0.0008895361261238577, "clip_ratio/low_min": 0.0001655283231229987, "clip_ratio/region_mean": 0.0019149758300045505, "epoch": 0.013439966400084, "grad_norm": 0.11988680064678192, "learning_rate": 2e-07, "loss": -0.0056, "step": 144 }, { "clip_ratio/high_max": 0.002276813036587555, "clip_ratio/high_mean": 0.0011238606202823576, "clip_ratio/low_mean": 0.000917119574296521, "clip_ratio/low_min": 0.0001440282931071124, "clip_ratio/region_mean": 0.0020409802382346243, "epoch": 0.013533299500084583, "grad_norm": 0.12003538757562637, "learning_rate": 2e-07, "loss": -0.0342, "step": 145 }, { "clip_ratio/high_max": 0.0027001834896509536, "clip_ratio/high_mean": 0.0010937901697616326, "clip_ratio/low_mean": 0.000816682566437521, "clip_ratio/low_min": 6.690785448881797e-05, "clip_ratio/region_mean": 0.0019104727180092596, "epoch": 0.013626632600085167, "grad_norm": 0.11384635418653488, "learning_rate": 2e-07, "loss": -0.01, "step": 146 }, { "clip_ratio/high_max": 0.0025461251570959575, "clip_ratio/high_mean": 0.0010602314396237489, "clip_ratio/low_mean": 0.0009832671112235403, "clip_ratio/low_min": 0.00013367325300350785, "clip_ratio/region_mean": 0.0020434985563042574, "epoch": 0.01371996570008575, "grad_norm": 0.12295091897249222, "learning_rate": 2e-07, "loss": -0.016, "step": 147 }, { "clip_ratio/high_max": 0.0021047491318313405, "clip_ratio/high_mean": 0.0009729219982546056, "clip_ratio/low_mean": 0.0009922916942741722, "clip_ratio/low_min": 7.056615731926286e-05, "clip_ratio/region_mean": 0.0019652137489174493, "epoch": 0.013813298800086334, "grad_norm": 0.11358130723237991, "learning_rate": 2e-07, "loss": 0.0156, "step": 148 }, { "clip_ratio/high_max": 0.0022650709724985063, "clip_ratio/high_mean": 0.000914602027478395, "clip_ratio/low_mean": 0.0009901806697598659, "clip_ratio/low_min": 5.657449037244078e-05, "clip_ratio/region_mean": 0.0019047827299800701, "epoch": 0.013906631900086916, "grad_norm": 0.10851912200450897, "learning_rate": 2e-07, "loss": 0.0372, "step": 149 }, { "clip_ratio/high_max": 0.002455469271808397, "clip_ratio/high_mean": 0.0010375056244811276, "clip_ratio/low_mean": 0.0009754002276167739, "clip_ratio/low_min": 0.00015446253928530496, "clip_ratio/region_mean": 0.00201290579570923, "epoch": 0.013999965000087499, "grad_norm": 0.11816101521253586, "learning_rate": 2e-07, "loss": 0.0281, "step": 150 }, { "clip_ratio/high_max": 0.0020574581212713383, "clip_ratio/high_mean": 0.0009042886067618383, "clip_ratio/low_mean": 0.0011247423099121079, "clip_ratio/low_min": 0.00023100295948097482, "clip_ratio/region_mean": 0.002029030911216978, "epoch": 0.014093298100088083, "grad_norm": 0.11871708929538727, "learning_rate": 2e-07, "loss": 0.0726, "step": 151 }, { "clip_ratio/high_max": 0.0023412091395584866, "clip_ratio/high_mean": 0.0010717992008721922, "clip_ratio/low_mean": 0.0009969192469725385, "clip_ratio/low_min": 8.999525653052842e-05, "clip_ratio/region_mean": 0.0020687184296548367, "epoch": 0.014186631200088666, "grad_norm": 0.11756947636604309, "learning_rate": 2e-07, "loss": 0.0149, "step": 152 }, { "clip_ratio/high_max": 0.0022104529416537844, "clip_ratio/high_mean": 0.001048275862558512, "clip_ratio/low_mean": 0.00096182550987578, "clip_ratio/low_min": 0.0001271830760742887, "clip_ratio/region_mean": 0.002010101394262165, "epoch": 0.01427996430008925, "grad_norm": 0.11331942677497864, "learning_rate": 2e-07, "loss": 0.0148, "step": 153 }, { "clip_ratio/high_max": 0.0025152997841360047, "clip_ratio/high_mean": 0.0010446363376104273, "clip_ratio/low_mean": 0.0010225364967482165, "clip_ratio/low_min": 2.0619086171791423e-05, "clip_ratio/region_mean": 0.0020671728780143894, "epoch": 0.014373297400089833, "grad_norm": 0.1262289136648178, "learning_rate": 2e-07, "loss": -0.0138, "step": 154 }, { "clip_ratio/high_max": 0.0023504127057094593, "clip_ratio/high_mean": 0.0010495629649085458, "clip_ratio/low_mean": 0.001205289489007555, "clip_ratio/low_min": 0.00017996442056755768, "clip_ratio/region_mean": 0.002254852428450249, "epoch": 0.014466630500090416, "grad_norm": 0.12503443658351898, "learning_rate": 2e-07, "loss": 0.0316, "step": 155 }, { "clip_ratio/high_max": 0.0020614491986634675, "clip_ratio/high_mean": 0.0009952435721061192, "clip_ratio/low_mean": 0.0009899511169351172, "clip_ratio/low_min": 9.162593323708279e-05, "clip_ratio/region_mean": 0.001985194699955173, "epoch": 0.014559963600091, "grad_norm": 0.1194966584444046, "learning_rate": 2e-07, "loss": 0.0245, "step": 156 }, { "clip_ratio/high_max": 0.0024101724702632055, "clip_ratio/high_mean": 0.000988665888144169, "clip_ratio/low_mean": 0.0010312882568541681, "clip_ratio/low_min": 7.801058018230833e-05, "clip_ratio/region_mean": 0.002019954139541369, "epoch": 0.014653296700091583, "grad_norm": 0.11390312761068344, "learning_rate": 2e-07, "loss": 0.0614, "step": 157 }, { "clip_ratio/high_max": 0.002043804110144265, "clip_ratio/high_mean": 0.0009360972471768036, "clip_ratio/low_mean": 0.0010851766710402444, "clip_ratio/low_min": 0.00013144642889528768, "clip_ratio/region_mean": 0.0020212739291309845, "epoch": 0.014746629800092167, "grad_norm": 0.11520647257566452, "learning_rate": 2e-07, "loss": 0.0465, "step": 158 }, { "clip_ratio/high_max": 0.0024747769930399954, "clip_ratio/high_mean": 0.0010577441644272767, "clip_ratio/low_mean": 0.0009229692714143312, "clip_ratio/low_min": 0.00012402843276504427, "clip_ratio/region_mean": 0.0019807134740403853, "epoch": 0.01483996290009275, "grad_norm": 0.11063252389431, "learning_rate": 2e-07, "loss": 0.0003, "step": 159 }, { "clip_ratio/high_max": 0.002349348447751254, "clip_ratio/high_mean": 0.0010158413497265428, "clip_ratio/low_mean": 0.00109984969276411, "clip_ratio/low_min": 0.00011386273354219156, "clip_ratio/region_mean": 0.002115691044309642, "epoch": 0.014933296000093334, "grad_norm": 0.11516238749027252, "learning_rate": 2e-07, "loss": 0.036, "step": 160 }, { "clip_ratio/high_max": 0.0021381953338277526, "clip_ratio/high_mean": 0.0009600074699847028, "clip_ratio/low_mean": 0.0011274931894149631, "clip_ratio/low_min": 0.00012667724695347715, "clip_ratio/region_mean": 0.002087500601192005, "epoch": 0.015026629100093917, "grad_norm": 0.12140358239412308, "learning_rate": 2e-07, "loss": 0.0356, "step": 161 }, { "clip_ratio/high_max": 0.0024240844504674897, "clip_ratio/high_mean": 0.0010787419669213705, "clip_ratio/low_mean": 0.0010024136918218574, "clip_ratio/low_min": 3.684022158267908e-05, "clip_ratio/region_mean": 0.002081155624182429, "epoch": 0.015119962200094499, "grad_norm": 0.1216551661491394, "learning_rate": 2e-07, "loss": 0.0194, "step": 162 }, { "clip_ratio/high_max": 0.0021285293623805046, "clip_ratio/high_mean": 0.001008749941320275, "clip_ratio/low_mean": 0.0009402789983141702, "clip_ratio/low_min": 0.00021992080655763857, "clip_ratio/region_mean": 0.0019490289632813074, "epoch": 0.015213295300095082, "grad_norm": 0.11626891046762466, "learning_rate": 2e-07, "loss": 0.0414, "step": 163 }, { "clip_ratio/high_max": 0.002621370651468169, "clip_ratio/high_mean": 0.0010795422658702591, "clip_ratio/low_mean": 0.0009695547432784224, "clip_ratio/low_min": 0.00010124448635906447, "clip_ratio/region_mean": 0.0020490969691309147, "epoch": 0.015306628400095666, "grad_norm": 0.12608931958675385, "learning_rate": 2e-07, "loss": -0.0066, "step": 164 }, { "clip_ratio/high_max": 0.002125522260030266, "clip_ratio/high_mean": 0.0009154718645731919, "clip_ratio/low_mean": 0.0009758792111824732, "clip_ratio/low_min": 9.051103006640915e-05, "clip_ratio/region_mean": 0.0018913510721176863, "epoch": 0.01539996150009625, "grad_norm": 0.12320546805858612, "learning_rate": 2e-07, "loss": 0.0485, "step": 165 }, { "clip_ratio/high_max": 0.002591632422991097, "clip_ratio/high_mean": 0.0011395890251151286, "clip_ratio/low_mean": 0.0009301047139160801, "clip_ratio/low_min": 0.00015941577294142917, "clip_ratio/region_mean": 0.0020696936844615266, "epoch": 0.015493294600096833, "grad_norm": 0.11828868836164474, "learning_rate": 2e-07, "loss": -0.0049, "step": 166 }, { "clip_ratio/high_max": 0.0023275501807802357, "clip_ratio/high_mean": 0.0009904717753670411, "clip_ratio/low_mean": 0.0011094271612819284, "clip_ratio/low_min": 0.00019971528763562674, "clip_ratio/region_mean": 0.0020998989421059377, "epoch": 0.015586627700097416, "grad_norm": 26.616317749023438, "learning_rate": 2e-07, "loss": 0.061, "step": 167 }, { "clip_ratio/high_max": 0.002314448243851075, "clip_ratio/high_mean": 0.0010348311570851365, "clip_ratio/low_mean": 0.001010514792142203, "clip_ratio/low_min": 0.00020920293354720343, "clip_ratio/region_mean": 0.002045345929218456, "epoch": 0.015679960800098, "grad_norm": 0.1182899922132492, "learning_rate": 2e-07, "loss": -0.015, "step": 168 }, { "clip_ratio/high_max": 0.002457881251757499, "clip_ratio/high_mean": 0.0011290573802398285, "clip_ratio/low_mean": 0.0009525034201942617, "clip_ratio/low_min": 0.00021894963902013842, "clip_ratio/region_mean": 0.0020815607931581326, "epoch": 0.015773293900098583, "grad_norm": 0.12637564539909363, "learning_rate": 2e-07, "loss": 0.0121, "step": 169 }, { "clip_ratio/high_max": 0.002503236442862544, "clip_ratio/high_mean": 0.0010618162123137154, "clip_ratio/low_mean": 0.0007971939776325598, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.001859010139014572, "epoch": 0.015866627000099165, "grad_norm": 0.12379348278045654, "learning_rate": 2e-07, "loss": -0.0098, "step": 170 }, { "clip_ratio/high_max": 0.002317321741429623, "clip_ratio/high_mean": 0.0010113195057783742, "clip_ratio/low_mean": 0.0010328230782761239, "clip_ratio/low_min": 0.00014360537443280919, "clip_ratio/region_mean": 0.0020441426313482225, "epoch": 0.01595996010009975, "grad_norm": 0.14188984036445618, "learning_rate": 2e-07, "loss": 0.0372, "step": 171 }, { "clip_ratio/high_max": 0.001951427952008089, "clip_ratio/high_mean": 0.0009279394980694633, "clip_ratio/low_mean": 0.001060795122612035, "clip_ratio/low_min": 0.0001960510862772935, "clip_ratio/region_mean": 0.0019887346352334134, "epoch": 0.016053293200100332, "grad_norm": 0.1133657693862915, "learning_rate": 2e-07, "loss": 0.0343, "step": 172 }, { "clip_ratio/high_max": 0.002071236329356907, "clip_ratio/high_mean": 0.000905365513972356, "clip_ratio/low_mean": 0.0009156375090242364, "clip_ratio/low_min": 0.00011612400248850463, "clip_ratio/region_mean": 0.0018210030102636665, "epoch": 0.016146626300100917, "grad_norm": 0.11113794147968292, "learning_rate": 2e-07, "loss": -0.0031, "step": 173 }, { "clip_ratio/high_max": 0.0023085512439138256, "clip_ratio/high_mean": 0.0009839642880251631, "clip_ratio/low_mean": 0.000998424240606255, "clip_ratio/low_min": 0.00012565961151267402, "clip_ratio/region_mean": 0.0019823884722427465, "epoch": 0.0162399594001015, "grad_norm": 0.11962849646806717, "learning_rate": 2e-07, "loss": 0.0587, "step": 174 }, { "clip_ratio/high_max": 0.0018068092103931122, "clip_ratio/high_mean": 0.0008250220453192014, "clip_ratio/low_mean": 0.001107988635340007, "clip_ratio/low_min": 0.00012506831626524217, "clip_ratio/region_mean": 0.0019330106661072932, "epoch": 0.016333292500102084, "grad_norm": 0.1193937361240387, "learning_rate": 2e-07, "loss": 0.0626, "step": 175 }, { "clip_ratio/high_max": 0.0025243309937650338, "clip_ratio/high_mean": 0.0010203607744188048, "clip_ratio/low_mean": 0.0009396533350809477, "clip_ratio/low_min": 0.0001321702693530824, "clip_ratio/region_mean": 0.001960014153155498, "epoch": 0.016426625600102666, "grad_norm": 0.1215694397687912, "learning_rate": 2e-07, "loss": 0.026, "step": 176 }, { "clip_ratio/high_max": 0.0024269349487440195, "clip_ratio/high_mean": 0.0011048557553294813, "clip_ratio/low_mean": 0.0011205751325178426, "clip_ratio/low_min": 0.0002564700844231993, "clip_ratio/region_mean": 0.0022254309078562073, "epoch": 0.01651995870010325, "grad_norm": 0.12163890898227692, "learning_rate": 2e-07, "loss": -0.0012, "step": 177 }, { "clip_ratio/high_max": 0.0022752477016183548, "clip_ratio/high_mean": 0.0010906550851359498, "clip_ratio/low_mean": 0.0010165875683014747, "clip_ratio/low_min": 7.854106570448494e-05, "clip_ratio/region_mean": 0.0021072426534374245, "epoch": 0.016613291800103833, "grad_norm": 0.12175972014665604, "learning_rate": 2e-07, "loss": 0.0184, "step": 178 }, { "clip_ratio/high_max": 0.0021467865735758096, "clip_ratio/high_mean": 0.0009431789585505612, "clip_ratio/low_mean": 0.0009188300209643785, "clip_ratio/low_min": 9.024345399666345e-05, "clip_ratio/region_mean": 0.0018620089904288761, "epoch": 0.016706624900104418, "grad_norm": 0.12836070358753204, "learning_rate": 2e-07, "loss": 0.015, "step": 179 }, { "clip_ratio/high_max": 0.0024928435959736817, "clip_ratio/high_mean": 0.0010335963088436984, "clip_ratio/low_mean": 0.0010255315428366885, "clip_ratio/low_min": 8.911354143492645e-05, "clip_ratio/region_mean": 0.0020591278153005987, "epoch": 0.016799958000105, "grad_norm": 0.12374837696552277, "learning_rate": 2e-07, "loss": 0.0512, "step": 180 }, { "clip_ratio/high_max": 0.0023851870355429128, "clip_ratio/high_mean": 0.0009113808991969563, "clip_ratio/low_mean": 0.000996776658212184, "clip_ratio/low_min": 0.0001440137775716721, "clip_ratio/region_mean": 0.0019081575228483416, "epoch": 0.016893291100105585, "grad_norm": 0.1123925969004631, "learning_rate": 2e-07, "loss": 0.0162, "step": 181 }, { "clip_ratio/high_max": 0.0022945046875975095, "clip_ratio/high_mean": 0.0010496930699446239, "clip_ratio/low_mean": 0.0008662598120281473, "clip_ratio/low_min": 4.1981134927482344e-05, "clip_ratio/region_mean": 0.001915952940180432, "epoch": 0.016986624200106167, "grad_norm": 0.12222085893154144, "learning_rate": 2e-07, "loss": -0.058, "step": 182 }, { "clip_ratio/high_max": 0.0022298770236375276, "clip_ratio/high_mean": 0.0009727602373459376, "clip_ratio/low_mean": 0.0009580133792042034, "clip_ratio/low_min": 6.394952015398303e-05, "clip_ratio/region_mean": 0.0019307736511109397, "epoch": 0.017079957300106748, "grad_norm": 0.11742282658815384, "learning_rate": 2e-07, "loss": 0.0055, "step": 183 }, { "clip_ratio/high_max": 0.002245485899038613, "clip_ratio/high_mean": 0.0010460002049512696, "clip_ratio/low_mean": 0.0009827064241108019, "clip_ratio/low_min": 5.408273364082561e-05, "clip_ratio/region_mean": 0.0020287066072341986, "epoch": 0.017173290400107333, "grad_norm": 0.12085293233394623, "learning_rate": 2e-07, "loss": 0.0351, "step": 184 }, { "clip_ratio/high_max": 0.0023337375423579942, "clip_ratio/high_mean": 0.0010509970325074391, "clip_ratio/low_mean": 0.0010217202652711421, "clip_ratio/low_min": 0.00017886338719108608, "clip_ratio/region_mean": 0.0020727173032355495, "epoch": 0.017266623500107915, "grad_norm": 0.12703543901443481, "learning_rate": 2e-07, "loss": 0.0327, "step": 185 }, { "clip_ratio/high_max": 0.0024703241360839456, "clip_ratio/high_mean": 0.0008734534421819262, "clip_ratio/low_mean": 0.0010401628678664565, "clip_ratio/low_min": 0.00013215726448834175, "clip_ratio/region_mean": 0.0019136163755320013, "epoch": 0.0173599566001085, "grad_norm": 0.11987452208995819, "learning_rate": 2e-07, "loss": 0.0667, "step": 186 }, { "clip_ratio/high_max": 0.0020327953243395314, "clip_ratio/high_mean": 0.0008904622427508002, "clip_ratio/low_mean": 0.0009205971837218385, "clip_ratio/low_min": 0.00022528671524923993, "clip_ratio/region_mean": 0.001811059410101734, "epoch": 0.017453289700109082, "grad_norm": 0.11871036142110825, "learning_rate": 2e-07, "loss": 0.031, "step": 187 }, { "clip_ratio/high_max": 0.0022935889901418705, "clip_ratio/high_mean": 0.0010236940397589933, "clip_ratio/low_mean": 0.0007941564472275786, "clip_ratio/low_min": 4.008818905276712e-05, "clip_ratio/region_mean": 0.0018178504760726355, "epoch": 0.017546622800109667, "grad_norm": 0.11217762529850006, "learning_rate": 2e-07, "loss": 0.004, "step": 188 }, { "clip_ratio/high_max": 0.0021854220394743606, "clip_ratio/high_mean": 0.000961354582614149, "clip_ratio/low_mean": 0.0010703402767830994, "clip_ratio/low_min": 0.0001440718720004952, "clip_ratio/region_mean": 0.0020316948284744285, "epoch": 0.01763995590011025, "grad_norm": 0.11416805535554886, "learning_rate": 2e-07, "loss": 0.0253, "step": 189 }, { "clip_ratio/high_max": 0.002504703472368419, "clip_ratio/high_mean": 0.0011125294968223898, "clip_ratio/low_mean": 0.0009059971325768856, "clip_ratio/low_min": 0.00011228650600969559, "clip_ratio/region_mean": 0.0020185265748295933, "epoch": 0.017733289000110834, "grad_norm": 0.10930581390857697, "learning_rate": 2e-07, "loss": 0.0109, "step": 190 }, { "clip_ratio/high_max": 0.002368031200603582, "clip_ratio/high_mean": 0.0009744305825734045, "clip_ratio/low_mean": 0.0011222791654290631, "clip_ratio/low_min": 0.0002622912943479605, "clip_ratio/region_mean": 0.0020967097152606584, "epoch": 0.017826622100111416, "grad_norm": 0.11341755092144012, "learning_rate": 2e-07, "loss": 0.0318, "step": 191 }, { "clip_ratio/high_max": 0.0021244492745609023, "clip_ratio/high_mean": 0.0009373769808007637, "clip_ratio/low_mean": 0.0009621774916013237, "clip_ratio/low_min": 0.00020242235223122407, "clip_ratio/region_mean": 0.0018995545251527801, "epoch": 0.017919955200112, "grad_norm": 0.1153130829334259, "learning_rate": 2e-07, "loss": 0.0231, "step": 192 }, { "clip_ratio/high_max": 0.002168262071791105, "clip_ratio/high_mean": 0.0009975659413612448, "clip_ratio/low_mean": 0.0008994193176476983, "clip_ratio/low_min": 8.752061330596916e-05, "clip_ratio/region_mean": 0.0018969852390000597, "epoch": 0.018013288300112583, "grad_norm": 0.10475920885801315, "learning_rate": 2e-07, "loss": 0.0083, "step": 193 }, { "clip_ratio/high_max": 0.002539620894822292, "clip_ratio/high_mean": 0.001091326796085923, "clip_ratio/low_mean": 0.0009693101674201898, "clip_ratio/low_min": 2.9162461487430846e-05, "clip_ratio/region_mean": 0.0020606369580491446, "epoch": 0.018106621400113165, "grad_norm": 0.13054399192333221, "learning_rate": 2e-07, "loss": -0.0372, "step": 194 }, { "clip_ratio/high_max": 0.0020667135031544603, "clip_ratio/high_mean": 0.0009356023474538233, "clip_ratio/low_mean": 0.0009706382006697822, "clip_ratio/low_min": 7.61611308917054e-05, "clip_ratio/region_mean": 0.0019062405262957327, "epoch": 0.01819995450011375, "grad_norm": 0.12089604139328003, "learning_rate": 2e-07, "loss": 0.0481, "step": 195 }, { "clip_ratio/high_max": 0.00249840543983737, "clip_ratio/high_mean": 0.0011213863763259724, "clip_ratio/low_mean": 0.0009371234700665809, "clip_ratio/low_min": 0.00013465874963003444, "clip_ratio/region_mean": 0.0020585098463925533, "epoch": 0.01829328760011433, "grad_norm": 0.11723543703556061, "learning_rate": 2e-07, "loss": -0.0023, "step": 196 }, { "clip_ratio/high_max": 0.002285553127876483, "clip_ratio/high_mean": 0.0010164995819650358, "clip_ratio/low_mean": 0.0008974989505077247, "clip_ratio/low_min": 9.983821018977324e-05, "clip_ratio/region_mean": 0.001913998567033559, "epoch": 0.018386620700114917, "grad_norm": 0.10722363740205765, "learning_rate": 2e-07, "loss": 0.0064, "step": 197 }, { "clip_ratio/high_max": 0.002358752812142484, "clip_ratio/high_mean": 0.0010754599643405527, "clip_ratio/low_mean": 0.0008644656236356241, "clip_ratio/low_min": 0.00010313741677236976, "clip_ratio/region_mean": 0.001939925568876788, "epoch": 0.0184799538001155, "grad_norm": 0.12058883160352707, "learning_rate": 2e-07, "loss": 0.0256, "step": 198 }, { "clip_ratio/high_max": 0.0022769173374399543, "clip_ratio/high_mean": 0.0009310306304541882, "clip_ratio/low_mean": 0.0010359112602600362, "clip_ratio/low_min": 0.00012900576439278666, "clip_ratio/region_mean": 0.0019669418470584787, "epoch": 0.018573286900116084, "grad_norm": 0.11266931891441345, "learning_rate": 2e-07, "loss": 0.0357, "step": 199 }, { "clip_ratio/high_max": 0.0024134731356753036, "clip_ratio/high_mean": 0.001065897067746846, "clip_ratio/low_mean": 0.001018772556562908, "clip_ratio/low_min": 0.00012236155362188583, "clip_ratio/region_mean": 0.002084669627947733, "epoch": 0.018666620000116665, "grad_norm": 0.11524151265621185, "learning_rate": 2e-07, "loss": 0.026, "step": 200 }, { "clip_ratio/high_max": 0.002161034703021869, "clip_ratio/high_mean": 0.0009650331085140351, "clip_ratio/low_mean": 0.0010395104091003304, "clip_ratio/low_min": 0.00010112834752362687, "clip_ratio/region_mean": 0.002004543537623249, "epoch": 0.01875995310011725, "grad_norm": 0.1180180087685585, "learning_rate": 2e-07, "loss": 0.0455, "step": 201 }, { "clip_ratio/high_max": 0.00255183684930671, "clip_ratio/high_mean": 0.0010952425218420103, "clip_ratio/low_mean": 0.00108179212838877, "clip_ratio/low_min": 0.00020108850549149793, "clip_ratio/region_mean": 0.002177034693886526, "epoch": 0.018853286200117832, "grad_norm": 0.11948747932910919, "learning_rate": 2e-07, "loss": -0.0062, "step": 202 }, { "clip_ratio/high_max": 0.002260613200633088, "clip_ratio/high_mean": 0.0009473042173340218, "clip_ratio/low_mean": 0.0010732630307757063, "clip_ratio/low_min": 5.881974175281357e-05, "clip_ratio/region_mean": 0.002020567269937601, "epoch": 0.018946619300118418, "grad_norm": 0.12715503573417664, "learning_rate": 2e-07, "loss": 0.003, "step": 203 }, { "clip_ratio/high_max": 0.002355942371650599, "clip_ratio/high_mean": 0.001142281253123656, "clip_ratio/low_mean": 0.0008978219375421759, "clip_ratio/low_min": 8.514210821886081e-05, "clip_ratio/region_mean": 0.002040103245235514, "epoch": 0.019039952400119, "grad_norm": 0.11864128708839417, "learning_rate": 2e-07, "loss": -0.0015, "step": 204 }, { "clip_ratio/high_max": 0.0021187963138800114, "clip_ratio/high_mean": 0.0010283407500537578, "clip_ratio/low_mean": 0.0008666067442391068, "clip_ratio/low_min": 8.137011809594696e-05, "clip_ratio/region_mean": 0.0018949474906548858, "epoch": 0.019133285500119585, "grad_norm": 0.11928252130746841, "learning_rate": 2e-07, "loss": -0.0255, "step": 205 }, { "clip_ratio/high_max": 0.002110798974172212, "clip_ratio/high_mean": 0.000859755045894417, "clip_ratio/low_mean": 0.0010846321783901658, "clip_ratio/low_min": 0.0001521317917649867, "clip_ratio/region_mean": 0.0019443871569819748, "epoch": 0.019226618600120166, "grad_norm": 0.1112714484333992, "learning_rate": 2e-07, "loss": 0.0495, "step": 206 }, { "clip_ratio/high_max": 0.0022201028041308746, "clip_ratio/high_mean": 0.00093288711286732, "clip_ratio/low_mean": 0.0011367415281711146, "clip_ratio/low_min": 0.00018341206032346236, "clip_ratio/region_mean": 0.0020696286374004558, "epoch": 0.019319951700120748, "grad_norm": 0.1132681742310524, "learning_rate": 2e-07, "loss": 0.073, "step": 207 }, { "clip_ratio/high_max": 0.002229861624073237, "clip_ratio/high_mean": 0.001018268692860147, "clip_ratio/low_mean": 0.001004857349471422, "clip_ratio/low_min": 0.0001362255543426727, "clip_ratio/region_mean": 0.002023126093263272, "epoch": 0.019413284800121333, "grad_norm": 0.1113051176071167, "learning_rate": 2e-07, "loss": 0.0132, "step": 208 }, { "clip_ratio/high_max": 0.002318780247151153, "clip_ratio/high_mean": 0.0010097257709276164, "clip_ratio/low_mean": 0.0008776120557740796, "clip_ratio/low_min": 5.9538079767662566e-05, "clip_ratio/region_mean": 0.0018873378503485583, "epoch": 0.019506617900121915, "grad_norm": 0.10417304188013077, "learning_rate": 2e-07, "loss": 0.016, "step": 209 }, { "clip_ratio/high_max": 0.002996490919031203, "clip_ratio/high_mean": 0.0012716445489786565, "clip_ratio/low_mean": 0.0009494213045400102, "clip_ratio/low_min": 6.743644826201489e-05, "clip_ratio/region_mean": 0.0022210659153643064, "epoch": 0.0195999510001225, "grad_norm": 0.11338069289922714, "learning_rate": 2e-07, "loss": -0.0243, "step": 210 }, { "clip_ratio/high_max": 0.0025774256500881165, "clip_ratio/high_mean": 0.0010369898518547416, "clip_ratio/low_mean": 0.0010244952027278487, "clip_ratio/low_min": 0.00014959456711949315, "clip_ratio/region_mean": 0.0020614850145648234, "epoch": 0.019693284100123082, "grad_norm": 0.12622614204883575, "learning_rate": 2e-07, "loss": -0.0094, "step": 211 }, { "clip_ratio/high_max": 0.0023311748445848934, "clip_ratio/high_mean": 0.0009884692735795397, "clip_ratio/low_mean": 0.0009892283978842897, "clip_ratio/low_min": 5.883603989786934e-05, "clip_ratio/region_mean": 0.00197769766964484, "epoch": 0.019786617200123667, "grad_norm": 0.12311524897813797, "learning_rate": 2e-07, "loss": -0.0059, "step": 212 }, { "clip_ratio/high_max": 0.0025248883321182802, "clip_ratio/high_mean": 0.0009915803930198308, "clip_ratio/low_mean": 0.0011458990193204954, "clip_ratio/low_min": 0.0001764216231094906, "clip_ratio/region_mean": 0.0021374794596340507, "epoch": 0.01987995030012425, "grad_norm": 0.12415769696235657, "learning_rate": 2e-07, "loss": 0.1037, "step": 213 }, { "clip_ratio/high_max": 0.002180897536163684, "clip_ratio/high_mean": 0.0010145774394914042, "clip_ratio/low_mean": 0.000985586979368236, "clip_ratio/low_min": 8.580048870499013e-05, "clip_ratio/region_mean": 0.002000164386117831, "epoch": 0.019973283400124834, "grad_norm": 0.12184584885835648, "learning_rate": 2e-07, "loss": -0.0246, "step": 214 }, { "clip_ratio/high_max": 0.002384544364758767, "clip_ratio/high_mean": 0.0010087002701766323, "clip_ratio/low_mean": 0.0009045074220921379, "clip_ratio/low_min": 0.00017159206254291348, "clip_ratio/region_mean": 0.0019132077359245159, "epoch": 0.020066616500125416, "grad_norm": 0.10947056114673615, "learning_rate": 2e-07, "loss": 0.0258, "step": 215 }, { "clip_ratio/high_max": 0.0020853797541349195, "clip_ratio/high_mean": 0.0010148351957468549, "clip_ratio/low_mean": 0.0009736819411045872, "clip_ratio/low_min": 0.00014323201776278438, "clip_ratio/region_mean": 0.0019885171423084103, "epoch": 0.020159949600126, "grad_norm": 0.12318925559520721, "learning_rate": 2e-07, "loss": 0.0121, "step": 216 }, { "clip_ratio/high_max": 0.0020862270466750488, "clip_ratio/high_mean": 0.0009347709383291658, "clip_ratio/low_mean": 0.0010414562311780173, "clip_ratio/low_min": 9.906464219966438e-05, "clip_ratio/region_mean": 0.001976227154955268, "epoch": 0.020253282700126583, "grad_norm": 0.12481623142957687, "learning_rate": 2e-07, "loss": 0.0214, "step": 217 }, { "clip_ratio/high_max": 0.002196132787503302, "clip_ratio/high_mean": 0.0010729603309300728, "clip_ratio/low_mean": 0.0010633969541231636, "clip_ratio/low_min": 0.00012807946495740907, "clip_ratio/region_mean": 0.002136357310519088, "epoch": 0.020346615800127168, "grad_norm": 0.11990834772586823, "learning_rate": 2e-07, "loss": -0.03, "step": 218 }, { "clip_ratio/high_max": 0.0020590653548424598, "clip_ratio/high_mean": 0.000909521164430771, "clip_ratio/low_mean": 0.0009942918331944384, "clip_ratio/low_min": 0.00014961503893573536, "clip_ratio/region_mean": 0.0019038130121771246, "epoch": 0.02043994890012775, "grad_norm": 0.11991198360919952, "learning_rate": 2e-07, "loss": 0.0575, "step": 219 }, { "clip_ratio/high_max": 0.0027112673415103927, "clip_ratio/high_mean": 0.0012782540179614443, "clip_ratio/low_mean": 0.0009644220663176384, "clip_ratio/low_min": 4.135953895456623e-05, "clip_ratio/region_mean": 0.0022426760915550403, "epoch": 0.02053328200012833, "grad_norm": 0.12295389175415039, "learning_rate": 2e-07, "loss": -0.0266, "step": 220 }, { "clip_ratio/high_max": 0.0021552505713771097, "clip_ratio/high_mean": 0.0010718936937337276, "clip_ratio/low_mean": 0.0010291908329236321, "clip_ratio/low_min": 9.528353848509141e-05, "clip_ratio/region_mean": 0.0021010845885029994, "epoch": 0.020626615100128916, "grad_norm": 0.1294092983007431, "learning_rate": 2e-07, "loss": 0.0231, "step": 221 }, { "clip_ratio/high_max": 0.002308184586581774, "clip_ratio/high_mean": 0.0010044728787761414, "clip_ratio/low_mean": 0.0010992129755322821, "clip_ratio/low_min": 0.00018198173165728804, "clip_ratio/region_mean": 0.0021036858670413494, "epoch": 0.020719948200129498, "grad_norm": 0.12739701569080353, "learning_rate": 2e-07, "loss": 0.0295, "step": 222 }, { "clip_ratio/high_max": 0.002260941699205432, "clip_ratio/high_mean": 0.0009770545566425426, "clip_ratio/low_mean": 0.0009768445033842, "clip_ratio/low_min": 5.354059157980373e-05, "clip_ratio/region_mean": 0.0019538990964065306, "epoch": 0.020813281300130083, "grad_norm": 0.11412958055734634, "learning_rate": 2e-07, "loss": -0.0172, "step": 223 }, { "clip_ratio/high_max": 0.0019823621842078865, "clip_ratio/high_mean": 0.000906308499907027, "clip_ratio/low_mean": 0.001121312248869799, "clip_ratio/low_min": 0.00021074059714010218, "clip_ratio/region_mean": 0.0020276207869756036, "epoch": 0.020906614400130665, "grad_norm": 0.11903505027294159, "learning_rate": 2e-07, "loss": 0.0698, "step": 224 }, { "clip_ratio/high_max": 0.002104424493154511, "clip_ratio/high_mean": 0.0009235612815245986, "clip_ratio/low_mean": 0.00116866276221117, "clip_ratio/low_min": 0.0002979233295263839, "clip_ratio/region_mean": 0.0020922240437357686, "epoch": 0.02099994750013125, "grad_norm": 0.11688167601823807, "learning_rate": 2e-07, "loss": 0.0566, "step": 225 }, { "clip_ratio/high_max": 0.002227864442829741, "clip_ratio/high_mean": 0.0009482075529376743, "clip_ratio/low_mean": 0.0009780536784091964, "clip_ratio/low_min": 0.00012159468224126613, "clip_ratio/region_mean": 0.001926261218613945, "epoch": 0.021093280600131832, "grad_norm": 0.11947978287935257, "learning_rate": 2e-07, "loss": 0.0114, "step": 226 }, { "clip_ratio/high_max": 0.001948991386598209, "clip_ratio/high_mean": 0.0008729245600989088, "clip_ratio/low_mean": 0.0009982839910662733, "clip_ratio/low_min": 0.00015985702430043602, "clip_ratio/region_mean": 0.0018712086020968854, "epoch": 0.021186613700132417, "grad_norm": 0.1249566376209259, "learning_rate": 2e-07, "loss": 0.0195, "step": 227 }, { "clip_ratio/high_max": 0.002049351969617419, "clip_ratio/high_mean": 0.0009398530128237326, "clip_ratio/low_mean": 0.0009291364985983819, "clip_ratio/low_min": 0.00016469120055262465, "clip_ratio/region_mean": 0.001868989536887966, "epoch": 0.021279946800133, "grad_norm": 0.12076229602098465, "learning_rate": 2e-07, "loss": 0.0021, "step": 228 }, { "clip_ratio/high_max": 0.002549138975155074, "clip_ratio/high_mean": 0.001093319930077996, "clip_ratio/low_mean": 0.0011890636524185538, "clip_ratio/low_min": 0.00018018401806330075, "clip_ratio/region_mean": 0.0022823835679446347, "epoch": 0.021373279900133584, "grad_norm": 0.12609221041202545, "learning_rate": 2e-07, "loss": 0.0074, "step": 229 }, { "clip_ratio/high_max": 0.0024281287915073335, "clip_ratio/high_mean": 0.0010586231146589853, "clip_ratio/low_mean": 0.0010031884157797322, "clip_ratio/low_min": 7.778579310979694e-05, "clip_ratio/region_mean": 0.0020618114722310565, "epoch": 0.021466613000134166, "grad_norm": 0.11311987787485123, "learning_rate": 2e-07, "loss": 0.0286, "step": 230 }, { "clip_ratio/high_max": 0.002668012228241423, "clip_ratio/high_mean": 0.0010768062820716295, "clip_ratio/low_mean": 0.00095422606318607, "clip_ratio/low_min": 0.00017068327997549204, "clip_ratio/region_mean": 0.0020310323452576995, "epoch": 0.02155994610013475, "grad_norm": 0.10470303148031235, "learning_rate": 2e-07, "loss": 0.0344, "step": 231 }, { "clip_ratio/high_max": 0.0026121108094230294, "clip_ratio/high_mean": 0.0012060398294124752, "clip_ratio/low_mean": 0.0008945050813053967, "clip_ratio/low_min": 0.00011111664571217261, "clip_ratio/region_mean": 0.0021005449088988826, "epoch": 0.021653279200135333, "grad_norm": 0.11880531162023544, "learning_rate": 2e-07, "loss": -0.0172, "step": 232 }, { "clip_ratio/high_max": 0.002362415885727387, "clip_ratio/high_mean": 0.0010069034724438097, "clip_ratio/low_mean": 0.0010285539829055779, "clip_ratio/low_min": 8.50454007377266e-05, "clip_ratio/region_mean": 0.002035457466263324, "epoch": 0.021746612300135915, "grad_norm": 0.12247668951749802, "learning_rate": 2e-07, "loss": 0.0489, "step": 233 }, { "clip_ratio/high_max": 0.0023830264690332115, "clip_ratio/high_mean": 0.001078729226719588, "clip_ratio/low_mean": 0.0010804843295773026, "clip_ratio/low_min": 0.0002266194478579564, "clip_ratio/region_mean": 0.0021592135890387, "epoch": 0.0218399454001365, "grad_norm": 0.13124889135360718, "learning_rate": 2e-07, "loss": 0.0137, "step": 234 }, { "clip_ratio/high_max": 0.0021872690122108907, "clip_ratio/high_mean": 0.0009655877947807312, "clip_ratio/low_mean": 0.0010845890938071534, "clip_ratio/low_min": 0.00011390192958060652, "clip_ratio/region_mean": 0.0020501769031398, "epoch": 0.02193327850013708, "grad_norm": 0.10769148170948029, "learning_rate": 2e-07, "loss": -0.0009, "step": 235 }, { "clip_ratio/high_max": 0.001958989741979167, "clip_ratio/high_mean": 0.0009361365682707401, "clip_ratio/low_mean": 0.0010283784213243052, "clip_ratio/low_min": 8.252856696344679e-05, "clip_ratio/region_mean": 0.001964514987776056, "epoch": 0.022026611600137667, "grad_norm": 0.11504022032022476, "learning_rate": 2e-07, "loss": 0.0283, "step": 236 }, { "clip_ratio/high_max": 0.002026233749347739, "clip_ratio/high_mean": 0.000888086045961245, "clip_ratio/low_mean": 0.0009965724748326465, "clip_ratio/low_min": 8.903238267521374e-05, "clip_ratio/region_mean": 0.0018846585298888385, "epoch": 0.02211994470013825, "grad_norm": 0.10749346017837524, "learning_rate": 2e-07, "loss": 0.0166, "step": 237 }, { "clip_ratio/high_max": 0.0021355157223297283, "clip_ratio/high_mean": 0.0010645104594004806, "clip_ratio/low_mean": 0.0009944661942427047, "clip_ratio/low_min": 0.00020234614066794165, "clip_ratio/region_mean": 0.002058976620901376, "epoch": 0.022213277800138834, "grad_norm": 0.12324319034814835, "learning_rate": 2e-07, "loss": 0.0431, "step": 238 }, { "clip_ratio/high_max": 0.002177867201680783, "clip_ratio/high_mean": 0.0010424470347061288, "clip_ratio/low_mean": 0.0010108734149980592, "clip_ratio/low_min": 0.00018454927158018108, "clip_ratio/region_mean": 0.002053320436971262, "epoch": 0.022306610900139415, "grad_norm": 0.11169817298650742, "learning_rate": 2e-07, "loss": 0.016, "step": 239 }, { "clip_ratio/high_max": 0.0023789930673956405, "clip_ratio/high_mean": 0.0011294886644463986, "clip_ratio/low_mean": 0.0009677143334556604, "clip_ratio/low_min": 9.699025667941896e-05, "clip_ratio/region_mean": 0.0020972029815311544, "epoch": 0.02239994400014, "grad_norm": 0.11959470808506012, "learning_rate": 2e-07, "loss": 0.0, "step": 240 }, { "clip_ratio/high_max": 0.002397028758423403, "clip_ratio/high_mean": 0.0010248331454931758, "clip_ratio/low_mean": 0.001088363460439723, "clip_ratio/low_min": 0.00013388623847276904, "clip_ratio/region_mean": 0.002113196598656941, "epoch": 0.022493277100140582, "grad_norm": 0.1108279898762703, "learning_rate": 2e-07, "loss": 0.0149, "step": 241 }, { "clip_ratio/high_max": 0.001989764721656684, "clip_ratio/high_mean": 0.0009163568774965825, "clip_ratio/low_mean": 0.0009470721197430976, "clip_ratio/low_min": 0.00012800167314708233, "clip_ratio/region_mean": 0.0018634290172485635, "epoch": 0.022586610200141168, "grad_norm": 0.12124069780111313, "learning_rate": 2e-07, "loss": -0.005, "step": 242 }, { "clip_ratio/high_max": 0.0027479513082653284, "clip_ratio/high_mean": 0.0011125606724817771, "clip_ratio/low_mean": 0.0010082282624352956, "clip_ratio/low_min": 0.00024610083255538484, "clip_ratio/region_mean": 0.002120788958563935, "epoch": 0.02267994330014175, "grad_norm": 0.11768393218517303, "learning_rate": 2e-07, "loss": 0.0113, "step": 243 }, { "clip_ratio/high_max": 0.0024072675259958487, "clip_ratio/high_mean": 0.0009915180708048865, "clip_ratio/low_mean": 0.0009702909665065818, "clip_ratio/low_min": 8.324585360242054e-05, "clip_ratio/region_mean": 0.0019618090373114683, "epoch": 0.022773276400142334, "grad_norm": 0.11799103021621704, "learning_rate": 2e-07, "loss": 0.0291, "step": 244 }, { "clip_ratio/high_max": 0.00252033023207332, "clip_ratio/high_mean": 0.0010702432209654944, "clip_ratio/low_mean": 0.0012276227353140712, "clip_ratio/low_min": 0.0003225256768928375, "clip_ratio/region_mean": 0.002297865961736534, "epoch": 0.022866609500142916, "grad_norm": 0.1246575191617012, "learning_rate": 2e-07, "loss": 0.0635, "step": 245 }, { "clip_ratio/high_max": 0.002625590263050981, "clip_ratio/high_mean": 0.0011020396013918798, "clip_ratio/low_mean": 0.0010348295036237687, "clip_ratio/low_min": 0.00014932721114746528, "clip_ratio/region_mean": 0.0021368691232055426, "epoch": 0.022959942600143498, "grad_norm": 0.11939921975135803, "learning_rate": 2e-07, "loss": 0.0138, "step": 246 }, { "clip_ratio/high_max": 0.0021369988025981, "clip_ratio/high_mean": 0.0009930782362062018, "clip_ratio/low_mean": 0.0010368927923991578, "clip_ratio/low_min": 0.00011952939621551195, "clip_ratio/region_mean": 0.0020299710231483914, "epoch": 0.023053275700144083, "grad_norm": 0.11346429586410522, "learning_rate": 2e-07, "loss": 0.0467, "step": 247 }, { "clip_ratio/high_max": 0.0020814463059650734, "clip_ratio/high_mean": 0.000873228624186595, "clip_ratio/low_mean": 0.0010295795800630003, "clip_ratio/low_min": 8.042676199693233e-05, "clip_ratio/region_mean": 0.0019028082097065635, "epoch": 0.023146608800144665, "grad_norm": 0.12038135528564453, "learning_rate": 2e-07, "loss": 0.0307, "step": 248 }, { "clip_ratio/high_max": 0.002471878658980131, "clip_ratio/high_mean": 0.0010739890167315025, "clip_ratio/low_mean": 0.0010896815911110025, "clip_ratio/low_min": 5.190113733988255e-05, "clip_ratio/region_mean": 0.0021636706151184626, "epoch": 0.02323994190014525, "grad_norm": 0.12679967284202576, "learning_rate": 2e-07, "loss": 0.0373, "step": 249 }, { "clip_ratio/high_max": 0.002430623608233873, "clip_ratio/high_mean": 0.0009568185123498552, "clip_ratio/low_mean": 0.001034767981764162, "clip_ratio/low_min": 0.000112822513528954, "clip_ratio/region_mean": 0.0019915864904760383, "epoch": 0.023333275000145832, "grad_norm": 0.11574284732341766, "learning_rate": 2e-07, "loss": 0.0235, "step": 250 }, { "clip_ratio/high_max": 0.002417161493212916, "clip_ratio/high_mean": 0.0010617392908898182, "clip_ratio/low_mean": 0.0009799253948585829, "clip_ratio/low_min": 0.00013937268704466987, "clip_ratio/region_mean": 0.002041664680291433, "epoch": 0.023426608100146417, "grad_norm": 0.11487965285778046, "learning_rate": 2e-07, "loss": 0.032, "step": 251 }, { "clip_ratio/high_max": 0.00220940746658016, "clip_ratio/high_mean": 0.0009383756332681514, "clip_ratio/low_mean": 0.001127868570620194, "clip_ratio/low_min": 0.00012155586455264711, "clip_ratio/region_mean": 0.0020662442257162184, "epoch": 0.023519941200147, "grad_norm": 0.12255435436964035, "learning_rate": 2e-07, "loss": 0.0385, "step": 252 }, { "clip_ratio/high_max": 0.0021277316700434312, "clip_ratio/high_mean": 0.0010045699546026299, "clip_ratio/low_mean": 0.001201266288262559, "clip_ratio/low_min": 0.00017852746259450214, "clip_ratio/region_mean": 0.0022058362228563055, "epoch": 0.023613274300147584, "grad_norm": 0.11734842509031296, "learning_rate": 2e-07, "loss": 0.0751, "step": 253 }, { "clip_ratio/high_max": 0.002427127430564724, "clip_ratio/high_mean": 0.0011397609996492974, "clip_ratio/low_mean": 0.0010511071159271523, "clip_ratio/low_min": 0.00011756186358979903, "clip_ratio/region_mean": 0.0021908681374043226, "epoch": 0.023706607400148166, "grad_norm": 0.11389374732971191, "learning_rate": 2e-07, "loss": 0.0059, "step": 254 }, { "clip_ratio/high_max": 0.0020314825524110347, "clip_ratio/high_mean": 0.0008615152073616628, "clip_ratio/low_mean": 0.001004976158583304, "clip_ratio/low_min": 0.00012333091308391886, "clip_ratio/region_mean": 0.0018664913950487971, "epoch": 0.02379994050014875, "grad_norm": 0.11143703758716583, "learning_rate": 2e-07, "loss": 0.0462, "step": 255 }, { "clip_ratio/high_max": 0.002511016951757483, "clip_ratio/high_mean": 0.0010335400838812348, "clip_ratio/low_mean": 0.0010774949987535365, "clip_ratio/low_min": 6.183370442158775e-05, "clip_ratio/region_mean": 0.002111035028065089, "epoch": 0.023893273600149333, "grad_norm": 0.12570655345916748, "learning_rate": 2e-07, "loss": 0.0109, "step": 256 }, { "clip_ratio/high_max": 0.0, "clip_ratio/high_mean": 0.0, "clip_ratio/low_mean": 0.0, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0, "completions/clipped_ratio": 0.014386858258928603, "completions/max_length": 4096.0, "completions/max_terminated_length": 4096.0, "completions/mean_length": 609.5548706054688, "completions/mean_terminated_length": 558.6636352539062, "completions/min_length": 2.0, "completions/min_terminated_length": 2.0, "epoch": 0.023986606700149918, "grad_norm": 0.12165375798940659, "learning_rate": 2e-07, "loss": 0.0443, "num_tokens": 243161879.0, "reward": 0.5292707681655884, "reward_std": 0.23620083928108215, "rewards/simpleverify_reward/mean": 0.5292707085609436, "rewards/simpleverify_reward/std": 0.49914470314979553, "step": 257 }, { "clip_ratio/high_max": 0.002164937526686117, "clip_ratio/high_mean": 0.0009221315376635175, "clip_ratio/low_mean": 0.0006166441344248597, "clip_ratio/low_min": 8.29185742077243e-05, "clip_ratio/region_mean": 0.0015387756830023136, "epoch": 0.0240799398001505, "grad_norm": 0.13454820215702057, "learning_rate": 2e-07, "loss": 0.0017, "step": 258 }, { "clip_ratio/high_max": 0.0020151903590885922, "clip_ratio/high_mean": 0.0008842802890285384, "clip_ratio/low_mean": 0.0005605472306342563, "clip_ratio/low_min": 2.7355551537766587e-05, "clip_ratio/region_mean": 0.0014448275105678476, "epoch": 0.02417327290015108, "grad_norm": 0.3837902843952179, "learning_rate": 2e-07, "loss": 0.0373, "step": 259 }, { "clip_ratio/high_max": 0.0017220923546119593, "clip_ratio/high_mean": 0.0007624228328495519, "clip_ratio/low_mean": 0.0005955116012046346, "clip_ratio/low_min": 1.252254060091218e-05, "clip_ratio/region_mean": 0.0013579344486061018, "epoch": 0.024266606000151666, "grad_norm": 0.12554658949375153, "learning_rate": 2e-07, "loss": 0.0272, "step": 260 }, { "clip_ratio/high_max": 0.002161966163839679, "clip_ratio/high_mean": 0.0009266916276828852, "clip_ratio/low_mean": 0.0005994087405269966, "clip_ratio/low_min": 1.8312335669179447e-05, "clip_ratio/region_mean": 0.0015261003936757334, "epoch": 0.024359939100152248, "grad_norm": 0.11657988280057907, "learning_rate": 2e-07, "loss": 0.0155, "step": 261 }, { "clip_ratio/high_max": 0.0025087115427595563, "clip_ratio/high_mean": 0.0010005763706431026, "clip_ratio/low_mean": 0.0006305902879830683, "clip_ratio/low_min": 0.0001003253782982938, "clip_ratio/region_mean": 0.0016311666804540437, "epoch": 0.024453272200152833, "grad_norm": 0.12980857491493225, "learning_rate": 2e-07, "loss": -0.0267, "step": 262 }, { "clip_ratio/high_max": 0.002232325787190348, "clip_ratio/high_mean": 0.0009656262500357116, "clip_ratio/low_mean": 0.0006854519324406283, "clip_ratio/low_min": 6.55142248433549e-05, "clip_ratio/region_mean": 0.0016510781752003822, "epoch": 0.024546605300153415, "grad_norm": 0.13097405433654785, "learning_rate": 2e-07, "loss": -0.0248, "step": 263 }, { "clip_ratio/high_max": 0.002277901046909392, "clip_ratio/high_mean": 0.0010229253348370548, "clip_ratio/low_mean": 0.0006064817735023098, "clip_ratio/low_min": 2.9806811653543264e-05, "clip_ratio/region_mean": 0.0016294070883304812, "epoch": 0.024639938400154, "grad_norm": 0.12044909596443176, "learning_rate": 2e-07, "loss": -0.041, "step": 264 }, { "clip_ratio/high_max": 0.0021654551273968536, "clip_ratio/high_mean": 0.000967479711107444, "clip_ratio/low_mean": 0.0006782053933420684, "clip_ratio/low_min": 3.96443911085953e-05, "clip_ratio/region_mean": 0.001645685093535576, "epoch": 0.024733271500154582, "grad_norm": 0.12100070714950562, "learning_rate": 2e-07, "loss": 0.0588, "step": 265 }, { "clip_ratio/high_max": 0.001978774511371739, "clip_ratio/high_mean": 0.0009470828972553136, "clip_ratio/low_mean": 0.0007585859038954368, "clip_ratio/low_min": 8.825229087960906e-05, "clip_ratio/region_mean": 0.0017056688702723477, "epoch": 0.024826604600155167, "grad_norm": 0.125342458486557, "learning_rate": 2e-07, "loss": 0.0604, "step": 266 }, { "clip_ratio/high_max": 0.0019497438916005194, "clip_ratio/high_mean": 0.0008667253987368895, "clip_ratio/low_mean": 0.0007486851518478943, "clip_ratio/low_min": 9.622676134313224e-05, "clip_ratio/region_mean": 0.0016154105760506354, "epoch": 0.02491993770015575, "grad_norm": 0.12119797617197037, "learning_rate": 2e-07, "loss": 0.0566, "step": 267 }, { "clip_ratio/high_max": 0.0020604364181053825, "clip_ratio/high_mean": 0.0008952821808634326, "clip_ratio/low_mean": 0.0007573141538159689, "clip_ratio/low_min": 1.883664845081512e-05, "clip_ratio/region_mean": 0.0016525963801541366, "epoch": 0.025013270800156334, "grad_norm": 0.12163382023572922, "learning_rate": 2e-07, "loss": 0.0417, "step": 268 }, { "clip_ratio/high_max": 0.0022574229442398064, "clip_ratio/high_mean": 0.0009778068233572412, "clip_ratio/low_mean": 0.0008181967023119796, "clip_ratio/low_min": 7.309659031307092e-05, "clip_ratio/region_mean": 0.0017960035547730513, "epoch": 0.025106603900156916, "grad_norm": 0.11943285167217255, "learning_rate": 2e-07, "loss": 0.0055, "step": 269 }, { "clip_ratio/high_max": 0.0023436872143065557, "clip_ratio/high_mean": 0.0009404737938893959, "clip_ratio/low_mean": 0.000776779803345562, "clip_ratio/low_min": 0.00012098028037144104, "clip_ratio/region_mean": 0.001717253566312138, "epoch": 0.0251999370001575, "grad_norm": 0.12395653128623962, "learning_rate": 2e-07, "loss": 0.0014, "step": 270 }, { "clip_ratio/high_max": 0.0019441905824351124, "clip_ratio/high_mean": 0.0008890898661775282, "clip_ratio/low_mean": 0.0006772554388589924, "clip_ratio/low_min": 4.036024256492965e-05, "clip_ratio/region_mean": 0.0015663453050365206, "epoch": 0.025293270100158083, "grad_norm": 0.11219640076160431, "learning_rate": 2e-07, "loss": 0.0129, "step": 271 }, { "clip_ratio/high_max": 0.002455558074871078, "clip_ratio/high_mean": 0.0009394696116942214, "clip_ratio/low_mean": 0.0007969653579493752, "clip_ratio/low_min": 7.751016892143525e-05, "clip_ratio/region_mean": 0.001736434940539766, "epoch": 0.025386603200158665, "grad_norm": 0.11326699703931808, "learning_rate": 2e-07, "loss": 0.0364, "step": 272 }, { "clip_ratio/high_max": 0.002192847663536668, "clip_ratio/high_mean": 0.0010489930864423513, "clip_ratio/low_mean": 0.000755985753130517, "clip_ratio/low_min": 4.09064746236254e-05, "clip_ratio/region_mean": 0.0018049788486678153, "epoch": 0.02547993630015925, "grad_norm": 0.12172611802816391, "learning_rate": 2e-07, "loss": -0.0079, "step": 273 }, { "clip_ratio/high_max": 0.002188600479712477, "clip_ratio/high_mean": 0.0010594942796160467, "clip_ratio/low_mean": 0.0008400919432460796, "clip_ratio/low_min": 8.138159137160983e-05, "clip_ratio/region_mean": 0.0018995862119481899, "epoch": 0.02557326940015983, "grad_norm": 0.11077050119638443, "learning_rate": 2e-07, "loss": 0.0294, "step": 274 }, { "clip_ratio/high_max": 0.002360926053370349, "clip_ratio/high_mean": 0.0009811717236516415, "clip_ratio/low_mean": 0.0007800768962624716, "clip_ratio/low_min": 9.138147561316146e-05, "clip_ratio/region_mean": 0.0017612486408324912, "epoch": 0.025666602500160417, "grad_norm": 0.12436690181493759, "learning_rate": 2e-07, "loss": -0.0077, "step": 275 }, { "clip_ratio/high_max": 0.0020885259145870805, "clip_ratio/high_mean": 0.0010256047353323083, "clip_ratio/low_mean": 0.0007699046036577784, "clip_ratio/low_min": 0.00010014122335633147, "clip_ratio/region_mean": 0.0017955093644559383, "epoch": 0.025759935600161, "grad_norm": 0.1603475958108902, "learning_rate": 2e-07, "loss": -0.015, "step": 276 }, { "clip_ratio/high_max": 0.0025062743297894485, "clip_ratio/high_mean": 0.00100085877784295, "clip_ratio/low_mean": 0.0008639496445539407, "clip_ratio/low_min": 4.556383692033705e-05, "clip_ratio/region_mean": 0.0018648084442247637, "epoch": 0.025853268700161584, "grad_norm": 1.4605671167373657, "learning_rate": 2e-07, "loss": 0.0437, "step": 277 }, { "clip_ratio/high_max": 0.0023231007980939467, "clip_ratio/high_mean": 0.0010188669421040686, "clip_ratio/low_mean": 0.0008580658031860366, "clip_ratio/low_min": 0.00012508647841968923, "clip_ratio/region_mean": 0.0018769327652989887, "epoch": 0.025946601800162165, "grad_norm": 0.10945040732622147, "learning_rate": 2e-07, "loss": 0.0215, "step": 278 }, { "clip_ratio/high_max": 0.0020257338110241108, "clip_ratio/high_mean": 0.0008828582576825283, "clip_ratio/low_mean": 0.0008513730481354287, "clip_ratio/low_min": 0.00015755996264488203, "clip_ratio/region_mean": 0.0017342313003609888, "epoch": 0.02603993490016275, "grad_norm": 0.11126052588224411, "learning_rate": 2e-07, "loss": 0.0294, "step": 279 }, { "clip_ratio/high_max": 0.0020004422913189046, "clip_ratio/high_mean": 0.0008619764757895609, "clip_ratio/low_mean": 0.0009805456393223722, "clip_ratio/low_min": 9.269251222576713e-05, "clip_ratio/region_mean": 0.0018425221205689013, "epoch": 0.026133268000163332, "grad_norm": 0.12135310471057892, "learning_rate": 2e-07, "loss": 0.0277, "step": 280 }, { "clip_ratio/high_max": 0.002389052384387469, "clip_ratio/high_mean": 0.0010145772866962943, "clip_ratio/low_mean": 0.0009208536193909822, "clip_ratio/low_min": 0.00014947042654966936, "clip_ratio/region_mean": 0.0019354309188202024, "epoch": 0.026226601100163918, "grad_norm": 0.11440776288509369, "learning_rate": 2e-07, "loss": 0.0296, "step": 281 }, { "clip_ratio/high_max": 0.0021573334306594916, "clip_ratio/high_mean": 0.0008927443705033511, "clip_ratio/low_mean": 0.0009066752113540133, "clip_ratio/low_min": 8.437047745246673e-05, "clip_ratio/region_mean": 0.0017994195804931223, "epoch": 0.0263199342001645, "grad_norm": 0.11105756461620331, "learning_rate": 2e-07, "loss": 0.02, "step": 282 }, { "clip_ratio/high_max": 0.002387195097981021, "clip_ratio/high_mean": 0.0011055121667595813, "clip_ratio/low_mean": 0.0008902392237359891, "clip_ratio/low_min": 0.00019250412242399761, "clip_ratio/region_mean": 0.001995751379581634, "epoch": 0.026413267300165084, "grad_norm": 0.11866801232099533, "learning_rate": 2e-07, "loss": 0.037, "step": 283 }, { "clip_ratio/high_max": 0.002681473779375665, "clip_ratio/high_mean": 0.0011479227541713044, "clip_ratio/low_mean": 0.0009496065922576236, "clip_ratio/low_min": 0.00016694488112989347, "clip_ratio/region_mean": 0.002097529373713769, "epoch": 0.026506600400165666, "grad_norm": 0.12550069391727448, "learning_rate": 2e-07, "loss": 0.0214, "step": 284 }, { "clip_ratio/high_max": 0.002073765434033703, "clip_ratio/high_mean": 0.0008759493721299805, "clip_ratio/low_mean": 0.0009056493881871575, "clip_ratio/low_min": 0.00011013327548425877, "clip_ratio/region_mean": 0.0017815987666836008, "epoch": 0.026599933500166248, "grad_norm": 0.1108904480934143, "learning_rate": 2e-07, "loss": 0.0198, "step": 285 }, { "clip_ratio/high_max": 0.0020347713652881794, "clip_ratio/high_mean": 0.0009509722749498906, "clip_ratio/low_mean": 0.0008639666739327367, "clip_ratio/low_min": 3.6063363950233907e-05, "clip_ratio/region_mean": 0.0018149389325117227, "epoch": 0.026693266600166833, "grad_norm": 0.10219817608594894, "learning_rate": 2e-07, "loss": -0.0002, "step": 286 }, { "clip_ratio/high_max": 0.002298510749824345, "clip_ratio/high_mean": 0.0010776368108054157, "clip_ratio/low_mean": 0.0008991812610474881, "clip_ratio/low_min": 6.9262033321138e-05, "clip_ratio/region_mean": 0.001976818086404819, "epoch": 0.026786599700167415, "grad_norm": 0.11889860779047012, "learning_rate": 2e-07, "loss": 0.0306, "step": 287 }, { "clip_ratio/high_max": 0.0024199527979362756, "clip_ratio/high_mean": 0.0011237696526222862, "clip_ratio/low_mean": 0.0008424203078902792, "clip_ratio/low_min": 0.00012806228005501907, "clip_ratio/region_mean": 0.00196619000780629, "epoch": 0.026879932800168, "grad_norm": 0.12839743494987488, "learning_rate": 2e-07, "loss": -0.0435, "step": 288 }, { "clip_ratio/high_max": 0.00206505744063179, "clip_ratio/high_mean": 0.0008867223114066292, "clip_ratio/low_mean": 0.0009486557173659094, "clip_ratio/low_min": 7.199846368166618e-05, "clip_ratio/region_mean": 0.0018353781051700935, "epoch": 0.026973265900168582, "grad_norm": 0.13084933161735535, "learning_rate": 2e-07, "loss": -0.0236, "step": 289 }, { "clip_ratio/high_max": 0.001890574516437482, "clip_ratio/high_mean": 0.0009124967236857628, "clip_ratio/low_mean": 0.0009347159684693906, "clip_ratio/low_min": 0.00010004963951359969, "clip_ratio/region_mean": 0.0018472127412678674, "epoch": 0.027066599000169167, "grad_norm": 0.12404333055019379, "learning_rate": 2e-07, "loss": 0.0297, "step": 290 }, { "clip_ratio/high_max": 0.0018461411309544928, "clip_ratio/high_mean": 0.0008956645106081851, "clip_ratio/low_mean": 0.0009861597063718364, "clip_ratio/low_min": 0.00011762832309614168, "clip_ratio/region_mean": 0.0018818242097040638, "epoch": 0.02715993210016975, "grad_norm": 0.11666793376207352, "learning_rate": 2e-07, "loss": 0.0706, "step": 291 }, { "clip_ratio/high_max": 0.0020534715586109087, "clip_ratio/high_mean": 0.0009780338186828885, "clip_ratio/low_mean": 0.0009297630404034862, "clip_ratio/low_min": 0.00020504675194388255, "clip_ratio/region_mean": 0.0019077968609053642, "epoch": 0.027253265200170334, "grad_norm": 0.12766212224960327, "learning_rate": 2e-07, "loss": 0.0581, "step": 292 }, { "clip_ratio/high_max": 0.002441357202769723, "clip_ratio/high_mean": 0.0010469158351043006, "clip_ratio/low_mean": 0.0010778832474898081, "clip_ratio/low_min": 0.00018211327778772102, "clip_ratio/region_mean": 0.002124799088051077, "epoch": 0.027346598300170916, "grad_norm": 0.12381277233362198, "learning_rate": 2e-07, "loss": 0.0278, "step": 293 }, { "clip_ratio/high_max": 0.002451977190503385, "clip_ratio/high_mean": 0.001059636560967192, "clip_ratio/low_mean": 0.0008268145720649045, "clip_ratio/low_min": 7.450916928064544e-05, "clip_ratio/region_mean": 0.001886451107566245, "epoch": 0.0274399314001715, "grad_norm": 0.12609133124351501, "learning_rate": 2e-07, "loss": 0.0104, "step": 294 }, { "clip_ratio/high_max": 0.0022005365099175833, "clip_ratio/high_mean": 0.0009152151433227118, "clip_ratio/low_mean": 0.0007883116541052004, "clip_ratio/low_min": 3.33272755597136e-05, "clip_ratio/region_mean": 0.0017035267956089228, "epoch": 0.027533264500172083, "grad_norm": 0.11083073168992996, "learning_rate": 2e-07, "loss": 0.0011, "step": 295 }, { "clip_ratio/high_max": 0.0019503028452163562, "clip_ratio/high_mean": 0.0008402257390116574, "clip_ratio/low_mean": 0.0009891724148474168, "clip_ratio/low_min": 8.956734109233366e-05, "clip_ratio/region_mean": 0.0018293981920578517, "epoch": 0.027626597600172668, "grad_norm": 0.11930733919143677, "learning_rate": 2e-07, "loss": 0.0548, "step": 296 }, { "clip_ratio/high_max": 0.0021221788992988877, "clip_ratio/high_mean": 0.0008193312642106321, "clip_ratio/low_mean": 0.0009014827519422397, "clip_ratio/low_min": 0.00016800149342088844, "clip_ratio/region_mean": 0.0017208140707225539, "epoch": 0.02771993070017325, "grad_norm": 0.11643857508897781, "learning_rate": 2e-07, "loss": 0.0288, "step": 297 }, { "clip_ratio/high_max": 0.002176887632231228, "clip_ratio/high_mean": 0.0010341411361878272, "clip_ratio/low_mean": 0.0007963407770148478, "clip_ratio/low_min": 0.00010874304189201212, "clip_ratio/region_mean": 0.0018304818368051201, "epoch": 0.02781326380017383, "grad_norm": 0.11364585161209106, "learning_rate": 2e-07, "loss": -0.0177, "step": 298 }, { "clip_ratio/high_max": 0.0024108603211061563, "clip_ratio/high_mean": 0.0009683823518571444, "clip_ratio/low_mean": 0.0009297294382122345, "clip_ratio/low_min": 5.4730689043935854e-05, "clip_ratio/region_mean": 0.0018981118046212941, "epoch": 0.027906596900174416, "grad_norm": 0.11870751529932022, "learning_rate": 2e-07, "loss": 0.0071, "step": 299 }, { "clip_ratio/high_max": 0.0020918308218824677, "clip_ratio/high_mean": 0.0009506221031188034, "clip_ratio/low_mean": 0.0008350742300535785, "clip_ratio/low_min": 9.740659606904956e-05, "clip_ratio/region_mean": 0.0017856963240774348, "epoch": 0.027999930000174998, "grad_norm": 0.10309873521327972, "learning_rate": 2e-07, "loss": 0.0379, "step": 300 }, { "clip_ratio/high_max": 0.002321016727364622, "clip_ratio/high_mean": 0.0009164779494312825, "clip_ratio/low_mean": 0.0008440316132691805, "clip_ratio/low_min": 0.00013976338505017338, "clip_ratio/region_mean": 0.0017605095636099577, "epoch": 0.028093263100175583, "grad_norm": 0.1211768090724945, "learning_rate": 2e-07, "loss": 0.027, "step": 301 }, { "clip_ratio/high_max": 0.0021033888006058987, "clip_ratio/high_mean": 0.0009711488601169549, "clip_ratio/low_mean": 0.001001995744445594, "clip_ratio/low_min": 6.213934648258146e-05, "clip_ratio/region_mean": 0.001973144622752443, "epoch": 0.028186596200176165, "grad_norm": 0.13179805874824524, "learning_rate": 2e-07, "loss": 0.0652, "step": 302 }, { "clip_ratio/high_max": 0.002152578792447457, "clip_ratio/high_mean": 0.0009595325846021296, "clip_ratio/low_mean": 0.0009027436717587989, "clip_ratio/low_min": 6.604561986023327e-05, "clip_ratio/region_mean": 0.001862276199972257, "epoch": 0.02827992930017675, "grad_norm": 0.11733128130435944, "learning_rate": 2e-07, "loss": 0.0242, "step": 303 }, { "clip_ratio/high_max": 0.0024228912152466364, "clip_ratio/high_mean": 0.0009838691075856332, "clip_ratio/low_mean": 0.0008501051197526976, "clip_ratio/low_min": 1.4880952221574262e-05, "clip_ratio/region_mean": 0.0018339742746320553, "epoch": 0.028373262400177332, "grad_norm": 0.1206582561135292, "learning_rate": 2e-07, "loss": -0.0091, "step": 304 }, { "clip_ratio/high_max": 0.0022641316245426424, "clip_ratio/high_mean": 0.0009714315056044143, "clip_ratio/low_mean": 0.0007846896023693262, "clip_ratio/low_min": 0.00010326781193725765, "clip_ratio/region_mean": 0.0017561211134307086, "epoch": 0.028466595500177917, "grad_norm": 0.11145830154418945, "learning_rate": 2e-07, "loss": 0.012, "step": 305 }, { "clip_ratio/high_max": 0.002683011807675939, "clip_ratio/high_mean": 0.0011586245673242956, "clip_ratio/low_mean": 0.0008448558946838602, "clip_ratio/low_min": 5.505580884346273e-05, "clip_ratio/region_mean": 0.002003480440180283, "epoch": 0.0285599286001785, "grad_norm": 0.115868479013443, "learning_rate": 2e-07, "loss": -0.0353, "step": 306 }, { "clip_ratio/high_max": 0.002269501612317981, "clip_ratio/high_mean": 0.0009382805055793142, "clip_ratio/low_mean": 0.0009641588367230725, "clip_ratio/low_min": 0.00015587984398734989, "clip_ratio/region_mean": 0.0019024393404833972, "epoch": 0.028653261700179084, "grad_norm": 0.11247304081916809, "learning_rate": 2e-07, "loss": 0.0495, "step": 307 }, { "clip_ratio/high_max": 0.0021154528949409723, "clip_ratio/high_mean": 0.0009375951904075919, "clip_ratio/low_mean": 0.000934220508497674, "clip_ratio/low_min": 7.013199228822486e-05, "clip_ratio/region_mean": 0.0018718157298280858, "epoch": 0.028746594800179666, "grad_norm": 0.1204587072134018, "learning_rate": 2e-07, "loss": 0.0165, "step": 308 }, { "clip_ratio/high_max": 0.0027527318634383846, "clip_ratio/high_mean": 0.001028481156026828, "clip_ratio/low_mean": 0.0009865338579402305, "clip_ratio/low_min": 8.550395159545587e-05, "clip_ratio/region_mean": 0.0020150150448898785, "epoch": 0.02883992790018025, "grad_norm": 0.1246158629655838, "learning_rate": 2e-07, "loss": 0.0161, "step": 309 }, { "clip_ratio/high_max": 0.0021824009563715663, "clip_ratio/high_mean": 0.000937502421948011, "clip_ratio/low_mean": 0.0008035470018512569, "clip_ratio/low_min": 9.195720667776186e-05, "clip_ratio/region_mean": 0.0017410494474461302, "epoch": 0.028933261000180833, "grad_norm": 0.10335766524076462, "learning_rate": 2e-07, "loss": 0.0052, "step": 310 }, { "clip_ratio/high_max": 0.0019906581583200023, "clip_ratio/high_mean": 0.0008757097493798938, "clip_ratio/low_mean": 0.0010095166107930709, "clip_ratio/low_min": 8.585615159972804e-05, "clip_ratio/region_mean": 0.001885226352897007, "epoch": 0.029026594100181415, "grad_norm": 0.1161288470029831, "learning_rate": 2e-07, "loss": 0.0368, "step": 311 }, { "clip_ratio/high_max": 0.0023287877775146626, "clip_ratio/high_mean": 0.0009187250634568045, "clip_ratio/low_mean": 0.0009033200003614184, "clip_ratio/low_min": 8.034261099965079e-05, "clip_ratio/region_mean": 0.0018220450729131699, "epoch": 0.029119927200182, "grad_norm": 0.11232461780309677, "learning_rate": 2e-07, "loss": 0.0322, "step": 312 }, { "clip_ratio/high_max": 0.0021705131584894843, "clip_ratio/high_mean": 0.0010051166464108974, "clip_ratio/low_mean": 0.0009737189320730977, "clip_ratio/low_min": 6.614569610974286e-05, "clip_ratio/region_mean": 0.0019788355493801646, "epoch": 0.02921326030018258, "grad_norm": 0.12707826495170593, "learning_rate": 2e-07, "loss": -0.0135, "step": 313 }, { "clip_ratio/high_max": 0.002440060743538197, "clip_ratio/high_mean": 0.001016465790598886, "clip_ratio/low_mean": 0.0009140253860095982, "clip_ratio/low_min": 0.00010067885978060076, "clip_ratio/region_mean": 0.0019304911475046538, "epoch": 0.029306593400183167, "grad_norm": 0.6227886080741882, "learning_rate": 2e-07, "loss": -0.0025, "step": 314 }, { "clip_ratio/high_max": 0.0021325663619791158, "clip_ratio/high_mean": 0.0009158251796179684, "clip_ratio/low_mean": 0.0010372724718763493, "clip_ratio/low_min": 0.00019047625391976908, "clip_ratio/region_mean": 0.0019530976205714978, "epoch": 0.02939992650018375, "grad_norm": 0.11513081192970276, "learning_rate": 2e-07, "loss": 0.0481, "step": 315 }, { "clip_ratio/high_max": 0.00207363756999257, "clip_ratio/high_mean": 0.0008522590924258111, "clip_ratio/low_mean": 0.0009451399910176406, "clip_ratio/low_min": 8.020322275115177e-05, "clip_ratio/region_mean": 0.0017973991270991974, "epoch": 0.029493259600184334, "grad_norm": 0.12545005977153778, "learning_rate": 2e-07, "loss": 0.0128, "step": 316 }, { "clip_ratio/high_max": 0.002666181608219631, "clip_ratio/high_mean": 0.0011388375751266722, "clip_ratio/low_mean": 0.0009147858509095386, "clip_ratio/low_min": 4.1807001252891496e-05, "clip_ratio/region_mean": 0.0020536234442261048, "epoch": 0.029586592700184915, "grad_norm": 0.12078186124563217, "learning_rate": 2e-07, "loss": -0.0352, "step": 317 }, { "clip_ratio/high_max": 0.0019574982034100685, "clip_ratio/high_mean": 0.0008096033689071191, "clip_ratio/low_mean": 0.0009732106063893298, "clip_ratio/low_min": 0.00010755479070212459, "clip_ratio/region_mean": 0.0017828139134508092, "epoch": 0.0296799258001855, "grad_norm": 0.1106266975402832, "learning_rate": 2e-07, "loss": 0.0786, "step": 318 }, { "clip_ratio/high_max": 0.0022643398624495603, "clip_ratio/high_mean": 0.0009600351531844353, "clip_ratio/low_mean": 0.000981686305749463, "clip_ratio/low_min": 0.00011713834464899264, "clip_ratio/region_mean": 0.0019417214280110784, "epoch": 0.029773258900186082, "grad_norm": 0.11714010685682297, "learning_rate": 2e-07, "loss": 0.0492, "step": 319 }, { "clip_ratio/high_max": 0.001967811695067212, "clip_ratio/high_mean": 0.0008946573234425159, "clip_ratio/low_mean": 0.0008470306311210152, "clip_ratio/low_min": 5.4232888942351565e-05, "clip_ratio/region_mean": 0.0017416879563825205, "epoch": 0.029866592000186667, "grad_norm": 0.10652794688940048, "learning_rate": 2e-07, "loss": -0.0059, "step": 320 }, { "clip_ratio/high_max": 0.00256614633690333, "clip_ratio/high_mean": 0.0011383980745449662, "clip_ratio/low_mean": 0.0010102205742441583, "clip_ratio/low_min": 0.00011374871519365115, "clip_ratio/region_mean": 0.0021486186524271034, "epoch": 0.02995992510018725, "grad_norm": 0.13538402318954468, "learning_rate": 2e-07, "loss": 0.0063, "step": 321 }, { "clip_ratio/high_max": 0.0023314668142120354, "clip_ratio/high_mean": 0.0010597625841910485, "clip_ratio/low_mean": 0.0009980678896681638, "clip_ratio/low_min": 3.430909964663442e-05, "clip_ratio/region_mean": 0.0020578304611262865, "epoch": 0.030053258200187834, "grad_norm": 0.12654583156108856, "learning_rate": 2e-07, "loss": -0.0071, "step": 322 }, { "clip_ratio/high_max": 0.002808672630635556, "clip_ratio/high_mean": 0.0010987423593178391, "clip_ratio/low_mean": 0.0009043465688591823, "clip_ratio/low_min": 6.213408869371051e-05, "clip_ratio/region_mean": 0.0020030889281770214, "epoch": 0.030146591300188416, "grad_norm": 0.11694788932800293, "learning_rate": 2e-07, "loss": 0.0065, "step": 323 }, { "clip_ratio/high_max": 0.0023038351791910827, "clip_ratio/high_mean": 0.0009616794886824209, "clip_ratio/low_mean": 0.0009897258896671701, "clip_ratio/low_min": 0.00013127831789461197, "clip_ratio/region_mean": 0.001951405341969803, "epoch": 0.030239924400188998, "grad_norm": 0.11417174339294434, "learning_rate": 2e-07, "loss": 0.0469, "step": 324 }, { "clip_ratio/high_max": 0.0021999500058882404, "clip_ratio/high_mean": 0.0010025789397332119, "clip_ratio/low_mean": 0.0010728575234679738, "clip_ratio/low_min": 0.00010481150638952386, "clip_ratio/region_mean": 0.0020754364304593764, "epoch": 0.030333257500189583, "grad_norm": 0.11446146667003632, "learning_rate": 2e-07, "loss": 0.0346, "step": 325 }, { "clip_ratio/high_max": 0.0020088704768568277, "clip_ratio/high_mean": 0.0008960323721112218, "clip_ratio/low_mean": 0.000856843826113618, "clip_ratio/low_min": 7.65571621741401e-05, "clip_ratio/region_mean": 0.0017528761745779775, "epoch": 0.030426590600190165, "grad_norm": 0.11797110736370087, "learning_rate": 2e-07, "loss": 0.016, "step": 326 }, { "clip_ratio/high_max": 0.002201708633947419, "clip_ratio/high_mean": 0.0009216107891916181, "clip_ratio/low_mean": 0.0010378098413639236, "clip_ratio/low_min": 0.00013835148092766758, "clip_ratio/region_mean": 0.0019594206314650364, "epoch": 0.03051992370019075, "grad_norm": 0.12176623195409775, "learning_rate": 2e-07, "loss": 0.0306, "step": 327 }, { "clip_ratio/high_max": 0.002096448999509448, "clip_ratio/high_mean": 0.0008340022545780812, "clip_ratio/low_mean": 0.001091078946046764, "clip_ratio/low_min": 0.00015115215774130775, "clip_ratio/region_mean": 0.0019250812074460555, "epoch": 0.030613256800191332, "grad_norm": 0.11736004799604416, "learning_rate": 2e-07, "loss": 0.066, "step": 328 }, { "clip_ratio/high_max": 0.002302198365214281, "clip_ratio/high_mean": 0.0010027742573583964, "clip_ratio/low_mean": 0.0010144725874852156, "clip_ratio/low_min": 7.721492875134572e-05, "clip_ratio/region_mean": 0.0020172468430246226, "epoch": 0.030706589900191917, "grad_norm": 0.12399604171514511, "learning_rate": 2e-07, "loss": 0.0248, "step": 329 }, { "clip_ratio/high_max": 0.002396772659267299, "clip_ratio/high_mean": 0.0009556856530252844, "clip_ratio/low_mean": 0.0008992257135105319, "clip_ratio/low_min": 7.118371559045045e-05, "clip_ratio/region_mean": 0.001854911373811774, "epoch": 0.0307999230001925, "grad_norm": 0.11492188274860382, "learning_rate": 2e-07, "loss": 0.022, "step": 330 }, { "clip_ratio/high_max": 0.002186256861023139, "clip_ratio/high_mean": 0.0010335826573282247, "clip_ratio/low_mean": 0.0009764205569808837, "clip_ratio/low_min": 7.363861459452892e-05, "clip_ratio/region_mean": 0.0020100032415939495, "epoch": 0.030893256100193084, "grad_norm": 0.11338464915752411, "learning_rate": 2e-07, "loss": 0.0084, "step": 331 }, { "clip_ratio/high_max": 0.0023477216745959595, "clip_ratio/high_mean": 0.0009716838794702198, "clip_ratio/low_mean": 0.0010526366422709543, "clip_ratio/low_min": 0.00018729975454334635, "clip_ratio/region_mean": 0.0020243205144652165, "epoch": 0.030986589200193666, "grad_norm": 0.12447676807641983, "learning_rate": 2e-07, "loss": 0.0335, "step": 332 }, { "clip_ratio/high_max": 0.002680094348761486, "clip_ratio/high_mean": 0.0011621655285125598, "clip_ratio/low_mean": 0.0009916857379721478, "clip_ratio/low_min": 0.00011189456654392416, "clip_ratio/region_mean": 0.002153851295588538, "epoch": 0.03107992230019425, "grad_norm": 0.1169513612985611, "learning_rate": 2e-07, "loss": 0.0016, "step": 333 }, { "clip_ratio/high_max": 0.0023960526814335026, "clip_ratio/high_mean": 0.000980569820967503, "clip_ratio/low_mean": 0.0010936381549981888, "clip_ratio/low_min": 0.00013375626713241218, "clip_ratio/region_mean": 0.0020742080159834586, "epoch": 0.031173255400194833, "grad_norm": 0.131802499294281, "learning_rate": 2e-07, "loss": 0.0892, "step": 334 }, { "clip_ratio/high_max": 0.0020851009903708473, "clip_ratio/high_mean": 0.0008944596920628101, "clip_ratio/low_mean": 0.0010020399931818247, "clip_ratio/low_min": 6.378808029694483e-05, "clip_ratio/region_mean": 0.0018964996925205924, "epoch": 0.03126658850019542, "grad_norm": 0.1128229945898056, "learning_rate": 2e-07, "loss": 0.0539, "step": 335 }, { "clip_ratio/high_max": 0.002273106307256967, "clip_ratio/high_mean": 0.0010320381916244514, "clip_ratio/low_mean": 0.001000911601295229, "clip_ratio/low_min": 0.00013188336470193462, "clip_ratio/region_mean": 0.0020329498074715957, "epoch": 0.031359921600196, "grad_norm": 0.11824652552604675, "learning_rate": 2e-07, "loss": 0.0395, "step": 336 }, { "clip_ratio/high_max": 0.002220172194938641, "clip_ratio/high_mean": 0.0009316638079326367, "clip_ratio/low_mean": 0.0010693099811760476, "clip_ratio/low_min": 0.00012711081399174873, "clip_ratio/region_mean": 0.0020009738072985783, "epoch": 0.03145325470019658, "grad_norm": 0.11748380213975906, "learning_rate": 2e-07, "loss": 0.0251, "step": 337 }, { "clip_ratio/high_max": 0.002139083379006479, "clip_ratio/high_mean": 0.0010679588122002315, "clip_ratio/low_mean": 0.0010761458506749477, "clip_ratio/low_min": 0.0002248327814413642, "clip_ratio/region_mean": 0.0021441046919790097, "epoch": 0.031546587800197166, "grad_norm": 0.1240968406200409, "learning_rate": 2e-07, "loss": 0.0104, "step": 338 }, { "clip_ratio/high_max": 0.0023590052624058444, "clip_ratio/high_mean": 0.0009146658430836396, "clip_ratio/low_mean": 0.0010461594974913169, "clip_ratio/low_min": 0.00017604684217076283, "clip_ratio/region_mean": 0.001960825378773734, "epoch": 0.03163992090019775, "grad_norm": 0.11643088608980179, "learning_rate": 2e-07, "loss": 0.0485, "step": 339 }, { "clip_ratio/high_max": 0.002480952061887365, "clip_ratio/high_mean": 0.0009284691186621785, "clip_ratio/low_mean": 0.0011624251910689054, "clip_ratio/low_min": 0.00016817041978356428, "clip_ratio/region_mean": 0.0020908942751702853, "epoch": 0.03173325400019833, "grad_norm": 0.11981654167175293, "learning_rate": 2e-07, "loss": 0.0555, "step": 340 }, { "clip_ratio/high_max": 0.002171093779907096, "clip_ratio/high_mean": 0.0009637573020881973, "clip_ratio/low_mean": 0.000976807870756602, "clip_ratio/low_min": 4.7221673412423115e-05, "clip_ratio/region_mean": 0.0019405651473789476, "epoch": 0.031826587100198915, "grad_norm": 0.1030951514840126, "learning_rate": 2e-07, "loss": 0.0166, "step": 341 }, { "clip_ratio/high_max": 0.0023250365047715604, "clip_ratio/high_mean": 0.0009597863463568501, "clip_ratio/low_mean": 0.001007146365736844, "clip_ratio/low_min": 0.0001482133870922553, "clip_ratio/region_mean": 0.001966932737559546, "epoch": 0.0319199202001995, "grad_norm": 0.12194515019655228, "learning_rate": 2e-07, "loss": 0.0148, "step": 342 }, { "clip_ratio/high_max": 0.0023266416101250798, "clip_ratio/high_mean": 0.0009423888732271735, "clip_ratio/low_mean": 0.0009500014602963347, "clip_ratio/low_min": 0.00016302731819450855, "clip_ratio/region_mean": 0.0018923903407994658, "epoch": 0.032013253300200085, "grad_norm": 0.15885935723781586, "learning_rate": 2e-07, "loss": 0.024, "step": 343 }, { "clip_ratio/high_max": 0.0023650409493711777, "clip_ratio/high_mean": 0.0010177351632592035, "clip_ratio/low_mean": 0.0010740248726506252, "clip_ratio/low_min": 4.4827003875980154e-05, "clip_ratio/region_mean": 0.002091759961331263, "epoch": 0.032106586400200664, "grad_norm": 0.11424627900123596, "learning_rate": 2e-07, "loss": 0.0258, "step": 344 }, { "clip_ratio/high_max": 0.0020726813636429142, "clip_ratio/high_mean": 0.0009084537705348339, "clip_ratio/low_mean": 0.00098471110140963, "clip_ratio/low_min": 0.00010325823859602679, "clip_ratio/region_mean": 0.001893164895591326, "epoch": 0.03219991950020125, "grad_norm": 0.11793617159128189, "learning_rate": 2e-07, "loss": 0.0092, "step": 345 }, { "clip_ratio/high_max": 0.002211490682384465, "clip_ratio/high_mean": 0.001098279441066552, "clip_ratio/low_mean": 0.0008270462640211917, "clip_ratio/low_min": 0.00010457783719175495, "clip_ratio/region_mean": 0.0019253257050877437, "epoch": 0.032293252600201834, "grad_norm": 0.12200096994638443, "learning_rate": 2e-07, "loss": -0.0205, "step": 346 }, { "clip_ratio/high_max": 0.00233099111210322, "clip_ratio/high_mean": 0.000952059755945811, "clip_ratio/low_mean": 0.0009631025022827089, "clip_ratio/low_min": 0.0001271039236598881, "clip_ratio/region_mean": 0.0019151622618664987, "epoch": 0.03238658570020242, "grad_norm": 0.11682575196027756, "learning_rate": 2e-07, "loss": -0.0068, "step": 347 }, { "clip_ratio/high_max": 0.0023664640393690206, "clip_ratio/high_mean": 0.0009335987579106586, "clip_ratio/low_mean": 0.0010513175802771002, "clip_ratio/low_min": 0.00011428442030592123, "clip_ratio/region_mean": 0.0019849163509206846, "epoch": 0.032479918800203, "grad_norm": 0.11813147366046906, "learning_rate": 2e-07, "loss": 0.0539, "step": 348 }, { "clip_ratio/high_max": 0.002093289811455179, "clip_ratio/high_mean": 0.0008742295394768007, "clip_ratio/low_mean": 0.0009731762547744438, "clip_ratio/low_min": 0.00013083843077765778, "clip_ratio/region_mean": 0.0018474058160791174, "epoch": 0.03257325190020358, "grad_norm": 0.11360342055559158, "learning_rate": 2e-07, "loss": 0.0472, "step": 349 }, { "clip_ratio/high_max": 0.002393559680058388, "clip_ratio/high_mean": 0.0009841141109063756, "clip_ratio/low_mean": 0.0010431089067424182, "clip_ratio/low_min": 0.00016331323968188372, "clip_ratio/region_mean": 0.0020272230831324123, "epoch": 0.03266658500020417, "grad_norm": 0.13561463356018066, "learning_rate": 2e-07, "loss": 0.0382, "step": 350 }, { "clip_ratio/high_max": 0.002164147903386038, "clip_ratio/high_mean": 0.0008933646277000662, "clip_ratio/low_mean": 0.0010264774482493522, "clip_ratio/low_min": 0.00013836673542755307, "clip_ratio/region_mean": 0.0019198420632164925, "epoch": 0.032759918100204746, "grad_norm": 0.11417634785175323, "learning_rate": 2e-07, "loss": 0.044, "step": 351 }, { "clip_ratio/high_max": 0.0022255111907725222, "clip_ratio/high_mean": 0.0009959790295397397, "clip_ratio/low_mean": 0.0009416905886610039, "clip_ratio/low_min": 0.00013209417375037447, "clip_ratio/region_mean": 0.0019376696436665952, "epoch": 0.03285325120020533, "grad_norm": 0.10786327719688416, "learning_rate": 2e-07, "loss": -0.0061, "step": 352 }, { "clip_ratio/high_max": 0.0024176996084861457, "clip_ratio/high_mean": 0.0009324501061200863, "clip_ratio/low_mean": 0.0010348087416787166, "clip_ratio/low_min": 0.00012730852813547244, "clip_ratio/region_mean": 0.00196725879504811, "epoch": 0.03294658430020592, "grad_norm": 0.11818265169858932, "learning_rate": 2e-07, "loss": 0.0509, "step": 353 }, { "clip_ratio/high_max": 0.002107254375005141, "clip_ratio/high_mean": 0.0009269770325772697, "clip_ratio/low_mean": 0.0009891040936054196, "clip_ratio/low_min": 0.00011906828876817599, "clip_ratio/region_mean": 0.0019160810988978483, "epoch": 0.0330399174002065, "grad_norm": 0.12667396664619446, "learning_rate": 2e-07, "loss": 0.0305, "step": 354 }, { "clip_ratio/high_max": 0.001960705045348732, "clip_ratio/high_mean": 0.000833982543554157, "clip_ratio/low_mean": 0.0010087482041853946, "clip_ratio/low_min": 0.00019684484868776053, "clip_ratio/region_mean": 0.0018427307149977423, "epoch": 0.03313325050020708, "grad_norm": 0.12436181306838989, "learning_rate": 2e-07, "loss": 0.045, "step": 355 }, { "clip_ratio/high_max": 0.0020659207948483527, "clip_ratio/high_mean": 0.0008700418384250952, "clip_ratio/low_mean": 0.0011201304077985696, "clip_ratio/low_min": 7.588569405925227e-05, "clip_ratio/region_mean": 0.0019901722407666966, "epoch": 0.033226583600207665, "grad_norm": 0.11962632089853287, "learning_rate": 2e-07, "loss": 0.0543, "step": 356 }, { "clip_ratio/high_max": 0.002466775244101882, "clip_ratio/high_mean": 0.0010720916452555684, "clip_ratio/low_mean": 0.000929301357246004, "clip_ratio/low_min": 8.961488219938474e-05, "clip_ratio/region_mean": 0.002001393018872477, "epoch": 0.03331991670020825, "grad_norm": 0.11339904367923737, "learning_rate": 2e-07, "loss": 0.0168, "step": 357 }, { "clip_ratio/high_max": 0.002149727999494644, "clip_ratio/high_mean": 0.00099827832855226, "clip_ratio/low_mean": 0.0008361318705283338, "clip_ratio/low_min": 9.435636820853688e-05, "clip_ratio/region_mean": 0.001834410177252721, "epoch": 0.033413249800208836, "grad_norm": 0.10464035719633102, "learning_rate": 2e-07, "loss": 0.0152, "step": 358 }, { "clip_ratio/high_max": 0.0022349261489580385, "clip_ratio/high_mean": 0.0009745233910507523, "clip_ratio/low_mean": 0.0010890962948906235, "clip_ratio/low_min": 0.00019618960322986823, "clip_ratio/region_mean": 0.00206361964228563, "epoch": 0.033506582900209414, "grad_norm": 0.1155829057097435, "learning_rate": 2e-07, "loss": 0.0452, "step": 359 }, { "clip_ratio/high_max": 0.0020347935933386907, "clip_ratio/high_mean": 0.0009175762825179845, "clip_ratio/low_mean": 0.0009897929667204153, "clip_ratio/low_min": 7.372469099209411e-05, "clip_ratio/region_mean": 0.0019073692310485058, "epoch": 0.03359991600021, "grad_norm": 0.10900010913610458, "learning_rate": 2e-07, "loss": 0.0033, "step": 360 }, { "clip_ratio/high_max": 0.0022565797407878563, "clip_ratio/high_mean": 0.0009242708329111338, "clip_ratio/low_mean": 0.0010122450548806228, "clip_ratio/low_min": 0.00014858936083328445, "clip_ratio/region_mean": 0.0019365158950677142, "epoch": 0.033693249100210584, "grad_norm": 0.13071617484092712, "learning_rate": 2e-07, "loss": 0.0234, "step": 361 }, { "clip_ratio/high_max": 0.0022458903040387668, "clip_ratio/high_mean": 0.0009609796961740358, "clip_ratio/low_mean": 0.0009439296027267119, "clip_ratio/low_min": 5.524962307390524e-05, "clip_ratio/region_mean": 0.0019049092406930868, "epoch": 0.03378658220021117, "grad_norm": 0.10969194769859314, "learning_rate": 2e-07, "loss": -0.0143, "step": 362 }, { "clip_ratio/high_max": 0.002261694105982315, "clip_ratio/high_mean": 0.0008840756345307454, "clip_ratio/low_mean": 0.0010506906419323059, "clip_ratio/low_min": 0.00021957909575576195, "clip_ratio/region_mean": 0.0019347662891959772, "epoch": 0.03387991530021175, "grad_norm": 0.13056176900863647, "learning_rate": 2e-07, "loss": 0.0285, "step": 363 }, { "clip_ratio/high_max": 0.002028741881076712, "clip_ratio/high_mean": 0.0009438857159693725, "clip_ratio/low_mean": 0.0011309602050459944, "clip_ratio/low_min": 0.00015178522608039202, "clip_ratio/region_mean": 0.002074845993774943, "epoch": 0.03397324840021233, "grad_norm": 0.12196393311023712, "learning_rate": 2e-07, "loss": 0.0206, "step": 364 }, { "clip_ratio/high_max": 0.002436807051708456, "clip_ratio/high_mean": 0.0010417537960165646, "clip_ratio/low_mean": 0.0009605069426470436, "clip_ratio/low_min": 0.00012482506190281129, "clip_ratio/region_mean": 0.0020022606986458413, "epoch": 0.03406658150021292, "grad_norm": 0.11327728629112244, "learning_rate": 2e-07, "loss": -0.0121, "step": 365 }, { "clip_ratio/high_max": 0.002339727943763137, "clip_ratio/high_mean": 0.0010352220233471598, "clip_ratio/low_mean": 0.0011386352161935065, "clip_ratio/low_min": 4.074403295817319e-05, "clip_ratio/region_mean": 0.002173857174057048, "epoch": 0.034159914600213497, "grad_norm": 0.11825881898403168, "learning_rate": 2e-07, "loss": 0.067, "step": 366 }, { "clip_ratio/high_max": 0.0024218938051490113, "clip_ratio/high_mean": 0.000924776455576648, "clip_ratio/low_mean": 0.0009141574355453486, "clip_ratio/low_min": 5.823581113872933e-05, "clip_ratio/region_mean": 0.0018389338729321025, "epoch": 0.03425324770021408, "grad_norm": 0.10933463275432587, "learning_rate": 2e-07, "loss": 0.0018, "step": 367 }, { "clip_ratio/high_max": 0.0022142408342915587, "clip_ratio/high_mean": 0.0010255488959955983, "clip_ratio/low_mean": 0.0009670257386460435, "clip_ratio/low_min": 0.00010940259926428553, "clip_ratio/region_mean": 0.0019925746746594086, "epoch": 0.03434658080021467, "grad_norm": 0.11526765674352646, "learning_rate": 2e-07, "loss": -0.0085, "step": 368 }, { "clip_ratio/high_max": 0.0019511819336912595, "clip_ratio/high_mean": 0.0008641749609523686, "clip_ratio/low_mean": 0.0010229588951915503, "clip_ratio/low_min": 0.00010771323559310986, "clip_ratio/region_mean": 0.0018871338470489718, "epoch": 0.03443991390021525, "grad_norm": 0.11865226179361343, "learning_rate": 2e-07, "loss": 0.0432, "step": 369 }, { "clip_ratio/high_max": 0.0020448726609174628, "clip_ratio/high_mean": 0.0008958521975728218, "clip_ratio/low_mean": 0.0009560480157233542, "clip_ratio/low_min": 0.00011208213072677609, "clip_ratio/region_mean": 0.0018519002187531441, "epoch": 0.03453324700021583, "grad_norm": 0.11468666046857834, "learning_rate": 2e-07, "loss": 0.0135, "step": 370 }, { "clip_ratio/high_max": 0.002502015391655732, "clip_ratio/high_mean": 0.0011075132133555599, "clip_ratio/low_mean": 0.0010141358761757147, "clip_ratio/low_min": 0.0001334635726379929, "clip_ratio/region_mean": 0.002121649078617338, "epoch": 0.034626580100216416, "grad_norm": 0.11855193227529526, "learning_rate": 2e-07, "loss": 0.0115, "step": 371 }, { "clip_ratio/high_max": 0.0020563003126881085, "clip_ratio/high_mean": 0.0008553052284696605, "clip_ratio/low_mean": 0.0009304502837039763, "clip_ratio/low_min": 7.837172233848833e-05, "clip_ratio/region_mean": 0.0017857555139926262, "epoch": 0.034719913200217, "grad_norm": 0.1174718514084816, "learning_rate": 2e-07, "loss": 0.0, "step": 372 }, { "clip_ratio/high_max": 0.002241092861368088, "clip_ratio/high_mean": 0.000938063323701499, "clip_ratio/low_mean": 0.0009876362564682495, "clip_ratio/low_min": 7.666890769542078e-05, "clip_ratio/region_mean": 0.0019256996238254942, "epoch": 0.034813246300217586, "grad_norm": 0.12360448390245438, "learning_rate": 2e-07, "loss": 0.0464, "step": 373 }, { "clip_ratio/high_max": 0.002300617481523659, "clip_ratio/high_mean": 0.0010381426582171116, "clip_ratio/low_mean": 0.0009303783372160979, "clip_ratio/low_min": 0.00011484210972412257, "clip_ratio/region_mean": 0.0019685210354509763, "epoch": 0.034906579400218164, "grad_norm": 0.12292679399251938, "learning_rate": 2e-07, "loss": 0.004, "step": 374 }, { "clip_ratio/high_max": 0.0021412240967038088, "clip_ratio/high_mean": 0.0009194662670779508, "clip_ratio/low_mean": 0.0010363605433667544, "clip_ratio/low_min": 0.0001080445499610505, "clip_ratio/region_mean": 0.001955826810444705, "epoch": 0.03499991250021875, "grad_norm": 0.12341368198394775, "learning_rate": 2e-07, "loss": 0.0106, "step": 375 }, { "clip_ratio/high_max": 0.0023683832187089138, "clip_ratio/high_mean": 0.0010561526105448138, "clip_ratio/low_mean": 0.0010940790343738627, "clip_ratio/low_min": 0.0001603238324605627, "clip_ratio/region_mean": 0.0021502316449186765, "epoch": 0.035093245600219335, "grad_norm": 0.11230902373790741, "learning_rate": 2e-07, "loss": 0.0217, "step": 376 }, { "clip_ratio/high_max": 0.002472067753842566, "clip_ratio/high_mean": 0.0010215282563876826, "clip_ratio/low_mean": 0.0010584321516944328, "clip_ratio/low_min": 0.00010600108180369716, "clip_ratio/region_mean": 0.00207996042445302, "epoch": 0.03518657870021991, "grad_norm": 0.11010879278182983, "learning_rate": 2e-07, "loss": 0.0253, "step": 377 }, { "clip_ratio/high_max": 0.002573350560851395, "clip_ratio/high_mean": 0.001136587030487135, "clip_ratio/low_mean": 0.0007913624704087852, "clip_ratio/low_min": 4.0904425986809656e-05, "clip_ratio/region_mean": 0.0019279494736110792, "epoch": 0.0352799118002205, "grad_norm": 0.11940529197454453, "learning_rate": 2e-07, "loss": -0.0519, "step": 378 }, { "clip_ratio/high_max": 0.002073470470350003, "clip_ratio/high_mean": 0.0008529664482921362, "clip_ratio/low_mean": 0.0012406544337864034, "clip_ratio/low_min": 0.0002700552331589279, "clip_ratio/region_mean": 0.0020936209039064124, "epoch": 0.03537324490022108, "grad_norm": 0.12314601987600327, "learning_rate": 2e-07, "loss": 0.0653, "step": 379 }, { "clip_ratio/high_max": 0.0020780018021469004, "clip_ratio/high_mean": 0.0009273533923987998, "clip_ratio/low_mean": 0.0009265466105716769, "clip_ratio/low_min": 0.0001114659353333991, "clip_ratio/region_mean": 0.0018539000084274448, "epoch": 0.03546657800022167, "grad_norm": 0.11450739949941635, "learning_rate": 2e-07, "loss": -0.0485, "step": 380 }, { "clip_ratio/high_max": 0.001717559622193221, "clip_ratio/high_mean": 0.0008335874736076221, "clip_ratio/low_mean": 0.0009617204977985239, "clip_ratio/low_min": 6.846310679975431e-05, "clip_ratio/region_mean": 0.0017953079732251354, "epoch": 0.03555991110022225, "grad_norm": 0.11781059205532074, "learning_rate": 2e-07, "loss": 0.0343, "step": 381 }, { "clip_ratio/high_max": 0.002344134933082387, "clip_ratio/high_mean": 0.0008995527696242789, "clip_ratio/low_mean": 0.0011606791376834735, "clip_ratio/low_min": 0.00016642602258798433, "clip_ratio/region_mean": 0.00206023188366089, "epoch": 0.03565324420022283, "grad_norm": 0.11900895833969116, "learning_rate": 2e-07, "loss": 0.0285, "step": 382 }, { "clip_ratio/high_max": 0.0019259789114585146, "clip_ratio/high_mean": 0.0008842626375553664, "clip_ratio/low_mean": 0.0010764770922833122, "clip_ratio/low_min": 0.0001375008505419828, "clip_ratio/region_mean": 0.0019607396898209117, "epoch": 0.03574657730022342, "grad_norm": 0.12927794456481934, "learning_rate": 2e-07, "loss": 0.0581, "step": 383 }, { "clip_ratio/high_max": 0.002059536025626585, "clip_ratio/high_mean": 0.0009178772397717694, "clip_ratio/low_mean": 0.0010624783753883094, "clip_ratio/low_min": 0.00016081609101092909, "clip_ratio/region_mean": 0.001980355620617047, "epoch": 0.035839910400224, "grad_norm": 0.10502680391073227, "learning_rate": 2e-07, "loss": 0.0242, "step": 384 }, { "clip_ratio/high_max": 0.0, "clip_ratio/high_mean": 0.0, "clip_ratio/low_mean": 0.0, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0, "completions/clipped_ratio": 0.01385498046875, "completions/max_length": 4096.0, "completions/max_terminated_length": 4092.0, "completions/mean_length": 610.0624389648438, "completions/mean_terminated_length": 561.0862426757812, "completions/min_length": 2.0, "completions/min_terminated_length": 2.0, "epoch": 0.03593324350022458, "grad_norm": 0.11456090956926346, "learning_rate": 2e-07, "loss": 0.0353, "num_tokens": 324578048.0, "reward": 0.542855441570282, "reward_std": 0.22516277432441711, "rewards/simpleverify_reward/mean": 0.5428553819656372, "rewards/simpleverify_reward/std": 0.49816226959228516, "step": 385 }, { "clip_ratio/high_max": 0.0017559950974828098, "clip_ratio/high_mean": 0.0007278089196915971, "clip_ratio/low_mean": 0.0006625809169236163, "clip_ratio/low_min": 2.473902077326784e-05, "clip_ratio/region_mean": 0.0013903898689022753, "epoch": 0.036026576600225166, "grad_norm": 0.12734541296958923, "learning_rate": 2e-07, "loss": 0.0921, "step": 386 }, { "clip_ratio/high_max": 0.0025453791677136905, "clip_ratio/high_mean": 0.001037432437442476, "clip_ratio/low_mean": 0.0006035990427335491, "clip_ratio/low_min": 2.980758472403977e-05, "clip_ratio/region_mean": 0.001641031492908951, "epoch": 0.03611990970022575, "grad_norm": 0.12250111252069473, "learning_rate": 2e-07, "loss": 0.0138, "step": 387 }, { "clip_ratio/high_max": 0.002207361932960339, "clip_ratio/high_mean": 0.0009231314470525831, "clip_ratio/low_mean": 0.0006365234930854058, "clip_ratio/low_min": 4.147783965890994e-05, "clip_ratio/region_mean": 0.0015596549419569783, "epoch": 0.03621324280022633, "grad_norm": 0.11904287338256836, "learning_rate": 2e-07, "loss": 0.0094, "step": 388 }, { "clip_ratio/high_max": 0.002101827267324552, "clip_ratio/high_mean": 0.0008576082727813628, "clip_ratio/low_mean": 0.0006074333177821245, "clip_ratio/low_min": 0.00012706233428616542, "clip_ratio/region_mean": 0.001465041594201466, "epoch": 0.036306575900226914, "grad_norm": 0.12277815490961075, "learning_rate": 2e-07, "loss": 0.0258, "step": 389 }, { "clip_ratio/high_max": 0.0017382308360538445, "clip_ratio/high_mean": 0.0007671240900890552, "clip_ratio/low_mean": 0.0005518902717085439, "clip_ratio/low_min": 2.4696095351828262e-05, "clip_ratio/region_mean": 0.001319014347245684, "epoch": 0.0363999090002275, "grad_norm": 0.10924790054559708, "learning_rate": 2e-07, "loss": 0.0428, "step": 390 }, { "clip_ratio/high_max": 0.0017924217827385291, "clip_ratio/high_mean": 0.0008786258604231989, "clip_ratio/low_mean": 0.000545529298733527, "clip_ratio/low_min": 3.931362880393863e-05, "clip_ratio/region_mean": 0.0014241551580198575, "epoch": 0.036493242100228085, "grad_norm": 0.11210854351520538, "learning_rate": 2e-07, "loss": 0.0014, "step": 391 }, { "clip_ratio/high_max": 0.0020536320880637504, "clip_ratio/high_mean": 0.000947290889598662, "clip_ratio/low_mean": 0.000586602432122163, "clip_ratio/low_min": 3.528143952280516e-05, "clip_ratio/region_mean": 0.0015338933153543621, "epoch": 0.03658657520022866, "grad_norm": 0.11201830208301544, "learning_rate": 2e-07, "loss": 0.0132, "step": 392 }, { "clip_ratio/high_max": 0.002088896362693049, "clip_ratio/high_mean": 0.0009022970916703343, "clip_ratio/low_mean": 0.0006837162873125635, "clip_ratio/low_min": 5.8115100273425924e-05, "clip_ratio/region_mean": 0.001586013393534813, "epoch": 0.03667990830022925, "grad_norm": 0.1244579628109932, "learning_rate": 2e-07, "loss": 0.0035, "step": 393 }, { "clip_ratio/high_max": 0.0022416405045078136, "clip_ratio/high_mean": 0.0009764331734913867, "clip_ratio/low_mean": 0.0007038564081085497, "clip_ratio/low_min": 0.00010393485035820049, "clip_ratio/region_mean": 0.0016802896207082085, "epoch": 0.036773241400229834, "grad_norm": 0.12332562357187271, "learning_rate": 2e-07, "loss": 0.0193, "step": 394 }, { "clip_ratio/high_max": 0.0021914375174674205, "clip_ratio/high_mean": 0.0008885363968147431, "clip_ratio/low_mean": 0.0007157253603509162, "clip_ratio/low_min": 6.815265896875644e-05, "clip_ratio/region_mean": 0.0016042617935454473, "epoch": 0.03686657450023042, "grad_norm": 0.11344970017671585, "learning_rate": 2e-07, "loss": 0.0452, "step": 395 }, { "clip_ratio/high_max": 0.0022176111160661094, "clip_ratio/high_mean": 0.0009343643869215157, "clip_ratio/low_mean": 0.0006915263647897518, "clip_ratio/low_min": 7.837035718694096e-05, "clip_ratio/region_mean": 0.00162589069805108, "epoch": 0.036959907600231, "grad_norm": 0.41706404089927673, "learning_rate": 2e-07, "loss": 0.021, "step": 396 }, { "clip_ratio/high_max": 0.002177739210310392, "clip_ratio/high_mean": 0.0010119580347236479, "clip_ratio/low_mean": 0.0006430951716538402, "clip_ratio/low_min": 1.5133171473280527e-05, "clip_ratio/region_mean": 0.0016550532091059722, "epoch": 0.03705324070023158, "grad_norm": 0.1147422045469284, "learning_rate": 2e-07, "loss": 0.0005, "step": 397 }, { "clip_ratio/high_max": 0.002158268849598244, "clip_ratio/high_mean": 0.0008790599968051538, "clip_ratio/low_mean": 0.0006097410569054773, "clip_ratio/low_min": 3.072822710237233e-05, "clip_ratio/region_mean": 0.0014888010045979172, "epoch": 0.03714657380023217, "grad_norm": 0.11150866001844406, "learning_rate": 2e-07, "loss": 0.0177, "step": 398 }, { "clip_ratio/high_max": 0.002348668422200717, "clip_ratio/high_mean": 0.0009394072658324149, "clip_ratio/low_mean": 0.0006304159160208656, "clip_ratio/low_min": 6.635166710111662e-05, "clip_ratio/region_mean": 0.0015698231582064182, "epoch": 0.03723990690023275, "grad_norm": 0.11647429317235947, "learning_rate": 2e-07, "loss": 0.0373, "step": 399 }, { "clip_ratio/high_max": 0.002322462205484044, "clip_ratio/high_mean": 0.0009234979879693128, "clip_ratio/low_mean": 0.0006471525362030661, "clip_ratio/low_min": 1.3429307728074491e-05, "clip_ratio/region_mean": 0.0015706504782428965, "epoch": 0.03733324000023333, "grad_norm": 0.1072663888335228, "learning_rate": 2e-07, "loss": -0.0051, "step": 400 }, { "clip_ratio/high_max": 0.002038626596913673, "clip_ratio/high_mean": 0.0008996784690680215, "clip_ratio/low_mean": 0.0007853080878703622, "clip_ratio/low_min": 1.5147842532314826e-05, "clip_ratio/region_mean": 0.0016849865569383837, "epoch": 0.037426573100233916, "grad_norm": 0.11729703098535538, "learning_rate": 2e-07, "loss": 0.0285, "step": 401 }, { "clip_ratio/high_max": 0.0022657900117337704, "clip_ratio/high_mean": 0.0008789943785814103, "clip_ratio/low_mean": 0.0006538500347232912, "clip_ratio/low_min": 6.575021598109743e-05, "clip_ratio/region_mean": 0.0015328443769249134, "epoch": 0.0375199062002345, "grad_norm": 0.11642471700906754, "learning_rate": 2e-07, "loss": 0.017, "step": 402 }, { "clip_ratio/high_max": 0.0025832977989921346, "clip_ratio/high_mean": 0.0009106796187552391, "clip_ratio/low_mean": 0.000755996246880386, "clip_ratio/low_min": 8.744717524677981e-05, "clip_ratio/region_mean": 0.0016666758892824873, "epoch": 0.03761323930023508, "grad_norm": 0.11483058333396912, "learning_rate": 2e-07, "loss": 0.0479, "step": 403 }, { "clip_ratio/high_max": 0.002341608633287251, "clip_ratio/high_mean": 0.0008568004304834176, "clip_ratio/low_mean": 0.0008145177525875624, "clip_ratio/low_min": 8.177264408004703e-05, "clip_ratio/region_mean": 0.0016713181685190648, "epoch": 0.037706572400235665, "grad_norm": 0.11411089450120926, "learning_rate": 2e-07, "loss": 0.0484, "step": 404 }, { "clip_ratio/high_max": 0.002321920786926057, "clip_ratio/high_mean": 0.0010088994895340875, "clip_ratio/low_mean": 0.0008522099797119154, "clip_ratio/low_min": 0.00011332449093970354, "clip_ratio/region_mean": 0.001861109492892865, "epoch": 0.03779990550023625, "grad_norm": 0.15908290445804596, "learning_rate": 2e-07, "loss": 0.0316, "step": 405 }, { "clip_ratio/high_max": 0.0020113326208957005, "clip_ratio/high_mean": 0.0009313923310401151, "clip_ratio/low_mean": 0.0007562105347460601, "clip_ratio/low_min": 0.00010178752654610435, "clip_ratio/region_mean": 0.0016876028676051646, "epoch": 0.037893238600236835, "grad_norm": 0.12024180591106415, "learning_rate": 2e-07, "loss": 0.0512, "step": 406 }, { "clip_ratio/high_max": 0.002122077356034424, "clip_ratio/high_mean": 0.0009245533128705574, "clip_ratio/low_mean": 0.0006972420669626445, "clip_ratio/low_min": 6.107484296080656e-05, "clip_ratio/region_mean": 0.0016217953743762337, "epoch": 0.03798657170023741, "grad_norm": 0.11804087460041046, "learning_rate": 2e-07, "loss": -0.001, "step": 407 }, { "clip_ratio/high_max": 0.002408103613561252, "clip_ratio/high_mean": 0.0010119622256752336, "clip_ratio/low_mean": 0.0008201911550713703, "clip_ratio/low_min": 0.00013450218921207124, "clip_ratio/region_mean": 0.0018321533789276145, "epoch": 0.038079904800238, "grad_norm": 0.13277433812618256, "learning_rate": 2e-07, "loss": 0.0206, "step": 408 }, { "clip_ratio/high_max": 0.0022254596842685714, "clip_ratio/high_mean": 0.0008891799989214633, "clip_ratio/low_mean": 0.0008455715124000562, "clip_ratio/low_min": 4.309249561629258e-05, "clip_ratio/region_mean": 0.0017347514949506149, "epoch": 0.038173237900238584, "grad_norm": 0.10766805708408356, "learning_rate": 2e-07, "loss": 0.028, "step": 409 }, { "clip_ratio/high_max": 0.0022778219936299138, "clip_ratio/high_mean": 0.0009811555210035294, "clip_ratio/low_mean": 0.0009155531606666045, "clip_ratio/low_min": 0.0001742051399560296, "clip_ratio/region_mean": 0.001896708672575187, "epoch": 0.03826657100023917, "grad_norm": 0.11431422084569931, "learning_rate": 2e-07, "loss": 0.0281, "step": 410 }, { "clip_ratio/high_max": 0.002379552839556709, "clip_ratio/high_mean": 0.0010144433144887444, "clip_ratio/low_mean": 0.0009587348067725543, "clip_ratio/low_min": 6.265518140935455e-05, "clip_ratio/region_mean": 0.0019731781067093834, "epoch": 0.03835990410023975, "grad_norm": 0.1265234500169754, "learning_rate": 2e-07, "loss": -0.0073, "step": 411 }, { "clip_ratio/high_max": 0.0024561990285292268, "clip_ratio/high_mean": 0.0009134203501162119, "clip_ratio/low_mean": 0.0008060858926910441, "clip_ratio/low_min": 0.00010697371635615127, "clip_ratio/region_mean": 0.0017195062391692773, "epoch": 0.03845323720024033, "grad_norm": 0.10894020646810532, "learning_rate": 2e-07, "loss": 0.0345, "step": 412 }, { "clip_ratio/high_max": 0.0020608718223229516, "clip_ratio/high_mean": 0.0008798518083494855, "clip_ratio/low_mean": 0.000959227454586653, "clip_ratio/low_min": 8.417437402385985e-05, "clip_ratio/region_mean": 0.0018390792611171491, "epoch": 0.03854657030024092, "grad_norm": 0.115571029484272, "learning_rate": 2e-07, "loss": 0.0932, "step": 413 }, { "clip_ratio/high_max": 0.0021653893709299155, "clip_ratio/high_mean": 0.0009181729783449555, "clip_ratio/low_mean": 0.0007792789074301254, "clip_ratio/low_min": 7.235440443764674e-05, "clip_ratio/region_mean": 0.0016974519021459855, "epoch": 0.038639903400241496, "grad_norm": 0.11313897371292114, "learning_rate": 2e-07, "loss": -0.0202, "step": 414 }, { "clip_ratio/high_max": 0.0015843709406908602, "clip_ratio/high_mean": 0.0007469617776223458, "clip_ratio/low_mean": 0.001031487510772422, "clip_ratio/low_min": 0.0001532384185338742, "clip_ratio/region_mean": 0.001778449248377001, "epoch": 0.03873323650024208, "grad_norm": 0.11486821621656418, "learning_rate": 2e-07, "loss": 0.0531, "step": 415 }, { "clip_ratio/high_max": 0.0021730950320488773, "clip_ratio/high_mean": 0.0009340861925011268, "clip_ratio/low_mean": 0.0008123939496726962, "clip_ratio/low_min": 3.760500840144232e-05, "clip_ratio/region_mean": 0.0017464801640016958, "epoch": 0.038826569600242666, "grad_norm": 0.1169021725654602, "learning_rate": 2e-07, "loss": -0.0026, "step": 416 }, { "clip_ratio/high_max": 0.0023038371073198505, "clip_ratio/high_mean": 0.0009995346645155223, "clip_ratio/low_mean": 0.0007750027743895771, "clip_ratio/low_min": 7.786385185681866e-05, "clip_ratio/region_mean": 0.0017745374134392478, "epoch": 0.03891990270024325, "grad_norm": 0.11159112304449081, "learning_rate": 2e-07, "loss": 0.0081, "step": 417 }, { "clip_ratio/high_max": 0.002187954778491985, "clip_ratio/high_mean": 0.000844255082483869, "clip_ratio/low_mean": 0.000821132845885586, "clip_ratio/low_min": 8.449188044323819e-05, "clip_ratio/region_mean": 0.0016653879138175398, "epoch": 0.03901323580024383, "grad_norm": 0.11673636734485626, "learning_rate": 2e-07, "loss": 0.0344, "step": 418 }, { "clip_ratio/high_max": 0.002005532383918762, "clip_ratio/high_mean": 0.0009599970871931873, "clip_ratio/low_mean": 0.0008041258988669142, "clip_ratio/low_min": 7.307736086659133e-05, "clip_ratio/region_mean": 0.0017641229860601015, "epoch": 0.039106568900244415, "grad_norm": 0.11489438265562057, "learning_rate": 2e-07, "loss": 0.0, "step": 419 }, { "clip_ratio/high_max": 0.0021378632191044744, "clip_ratio/high_mean": 0.0009017400388984242, "clip_ratio/low_mean": 0.0008868317345331889, "clip_ratio/low_min": 0.00010697852940211305, "clip_ratio/region_mean": 0.0017885717934404965, "epoch": 0.039199902000245, "grad_norm": 0.11440420895814896, "learning_rate": 2e-07, "loss": -0.0311, "step": 420 }, { "clip_ratio/high_max": 0.0020561671553878114, "clip_ratio/high_mean": 0.0009365045552840456, "clip_ratio/low_mean": 0.0009586295018380042, "clip_ratio/low_min": 7.407742759824032e-05, "clip_ratio/region_mean": 0.0018951340316561982, "epoch": 0.039293235100245585, "grad_norm": 0.12472552061080933, "learning_rate": 2e-07, "loss": 0.021, "step": 421 }, { "clip_ratio/high_max": 0.002289889074745588, "clip_ratio/high_mean": 0.0008830113383737626, "clip_ratio/low_mean": 0.0008777020302659366, "clip_ratio/low_min": 0.00014692296645080205, "clip_ratio/region_mean": 0.001760713363182731, "epoch": 0.039386568200246164, "grad_norm": 0.11912091821432114, "learning_rate": 2e-07, "loss": 0.0563, "step": 422 }, { "clip_ratio/high_max": 0.0021351189934648573, "clip_ratio/high_mean": 0.0010460507473908365, "clip_ratio/low_mean": 0.0008984843479993287, "clip_ratio/low_min": 8.304466882691486e-05, "clip_ratio/region_mean": 0.0019445350917521864, "epoch": 0.03947990130024675, "grad_norm": 0.11897817254066467, "learning_rate": 2e-07, "loss": -0.0148, "step": 423 }, { "clip_ratio/high_max": 0.002029441006015986, "clip_ratio/high_mean": 0.0008940010302467272, "clip_ratio/low_mean": 0.0008420993217441719, "clip_ratio/low_min": 0.00011270071991020814, "clip_ratio/region_mean": 0.001736100297421217, "epoch": 0.039573234400247334, "grad_norm": 0.11907520890235901, "learning_rate": 2e-07, "loss": 0.0355, "step": 424 }, { "clip_ratio/high_max": 0.002256054744066205, "clip_ratio/high_mean": 0.000823764306915109, "clip_ratio/low_mean": 0.0009657354548835428, "clip_ratio/low_min": 0.00016057623543019872, "clip_ratio/region_mean": 0.0017894997872645035, "epoch": 0.03966656750024792, "grad_norm": 0.10738899558782578, "learning_rate": 2e-07, "loss": 0.0322, "step": 425 }, { "clip_ratio/high_max": 0.0019007241644430906, "clip_ratio/high_mean": 0.000886846573848743, "clip_ratio/low_mean": 0.0008935526475397637, "clip_ratio/low_min": 0.0001384626093567931, "clip_ratio/region_mean": 0.0017803992377594113, "epoch": 0.0397599006002485, "grad_norm": 0.11808796226978302, "learning_rate": 2e-07, "loss": 0.0259, "step": 426 }, { "clip_ratio/high_max": 0.0021683628583559766, "clip_ratio/high_mean": 0.000908164780412335, "clip_ratio/low_mean": 0.0008357383994734846, "clip_ratio/low_min": 3.868919429805828e-05, "clip_ratio/region_mean": 0.001743903150781989, "epoch": 0.03985323370024908, "grad_norm": 0.10963170230388641, "learning_rate": 2e-07, "loss": -0.01, "step": 427 }, { "clip_ratio/high_max": 0.0023480984164052643, "clip_ratio/high_mean": 0.0009342571902379859, "clip_ratio/low_mean": 0.0009715138603496598, "clip_ratio/low_min": 9.676904392108554e-05, "clip_ratio/region_mean": 0.0019057710524066351, "epoch": 0.03994656680024967, "grad_norm": 0.11410797387361526, "learning_rate": 2e-07, "loss": 0.0159, "step": 428 }, { "clip_ratio/high_max": 0.0021386182379501406, "clip_ratio/high_mean": 0.0009525562927592546, "clip_ratio/low_mean": 0.0008880508376023499, "clip_ratio/low_min": 7.192369230324402e-05, "clip_ratio/region_mean": 0.001840607132180594, "epoch": 0.040039899900250246, "grad_norm": 0.11762690544128418, "learning_rate": 2e-07, "loss": 0.0243, "step": 429 }, { "clip_ratio/high_max": 0.0023347691239905544, "clip_ratio/high_mean": 0.0009237483282049652, "clip_ratio/low_mean": 0.0009447772499697749, "clip_ratio/low_min": 5.856984444108093e-05, "clip_ratio/region_mean": 0.00186852557817474, "epoch": 0.04013323300025083, "grad_norm": 0.1171240285038948, "learning_rate": 2e-07, "loss": 0.0046, "step": 430 }, { "clip_ratio/high_max": 0.002405291117611341, "clip_ratio/high_mean": 0.000983984675258398, "clip_ratio/low_mean": 0.0008869818539096741, "clip_ratio/low_min": 0.00011179559714946663, "clip_ratio/region_mean": 0.0018709665164351463, "epoch": 0.04022656610025142, "grad_norm": 0.12378175556659698, "learning_rate": 2e-07, "loss": 0.0109, "step": 431 }, { "clip_ratio/high_max": 0.002442537537717726, "clip_ratio/high_mean": 0.0009348319763375912, "clip_ratio/low_mean": 0.0008514675646438263, "clip_ratio/low_min": 7.385962999251205e-05, "clip_ratio/region_mean": 0.0017862995227915235, "epoch": 0.040319899200252, "grad_norm": 0.12251628190279007, "learning_rate": 2e-07, "loss": 0.0401, "step": 432 }, { "clip_ratio/high_max": 0.0021499075228348374, "clip_ratio/high_mean": 0.0009057115094037727, "clip_ratio/low_mean": 0.0006973655472393148, "clip_ratio/low_min": 9.860417776508257e-05, "clip_ratio/region_mean": 0.0016030770711950026, "epoch": 0.04041323230025258, "grad_norm": 0.11849484592676163, "learning_rate": 2e-07, "loss": 0.0494, "step": 433 }, { "clip_ratio/high_max": 0.0022954697778914124, "clip_ratio/high_mean": 0.001005030469968915, "clip_ratio/low_mean": 0.0009653125925979111, "clip_ratio/low_min": 0.00011913711205124855, "clip_ratio/region_mean": 0.001970343029825017, "epoch": 0.040506565400253165, "grad_norm": 0.1204654648900032, "learning_rate": 2e-07, "loss": -0.014, "step": 434 }, { "clip_ratio/high_max": 0.0023600153290317394, "clip_ratio/high_mean": 0.0009908346910378896, "clip_ratio/low_mean": 0.0008754766950005433, "clip_ratio/low_min": 9.876540480036056e-05, "clip_ratio/region_mean": 0.0018663113951333798, "epoch": 0.04059989850025375, "grad_norm": 0.11963741481304169, "learning_rate": 2e-07, "loss": 0.0356, "step": 435 }, { "clip_ratio/high_max": 0.0026319170865463093, "clip_ratio/high_mean": 0.0010589698576950468, "clip_ratio/low_mean": 0.0009423672199773137, "clip_ratio/low_min": 0.00015106409819054534, "clip_ratio/region_mean": 0.002001337052206509, "epoch": 0.040693231600254336, "grad_norm": 0.1166808232665062, "learning_rate": 2e-07, "loss": 0.0172, "step": 436 }, { "clip_ratio/high_max": 0.0021439512056531385, "clip_ratio/high_mean": 0.0009789100204216084, "clip_ratio/low_mean": 0.0008508803093718598, "clip_ratio/low_min": 8.443144088232657e-05, "clip_ratio/region_mean": 0.0018297903152415529, "epoch": 0.040786564700254914, "grad_norm": 0.11000310629606247, "learning_rate": 2e-07, "loss": 0.0212, "step": 437 }, { "clip_ratio/high_max": 0.001877994101960212, "clip_ratio/high_mean": 0.0009132352424785495, "clip_ratio/low_mean": 0.0010401819527032785, "clip_ratio/low_min": 0.00017218431094079278, "clip_ratio/region_mean": 0.0019534171442501247, "epoch": 0.0408798978002555, "grad_norm": 0.12231463938951492, "learning_rate": 2e-07, "loss": 0.0063, "step": 438 }, { "clip_ratio/high_max": 0.0023249160585692152, "clip_ratio/high_mean": 0.0009128108540608082, "clip_ratio/low_mean": 0.000937574546696851, "clip_ratio/low_min": 8.207910013879882e-05, "clip_ratio/region_mean": 0.001850385422585532, "epoch": 0.040973230900256084, "grad_norm": 0.11456317454576492, "learning_rate": 2e-07, "loss": 0.0392, "step": 439 }, { "clip_ratio/high_max": 0.0018445767418597825, "clip_ratio/high_mean": 0.0007718229080637684, "clip_ratio/low_mean": 0.0008855989108269569, "clip_ratio/low_min": 0.00012021566999464994, "clip_ratio/region_mean": 0.001657421853451524, "epoch": 0.04106656400025666, "grad_norm": 0.11749608814716339, "learning_rate": 2e-07, "loss": 0.0654, "step": 440 }, { "clip_ratio/high_max": 0.0023254263069247827, "clip_ratio/high_mean": 0.0009989120771933813, "clip_ratio/low_mean": 0.0008875624753272859, "clip_ratio/low_min": 0.0001063389581759111, "clip_ratio/region_mean": 0.0018864745361497626, "epoch": 0.04115989710025725, "grad_norm": 0.11897794902324677, "learning_rate": 2e-07, "loss": 0.0189, "step": 441 }, { "clip_ratio/high_max": 0.0022615913694608025, "clip_ratio/high_mean": 0.0009701209492050111, "clip_ratio/low_mean": 0.0009497709852439584, "clip_ratio/low_min": 5.3731739171780646e-05, "clip_ratio/region_mean": 0.0019198919253540225, "epoch": 0.04125323020025783, "grad_norm": 0.11869539320468903, "learning_rate": 2e-07, "loss": 0.0122, "step": 442 }, { "clip_ratio/high_max": 0.002077365486911731, "clip_ratio/high_mean": 0.0007901588214735966, "clip_ratio/low_mean": 0.0009481882589170709, "clip_ratio/low_min": 0.00011752995578717673, "clip_ratio/region_mean": 0.0017383470694767311, "epoch": 0.04134656330025842, "grad_norm": 0.11476495862007141, "learning_rate": 2e-07, "loss": 0.0648, "step": 443 }, { "clip_ratio/high_max": 0.002063651605567429, "clip_ratio/high_mean": 0.0008007544729480287, "clip_ratio/low_mean": 0.000982819103228394, "clip_ratio/low_min": 6.837996534159174e-05, "clip_ratio/region_mean": 0.001783573636203073, "epoch": 0.041439896400258996, "grad_norm": 0.12138523161411285, "learning_rate": 2e-07, "loss": 0.0575, "step": 444 }, { "clip_ratio/high_max": 0.0018952958707814105, "clip_ratio/high_mean": 0.0007762268505757675, "clip_ratio/low_mean": 0.0009758286523720017, "clip_ratio/low_min": 0.00013074854177830275, "clip_ratio/region_mean": 0.001752055533870589, "epoch": 0.04153322950025958, "grad_norm": 0.11283163726329803, "learning_rate": 2e-07, "loss": 0.0326, "step": 445 }, { "clip_ratio/high_max": 0.0022156291088322178, "clip_ratio/high_mean": 0.0009682324453024194, "clip_ratio/low_mean": 0.0008335664751939476, "clip_ratio/low_min": 9.294639221479883e-05, "clip_ratio/region_mean": 0.001801798898668494, "epoch": 0.04162656260026017, "grad_norm": 0.11176684498786926, "learning_rate": 2e-07, "loss": 0.0136, "step": 446 }, { "clip_ratio/high_max": 0.002304917714354815, "clip_ratio/high_mean": 0.0010254782373522175, "clip_ratio/low_mean": 0.0009440064895898104, "clip_ratio/low_min": 0.00015700748735980596, "clip_ratio/region_mean": 0.001969484714209102, "epoch": 0.04171989570026075, "grad_norm": 0.12780800461769104, "learning_rate": 2e-07, "loss": -0.0171, "step": 447 }, { "clip_ratio/high_max": 0.002577936051238794, "clip_ratio/high_mean": 0.0010225201949651819, "clip_ratio/low_mean": 0.0009891313875414198, "clip_ratio/low_min": 0.00021590694450424053, "clip_ratio/region_mean": 0.0020116516097914428, "epoch": 0.04181322880026133, "grad_norm": 0.1125578060746193, "learning_rate": 2e-07, "loss": 0.0181, "step": 448 }, { "clip_ratio/high_max": 0.0025572296217433177, "clip_ratio/high_mean": 0.0011314970506646205, "clip_ratio/low_mean": 0.0008513731918355916, "clip_ratio/low_min": 6.788527934986632e-05, "clip_ratio/region_mean": 0.001982870206120424, "epoch": 0.041906561900261916, "grad_norm": 0.14265777170658112, "learning_rate": 2e-07, "loss": -0.018, "step": 449 }, { "clip_ratio/high_max": 0.002116962190484628, "clip_ratio/high_mean": 0.0009591196649125777, "clip_ratio/low_mean": 0.000981863271590555, "clip_ratio/low_min": 8.361827076441841e-05, "clip_ratio/region_mean": 0.0019409829255891964, "epoch": 0.0419998950002625, "grad_norm": 0.11985485255718231, "learning_rate": 2e-07, "loss": 0.034, "step": 450 }, { "clip_ratio/high_max": 0.0021616015292238444, "clip_ratio/high_mean": 0.0009408148507645819, "clip_ratio/low_mean": 0.0008765257953200489, "clip_ratio/low_min": 6.220471004780848e-05, "clip_ratio/region_mean": 0.001817340642446652, "epoch": 0.042093228100263086, "grad_norm": 0.12438426166772842, "learning_rate": 2e-07, "loss": 0.0258, "step": 451 }, { "clip_ratio/high_max": 0.002138797572115436, "clip_ratio/high_mean": 0.0009013525414047763, "clip_ratio/low_mean": 0.0008483078909193864, "clip_ratio/low_min": 7.034827012830647e-05, "clip_ratio/region_mean": 0.0017496604632469825, "epoch": 0.042186561200263664, "grad_norm": 0.10961660742759705, "learning_rate": 2e-07, "loss": 0.021, "step": 452 }, { "clip_ratio/high_max": 0.00241413529147394, "clip_ratio/high_mean": 0.0009270201298932079, "clip_ratio/low_mean": 0.0010248750622849911, "clip_ratio/low_min": 7.968538193381391e-05, "clip_ratio/region_mean": 0.0019518951594363898, "epoch": 0.04227989430026425, "grad_norm": 0.11330097913742065, "learning_rate": 2e-07, "loss": 0.0614, "step": 453 }, { "clip_ratio/high_max": 0.0021824804571224377, "clip_ratio/high_mean": 0.0009401545230502961, "clip_ratio/low_mean": 0.0009193636215059087, "clip_ratio/low_min": 3.213102036170312e-05, "clip_ratio/region_mean": 0.0018595181390992366, "epoch": 0.042373227400264835, "grad_norm": 0.10737673938274384, "learning_rate": 2e-07, "loss": 0.0241, "step": 454 }, { "clip_ratio/high_max": 0.0021936208868282847, "clip_ratio/high_mean": 0.0009180554152408149, "clip_ratio/low_mean": 0.0009310017285315553, "clip_ratio/low_min": 0.0001381685606247629, "clip_ratio/region_mean": 0.0018490571310394444, "epoch": 0.04246656050026541, "grad_norm": 0.11896377056837082, "learning_rate": 2e-07, "loss": 0.0252, "step": 455 }, { "clip_ratio/high_max": 0.002144321617379319, "clip_ratio/high_mean": 0.0009210318803525297, "clip_ratio/low_mean": 0.0010062951332656667, "clip_ratio/low_min": 0.00010806756108650006, "clip_ratio/region_mean": 0.0019273269426776096, "epoch": 0.042559893600266, "grad_norm": 0.11582513153553009, "learning_rate": 2e-07, "loss": 0.0316, "step": 456 }, { "clip_ratio/high_max": 0.0022139010616228916, "clip_ratio/high_mean": 0.0009115631473832764, "clip_ratio/low_mean": 0.0009167484404315474, "clip_ratio/low_min": 0.0001769062901075813, "clip_ratio/region_mean": 0.0018283115787198767, "epoch": 0.04265322670026658, "grad_norm": 0.11867281794548035, "learning_rate": 2e-07, "loss": 0.034, "step": 457 }, { "clip_ratio/high_max": 0.0020464750778046437, "clip_ratio/high_mean": 0.0008635583290015347, "clip_ratio/low_mean": 0.0009120242539211176, "clip_ratio/low_min": 0.00014250197455112357, "clip_ratio/region_mean": 0.0017755825683707371, "epoch": 0.04274655980026717, "grad_norm": 0.11845026165246964, "learning_rate": 2e-07, "loss": 0.0501, "step": 458 }, { "clip_ratio/high_max": 0.002209846250480041, "clip_ratio/high_mean": 0.0009212306486006128, "clip_ratio/low_mean": 0.0010026660384028219, "clip_ratio/low_min": 0.00013555366149375914, "clip_ratio/region_mean": 0.0019238966633565724, "epoch": 0.04283989290026775, "grad_norm": 0.12998808920383453, "learning_rate": 2e-07, "loss": 0.0434, "step": 459 }, { "clip_ratio/high_max": 0.0020460384330363013, "clip_ratio/high_mean": 0.0008804322333162418, "clip_ratio/low_mean": 0.0008743912162572087, "clip_ratio/low_min": 9.421625327377114e-05, "clip_ratio/region_mean": 0.001754823446390219, "epoch": 0.04293322600026833, "grad_norm": 0.11413136124610901, "learning_rate": 2e-07, "loss": 0.0352, "step": 460 }, { "clip_ratio/high_max": 0.0024610085238236934, "clip_ratio/high_mean": 0.0010141287348233163, "clip_ratio/low_mean": 0.000997321170871146, "clip_ratio/low_min": 0.00018923719835584052, "clip_ratio/region_mean": 0.0020114498838665895, "epoch": 0.04302655910026892, "grad_norm": 0.11709766089916229, "learning_rate": 2e-07, "loss": 0.0151, "step": 461 }, { "clip_ratio/high_max": 0.0022989178978605196, "clip_ratio/high_mean": 0.0009646581493143458, "clip_ratio/low_mean": 0.0011497753312141867, "clip_ratio/low_min": 9.352730012324173e-05, "clip_ratio/region_mean": 0.0021144334750715643, "epoch": 0.0431198922002695, "grad_norm": 0.1256629079580307, "learning_rate": 2e-07, "loss": 0.0071, "step": 462 }, { "clip_ratio/high_max": 0.0019255525257904083, "clip_ratio/high_mean": 0.0008831911909510382, "clip_ratio/low_mean": 0.0010735645046224818, "clip_ratio/low_min": 0.0001923193940456258, "clip_ratio/region_mean": 0.0019567557174013928, "epoch": 0.04321322530027008, "grad_norm": 0.12042519450187683, "learning_rate": 2e-07, "loss": 0.0425, "step": 463 }, { "clip_ratio/high_max": 0.0019485442244331352, "clip_ratio/high_mean": 0.0009593006270733895, "clip_ratio/low_mean": 0.0009012777663883753, "clip_ratio/low_min": 0.00016508120916114422, "clip_ratio/region_mean": 0.0018605783188831992, "epoch": 0.043306558400270666, "grad_norm": 0.12611928582191467, "learning_rate": 2e-07, "loss": 0.0114, "step": 464 }, { "clip_ratio/high_max": 0.0022179900406626984, "clip_ratio/high_mean": 0.0009755862920428626, "clip_ratio/low_mean": 0.0009026952284330036, "clip_ratio/low_min": 6.922899956407491e-05, "clip_ratio/region_mean": 0.0018782815313898027, "epoch": 0.04339989150027125, "grad_norm": 0.11388153582811356, "learning_rate": 2e-07, "loss": 0.0243, "step": 465 }, { "clip_ratio/high_max": 0.0023382343169942033, "clip_ratio/high_mean": 0.0008779352783676586, "clip_ratio/low_mean": 0.0009325867813458899, "clip_ratio/low_min": 0.00014943218775442801, "clip_ratio/region_mean": 0.001810522036976181, "epoch": 0.04349322460027183, "grad_norm": 0.11013499647378922, "learning_rate": 2e-07, "loss": 0.0433, "step": 466 }, { "clip_ratio/high_max": 0.002099457306030672, "clip_ratio/high_mean": 0.0009266209926863667, "clip_ratio/low_mean": 0.0009762910522113089, "clip_ratio/low_min": 0.00015591298233630368, "clip_ratio/region_mean": 0.001902912037621718, "epoch": 0.043586557700272414, "grad_norm": 0.13048942387104034, "learning_rate": 2e-07, "loss": 0.0453, "step": 467 }, { "clip_ratio/high_max": 0.00210831017466262, "clip_ratio/high_mean": 0.0008640765154268593, "clip_ratio/low_mean": 0.0010127349032700295, "clip_ratio/low_min": 0.0001953134496943676, "clip_ratio/region_mean": 0.001876811460533645, "epoch": 0.043679890800273, "grad_norm": 0.12373574078083038, "learning_rate": 2e-07, "loss": 0.0419, "step": 468 }, { "clip_ratio/high_max": 0.0024139349116012454, "clip_ratio/high_mean": 0.0010290271220583236, "clip_ratio/low_mean": 0.0010587414617475588, "clip_ratio/low_min": 0.00018582042912385077, "clip_ratio/region_mean": 0.0020877685528830625, "epoch": 0.043773223900273585, "grad_norm": 0.12545520067214966, "learning_rate": 2e-07, "loss": 0.0334, "step": 469 }, { "clip_ratio/high_max": 0.0027297762426314875, "clip_ratio/high_mean": 0.001106985397200333, "clip_ratio/low_mean": 0.0009402073483215645, "clip_ratio/low_min": 0.00020883239903923823, "clip_ratio/region_mean": 0.002047192770987749, "epoch": 0.04386655700027416, "grad_norm": 0.17388267815113068, "learning_rate": 2e-07, "loss": 0.0373, "step": 470 }, { "clip_ratio/high_max": 0.0018081994057865813, "clip_ratio/high_mean": 0.0008842006900522392, "clip_ratio/low_mean": 0.0008840818409225903, "clip_ratio/low_min": 0.0001485763532400597, "clip_ratio/region_mean": 0.0017682825855445117, "epoch": 0.04395989010027475, "grad_norm": 0.11366170644760132, "learning_rate": 2e-07, "loss": 0.0338, "step": 471 }, { "clip_ratio/high_max": 0.0023621447398909368, "clip_ratio/high_mean": 0.000940713080126443, "clip_ratio/low_mean": 0.000869792012963444, "clip_ratio/low_min": 4.750264724862063e-05, "clip_ratio/region_mean": 0.0018105050949088763, "epoch": 0.044053223200275334, "grad_norm": 0.10999000817537308, "learning_rate": 2e-07, "loss": 0.0192, "step": 472 }, { "clip_ratio/high_max": 0.0019479558868624736, "clip_ratio/high_mean": 0.00085053551265446, "clip_ratio/low_mean": 0.001027277990942821, "clip_ratio/low_min": 0.00018294409619556973, "clip_ratio/region_mean": 0.0018778135199681856, "epoch": 0.04414655630027592, "grad_norm": 0.11391984671354294, "learning_rate": 2e-07, "loss": 0.0559, "step": 473 }, { "clip_ratio/high_max": 0.002073125884635374, "clip_ratio/high_mean": 0.0008823675780149642, "clip_ratio/low_mean": 0.0008705244363227393, "clip_ratio/low_min": 4.958643603458768e-05, "clip_ratio/region_mean": 0.0017528920216136612, "epoch": 0.0442398894002765, "grad_norm": 0.1216319128870964, "learning_rate": 2e-07, "loss": 0.0144, "step": 474 }, { "clip_ratio/high_max": 0.00205260169605026, "clip_ratio/high_mean": 0.0008592520771344425, "clip_ratio/low_mean": 0.0010394599485152867, "clip_ratio/low_min": 0.00017994870904658455, "clip_ratio/region_mean": 0.001898712056572549, "epoch": 0.04433322250027708, "grad_norm": 0.11355572938919067, "learning_rate": 2e-07, "loss": 0.0364, "step": 475 }, { "clip_ratio/high_max": 0.0021929314243607223, "clip_ratio/high_mean": 0.0008556158918509027, "clip_ratio/low_mean": 0.0009467831350775668, "clip_ratio/low_min": 0.00011022945909644477, "clip_ratio/region_mean": 0.0018023989759967662, "epoch": 0.04442655560027767, "grad_norm": 0.11866224557161331, "learning_rate": 2e-07, "loss": 0.0231, "step": 476 }, { "clip_ratio/high_max": 0.00221455171413254, "clip_ratio/high_mean": 0.0009223656888934784, "clip_ratio/low_mean": 0.0009960194038285408, "clip_ratio/low_min": 0.00016828899015308707, "clip_ratio/region_mean": 0.0019183851400157437, "epoch": 0.04451988870027825, "grad_norm": 0.12050988525152206, "learning_rate": 2e-07, "loss": 0.0225, "step": 477 }, { "clip_ratio/high_max": 0.0022348541097017005, "clip_ratio/high_mean": 0.0009680452840257203, "clip_ratio/low_mean": 0.0009097687861867598, "clip_ratio/low_min": 0.00011333133261359762, "clip_ratio/region_mean": 0.001877814094768837, "epoch": 0.04461322180027883, "grad_norm": 0.11138606071472168, "learning_rate": 2e-07, "loss": 0.0154, "step": 478 }, { "clip_ratio/high_max": 0.002229319725302048, "clip_ratio/high_mean": 0.0009144981395365903, "clip_ratio/low_mean": 0.001053465824952582, "clip_ratio/low_min": 0.0001138521879511245, "clip_ratio/region_mean": 0.0019679640026879497, "epoch": 0.044706554900279416, "grad_norm": 0.12067735940217972, "learning_rate": 2e-07, "loss": 0.0421, "step": 479 }, { "clip_ratio/high_max": 0.002140239092113916, "clip_ratio/high_mean": 0.0009171433102892479, "clip_ratio/low_mean": 0.0009252726722479565, "clip_ratio/low_min": 5.008920834370656e-05, "clip_ratio/region_mean": 0.0018424159788992256, "epoch": 0.04479988800028, "grad_norm": 0.11382362991571426, "learning_rate": 2e-07, "loss": 0.0171, "step": 480 }, { "clip_ratio/high_max": 0.002166224687243812, "clip_ratio/high_mean": 0.0008646585956739727, "clip_ratio/low_mean": 0.0009478742504143156, "clip_ratio/low_min": 0.00015850094496272504, "clip_ratio/region_mean": 0.0018125327915186062, "epoch": 0.04489322110028058, "grad_norm": 0.11516925692558289, "learning_rate": 2e-07, "loss": 0.023, "step": 481 }, { "clip_ratio/high_max": 0.001986334318644367, "clip_ratio/high_mean": 0.0008319666558236349, "clip_ratio/low_mean": 0.000936768738029059, "clip_ratio/low_min": 5.1922185775765684e-05, "clip_ratio/region_mean": 0.0017687353320070542, "epoch": 0.044986554200281165, "grad_norm": 0.11894405633211136, "learning_rate": 2e-07, "loss": 0.0407, "step": 482 }, { "clip_ratio/high_max": 0.002120238154020626, "clip_ratio/high_mean": 0.0008885429851943627, "clip_ratio/low_mean": 0.0009819078986765817, "clip_ratio/low_min": 0.0001684004018898122, "clip_ratio/region_mean": 0.0018704509056988172, "epoch": 0.04507988730028175, "grad_norm": 0.11477168649435043, "learning_rate": 2e-07, "loss": 0.0277, "step": 483 }, { "clip_ratio/high_max": 0.002143346944649238, "clip_ratio/high_mean": 0.0009694175605545752, "clip_ratio/low_mean": 0.0009247773577953922, "clip_ratio/low_min": 7.680441103730118e-05, "clip_ratio/region_mean": 0.0018941949383588508, "epoch": 0.045173220400282335, "grad_norm": 0.11659643054008484, "learning_rate": 2e-07, "loss": 0.0133, "step": 484 }, { "clip_ratio/high_max": 0.002132837093085982, "clip_ratio/high_mean": 0.000825136638013646, "clip_ratio/low_mean": 0.0011425291741034016, "clip_ratio/low_min": 0.00028873990959255025, "clip_ratio/region_mean": 0.0019676657902891748, "epoch": 0.04526655350028291, "grad_norm": 0.10420174896717072, "learning_rate": 2e-07, "loss": 0.0582, "step": 485 }, { "clip_ratio/high_max": 0.0020679763838415965, "clip_ratio/high_mean": 0.0009412703693669755, "clip_ratio/low_mean": 0.0009178398540825583, "clip_ratio/low_min": 8.744957722228719e-05, "clip_ratio/region_mean": 0.0018591101907077245, "epoch": 0.0453598866002835, "grad_norm": 0.10893837362527847, "learning_rate": 2e-07, "loss": 0.0474, "step": 486 }, { "clip_ratio/high_max": 0.0020363660223665647, "clip_ratio/high_mean": 0.0009555230171827134, "clip_ratio/low_mean": 0.0009983471918530995, "clip_ratio/low_min": 0.000107767842564499, "clip_ratio/region_mean": 0.001953870214492781, "epoch": 0.045453219700284084, "grad_norm": 0.11855454742908478, "learning_rate": 2e-07, "loss": 0.0426, "step": 487 }, { "clip_ratio/high_max": 0.0029045043120277114, "clip_ratio/high_mean": 0.0010617471452860627, "clip_ratio/low_mean": 0.000867701886818395, "clip_ratio/low_min": 7.592265774292173e-05, "clip_ratio/region_mean": 0.001929448997543659, "epoch": 0.04554655280028467, "grad_norm": 0.11618532240390778, "learning_rate": 2e-07, "loss": -0.0149, "step": 488 }, { "clip_ratio/high_max": 0.0020201062579872087, "clip_ratio/high_mean": 0.0009322421610704623, "clip_ratio/low_mean": 0.0009244990305887768, "clip_ratio/low_min": 0.00016264931309706299, "clip_ratio/region_mean": 0.0018567411971162073, "epoch": 0.04563988590028525, "grad_norm": 0.1189904510974884, "learning_rate": 2e-07, "loss": -0.0324, "step": 489 }, { "clip_ratio/high_max": 0.002198350070102606, "clip_ratio/high_mean": 0.000974449065324734, "clip_ratio/low_mean": 0.0010309704321116442, "clip_ratio/low_min": 0.00015754415835544933, "clip_ratio/region_mean": 0.0020054194537806325, "epoch": 0.04573321900028583, "grad_norm": 0.1326221227645874, "learning_rate": 2e-07, "loss": 0.0303, "step": 490 }, { "clip_ratio/high_max": 0.0024662960568093695, "clip_ratio/high_mean": 0.0009339979842479806, "clip_ratio/low_mean": 0.0009617586620151997, "clip_ratio/low_min": 7.105117947503459e-05, "clip_ratio/region_mean": 0.0018957566171593498, "epoch": 0.04582655210028642, "grad_norm": 0.11166379600763321, "learning_rate": 2e-07, "loss": 0.0097, "step": 491 }, { "clip_ratio/high_max": 0.002050291323030251, "clip_ratio/high_mean": 0.0008871729887687252, "clip_ratio/low_mean": 0.0010322477100999095, "clip_ratio/low_min": 0.00015301647636078997, "clip_ratio/region_mean": 0.00191942069795914, "epoch": 0.045919885200286996, "grad_norm": 0.11446750909090042, "learning_rate": 2e-07, "loss": 0.0398, "step": 492 }, { "clip_ratio/high_max": 0.002544161066907691, "clip_ratio/high_mean": 0.0011630978915491141, "clip_ratio/low_mean": 0.0009263232041121228, "clip_ratio/low_min": 8.957735190051608e-05, "clip_ratio/region_mean": 0.0020894210974802263, "epoch": 0.04601321830028758, "grad_norm": 0.11928210407495499, "learning_rate": 2e-07, "loss": -0.0251, "step": 493 }, { "clip_ratio/high_max": 0.0019681162884808145, "clip_ratio/high_mean": 0.0008900683969841339, "clip_ratio/low_mean": 0.0010363525107095484, "clip_ratio/low_min": 0.00010094350545841735, "clip_ratio/region_mean": 0.0019264209258835763, "epoch": 0.046106551400288166, "grad_norm": 0.10903050750494003, "learning_rate": 2e-07, "loss": 0.0095, "step": 494 }, { "clip_ratio/high_max": 0.002791699138469994, "clip_ratio/high_mean": 0.0009992235518438974, "clip_ratio/low_mean": 0.0010727971166488715, "clip_ratio/low_min": 0.00014006829496793216, "clip_ratio/region_mean": 0.0020720206084661186, "epoch": 0.04619988450028875, "grad_norm": 0.1235462948679924, "learning_rate": 2e-07, "loss": 0.0262, "step": 495 }, { "clip_ratio/high_max": 0.0020841166951868217, "clip_ratio/high_mean": 0.00082844902681245, "clip_ratio/low_mean": 0.0009151419653790072, "clip_ratio/low_min": 0.00019164422474204912, "clip_ratio/region_mean": 0.001743590968544595, "epoch": 0.04629321760028933, "grad_norm": 0.1149994283914566, "learning_rate": 2e-07, "loss": 0.0706, "step": 496 }, { "clip_ratio/high_max": 0.0024767620634520426, "clip_ratio/high_mean": 0.0010630735177983297, "clip_ratio/low_mean": 0.0009248447495338041, "clip_ratio/low_min": 9.780283198779216e-05, "clip_ratio/region_mean": 0.001987918240047293, "epoch": 0.046386550700289915, "grad_norm": 0.1132793202996254, "learning_rate": 2e-07, "loss": -0.0395, "step": 497 }, { "clip_ratio/high_max": 0.0021475156463566236, "clip_ratio/high_mean": 0.000862965740452637, "clip_ratio/low_mean": 0.0009245053224731237, "clip_ratio/low_min": 9.711377788335085e-05, "clip_ratio/region_mean": 0.001787471046554856, "epoch": 0.0464798838002905, "grad_norm": 0.1016230657696724, "learning_rate": 2e-07, "loss": 0.03, "step": 498 }, { "clip_ratio/high_max": 0.001783506519132061, "clip_ratio/high_mean": 0.0008245242688644794, "clip_ratio/low_mean": 0.0010365446814830648, "clip_ratio/low_min": 0.0001475501721870387, "clip_ratio/region_mean": 0.0018610689439810812, "epoch": 0.046573216900291085, "grad_norm": 0.11492468416690826, "learning_rate": 2e-07, "loss": 0.0031, "step": 499 }, { "clip_ratio/high_max": 0.0024618959723738953, "clip_ratio/high_mean": 0.0010416513614472933, "clip_ratio/low_mean": 0.0008654866578581277, "clip_ratio/low_min": 4.970522059011273e-05, "clip_ratio/region_mean": 0.0019071380156674422, "epoch": 0.046666550000291664, "grad_norm": 0.11126232892274857, "learning_rate": 2e-07, "loss": -0.022, "step": 500 }, { "clip_ratio/high_max": 0.0019976288749603555, "clip_ratio/high_mean": 0.0008553708303224994, "clip_ratio/low_mean": 0.0010246605961583555, "clip_ratio/low_min": 0.00011322105274302885, "clip_ratio/region_mean": 0.0018800314355758019, "epoch": 0.04675988310029225, "grad_norm": 0.12699399888515472, "learning_rate": 2e-07, "loss": 0.0354, "step": 501 }, { "clip_ratio/high_max": 0.0019075550990237389, "clip_ratio/high_mean": 0.0008621496235718951, "clip_ratio/low_mean": 0.0010251553831039928, "clip_ratio/low_min": 0.00014106210346653825, "clip_ratio/region_mean": 0.0018873049812100362, "epoch": 0.046853216200292834, "grad_norm": 0.11891791224479675, "learning_rate": 2e-07, "loss": 0.0558, "step": 502 }, { "clip_ratio/high_max": 0.0018460878782207146, "clip_ratio/high_mean": 0.0008638468771096086, "clip_ratio/low_mean": 0.0009977827576221898, "clip_ratio/low_min": 8.964342760009458e-05, "clip_ratio/region_mean": 0.0018616295856190845, "epoch": 0.04694654930029342, "grad_norm": 0.1134866327047348, "learning_rate": 2e-07, "loss": 0.0352, "step": 503 }, { "clip_ratio/high_max": 0.001998072271817364, "clip_ratio/high_mean": 0.0008923144268919714, "clip_ratio/low_mean": 0.000998801579044084, "clip_ratio/low_min": 0.00012666574366448913, "clip_ratio/region_mean": 0.0018911159713752568, "epoch": 0.047039882400294, "grad_norm": 0.1125430166721344, "learning_rate": 2e-07, "loss": 0.0434, "step": 504 }, { "clip_ratio/high_max": 0.0020540753539535217, "clip_ratio/high_mean": 0.0008668253631185507, "clip_ratio/low_mean": 0.0008940261759562418, "clip_ratio/low_min": 7.802612890372984e-05, "clip_ratio/region_mean": 0.0017608515481697395, "epoch": 0.04713321550029458, "grad_norm": 0.11267927289009094, "learning_rate": 2e-07, "loss": 0.0025, "step": 505 }, { "clip_ratio/high_max": 0.0025118121557170525, "clip_ratio/high_mean": 0.0009809604489419144, "clip_ratio/low_mean": 0.0009767942574399058, "clip_ratio/low_min": 9.083359327632934e-05, "clip_ratio/region_mean": 0.0019577547136577778, "epoch": 0.04722654860029517, "grad_norm": 0.11542227864265442, "learning_rate": 2e-07, "loss": -0.022, "step": 506 }, { "clip_ratio/high_max": 0.0024000634512049146, "clip_ratio/high_mean": 0.000889746817847481, "clip_ratio/low_mean": 0.001016148384223925, "clip_ratio/low_min": 7.079758142936043e-05, "clip_ratio/region_mean": 0.0019058952238992788, "epoch": 0.047319881700295746, "grad_norm": 0.12162056565284729, "learning_rate": 2e-07, "loss": 0.0366, "step": 507 }, { "clip_ratio/high_max": 0.0022882040284457617, "clip_ratio/high_mean": 0.001026135574647924, "clip_ratio/low_mean": 0.0010581682909105439, "clip_ratio/low_min": 0.0001280536189369741, "clip_ratio/region_mean": 0.002084303880110383, "epoch": 0.04741321480029633, "grad_norm": 0.11644841730594635, "learning_rate": 2e-07, "loss": 0.0318, "step": 508 }, { "clip_ratio/high_max": 0.002016646507399855, "clip_ratio/high_mean": 0.0009344866812170949, "clip_ratio/low_mean": 0.0009105880217248341, "clip_ratio/low_min": 3.803223717113724e-05, "clip_ratio/region_mean": 0.0018450747011229396, "epoch": 0.04750654790029692, "grad_norm": 0.10687410831451416, "learning_rate": 2e-07, "loss": -0.0229, "step": 509 }, { "clip_ratio/high_max": 0.0022560539218829945, "clip_ratio/high_mean": 0.0009600157009117538, "clip_ratio/low_mean": 0.0010200020151387434, "clip_ratio/low_min": 4.616065871232422e-05, "clip_ratio/region_mean": 0.001980017710593529, "epoch": 0.0475998810002975, "grad_norm": 0.12589336931705475, "learning_rate": 2e-07, "loss": 0.026, "step": 510 }, { "clip_ratio/high_max": 0.0018825599327101372, "clip_ratio/high_mean": 0.0008869830780895427, "clip_ratio/low_mean": 0.0010153740331588779, "clip_ratio/low_min": 8.951151039582328e-05, "clip_ratio/region_mean": 0.0019023571512661874, "epoch": 0.04769321410029808, "grad_norm": 0.11596434563398361, "learning_rate": 2e-07, "loss": 0.0263, "step": 511 }, { "clip_ratio/high_max": 0.0023212233572849073, "clip_ratio/high_mean": 0.0009241106918125297, "clip_ratio/low_mean": 0.0009564395440975204, "clip_ratio/low_min": 5.879187119717244e-05, "clip_ratio/region_mean": 0.0018805503059411421, "epoch": 0.047786547200298665, "grad_norm": 0.10420980304479599, "learning_rate": 2e-07, "loss": -0.0093, "step": 512 }, { "clip_ratio/high_max": 0.0, "clip_ratio/high_mean": 0.0, "clip_ratio/low_mean": 0.0, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0, "completions/clipped_ratio": 0.015380859375, "completions/max_length": 4096.0, "completions/max_terminated_length": 4080.0, "completions/mean_length": 619.6220703125, "completions/mean_terminated_length": 565.317138671875, "completions/min_length": 3.0, "completions/min_terminated_length": 3.0, "epoch": 0.04787988030029925, "grad_norm": 0.1249484196305275, "learning_rate": 2e-07, "loss": 0.0639, "num_tokens": 407105446.0, "reward": 0.54559326171875, "reward_std": 0.21903932094573975, "rewards/simpleverify_reward/mean": 0.54559326171875, "rewards/simpleverify_reward/std": 0.49791914224624634, "step": 513 }, { "clip_ratio/high_max": 0.0020474573830142617, "clip_ratio/high_mean": 0.0008239163071266375, "clip_ratio/low_mean": 0.0005554225226660492, "clip_ratio/low_min": 1.75168170244433e-05, "clip_ratio/region_mean": 0.0013793387734040152, "epoch": 0.047973213400299836, "grad_norm": 0.11516439914703369, "learning_rate": 2e-07, "loss": 0.0427, "step": 514 }, { "clip_ratio/high_max": 0.0018966534698847681, "clip_ratio/high_mean": 0.0007866157466196455, "clip_ratio/low_mean": 0.0005730286675316165, "clip_ratio/low_min": 3.494028715067543e-05, "clip_ratio/region_mean": 0.0013596444259746931, "epoch": 0.048066546500300414, "grad_norm": 0.13290849328041077, "learning_rate": 2e-07, "loss": 0.0382, "step": 515 }, { "clip_ratio/high_max": 0.0021555245766649023, "clip_ratio/high_mean": 0.000930577358303708, "clip_ratio/low_mean": 0.0004975831398041919, "clip_ratio/low_min": 1.7009559996949974e-05, "clip_ratio/region_mean": 0.0014281604999268893, "epoch": 0.048159879600301, "grad_norm": 0.1208842396736145, "learning_rate": 2e-07, "loss": 0.0114, "step": 516 }, { "clip_ratio/high_max": 0.0021955815464025363, "clip_ratio/high_mean": 0.0009184077971440274, "clip_ratio/low_mean": 0.0005446152526928927, "clip_ratio/low_min": 5.7050307077588513e-05, "clip_ratio/region_mean": 0.0014630230762122665, "epoch": 0.048253212700301584, "grad_norm": 8.951251029968262, "learning_rate": 2e-07, "loss": -0.0504, "step": 517 }, { "clip_ratio/high_max": 0.002353072828555014, "clip_ratio/high_mean": 0.0009427147924725432, "clip_ratio/low_mean": 0.0005549133638851345, "clip_ratio/low_min": 1.0660071893653367e-05, "clip_ratio/region_mean": 0.0014976281454437412, "epoch": 0.04834654580030216, "grad_norm": 0.10491771996021271, "learning_rate": 2e-07, "loss": 0.0033, "step": 518 }, { "clip_ratio/high_max": 0.0019460780313238502, "clip_ratio/high_mean": 0.0007836033655621577, "clip_ratio/low_mean": 0.0006949090548005188, "clip_ratio/low_min": 0.00010643061614246108, "clip_ratio/region_mean": 0.0014785124149057083, "epoch": 0.04843987890030275, "grad_norm": 0.11117449402809143, "learning_rate": 2e-07, "loss": 0.0427, "step": 519 }, { "clip_ratio/high_max": 0.0017422130877093878, "clip_ratio/high_mean": 0.0007207912858575583, "clip_ratio/low_mean": 0.0005812427843920887, "clip_ratio/low_min": 2.3959351892699488e-05, "clip_ratio/region_mean": 0.001302034088439541, "epoch": 0.04853321200030333, "grad_norm": 0.11444155871868134, "learning_rate": 2e-07, "loss": 0.0228, "step": 520 }, { "clip_ratio/high_max": 0.0019335887373017613, "clip_ratio/high_mean": 0.0007430577734339749, "clip_ratio/low_mean": 0.0006356650474117487, "clip_ratio/low_min": 6.929017308721086e-05, "clip_ratio/region_mean": 0.0013787228090222925, "epoch": 0.04862654510030392, "grad_norm": 0.1354903280735016, "learning_rate": 2e-07, "loss": 0.0804, "step": 521 }, { "clip_ratio/high_max": 0.0020491522809606977, "clip_ratio/high_mean": 0.000841398345073685, "clip_ratio/low_mean": 0.0006478106042777654, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0014892089457134716, "epoch": 0.048719878200304496, "grad_norm": 0.11569122225046158, "learning_rate": 2e-07, "loss": 0.0139, "step": 522 }, { "clip_ratio/high_max": 0.0021278261265251786, "clip_ratio/high_mean": 0.0008932984364946606, "clip_ratio/low_mean": 0.0007110550086508738, "clip_ratio/low_min": 8.056410206336295e-05, "clip_ratio/region_mean": 0.0016043534560594708, "epoch": 0.04881321130030508, "grad_norm": 0.12606088817119598, "learning_rate": 2e-07, "loss": 0.0484, "step": 523 }, { "clip_ratio/high_max": 0.0022304598678601906, "clip_ratio/high_mean": 0.0009553815179970115, "clip_ratio/low_mean": 0.0005801243787573185, "clip_ratio/low_min": 3.298702449683333e-05, "clip_ratio/region_mean": 0.0015355058822024148, "epoch": 0.04890654440030567, "grad_norm": 0.11702584475278854, "learning_rate": 2e-07, "loss": -0.0316, "step": 524 }, { "clip_ratio/high_max": 0.0019979728022008203, "clip_ratio/high_mean": 0.0008308313153975178, "clip_ratio/low_mean": 0.000683303351252107, "clip_ratio/low_min": 1.5311121387640014e-05, "clip_ratio/region_mean": 0.00151413468120154, "epoch": 0.04899987750030625, "grad_norm": 0.12649109959602356, "learning_rate": 2e-07, "loss": 0.0409, "step": 525 }, { "clip_ratio/high_max": 0.00236291901092045, "clip_ratio/high_mean": 0.0010270862403558567, "clip_ratio/low_mean": 0.0006326909042400075, "clip_ratio/low_min": 5.130766930960817e-05, "clip_ratio/region_mean": 0.0016597771318629384, "epoch": 0.04909321060030683, "grad_norm": 0.12152663618326187, "learning_rate": 2e-07, "loss": 0.0102, "step": 526 }, { "clip_ratio/high_max": 0.0016582118732912932, "clip_ratio/high_mean": 0.0006913995530339889, "clip_ratio/low_mean": 0.0007755259866826236, "clip_ratio/low_min": 0.00010343870690121548, "clip_ratio/region_mean": 0.001466925510612782, "epoch": 0.049186543700307415, "grad_norm": 0.1052582710981369, "learning_rate": 2e-07, "loss": 0.0766, "step": 527 }, { "clip_ratio/high_max": 0.0021492439773282968, "clip_ratio/high_mean": 0.0008418255292781396, "clip_ratio/low_mean": 0.0004967712420693715, "clip_ratio/low_min": 2.176909129047999e-05, "clip_ratio/region_mean": 0.0013385967977228574, "epoch": 0.049279876800308, "grad_norm": 0.12021954357624054, "learning_rate": 2e-07, "loss": 0.0076, "step": 528 }, { "clip_ratio/high_max": 0.0018337889123358764, "clip_ratio/high_mean": 0.0007555235424661078, "clip_ratio/low_mean": 0.000737603264497011, "clip_ratio/low_min": 5.2281705393397715e-05, "clip_ratio/region_mean": 0.0014931268087821081, "epoch": 0.049373209900308586, "grad_norm": 0.11225282400846481, "learning_rate": 2e-07, "loss": 0.0514, "step": 529 }, { "clip_ratio/high_max": 0.0018649838093551807, "clip_ratio/high_mean": 0.0008285973090096377, "clip_ratio/low_mean": 0.0006624951638514176, "clip_ratio/low_min": 4.856254963669926e-05, "clip_ratio/region_mean": 0.0014910924437572248, "epoch": 0.049466543000309164, "grad_norm": 0.1083546131849289, "learning_rate": 2e-07, "loss": -0.011, "step": 530 }, { "clip_ratio/high_max": 0.002233852879726328, "clip_ratio/high_mean": 0.0009874441329884576, "clip_ratio/low_mean": 0.0007484307607228402, "clip_ratio/low_min": 0.0001460163293813821, "clip_ratio/region_mean": 0.0017358748882543296, "epoch": 0.04955987610030975, "grad_norm": 0.11867433041334152, "learning_rate": 2e-07, "loss": 0.0114, "step": 531 }, { "clip_ratio/high_max": 0.002101485777529888, "clip_ratio/high_mean": 0.0009654631503508426, "clip_ratio/low_mean": 0.0007567998954982613, "clip_ratio/low_min": 6.56810479995329e-05, "clip_ratio/region_mean": 0.0017222630413016304, "epoch": 0.049653209200310335, "grad_norm": 0.12591029703617096, "learning_rate": 2e-07, "loss": -0.0325, "step": 532 }, { "clip_ratio/high_max": 0.002063210544292815, "clip_ratio/high_mean": 0.0009547157351335045, "clip_ratio/low_mean": 0.0007278986067831283, "clip_ratio/low_min": 8.335960455951863e-05, "clip_ratio/region_mean": 0.001682614347373601, "epoch": 0.04974654230031091, "grad_norm": 0.11194096505641937, "learning_rate": 2e-07, "loss": -0.0134, "step": 533 }, { "clip_ratio/high_max": 0.002131147099134978, "clip_ratio/high_mean": 0.0009507867980573792, "clip_ratio/low_mean": 0.0007607934840052621, "clip_ratio/low_min": 0.00012364546000753762, "clip_ratio/region_mean": 0.0017115802693297155, "epoch": 0.0498398754003115, "grad_norm": 0.12011602520942688, "learning_rate": 2e-07, "loss": 0.002, "step": 534 }, { "clip_ratio/high_max": 0.0023105600303097162, "clip_ratio/high_mean": 0.0008917345494410256, "clip_ratio/low_mean": 0.0007742356665403349, "clip_ratio/low_min": 8.055868420342449e-05, "clip_ratio/region_mean": 0.0016659702596371062, "epoch": 0.04993320850031208, "grad_norm": 0.115916408598423, "learning_rate": 2e-07, "loss": 0.0413, "step": 535 }, { "clip_ratio/high_max": 0.0016676672894391231, "clip_ratio/high_mean": 0.0007589723772980506, "clip_ratio/low_mean": 0.000746526933653513, "clip_ratio/low_min": 8.771644434091286e-05, "clip_ratio/region_mean": 0.0015054993018566165, "epoch": 0.05002654160031267, "grad_norm": 0.10498738288879395, "learning_rate": 2e-07, "loss": 0.0294, "step": 536 }, { "clip_ratio/high_max": 0.0024208100949181244, "clip_ratio/high_mean": 0.0009587153381289681, "clip_ratio/low_mean": 0.0007878507185523631, "clip_ratio/low_min": 2.3066188077791594e-05, "clip_ratio/region_mean": 0.0017465660857851617, "epoch": 0.05011987470031325, "grad_norm": 0.1192055344581604, "learning_rate": 2e-07, "loss": 0.0397, "step": 537 }, { "clip_ratio/high_max": 0.0021170762920519337, "clip_ratio/high_mean": 0.0009136065855273046, "clip_ratio/low_mean": 0.0007115834414435085, "clip_ratio/low_min": 2.5180779630318284e-05, "clip_ratio/region_mean": 0.0016251900524366647, "epoch": 0.05021320780031383, "grad_norm": 0.11429329216480255, "learning_rate": 2e-07, "loss": 0.0482, "step": 538 }, { "clip_ratio/high_max": 0.0023239120055222884, "clip_ratio/high_mean": 0.0009998277928389143, "clip_ratio/low_mean": 0.0008660658932058141, "clip_ratio/low_min": 2.5096071567531908e-05, "clip_ratio/region_mean": 0.0018658937042346224, "epoch": 0.05030654090031442, "grad_norm": 0.12397728860378265, "learning_rate": 2e-07, "loss": 0.0475, "step": 539 }, { "clip_ratio/high_max": 0.002159439136448782, "clip_ratio/high_mean": 0.0008969422706286423, "clip_ratio/low_mean": 0.000861676424392499, "clip_ratio/low_min": 4.1730730117706116e-05, "clip_ratio/region_mean": 0.0017586186695552897, "epoch": 0.050399874000315, "grad_norm": 0.12380772829055786, "learning_rate": 2e-07, "loss": 0.0246, "step": 540 }, { "clip_ratio/high_max": 0.002097133648931049, "clip_ratio/high_mean": 0.0009343938545498531, "clip_ratio/low_mean": 0.000825334143883083, "clip_ratio/low_min": 7.041940261842683e-05, "clip_ratio/region_mean": 0.0017597279875189997, "epoch": 0.05049320710031558, "grad_norm": 0.11874108016490936, "learning_rate": 2e-07, "loss": 0.0053, "step": 541 }, { "clip_ratio/high_max": 0.0024011186687857844, "clip_ratio/high_mean": 0.0010517803784750868, "clip_ratio/low_mean": 0.0007826008077245206, "clip_ratio/low_min": 8.263272138719913e-05, "clip_ratio/region_mean": 0.001834381153457798, "epoch": 0.050586540200316166, "grad_norm": 0.11690741777420044, "learning_rate": 2e-07, "loss": 0.0182, "step": 542 }, { "clip_ratio/high_max": 0.0021468082486535423, "clip_ratio/high_mean": 0.0008459979162580566, "clip_ratio/low_mean": 0.0008452306810795562, "clip_ratio/low_min": 0.0001053713021974545, "clip_ratio/region_mean": 0.0016912286300794221, "epoch": 0.05067987330031675, "grad_norm": 0.11066032946109772, "learning_rate": 2e-07, "loss": 0.0411, "step": 543 }, { "clip_ratio/high_max": 0.0021998991251166444, "clip_ratio/high_mean": 0.0008864237661327934, "clip_ratio/low_mean": 0.0009112051830015844, "clip_ratio/low_min": 4.105756943317829e-05, "clip_ratio/region_mean": 0.0017976290255319327, "epoch": 0.05077320640031733, "grad_norm": 0.1181308776140213, "learning_rate": 2e-07, "loss": 0.0395, "step": 544 }, { "clip_ratio/high_max": 0.0021576228537014686, "clip_ratio/high_mean": 0.0008953752385423286, "clip_ratio/low_mean": 0.0008976412646006793, "clip_ratio/low_min": 0.00010781910896184854, "clip_ratio/region_mean": 0.0017930165049619973, "epoch": 0.050866539500317914, "grad_norm": 0.11932957172393799, "learning_rate": 2e-07, "loss": 0.0335, "step": 545 }, { "clip_ratio/high_max": 0.002208736856118776, "clip_ratio/high_mean": 0.0009116104993154295, "clip_ratio/low_mean": 0.0008198049326892942, "clip_ratio/low_min": 3.338253009133041e-05, "clip_ratio/region_mean": 0.0017314154538325965, "epoch": 0.0509598726003185, "grad_norm": 0.11894290149211884, "learning_rate": 2e-07, "loss": 0.0339, "step": 546 }, { "clip_ratio/high_max": 0.0018048475758405402, "clip_ratio/high_mean": 0.0007394633448711829, "clip_ratio/low_mean": 0.0008841771668812726, "clip_ratio/low_min": 5.9546148804656696e-05, "clip_ratio/region_mean": 0.001623640509933466, "epoch": 0.051053205700319085, "grad_norm": 0.12036183476448059, "learning_rate": 2e-07, "loss": 0.0607, "step": 547 }, { "clip_ratio/high_max": 0.0019977466072305106, "clip_ratio/high_mean": 0.0007656978514205548, "clip_ratio/low_mean": 0.0009487922816333594, "clip_ratio/low_min": 9.224892528436612e-05, "clip_ratio/region_mean": 0.0017144901357823983, "epoch": 0.05114653880031966, "grad_norm": 0.11514570564031601, "learning_rate": 2e-07, "loss": 0.0264, "step": 548 }, { "clip_ratio/high_max": 0.002192864882090362, "clip_ratio/high_mean": 0.000971686507909908, "clip_ratio/low_mean": 0.0009848649606283288, "clip_ratio/low_min": 0.00013279655013320735, "clip_ratio/region_mean": 0.0019565514085115865, "epoch": 0.05123987190032025, "grad_norm": 0.11713724583387375, "learning_rate": 2e-07, "loss": 0.0467, "step": 549 }, { "clip_ratio/high_max": 0.00207652079188847, "clip_ratio/high_mean": 0.0009597385069355369, "clip_ratio/low_mean": 0.0008380981817026623, "clip_ratio/low_min": 9.198378847941058e-05, "clip_ratio/region_mean": 0.0017978367141040508, "epoch": 0.05133320500032083, "grad_norm": 0.11240042001008987, "learning_rate": 2e-07, "loss": 0.0207, "step": 550 }, { "clip_ratio/high_max": 0.002158055311156204, "clip_ratio/high_mean": 0.0009785837301024003, "clip_ratio/low_mean": 0.0008309366530738771, "clip_ratio/low_min": 0.00012444339290595963, "clip_ratio/region_mean": 0.0018095203959092032, "epoch": 0.05142653810032142, "grad_norm": 0.11792036890983582, "learning_rate": 2e-07, "loss": 0.0348, "step": 551 }, { "clip_ratio/high_max": 0.0019930229100282304, "clip_ratio/high_mean": 0.0008410440796069452, "clip_ratio/low_mean": 0.0007813269403413869, "clip_ratio/low_min": 3.7099203836987726e-05, "clip_ratio/region_mean": 0.0016223710335907526, "epoch": 0.051519871200322, "grad_norm": 0.11646736413240433, "learning_rate": 2e-07, "loss": 0.0506, "step": 552 }, { "clip_ratio/high_max": 0.0020072338375030085, "clip_ratio/high_mean": 0.0009419335292477626, "clip_ratio/low_mean": 0.0009087666676350636, "clip_ratio/low_min": 0.00011563887528609484, "clip_ratio/region_mean": 0.0018507001805119216, "epoch": 0.05161320430032258, "grad_norm": 0.10690699517726898, "learning_rate": 2e-07, "loss": -0.0223, "step": 553 }, { "clip_ratio/high_max": 0.0021032825898146257, "clip_ratio/high_mean": 0.0008944293495005695, "clip_ratio/low_mean": 0.0009180684137390926, "clip_ratio/low_min": 0.00011040256140404381, "clip_ratio/region_mean": 0.0018124977650586516, "epoch": 0.05170653740032317, "grad_norm": 0.1242905706167221, "learning_rate": 2e-07, "loss": 0.021, "step": 554 }, { "clip_ratio/high_max": 0.0022934982625884004, "clip_ratio/high_mean": 0.0009107690930250101, "clip_ratio/low_mean": 0.0008404621257795952, "clip_ratio/low_min": 9.424061408935813e-05, "clip_ratio/region_mean": 0.0017512312115286477, "epoch": 0.05179987050032375, "grad_norm": 0.11362404376268387, "learning_rate": 2e-07, "loss": 0.0091, "step": 555 }, { "clip_ratio/high_max": 0.0018486931257939432, "clip_ratio/high_mean": 0.0007768372870486928, "clip_ratio/low_mean": 0.0009042385827342514, "clip_ratio/low_min": 9.784503436094383e-05, "clip_ratio/region_mean": 0.0016810758752399124, "epoch": 0.05189320360032433, "grad_norm": 0.11175607889890671, "learning_rate": 2e-07, "loss": 0.0408, "step": 556 }, { "clip_ratio/high_max": 0.0019550913748389576, "clip_ratio/high_mean": 0.0008990437199827284, "clip_ratio/low_mean": 0.0008994307572720572, "clip_ratio/low_min": 6.972391474846518e-05, "clip_ratio/region_mean": 0.0017984744627028704, "epoch": 0.051986536700324916, "grad_norm": 0.11491791158914566, "learning_rate": 2e-07, "loss": 0.0131, "step": 557 }, { "clip_ratio/high_max": 0.002340992505196482, "clip_ratio/high_mean": 0.0010490290806046687, "clip_ratio/low_mean": 0.0008616599334345665, "clip_ratio/low_min": 9.914558722812217e-05, "clip_ratio/region_mean": 0.0019106890104012564, "epoch": 0.0520798698003255, "grad_norm": 0.12155648320913315, "learning_rate": 2e-07, "loss": -0.034, "step": 558 }, { "clip_ratio/high_max": 0.002293695812113583, "clip_ratio/high_mean": 0.0009495897520537255, "clip_ratio/low_mean": 0.0008371381263714284, "clip_ratio/low_min": 0.00011380048727005487, "clip_ratio/region_mean": 0.001786727923899889, "epoch": 0.05217320290032608, "grad_norm": 0.12462866306304932, "learning_rate": 2e-07, "loss": 0.0503, "step": 559 }, { "clip_ratio/high_max": 0.0022549406421603635, "clip_ratio/high_mean": 0.0008963701202446828, "clip_ratio/low_mean": 0.000818770966361626, "clip_ratio/low_min": 8.798808994470164e-05, "clip_ratio/region_mean": 0.0017151410866063088, "epoch": 0.052266536000326665, "grad_norm": 0.11171950399875641, "learning_rate": 2e-07, "loss": 0.0074, "step": 560 }, { "clip_ratio/high_max": 0.0019454746798146516, "clip_ratio/high_mean": 0.0008578849010518752, "clip_ratio/low_mean": 0.0010321286317775957, "clip_ratio/low_min": 6.797461355745327e-05, "clip_ratio/region_mean": 0.0018900135401054285, "epoch": 0.05235986910032725, "grad_norm": 0.10680074244737625, "learning_rate": 2e-07, "loss": 0.0749, "step": 561 }, { "clip_ratio/high_max": 0.0024539571386412717, "clip_ratio/high_mean": 0.0010209035281150136, "clip_ratio/low_mean": 0.0008800053128652507, "clip_ratio/low_min": 8.657255057187285e-05, "clip_ratio/region_mean": 0.0019009088427992538, "epoch": 0.052453202200327835, "grad_norm": 0.11294497549533844, "learning_rate": 2e-07, "loss": -0.0048, "step": 562 }, { "clip_ratio/high_max": 0.0023167698600445874, "clip_ratio/high_mean": 0.001069298439688282, "clip_ratio/low_mean": 0.0007506689726142213, "clip_ratio/low_min": 4.282034842617577e-05, "clip_ratio/region_mean": 0.001819967401388567, "epoch": 0.05254653530032841, "grad_norm": 0.12658095359802246, "learning_rate": 2e-07, "loss": -0.0042, "step": 563 }, { "clip_ratio/high_max": 0.001922028823173605, "clip_ratio/high_mean": 0.0008675252684042789, "clip_ratio/low_mean": 0.0009345753351226449, "clip_ratio/low_min": 0.00017335566553811077, "clip_ratio/region_mean": 0.0018021005889750086, "epoch": 0.052639868400329, "grad_norm": 0.11058972775936127, "learning_rate": 2e-07, "loss": 0.0255, "step": 564 }, { "clip_ratio/high_max": 0.0017740512848831713, "clip_ratio/high_mean": 0.0007401819675578736, "clip_ratio/low_mean": 0.000998289484414272, "clip_ratio/low_min": 0.00011004591851815348, "clip_ratio/region_mean": 0.001738471444696188, "epoch": 0.052733201500329584, "grad_norm": 0.10528402775526047, "learning_rate": 2e-07, "loss": 0.0625, "step": 565 }, { "clip_ratio/high_max": 0.002348029214772396, "clip_ratio/high_mean": 0.0009806530015339376, "clip_ratio/low_mean": 0.0008557406508771237, "clip_ratio/low_min": 8.909490406949772e-05, "clip_ratio/region_mean": 0.0018363936032983474, "epoch": 0.05282653460033017, "grad_norm": 0.11347829550504684, "learning_rate": 2e-07, "loss": 0.0036, "step": 566 }, { "clip_ratio/high_max": 0.002062040839518886, "clip_ratio/high_mean": 0.0008136943870340474, "clip_ratio/low_mean": 0.0009444121260457905, "clip_ratio/low_min": 0.0001790724936654442, "clip_ratio/region_mean": 0.0017581065330887213, "epoch": 0.05291986770033075, "grad_norm": 0.11951661109924316, "learning_rate": 2e-07, "loss": 0.0078, "step": 567 }, { "clip_ratio/high_max": 0.0019190219354641158, "clip_ratio/high_mean": 0.000836508812426473, "clip_ratio/low_mean": 0.0009748148786457023, "clip_ratio/low_min": 6.62891479805694e-05, "clip_ratio/region_mean": 0.0018113237092620693, "epoch": 0.05301320080033133, "grad_norm": 0.10618489235639572, "learning_rate": 2e-07, "loss": 0.0298, "step": 568 }, { "clip_ratio/high_max": 0.002280811604578048, "clip_ratio/high_mean": 0.0009553527888783719, "clip_ratio/low_mean": 0.0009150287751253927, "clip_ratio/low_min": 5.315143152984092e-05, "clip_ratio/region_mean": 0.0018703815512708388, "epoch": 0.05310653390033192, "grad_norm": 0.11487512290477753, "learning_rate": 2e-07, "loss": 0.0372, "step": 569 }, { "clip_ratio/high_max": 0.002143306664947886, "clip_ratio/high_mean": 0.0008930126205086708, "clip_ratio/low_mean": 0.0008852437549649039, "clip_ratio/low_min": 0.0001049039710778743, "clip_ratio/region_mean": 0.0017782563663786277, "epoch": 0.053199867000332496, "grad_norm": 0.11438082903623581, "learning_rate": 2e-07, "loss": -0.0186, "step": 570 }, { "clip_ratio/high_max": 0.0021715780676458962, "clip_ratio/high_mean": 0.0009025206072692527, "clip_ratio/low_mean": 0.0008652216529299039, "clip_ratio/low_min": 0.00011199818891327595, "clip_ratio/region_mean": 0.0017677422874839976, "epoch": 0.05329320010033308, "grad_norm": 0.12410159409046173, "learning_rate": 2e-07, "loss": 0.0151, "step": 571 }, { "clip_ratio/high_max": 0.0021000182641728316, "clip_ratio/high_mean": 0.0009290268662880408, "clip_ratio/low_mean": 0.0009231869244104018, "clip_ratio/low_min": 0.00015483707556995796, "clip_ratio/region_mean": 0.0018522137688705698, "epoch": 0.053386533200333666, "grad_norm": 0.11413950473070145, "learning_rate": 2e-07, "loss": 0.0335, "step": 572 }, { "clip_ratio/high_max": 0.0023188894556369632, "clip_ratio/high_mean": 0.0010376073769293725, "clip_ratio/low_mean": 0.0007957654142956017, "clip_ratio/low_min": 4.427603380463552e-05, "clip_ratio/region_mean": 0.0018333728075958788, "epoch": 0.05347986630033425, "grad_norm": 0.11095670610666275, "learning_rate": 2e-07, "loss": 0.0181, "step": 573 }, { "clip_ratio/high_max": 0.0020948576275259256, "clip_ratio/high_mean": 0.000933143550355453, "clip_ratio/low_mean": 0.00102705701465311, "clip_ratio/low_min": 0.00012291240454942454, "clip_ratio/region_mean": 0.0019602006068453193, "epoch": 0.05357319940033483, "grad_norm": 0.11983940005302429, "learning_rate": 2e-07, "loss": 0.0713, "step": 574 }, { "clip_ratio/high_max": 0.0022457263548858464, "clip_ratio/high_mean": 0.0009589354121999349, "clip_ratio/low_mean": 0.001094980083507835, "clip_ratio/low_min": 0.00014410053290703217, "clip_ratio/region_mean": 0.0020539155084406957, "epoch": 0.053666532500335415, "grad_norm": 0.12965551018714905, "learning_rate": 2e-07, "loss": 0.0612, "step": 575 }, { "clip_ratio/high_max": 0.0021580680331680924, "clip_ratio/high_mean": 0.0009038720490934793, "clip_ratio/low_mean": 0.0009144431714958046, "clip_ratio/low_min": 1.2711002455034759e-05, "clip_ratio/region_mean": 0.001818315198761411, "epoch": 0.053759865600336, "grad_norm": 0.10498246550559998, "learning_rate": 2e-07, "loss": 0.0099, "step": 576 }, { "clip_ratio/high_max": 0.0019492115316097625, "clip_ratio/high_mean": 0.0009071483782463474, "clip_ratio/low_mean": 0.0009176673629553989, "clip_ratio/low_min": 7.375644327112241e-05, "clip_ratio/region_mean": 0.0018248157284688205, "epoch": 0.053853198700336585, "grad_norm": 0.12012619525194168, "learning_rate": 2e-07, "loss": 0.0185, "step": 577 }, { "clip_ratio/high_max": 0.0017023940781655256, "clip_ratio/high_mean": 0.000739204604542465, "clip_ratio/low_mean": 0.0009804242490645265, "clip_ratio/low_min": 0.00016335269447154133, "clip_ratio/region_mean": 0.0017196288499690127, "epoch": 0.053946531800337164, "grad_norm": 0.11582954972982407, "learning_rate": 2e-07, "loss": 0.038, "step": 578 }, { "clip_ratio/high_max": 0.002048346748779295, "clip_ratio/high_mean": 0.0008254232488980051, "clip_ratio/low_mean": 0.0009237628073606174, "clip_ratio/low_min": 5.9767390666820575e-05, "clip_ratio/region_mean": 0.0017491860635345802, "epoch": 0.05403986490033775, "grad_norm": 0.1181752160191536, "learning_rate": 2e-07, "loss": 0.0387, "step": 579 }, { "clip_ratio/high_max": 0.0018694685204536654, "clip_ratio/high_mean": 0.0009552729843562702, "clip_ratio/low_mean": 0.0009647444639995228, "clip_ratio/low_min": 0.00017141571515821852, "clip_ratio/region_mean": 0.0019200174792786129, "epoch": 0.054133198000338334, "grad_norm": 0.11863341182470322, "learning_rate": 2e-07, "loss": 0.025, "step": 580 }, { "clip_ratio/high_max": 0.0022962249640841037, "clip_ratio/high_mean": 0.0009976906003430486, "clip_ratio/low_mean": 0.0008344412362930598, "clip_ratio/low_min": 9.821933508646907e-05, "clip_ratio/region_mean": 0.0018321318384550977, "epoch": 0.05422653110033892, "grad_norm": 0.11145305633544922, "learning_rate": 2e-07, "loss": 0.001, "step": 581 }, { "clip_ratio/high_max": 0.0021815884683746845, "clip_ratio/high_mean": 0.000954229588387534, "clip_ratio/low_mean": 0.0009202340079355054, "clip_ratio/low_min": 8.562316816096427e-05, "clip_ratio/region_mean": 0.0018744636327028275, "epoch": 0.0543198642003395, "grad_norm": 0.11698178201913834, "learning_rate": 2e-07, "loss": 0.0131, "step": 582 }, { "clip_ratio/high_max": 0.0017914551390276756, "clip_ratio/high_mean": 0.0007192978455350385, "clip_ratio/low_mean": 0.0009974592576327268, "clip_ratio/low_min": 0.00018289320632902673, "clip_ratio/region_mean": 0.0017167571277241223, "epoch": 0.05441319730034008, "grad_norm": 0.10542143136262894, "learning_rate": 2e-07, "loss": 0.09, "step": 583 }, { "clip_ratio/high_max": 0.002489315505954437, "clip_ratio/high_mean": 0.0010848806850844994, "clip_ratio/low_mean": 0.0009319544533354929, "clip_ratio/low_min": 0.00015061532303661807, "clip_ratio/region_mean": 0.0020168351620668545, "epoch": 0.05450653040034067, "grad_norm": 0.1231141984462738, "learning_rate": 2e-07, "loss": -0.0248, "step": 584 }, { "clip_ratio/high_max": 0.002071356044325512, "clip_ratio/high_mean": 0.0008813738459139131, "clip_ratio/low_mean": 0.0009529373710392974, "clip_ratio/low_min": 0.00011528226150403498, "clip_ratio/region_mean": 0.0018343112387810834, "epoch": 0.054599863500341246, "grad_norm": 0.11391407996416092, "learning_rate": 2e-07, "loss": 0.0404, "step": 585 }, { "clip_ratio/high_max": 0.00215815971387201, "clip_ratio/high_mean": 0.0009000809459394077, "clip_ratio/low_mean": 0.0008285351814265596, "clip_ratio/low_min": 3.1650698474550154e-05, "clip_ratio/region_mean": 0.0017286161455558613, "epoch": 0.05469319660034183, "grad_norm": 0.1060062050819397, "learning_rate": 2e-07, "loss": 0.0051, "step": 586 }, { "clip_ratio/high_max": 0.0021636919482261874, "clip_ratio/high_mean": 0.0008839763577270787, "clip_ratio/low_mean": 0.001028448448778363, "clip_ratio/low_min": 9.961185151041718e-05, "clip_ratio/region_mean": 0.001912424821057357, "epoch": 0.054786529700342416, "grad_norm": 0.11327964067459106, "learning_rate": 2e-07, "loss": 0.0049, "step": 587 }, { "clip_ratio/high_max": 0.0022040526018827222, "clip_ratio/high_mean": 0.0009347021805297118, "clip_ratio/low_mean": 0.0009536270245007472, "clip_ratio/low_min": 0.00013456894430419197, "clip_ratio/region_mean": 0.0018883292068494484, "epoch": 0.054879862800343, "grad_norm": 0.1060989573597908, "learning_rate": 2e-07, "loss": 0.004, "step": 588 }, { "clip_ratio/high_max": 0.0022646527795586735, "clip_ratio/high_mean": 0.0009703894174890593, "clip_ratio/low_mean": 0.0009586943124304526, "clip_ratio/low_min": 9.760666489455616e-05, "clip_ratio/region_mean": 0.0019290837371954694, "epoch": 0.05497319590034358, "grad_norm": 0.11030080169439316, "learning_rate": 2e-07, "loss": 0.0082, "step": 589 }, { "clip_ratio/high_max": 0.0022469341711257584, "clip_ratio/high_mean": 0.0009577232995070517, "clip_ratio/low_mean": 0.0009654760960984277, "clip_ratio/low_min": 0.0001352637991658412, "clip_ratio/region_mean": 0.001923199357406702, "epoch": 0.055066529000344165, "grad_norm": 0.11834479868412018, "learning_rate": 2e-07, "loss": -0.0002, "step": 590 }, { "clip_ratio/high_max": 0.0018319178743695375, "clip_ratio/high_mean": 0.0007825559368939139, "clip_ratio/low_mean": 0.0008778100618656026, "clip_ratio/low_min": 8.736990366742248e-05, "clip_ratio/region_mean": 0.0016603660260443576, "epoch": 0.05515986210034475, "grad_norm": 0.118146151304245, "learning_rate": 2e-07, "loss": 0.0622, "step": 591 }, { "clip_ratio/high_max": 0.0017976771996472962, "clip_ratio/high_mean": 0.0007693296793149784, "clip_ratio/low_mean": 0.0007641156280442374, "clip_ratio/low_min": 6.267140270210803e-05, "clip_ratio/region_mean": 0.0015334453200921416, "epoch": 0.055253195200345336, "grad_norm": 0.10926242172718048, "learning_rate": 2e-07, "loss": 0.0273, "step": 592 }, { "clip_ratio/high_max": 0.0026338685675000306, "clip_ratio/high_mean": 0.0009663117634772789, "clip_ratio/low_mean": 0.0009121192797465483, "clip_ratio/low_min": 7.500432366214227e-05, "clip_ratio/region_mean": 0.0018784310450428165, "epoch": 0.055346528300345914, "grad_norm": 0.11061977595090866, "learning_rate": 2e-07, "loss": 0.0166, "step": 593 }, { "clip_ratio/high_max": 0.002083148927340517, "clip_ratio/high_mean": 0.0008223294162235106, "clip_ratio/low_mean": 0.0010763248174043838, "clip_ratio/low_min": 0.0001860264346760232, "clip_ratio/region_mean": 0.0018986542963830288, "epoch": 0.0554398614003465, "grad_norm": 0.11268526315689087, "learning_rate": 2e-07, "loss": 0.0702, "step": 594 }, { "clip_ratio/high_max": 0.0020758378668688238, "clip_ratio/high_mean": 0.0008936209451348986, "clip_ratio/low_mean": 0.0009142496310232673, "clip_ratio/low_min": 4.0614267163618933e-05, "clip_ratio/region_mean": 0.0018078706052619964, "epoch": 0.055533194500347084, "grad_norm": 0.11834265291690826, "learning_rate": 2e-07, "loss": 0.0134, "step": 595 }, { "clip_ratio/high_max": 0.0025160266159218736, "clip_ratio/high_mean": 0.0009563830753904767, "clip_ratio/low_mean": 0.0009830791259446414, "clip_ratio/low_min": 0.0001872199036370148, "clip_ratio/region_mean": 0.001939462214068044, "epoch": 0.05562652760034766, "grad_norm": 0.112601138651371, "learning_rate": 2e-07, "loss": 0.0173, "step": 596 }, { "clip_ratio/high_max": 0.0024438713808194734, "clip_ratio/high_mean": 0.0010165323146793526, "clip_ratio/low_mean": 0.0008924760777517804, "clip_ratio/low_min": 0.00012797618364857044, "clip_ratio/region_mean": 0.0019090083296759985, "epoch": 0.05571986070034825, "grad_norm": 0.12324375659227371, "learning_rate": 2e-07, "loss": 0.0248, "step": 597 }, { "clip_ratio/high_max": 0.0020940234608133323, "clip_ratio/high_mean": 0.0009214230267389212, "clip_ratio/low_mean": 0.0008906867624318693, "clip_ratio/low_min": 5.216767385718413e-05, "clip_ratio/region_mean": 0.0018121098037227057, "epoch": 0.05581319380034883, "grad_norm": 0.121707484126091, "learning_rate": 2e-07, "loss": 0.0148, "step": 598 }, { "clip_ratio/high_max": 0.002212887349742232, "clip_ratio/high_mean": 0.0009187065752485069, "clip_ratio/low_mean": 0.0008958016442193184, "clip_ratio/low_min": 8.468555643048603e-05, "clip_ratio/region_mean": 0.0018145082103728782, "epoch": 0.05590652690034942, "grad_norm": 0.12470190227031708, "learning_rate": 2e-07, "loss": 0.0229, "step": 599 }, { "clip_ratio/high_max": 0.0020196351397316903, "clip_ratio/high_mean": 0.0007749854048597626, "clip_ratio/low_mean": 0.0009585931238689227, "clip_ratio/low_min": 9.368802238896023e-05, "clip_ratio/region_mean": 0.0017335785378236324, "epoch": 0.055999860000349996, "grad_norm": 0.11060390621423721, "learning_rate": 2e-07, "loss": 0.0548, "step": 600 }, { "clip_ratio/high_max": 0.0021206659184827004, "clip_ratio/high_mean": 0.0008937904367485316, "clip_ratio/low_mean": 0.001179236136522377, "clip_ratio/low_min": 0.00021053740420029499, "clip_ratio/region_mean": 0.0020730266187456436, "epoch": 0.05609319310035058, "grad_norm": 0.11506493389606476, "learning_rate": 2e-07, "loss": 0.0346, "step": 601 }, { "clip_ratio/high_max": 0.002200509152316954, "clip_ratio/high_mean": 0.0009363797780679306, "clip_ratio/low_mean": 0.001097693806514144, "clip_ratio/low_min": 0.00019086016891378677, "clip_ratio/region_mean": 0.0020340735791251063, "epoch": 0.05618652620035117, "grad_norm": 0.12784834206104279, "learning_rate": 2e-07, "loss": 0.0376, "step": 602 }, { "clip_ratio/high_max": 0.0022849907545605674, "clip_ratio/high_mean": 0.0010077215629280545, "clip_ratio/low_mean": 0.0009346351216663606, "clip_ratio/low_min": 6.386938730429392e-05, "clip_ratio/region_mean": 0.0019423566700425, "epoch": 0.05627985930035175, "grad_norm": 0.11396363377571106, "learning_rate": 2e-07, "loss": 0.0088, "step": 603 }, { "clip_ratio/high_max": 0.0024233636941062286, "clip_ratio/high_mean": 0.0010009391226049047, "clip_ratio/low_mean": 0.0009546579822199419, "clip_ratio/low_min": 0.0001454099301554379, "clip_ratio/region_mean": 0.0019555971084628254, "epoch": 0.05637319240035233, "grad_norm": 0.11195860803127289, "learning_rate": 2e-07, "loss": 0.0182, "step": 604 }, { "clip_ratio/high_max": 0.0022584292528335936, "clip_ratio/high_mean": 0.001017276854327065, "clip_ratio/low_mean": 0.0010132947136298753, "clip_ratio/low_min": 8.994978270493448e-05, "clip_ratio/region_mean": 0.0020305715734139085, "epoch": 0.056466525500352915, "grad_norm": 0.1288360059261322, "learning_rate": 2e-07, "loss": 0.0282, "step": 605 }, { "clip_ratio/high_max": 0.0020801229766220786, "clip_ratio/high_mean": 0.0008598467538831756, "clip_ratio/low_mean": 0.0010053420628537424, "clip_ratio/low_min": 0.000144050864946621, "clip_ratio/region_mean": 0.0018651888094609603, "epoch": 0.0565598586003535, "grad_norm": 0.11538514494895935, "learning_rate": 2e-07, "loss": 0.0163, "step": 606 }, { "clip_ratio/high_max": 0.001956802541826619, "clip_ratio/high_mean": 0.0007998972778295865, "clip_ratio/low_mean": 0.0010591943155304762, "clip_ratio/low_min": 6.012514859321527e-05, "clip_ratio/region_mean": 0.0018590915569802746, "epoch": 0.056653191700354086, "grad_norm": 0.11271995306015015, "learning_rate": 2e-07, "loss": 0.0426, "step": 607 }, { "clip_ratio/high_max": 0.0022188252478372306, "clip_ratio/high_mean": 0.000901914712812868, "clip_ratio/low_mean": 0.001017480459267972, "clip_ratio/low_min": 9.17556226340821e-05, "clip_ratio/region_mean": 0.0019193951375200413, "epoch": 0.056746524800354664, "grad_norm": 0.11789216846227646, "learning_rate": 2e-07, "loss": 0.0437, "step": 608 }, { "clip_ratio/high_max": 0.0016462784296891186, "clip_ratio/high_mean": 0.0007263420666276943, "clip_ratio/low_mean": 0.000937152142796549, "clip_ratio/low_min": 4.636198718799278e-05, "clip_ratio/region_mean": 0.0016634942148812115, "epoch": 0.05683985790035525, "grad_norm": 0.11146269738674164, "learning_rate": 2e-07, "loss": 0.0098, "step": 609 }, { "clip_ratio/high_max": 0.0022068977195885964, "clip_ratio/high_mean": 0.0009652531571191503, "clip_ratio/low_mean": 0.0009203112131217495, "clip_ratio/low_min": 4.719633579952642e-05, "clip_ratio/region_mean": 0.0018855643502320163, "epoch": 0.056933191000355834, "grad_norm": 0.12851552665233612, "learning_rate": 2e-07, "loss": 0.0224, "step": 610 }, { "clip_ratio/high_max": 0.0017423881399736274, "clip_ratio/high_mean": 0.0007317573654290754, "clip_ratio/low_mean": 0.0010414331663923804, "clip_ratio/low_min": 0.00021733309449700755, "clip_ratio/region_mean": 0.0017731905245454982, "epoch": 0.05702652410035641, "grad_norm": 0.11545484513044357, "learning_rate": 2e-07, "loss": 0.1016, "step": 611 }, { "clip_ratio/high_max": 0.0018321981078770477, "clip_ratio/high_mean": 0.0008588770760979969, "clip_ratio/low_mean": 0.0009954212764569093, "clip_ratio/low_min": 0.00010560900591372047, "clip_ratio/region_mean": 0.0018542983307270333, "epoch": 0.057119857200357, "grad_norm": 0.1160525381565094, "learning_rate": 2e-07, "loss": 0.065, "step": 612 }, { "clip_ratio/high_max": 0.0018438875922583975, "clip_ratio/high_mean": 0.0008540100880054524, "clip_ratio/low_mean": 0.0009813424658204895, "clip_ratio/low_min": 7.070754691085313e-05, "clip_ratio/region_mean": 0.001835352522903122, "epoch": 0.05721319030035758, "grad_norm": 0.12325077503919601, "learning_rate": 2e-07, "loss": 0.0178, "step": 613 }, { "clip_ratio/high_max": 0.0020148377916484606, "clip_ratio/high_mean": 0.0008188337687897729, "clip_ratio/low_mean": 0.0008718620956642553, "clip_ratio/low_min": 2.973655500682071e-05, "clip_ratio/region_mean": 0.0016906958335312083, "epoch": 0.05730652340035817, "grad_norm": 0.11990873515605927, "learning_rate": 2e-07, "loss": 0.0543, "step": 614 }, { "clip_ratio/high_max": 0.0024417194654233754, "clip_ratio/high_mean": 0.0009819797305681277, "clip_ratio/low_mean": 0.0008621455563115887, "clip_ratio/low_min": 7.976830147526925e-05, "clip_ratio/region_mean": 0.0018441253268974833, "epoch": 0.05739985650035875, "grad_norm": 0.11211275309324265, "learning_rate": 2e-07, "loss": -0.0065, "step": 615 }, { "clip_ratio/high_max": 0.0024322381941601634, "clip_ratio/high_mean": 0.0009480927637923742, "clip_ratio/low_mean": 0.0008639070874778554, "clip_ratio/low_min": 5.4639115660393145e-05, "clip_ratio/region_mean": 0.0018119998494512402, "epoch": 0.05749318960035933, "grad_norm": 0.11129918694496155, "learning_rate": 2e-07, "loss": 0.0059, "step": 616 }, { "clip_ratio/high_max": 0.002055084059975343, "clip_ratio/high_mean": 0.0008700843236510991, "clip_ratio/low_mean": 0.0009720877224026481, "clip_ratio/low_min": 0.0001493253257649485, "clip_ratio/region_mean": 0.0018421720378682949, "epoch": 0.05758652270035992, "grad_norm": 0.11633151769638062, "learning_rate": 2e-07, "loss": 0.0398, "step": 617 }, { "clip_ratio/high_max": 0.0023168694679043256, "clip_ratio/high_mean": 0.0009925645463226829, "clip_ratio/low_mean": 0.0009188110579998465, "clip_ratio/low_min": 6.267105800361605e-05, "clip_ratio/region_mean": 0.0019113756061415188, "epoch": 0.0576798558003605, "grad_norm": 0.10338623076677322, "learning_rate": 2e-07, "loss": 0.0008, "step": 618 }, { "clip_ratio/high_max": 0.0022001542020007037, "clip_ratio/high_mean": 0.0009023841721500503, "clip_ratio/low_mean": 0.000887502494151704, "clip_ratio/low_min": 8.556810917070834e-05, "clip_ratio/region_mean": 0.001789886700862553, "epoch": 0.05777318890036108, "grad_norm": 0.12876224517822266, "learning_rate": 2e-07, "loss": 0.0119, "step": 619 }, { "clip_ratio/high_max": 0.002233200160844717, "clip_ratio/high_mean": 0.0008979661251942161, "clip_ratio/low_mean": 0.0008993901101348456, "clip_ratio/low_min": 0.00011472089227027027, "clip_ratio/region_mean": 0.0017973562426050194, "epoch": 0.057866522000361666, "grad_norm": 0.10375628620386124, "learning_rate": 2e-07, "loss": 0.0476, "step": 620 }, { "clip_ratio/high_max": 0.0019879384781233966, "clip_ratio/high_mean": 0.000867251797899371, "clip_ratio/low_mean": 0.000989591988400207, "clip_ratio/low_min": 0.0001362598786727176, "clip_ratio/region_mean": 0.0018568437444628216, "epoch": 0.05795985510036225, "grad_norm": 0.11803611367940903, "learning_rate": 2e-07, "loss": 0.0311, "step": 621 }, { "clip_ratio/high_max": 0.0022045137229724787, "clip_ratio/high_mean": 0.0010708162590162829, "clip_ratio/low_mean": 0.0009048676038219128, "clip_ratio/low_min": 3.424507849558722e-05, "clip_ratio/region_mean": 0.0019756837937165983, "epoch": 0.05805318820036283, "grad_norm": 0.11817792057991028, "learning_rate": 2e-07, "loss": 0.0155, "step": 622 }, { "clip_ratio/high_max": 0.002727392391534522, "clip_ratio/high_mean": 0.001058629684848711, "clip_ratio/low_mean": 0.0009116101082327077, "clip_ratio/low_min": 4.3188058043597266e-05, "clip_ratio/region_mean": 0.0019702397476066835, "epoch": 0.058146521300363414, "grad_norm": 0.1177649050951004, "learning_rate": 2e-07, "loss": 0.0022, "step": 623 }, { "clip_ratio/high_max": 0.0017515255458420143, "clip_ratio/high_mean": 0.000796027014075662, "clip_ratio/low_mean": 0.0009457279393245699, "clip_ratio/low_min": 3.4069600587827154e-05, "clip_ratio/region_mean": 0.001741754931572359, "epoch": 0.058239854400364, "grad_norm": 0.11694556474685669, "learning_rate": 2e-07, "loss": 0.0299, "step": 624 }, { "clip_ratio/high_max": 0.002340443643333856, "clip_ratio/high_mean": 0.0009413007064722478, "clip_ratio/low_mean": 0.0010392930180387339, "clip_ratio/low_min": 0.00015762340308356215, "clip_ratio/region_mean": 0.001980593726329971, "epoch": 0.058333187500364585, "grad_norm": 0.11658074706792831, "learning_rate": 2e-07, "loss": 0.0568, "step": 625 }, { "clip_ratio/high_max": 0.0019569094984035473, "clip_ratio/high_mean": 0.0008405772168771364, "clip_ratio/low_mean": 0.0009400380567967659, "clip_ratio/low_min": 0.00013596559074358083, "clip_ratio/region_mean": 0.0017806152536650188, "epoch": 0.05842652060036516, "grad_norm": 0.11186511069536209, "learning_rate": 2e-07, "loss": 0.03, "step": 626 }, { "clip_ratio/high_max": 0.0018417965911794454, "clip_ratio/high_mean": 0.000840042601339519, "clip_ratio/low_mean": 0.0009863174782367423, "clip_ratio/low_min": 0.0001037850379361771, "clip_ratio/region_mean": 0.0018263600795762613, "epoch": 0.05851985370036575, "grad_norm": 0.11228141188621521, "learning_rate": 2e-07, "loss": 0.0252, "step": 627 }, { "clip_ratio/high_max": 0.0022933728905627504, "clip_ratio/high_mean": 0.0009012081864057109, "clip_ratio/low_mean": 0.001025328030664241, "clip_ratio/low_min": 7.148210534069221e-05, "clip_ratio/region_mean": 0.0019265362279838882, "epoch": 0.05861318680036633, "grad_norm": 0.12023285776376724, "learning_rate": 2e-07, "loss": 0.0313, "step": 628 }, { "clip_ratio/high_max": 0.0021305307163856924, "clip_ratio/high_mean": 0.0008642983593745157, "clip_ratio/low_mean": 0.0009644283672969323, "clip_ratio/low_min": 6.521927207359113e-05, "clip_ratio/region_mean": 0.0018287267012055963, "epoch": 0.05870651990036692, "grad_norm": 0.14766451716423035, "learning_rate": 2e-07, "loss": 0.0321, "step": 629 }, { "clip_ratio/high_max": 0.0024739799919188954, "clip_ratio/high_mean": 0.001017876385958516, "clip_ratio/low_mean": 0.0009563955009070924, "clip_ratio/low_min": 0.00011074225494667189, "clip_ratio/region_mean": 0.0019742718868656084, "epoch": 0.0587998530003675, "grad_norm": 0.11985670030117035, "learning_rate": 2e-07, "loss": -0.0245, "step": 630 }, { "clip_ratio/high_max": 0.0021315259727998637, "clip_ratio/high_mean": 0.0008786385860730661, "clip_ratio/low_mean": 0.0009978000198316295, "clip_ratio/low_min": 0.0001557267760290415, "clip_ratio/region_mean": 0.0018764385968097486, "epoch": 0.05889318610036808, "grad_norm": 0.1174456998705864, "learning_rate": 2e-07, "loss": 0.0232, "step": 631 }, { "clip_ratio/high_max": 0.001963110644283006, "clip_ratio/high_mean": 0.0008560341157135554, "clip_ratio/low_mean": 0.0009234173376171384, "clip_ratio/low_min": 7.418874156428501e-05, "clip_ratio/region_mean": 0.001779451449692715, "epoch": 0.05898651920036867, "grad_norm": 0.1255776435136795, "learning_rate": 2e-07, "loss": 0.0557, "step": 632 }, { "clip_ratio/high_max": 0.0020621189250960015, "clip_ratio/high_mean": 0.0009853328665485606, "clip_ratio/low_mean": 0.0009934539193636738, "clip_ratio/low_min": 7.471607932529878e-05, "clip_ratio/region_mean": 0.001978786807740107, "epoch": 0.05907985230036925, "grad_norm": 0.11676029860973358, "learning_rate": 2e-07, "loss": 0.0621, "step": 633 }, { "clip_ratio/high_max": 0.0025065186964638997, "clip_ratio/high_mean": 0.0009538823615002912, "clip_ratio/low_mean": 0.0009157164076896152, "clip_ratio/low_min": 0.00010371599819336552, "clip_ratio/region_mean": 0.0018695987237151712, "epoch": 0.05917318540036983, "grad_norm": 0.11800405383110046, "learning_rate": 2e-07, "loss": 0.0201, "step": 634 }, { "clip_ratio/high_max": 0.0023061880201566964, "clip_ratio/high_mean": 0.0009191065219056327, "clip_ratio/low_mean": 0.0010262006289849523, "clip_ratio/low_min": 0.00012957333183294395, "clip_ratio/region_mean": 0.0019453071290627122, "epoch": 0.059266518500370416, "grad_norm": 0.12821388244628906, "learning_rate": 2e-07, "loss": 0.0301, "step": 635 }, { "clip_ratio/high_max": 0.0025455046488787048, "clip_ratio/high_mean": 0.0009687258989288239, "clip_ratio/low_mean": 0.0009747637559485156, "clip_ratio/low_min": 4.7209832700900733e-05, "clip_ratio/region_mean": 0.0019434896385064349, "epoch": 0.059359851600371, "grad_norm": 0.10838401317596436, "learning_rate": 2e-07, "loss": 0.0256, "step": 636 }, { "clip_ratio/high_max": 0.0021143549820408225, "clip_ratio/high_mean": 0.000868700873979833, "clip_ratio/low_mean": 0.0010076763082906837, "clip_ratio/low_min": 0.0001655052419664571, "clip_ratio/region_mean": 0.0018763771731755696, "epoch": 0.05945318470037158, "grad_norm": 0.11455827206373215, "learning_rate": 2e-07, "loss": 0.0385, "step": 637 }, { "clip_ratio/high_max": 0.002226033895567525, "clip_ratio/high_mean": 0.0008930311141739367, "clip_ratio/low_mean": 0.0009752767145982943, "clip_ratio/low_min": 0.00011565575368877035, "clip_ratio/region_mean": 0.00186830780148739, "epoch": 0.059546517800372165, "grad_norm": 0.11483007669448853, "learning_rate": 2e-07, "loss": -0.0197, "step": 638 }, { "clip_ratio/high_max": 0.002058508263871772, "clip_ratio/high_mean": 0.0008881699122866848, "clip_ratio/low_mean": 0.000922311241083662, "clip_ratio/low_min": 0.00014612324775953311, "clip_ratio/region_mean": 0.0018104811169905588, "epoch": 0.05963985090037275, "grad_norm": 0.11812012642621994, "learning_rate": 2e-07, "loss": 0.0047, "step": 639 }, { "clip_ratio/high_max": 0.002003866891755024, "clip_ratio/high_mean": 0.0008674252258060733, "clip_ratio/low_mean": 0.0008784973888396053, "clip_ratio/low_min": 4.701655052485876e-05, "clip_ratio/region_mean": 0.0017459226291975938, "epoch": 0.059733184000373335, "grad_norm": 0.10835648328065872, "learning_rate": 2e-07, "loss": -0.0067, "step": 640 }, { "clip_ratio/high_max": 0.0, "clip_ratio/high_mean": 0.0, "clip_ratio/low_mean": 0.0, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0, "completions/clipped_ratio": 0.014482770647321397, "completions/max_length": 4096.0, "completions/max_terminated_length": 4089.0, "completions/mean_length": 613.0990600585938, "completions/mean_terminated_length": 561.9157104492188, "completions/min_length": 2.0, "completions/min_terminated_length": 2.0, "epoch": 0.05982651710037391, "grad_norm": 0.12525855004787445, "learning_rate": 2e-07, "loss": 0.0285, "num_tokens": 488896931.0, "reward": 0.55816650390625, "reward_std": 0.21315595507621765, "rewards/simpleverify_reward/mean": 0.55816650390625, "rewards/simpleverify_reward/std": 0.49660736322402954, "step": 641 }, { "clip_ratio/high_max": 0.002371956841670908, "clip_ratio/high_mean": 0.0009330493849120103, "clip_ratio/low_mean": 0.0006415565894712927, "clip_ratio/low_min": 5.7625811678008176e-05, "clip_ratio/region_mean": 0.0015746059507364407, "epoch": 0.0599198502003745, "grad_norm": 0.11834606528282166, "learning_rate": 2e-07, "loss": 0.0072, "step": 642 }, { "clip_ratio/high_max": 0.0022746646536688786, "clip_ratio/high_mean": 0.0009125092728936579, "clip_ratio/low_mean": 0.0005986554497212637, "clip_ratio/low_min": 2.2847357286082115e-05, "clip_ratio/region_mean": 0.0015111647262529004, "epoch": 0.060013183300375084, "grad_norm": 0.11614423245191574, "learning_rate": 2e-07, "loss": 0.0403, "step": 643 }, { "clip_ratio/high_max": 0.0020758877362823114, "clip_ratio/high_mean": 0.0008623836965853116, "clip_ratio/low_mean": 0.0005467594128276687, "clip_ratio/low_min": 1.3366125131142326e-05, "clip_ratio/region_mean": 0.001409143085766118, "epoch": 0.06010651640037567, "grad_norm": 0.12088653445243835, "learning_rate": 2e-07, "loss": 0.0202, "step": 644 }, { "clip_ratio/high_max": 0.002267705203848891, "clip_ratio/high_mean": 0.0008915706566767767, "clip_ratio/low_mean": 0.0005369100526877446, "clip_ratio/low_min": 3.705171911860816e-05, "clip_ratio/region_mean": 0.0014284807111835107, "epoch": 0.06019984950037625, "grad_norm": 0.1258813887834549, "learning_rate": 2e-07, "loss": 0.0128, "step": 645 }, { "clip_ratio/high_max": 0.002247929136501625, "clip_ratio/high_mean": 0.0009537510995869525, "clip_ratio/low_mean": 0.0005995985120534897, "clip_ratio/low_min": 5.000415421818616e-05, "clip_ratio/region_mean": 0.0015533496298303362, "epoch": 0.06029318260037683, "grad_norm": 0.1321881264448166, "learning_rate": 2e-07, "loss": 0.0019, "step": 646 }, { "clip_ratio/high_max": 0.002189490172895603, "clip_ratio/high_mean": 0.0009045034275914077, "clip_ratio/low_mean": 0.0005839939694851637, "clip_ratio/low_min": 5.7134192502417136e-05, "clip_ratio/region_mean": 0.0014884973825246561, "epoch": 0.06038651570037742, "grad_norm": 0.11817917227745056, "learning_rate": 2e-07, "loss": 0.0283, "step": 647 }, { "clip_ratio/high_max": 0.0018796877047861926, "clip_ratio/high_mean": 0.000751205816413858, "clip_ratio/low_mean": 0.0006382209958246676, "clip_ratio/low_min": 6.225532069947803e-05, "clip_ratio/region_mean": 0.001389426804962568, "epoch": 0.060479848800377996, "grad_norm": 0.11604613810777664, "learning_rate": 2e-07, "loss": 0.0583, "step": 648 }, { "clip_ratio/high_max": 0.00240376027795719, "clip_ratio/high_mean": 0.0009194964295602404, "clip_ratio/low_mean": 0.0006476884809671901, "clip_ratio/low_min": 2.319556188012939e-05, "clip_ratio/region_mean": 0.0015671849250793457, "epoch": 0.06057318190037858, "grad_norm": 0.12826141715049744, "learning_rate": 2e-07, "loss": 0.0336, "step": 649 }, { "clip_ratio/high_max": 0.0021634745608025696, "clip_ratio/high_mean": 0.000879203422300634, "clip_ratio/low_mean": 0.0005358941698432318, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.001415097591234371, "epoch": 0.060666515000379166, "grad_norm": 0.11927508562803268, "learning_rate": 2e-07, "loss": -0.0059, "step": 650 }, { "clip_ratio/high_max": 0.002212839295680169, "clip_ratio/high_mean": 0.0008483325818815501, "clip_ratio/low_mean": 0.0007601955458085285, "clip_ratio/low_min": 5.877712374058319e-05, "clip_ratio/region_mean": 0.0016085281240520999, "epoch": 0.06075984810037975, "grad_norm": 0.11917001754045486, "learning_rate": 2e-07, "loss": 0.0356, "step": 651 }, { "clip_ratio/high_max": 0.0021385813561209943, "clip_ratio/high_mean": 0.0008537513640476391, "clip_ratio/low_mean": 0.0005956591285212198, "clip_ratio/low_min": 5.837635490024695e-05, "clip_ratio/region_mean": 0.0014494104871118907, "epoch": 0.06085318120038033, "grad_norm": 0.13249382376670837, "learning_rate": 2e-07, "loss": 0.0644, "step": 652 }, { "clip_ratio/high_max": 0.0023779871698934585, "clip_ratio/high_mean": 0.0008243031115853228, "clip_ratio/low_mean": 0.0006609952470171265, "clip_ratio/low_min": 5.012668407289311e-05, "clip_ratio/region_mean": 0.001485298402258195, "epoch": 0.060946514300380915, "grad_norm": 0.11846628785133362, "learning_rate": 2e-07, "loss": 0.0604, "step": 653 }, { "clip_ratio/high_max": 0.0018709585565375164, "clip_ratio/high_mean": 0.0007969460493768565, "clip_ratio/low_mean": 0.0005839664827362867, "clip_ratio/low_min": 5.370378221414285e-05, "clip_ratio/region_mean": 0.0013809125230181962, "epoch": 0.0610398474003815, "grad_norm": 0.12018971890211105, "learning_rate": 2e-07, "loss": 0.0177, "step": 654 }, { "clip_ratio/high_max": 0.0020739580140798353, "clip_ratio/high_mean": 0.0008887231106200488, "clip_ratio/low_mean": 0.0006062251532057417, "clip_ratio/low_min": 7.88685902080033e-05, "clip_ratio/region_mean": 0.0014949482574593276, "epoch": 0.061133180500382085, "grad_norm": 0.12182638794183731, "learning_rate": 2e-07, "loss": 0.0124, "step": 655 }, { "clip_ratio/high_max": 0.002188773207308259, "clip_ratio/high_mean": 0.00087898702986422, "clip_ratio/low_mean": 0.000774167585404939, "clip_ratio/low_min": 5.4331151659425814e-05, "clip_ratio/region_mean": 0.001653154642554, "epoch": 0.061226513600382663, "grad_norm": 0.11339588463306427, "learning_rate": 2e-07, "loss": 0.0144, "step": 656 }, { "clip_ratio/high_max": 0.002100151206832379, "clip_ratio/high_mean": 0.0008244738055509515, "clip_ratio/low_mean": 0.0008182076344382949, "clip_ratio/low_min": 0.00013545964975492097, "clip_ratio/region_mean": 0.001642681465455098, "epoch": 0.06131984670038325, "grad_norm": 0.10663426667451859, "learning_rate": 2e-07, "loss": 0.0694, "step": 657 }, { "clip_ratio/high_max": 0.001858689731307095, "clip_ratio/high_mean": 0.0008595221115683671, "clip_ratio/low_mean": 0.0007298510918190004, "clip_ratio/low_min": 8.013111892068991e-05, "clip_ratio/region_mean": 0.0015893732343101874, "epoch": 0.061413179800383834, "grad_norm": 0.11360536515712738, "learning_rate": 2e-07, "loss": 0.0304, "step": 658 }, { "clip_ratio/high_max": 0.0022252499402384274, "clip_ratio/high_mean": 0.0009185917788272491, "clip_ratio/low_mean": 0.0007417927899950882, "clip_ratio/low_min": 9.653050074120983e-05, "clip_ratio/region_mean": 0.0016603845979261678, "epoch": 0.06150651290038442, "grad_norm": 0.12179926037788391, "learning_rate": 2e-07, "loss": 0.0129, "step": 659 }, { "clip_ratio/high_max": 0.0022896380614838563, "clip_ratio/high_mean": 0.0009318047377746552, "clip_ratio/low_mean": 0.0006730870027240599, "clip_ratio/low_min": 1.940858601301443e-05, "clip_ratio/region_mean": 0.0016048917605075985, "epoch": 0.061599846000385, "grad_norm": 0.11873029917478561, "learning_rate": 2e-07, "loss": 0.0206, "step": 660 }, { "clip_ratio/high_max": 0.0020351467064756434, "clip_ratio/high_mean": 0.0007730941815680126, "clip_ratio/low_mean": 0.0006992682865529787, "clip_ratio/low_min": 3.565988390619168e-05, "clip_ratio/region_mean": 0.0014723624990438111, "epoch": 0.06169317910038558, "grad_norm": 0.11425571888685226, "learning_rate": 2e-07, "loss": 0.0104, "step": 661 }, { "clip_ratio/high_max": 0.002312986813194584, "clip_ratio/high_mean": 0.0009187582600134192, "clip_ratio/low_mean": 0.0007571778669444029, "clip_ratio/low_min": 8.963149821283878e-05, "clip_ratio/region_mean": 0.0016759361387812532, "epoch": 0.06178651220038617, "grad_norm": 0.12232028692960739, "learning_rate": 2e-07, "loss": 0.0517, "step": 662 }, { "clip_ratio/high_max": 0.002112763835611986, "clip_ratio/high_mean": 0.0008409908223256934, "clip_ratio/low_mean": 0.0006868618111184333, "clip_ratio/low_min": 2.1800494323542807e-05, "clip_ratio/region_mean": 0.0015278526370821055, "epoch": 0.061879845300386746, "grad_norm": 0.11244107782840729, "learning_rate": 2e-07, "loss": 0.0208, "step": 663 }, { "clip_ratio/high_max": 0.0023181005235528573, "clip_ratio/high_mean": 0.0009890048550005304, "clip_ratio/low_mean": 0.0007194268600869691, "clip_ratio/low_min": 6.873962593090255e-05, "clip_ratio/region_mean": 0.0017084317405533511, "epoch": 0.06197317840038733, "grad_norm": 0.11132694035768509, "learning_rate": 2e-07, "loss": -0.006, "step": 664 }, { "clip_ratio/high_max": 0.0022057903952372726, "clip_ratio/high_mean": 0.0009104003856919007, "clip_ratio/low_mean": 0.0007517829808421084, "clip_ratio/low_min": 7.970226397446822e-05, "clip_ratio/region_mean": 0.0016621834110992495, "epoch": 0.062066511500387916, "grad_norm": 0.1246526911854744, "learning_rate": 2e-07, "loss": -0.0175, "step": 665 }, { "clip_ratio/high_max": 0.001722380387946032, "clip_ratio/high_mean": 0.0007433621231029974, "clip_ratio/low_mean": 0.0007235482062242227, "clip_ratio/low_min": 4.8755345233075786e-05, "clip_ratio/region_mean": 0.0014669103038613684, "epoch": 0.0621598446003885, "grad_norm": 0.11363562196493149, "learning_rate": 2e-07, "loss": 0.0462, "step": 666 }, { "clip_ratio/high_max": 0.0022754080782760866, "clip_ratio/high_mean": 0.0008880047953425674, "clip_ratio/low_mean": 0.0008061302105488721, "clip_ratio/low_min": 8.244989112426993e-05, "clip_ratio/region_mean": 0.0016941349749686196, "epoch": 0.06225317770038908, "grad_norm": 0.10238362103700638, "learning_rate": 2e-07, "loss": 0.0171, "step": 667 }, { "clip_ratio/high_max": 0.001922552786709275, "clip_ratio/high_mean": 0.0008415329175477382, "clip_ratio/low_mean": 0.0008048155577853322, "clip_ratio/low_min": 4.667443499783985e-05, "clip_ratio/region_mean": 0.001646348464419134, "epoch": 0.062346510800389665, "grad_norm": 0.12019217759370804, "learning_rate": 2e-07, "loss": 0.0399, "step": 668 }, { "clip_ratio/high_max": 0.0019338492638780735, "clip_ratio/high_mean": 0.0008118976547848433, "clip_ratio/low_mean": 0.0008130748065013904, "clip_ratio/low_min": 0.00011061070836149156, "clip_ratio/region_mean": 0.0016249724321824033, "epoch": 0.06243984390039025, "grad_norm": 0.11617182195186615, "learning_rate": 2e-07, "loss": 0.0676, "step": 669 }, { "clip_ratio/high_max": 0.001970074841665337, "clip_ratio/high_mean": 0.0008161072801158298, "clip_ratio/low_mean": 0.0007418236145895207, "clip_ratio/low_min": 9.477987259742804e-05, "clip_ratio/region_mean": 0.0015579309038002975, "epoch": 0.06253317700039084, "grad_norm": 0.1118164211511612, "learning_rate": 2e-07, "loss": 0.0076, "step": 670 }, { "clip_ratio/high_max": 0.0022078778383729514, "clip_ratio/high_mean": 0.0008189249629140249, "clip_ratio/low_mean": 0.0008190792505047284, "clip_ratio/low_min": 9.686923658591695e-05, "clip_ratio/region_mean": 0.001638004232518142, "epoch": 0.06262651010039141, "grad_norm": 0.1153862401843071, "learning_rate": 2e-07, "loss": 0.0533, "step": 671 }, { "clip_ratio/high_max": 0.0021105991763761267, "clip_ratio/high_mean": 0.0008977356774266809, "clip_ratio/low_mean": 0.0008365056110051228, "clip_ratio/low_min": 9.843691987043712e-05, "clip_ratio/region_mean": 0.0017342412684229203, "epoch": 0.062719843200392, "grad_norm": 0.12080097943544388, "learning_rate": 2e-07, "loss": 0.0235, "step": 672 }, { "clip_ratio/high_max": 0.0018591475381981581, "clip_ratio/high_mean": 0.000907747627934441, "clip_ratio/low_mean": 0.0008816120189294452, "clip_ratio/low_min": 4.138876738579711e-05, "clip_ratio/region_mean": 0.0017893596887006424, "epoch": 0.06281317630039258, "grad_norm": 0.11238964647054672, "learning_rate": 2e-07, "loss": 0.03, "step": 673 }, { "clip_ratio/high_max": 0.002198485854023602, "clip_ratio/high_mean": 0.0008619735926913563, "clip_ratio/low_mean": 0.0007446933996106964, "clip_ratio/low_min": 2.3953436539159156e-05, "clip_ratio/region_mean": 0.0016066669777501374, "epoch": 0.06290650940039316, "grad_norm": 0.11121684312820435, "learning_rate": 2e-07, "loss": -0.0013, "step": 674 }, { "clip_ratio/high_max": 0.0022081065690144897, "clip_ratio/high_mean": 0.0009590811987436609, "clip_ratio/low_mean": 0.0008918706680560717, "clip_ratio/low_min": 8.814583543426124e-05, "clip_ratio/region_mean": 0.0018509518558857962, "epoch": 0.06299984250039375, "grad_norm": 0.12158425152301788, "learning_rate": 2e-07, "loss": 0.0001, "step": 675 }, { "clip_ratio/high_max": 0.001971314191905549, "clip_ratio/high_mean": 0.0008239938542828895, "clip_ratio/low_mean": 0.0007418953618980595, "clip_ratio/low_min": 3.5529345041140914e-05, "clip_ratio/region_mean": 0.001565889200719539, "epoch": 0.06309317560039433, "grad_norm": 0.10652816295623779, "learning_rate": 2e-07, "loss": 0.0523, "step": 676 }, { "clip_ratio/high_max": 0.002273922764288727, "clip_ratio/high_mean": 0.000976095994701609, "clip_ratio/low_mean": 0.0008085730387392687, "clip_ratio/low_min": 6.183747473187395e-05, "clip_ratio/region_mean": 0.0017846690134319942, "epoch": 0.06318650870039491, "grad_norm": 0.11928242444992065, "learning_rate": 2e-07, "loss": 0.0045, "step": 677 }, { "clip_ratio/high_max": 0.001818718301365152, "clip_ratio/high_mean": 0.0008516119178239023, "clip_ratio/low_mean": 0.0009140529000433162, "clip_ratio/low_min": 8.679845723236213e-05, "clip_ratio/region_mean": 0.0017656648778938688, "epoch": 0.0632798418003955, "grad_norm": 0.11051196604967117, "learning_rate": 2e-07, "loss": 0.0404, "step": 678 }, { "clip_ratio/high_max": 0.0025029404714587145, "clip_ratio/high_mean": 0.0009113033302128315, "clip_ratio/low_mean": 0.000846155766339507, "clip_ratio/low_min": 8.384710054087918e-05, "clip_ratio/region_mean": 0.0017574590528965928, "epoch": 0.06337317490039608, "grad_norm": 0.11238579452037811, "learning_rate": 2e-07, "loss": 0.01, "step": 679 }, { "clip_ratio/high_max": 0.002255398198030889, "clip_ratio/high_mean": 0.0008779307499935385, "clip_ratio/low_mean": 0.0007215602072392358, "clip_ratio/low_min": 4.401815567689482e-05, "clip_ratio/region_mean": 0.0015994909626897424, "epoch": 0.06346650800039666, "grad_norm": 0.11776664108037949, "learning_rate": 2e-07, "loss": -0.0106, "step": 680 }, { "clip_ratio/high_max": 0.0020852311317867134, "clip_ratio/high_mean": 0.0008095555831459933, "clip_ratio/low_mean": 0.0008922283241190598, "clip_ratio/low_min": 2.9339832508412655e-05, "clip_ratio/region_mean": 0.0017017839127220213, "epoch": 0.06355984110039725, "grad_norm": 0.12046264857053757, "learning_rate": 2e-07, "loss": 0.0489, "step": 681 }, { "clip_ratio/high_max": 0.002202571682573762, "clip_ratio/high_mean": 0.0009196183509629918, "clip_ratio/low_mean": 0.0008421338170592207, "clip_ratio/low_min": 7.011147226876346e-05, "clip_ratio/region_mean": 0.0017617521953070536, "epoch": 0.06365317420039783, "grad_norm": 0.1198941320180893, "learning_rate": 2e-07, "loss": 0.0295, "step": 682 }, { "clip_ratio/high_max": 0.0020623937125492375, "clip_ratio/high_mean": 0.0008958043836173601, "clip_ratio/low_mean": 0.000874515317264013, "clip_ratio/low_min": 7.926149464765331e-05, "clip_ratio/region_mean": 0.001770319686329458, "epoch": 0.06374650730039842, "grad_norm": 0.11256197094917297, "learning_rate": 2e-07, "loss": 0.0562, "step": 683 }, { "clip_ratio/high_max": 0.0021881583161302842, "clip_ratio/high_mean": 0.0009091709725908004, "clip_ratio/low_mean": 0.0008887479234545026, "clip_ratio/low_min": 4.9391591346648056e-05, "clip_ratio/region_mean": 0.001797918856027536, "epoch": 0.063839840400399, "grad_norm": 0.11190496385097504, "learning_rate": 2e-07, "loss": 0.027, "step": 684 }, { "clip_ratio/high_max": 0.0020117362946621142, "clip_ratio/high_mean": 0.000834682659842656, "clip_ratio/low_mean": 0.000788765040852013, "clip_ratio/low_min": 2.8463020498747937e-05, "clip_ratio/region_mean": 0.0016234476570389234, "epoch": 0.06393317350039958, "grad_norm": 0.12317820638418198, "learning_rate": 2e-07, "loss": 0.0203, "step": 685 }, { "clip_ratio/high_max": 0.0020931546641804744, "clip_ratio/high_mean": 0.000868763550897711, "clip_ratio/low_mean": 0.0008086914567684289, "clip_ratio/low_min": 0.00012224825695739128, "clip_ratio/region_mean": 0.001677455053140875, "epoch": 0.06402650660040017, "grad_norm": 0.1088864728808403, "learning_rate": 2e-07, "loss": 0.021, "step": 686 }, { "clip_ratio/high_max": 0.002222632960183546, "clip_ratio/high_mean": 0.0009545270531816641, "clip_ratio/low_mean": 0.0006916437851032242, "clip_ratio/low_min": 8.403605988860363e-05, "clip_ratio/region_mean": 0.0016461708437418565, "epoch": 0.06411983970040075, "grad_norm": 0.10864903032779694, "learning_rate": 2e-07, "loss": 0.0287, "step": 687 }, { "clip_ratio/high_max": 0.002169072162359953, "clip_ratio/high_mean": 0.0009225530229741707, "clip_ratio/low_mean": 0.0008662963973620208, "clip_ratio/low_min": 7.758977699268144e-05, "clip_ratio/region_mean": 0.0017888494112412445, "epoch": 0.06421317280040133, "grad_norm": 0.12108906358480453, "learning_rate": 2e-07, "loss": -0.0005, "step": 688 }, { "clip_ratio/high_max": 0.0021790128157590516, "clip_ratio/high_mean": 0.0009453333477722481, "clip_ratio/low_mean": 0.0008091359759418992, "clip_ratio/low_min": 3.614653087424813e-05, "clip_ratio/region_mean": 0.0017544693109812215, "epoch": 0.06430650590040192, "grad_norm": 0.12314426153898239, "learning_rate": 2e-07, "loss": 0.0061, "step": 689 }, { "clip_ratio/high_max": 0.002089945373882074, "clip_ratio/high_mean": 0.0008195294303732226, "clip_ratio/low_mean": 0.0008871048266883008, "clip_ratio/low_min": 8.112131854431937e-05, "clip_ratio/region_mean": 0.001706634218862746, "epoch": 0.0643998390004025, "grad_norm": 0.1125098392367363, "learning_rate": 2e-07, "loss": 0.0306, "step": 690 }, { "clip_ratio/high_max": 0.0016941306566877756, "clip_ratio/high_mean": 0.0007549089805252152, "clip_ratio/low_mean": 0.0008668644331919495, "clip_ratio/low_min": 6.75136061545345e-05, "clip_ratio/region_mean": 0.0016217734773817938, "epoch": 0.06449317210040308, "grad_norm": 0.11180693656206131, "learning_rate": 2e-07, "loss": 0.0579, "step": 691 }, { "clip_ratio/high_max": 0.0018474619209882803, "clip_ratio/high_mean": 0.0008112750001600944, "clip_ratio/low_mean": 0.0008431081660091877, "clip_ratio/low_min": 8.205249469028786e-05, "clip_ratio/region_mean": 0.0016543831261515152, "epoch": 0.06458650520040367, "grad_norm": 0.1175006553530693, "learning_rate": 2e-07, "loss": 0.0744, "step": 692 }, { "clip_ratio/high_max": 0.002112087320710998, "clip_ratio/high_mean": 0.0008698218989593443, "clip_ratio/low_mean": 0.0008978481091617141, "clip_ratio/low_min": 0.00011891856047441252, "clip_ratio/region_mean": 0.0017676699899311643, "epoch": 0.06467983830040425, "grad_norm": 0.12457312643527985, "learning_rate": 2e-07, "loss": 0.034, "step": 693 }, { "clip_ratio/high_max": 0.002470169529260602, "clip_ratio/high_mean": 0.001007330371066928, "clip_ratio/low_mean": 0.0007057065886328928, "clip_ratio/low_min": 5.682592927769292e-05, "clip_ratio/region_mean": 0.0017130369451479055, "epoch": 0.06477317140040484, "grad_norm": 0.1150871217250824, "learning_rate": 2e-07, "loss": -0.0344, "step": 694 }, { "clip_ratio/high_max": 0.002407417072390672, "clip_ratio/high_mean": 0.000966824904025998, "clip_ratio/low_mean": 0.0007456965031451546, "clip_ratio/low_min": 5.397236600401811e-05, "clip_ratio/region_mean": 0.0017125213853432797, "epoch": 0.06486650450040542, "grad_norm": 0.11348842829465866, "learning_rate": 2e-07, "loss": 0.015, "step": 695 }, { "clip_ratio/high_max": 0.0018829534237738699, "clip_ratio/high_mean": 0.0007628092789673246, "clip_ratio/low_mean": 0.0009712351456983015, "clip_ratio/low_min": 0.00013904784736951115, "clip_ratio/region_mean": 0.0017340444246656261, "epoch": 0.064959837600406, "grad_norm": 0.11851639300584793, "learning_rate": 2e-07, "loss": 0.0684, "step": 696 }, { "clip_ratio/high_max": 0.0020882356802758295, "clip_ratio/high_mean": 0.0007848074073990574, "clip_ratio/low_mean": 0.0009016389121825341, "clip_ratio/low_min": 7.932118205644656e-05, "clip_ratio/region_mean": 0.0016864463250385597, "epoch": 0.06505317070040659, "grad_norm": 0.11063860356807709, "learning_rate": 2e-07, "loss": 0.0191, "step": 697 }, { "clip_ratio/high_max": 0.0023747993691358715, "clip_ratio/high_mean": 0.0009586257037881296, "clip_ratio/low_mean": 0.000773739655414829, "clip_ratio/low_min": 3.229265075788135e-05, "clip_ratio/region_mean": 0.0017323653737548739, "epoch": 0.06514650380040717, "grad_norm": 0.11639688163995743, "learning_rate": 2e-07, "loss": 0.0184, "step": 698 }, { "clip_ratio/high_max": 0.002161511860322207, "clip_ratio/high_mean": 0.0008622648965683766, "clip_ratio/low_mean": 0.0009410165694134776, "clip_ratio/low_min": 7.350067971856333e-05, "clip_ratio/region_mean": 0.0018032814550679177, "epoch": 0.06523983690040774, "grad_norm": 0.11240983754396439, "learning_rate": 2e-07, "loss": 0.0162, "step": 699 }, { "clip_ratio/high_max": 0.0019992219749838114, "clip_ratio/high_mean": 0.0008674803011672338, "clip_ratio/low_mean": 0.0008064955381996697, "clip_ratio/low_min": 7.586130413983483e-05, "clip_ratio/region_mean": 0.0016739758575567976, "epoch": 0.06533317000040834, "grad_norm": 0.11679087579250336, "learning_rate": 2e-07, "loss": 0.0308, "step": 700 }, { "clip_ratio/high_max": 0.002081599919620203, "clip_ratio/high_mean": 0.000852947245221003, "clip_ratio/low_mean": 0.0008464762941002846, "clip_ratio/low_min": 6.472763197962195e-05, "clip_ratio/region_mean": 0.0016994235338643193, "epoch": 0.06542650310040891, "grad_norm": 0.11153484135866165, "learning_rate": 2e-07, "loss": 0.0154, "step": 701 }, { "clip_ratio/high_max": 0.002044341315922793, "clip_ratio/high_mean": 0.0009151527774520218, "clip_ratio/low_mean": 0.0009166164236376062, "clip_ratio/low_min": 0.00015281202740879962, "clip_ratio/region_mean": 0.0018317691865377128, "epoch": 0.06551983620040949, "grad_norm": 0.11806044727563858, "learning_rate": 2e-07, "loss": 0.0165, "step": 702 }, { "clip_ratio/high_max": 0.0021720466465922073, "clip_ratio/high_mean": 0.0008007766300579533, "clip_ratio/low_mean": 0.0007988253018993419, "clip_ratio/low_min": 3.4576312827994116e-05, "clip_ratio/region_mean": 0.0015996019319572952, "epoch": 0.06561316930041008, "grad_norm": 0.1329117715358734, "learning_rate": 2e-07, "loss": 0.0451, "step": 703 }, { "clip_ratio/high_max": 0.0020285205828258768, "clip_ratio/high_mean": 0.0009091887222894002, "clip_ratio/low_mean": 0.0008204034547816264, "clip_ratio/low_min": 0.00013054705596005078, "clip_ratio/region_mean": 0.0017295921497861855, "epoch": 0.06570650240041066, "grad_norm": 0.1148393526673317, "learning_rate": 2e-07, "loss": -0.0047, "step": 704 }, { "clip_ratio/high_max": 0.002228978424682282, "clip_ratio/high_mean": 0.0009214368365064729, "clip_ratio/low_mean": 0.0009225524663634133, "clip_ratio/low_min": 0.0002044902794295922, "clip_ratio/region_mean": 0.0018439892737660557, "epoch": 0.06579983550041126, "grad_norm": 0.12470487505197525, "learning_rate": 2e-07, "loss": 0.0345, "step": 705 }, { "clip_ratio/high_max": 0.0025448336891713552, "clip_ratio/high_mean": 0.0010366965034336317, "clip_ratio/low_mean": 0.0008257633435277967, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0018624598378664814, "epoch": 0.06589316860041183, "grad_norm": 0.15635575354099274, "learning_rate": 2e-07, "loss": -0.0039, "step": 706 }, { "clip_ratio/high_max": 0.0021615631849272177, "clip_ratio/high_mean": 0.0008788000068307156, "clip_ratio/low_mean": 0.0009164421426248737, "clip_ratio/low_min": 7.856956244722824e-05, "clip_ratio/region_mean": 0.0017952421330846846, "epoch": 0.06598650170041241, "grad_norm": 0.10381249338388443, "learning_rate": 2e-07, "loss": 0.0344, "step": 707 }, { "clip_ratio/high_max": 0.002216930493887048, "clip_ratio/high_mean": 0.0008634622754470911, "clip_ratio/low_mean": 0.000862828401295701, "clip_ratio/low_min": 5.020934531785315e-05, "clip_ratio/region_mean": 0.001726290662190877, "epoch": 0.066079834800413, "grad_norm": 0.11977564543485641, "learning_rate": 2e-07, "loss": 0.0307, "step": 708 }, { "clip_ratio/high_max": 0.0022222168372536544, "clip_ratio/high_mean": 0.0009323892863903893, "clip_ratio/low_mean": 0.0008921621338231489, "clip_ratio/low_min": 5.9140818848391064e-05, "clip_ratio/region_mean": 0.0018245514002046548, "epoch": 0.06617316790041358, "grad_norm": 0.12228800356388092, "learning_rate": 2e-07, "loss": 0.0385, "step": 709 }, { "clip_ratio/high_max": 0.0017733751083142124, "clip_ratio/high_mean": 0.0007875870542193297, "clip_ratio/low_mean": 0.0010265787932439707, "clip_ratio/low_min": 7.791920870658942e-05, "clip_ratio/region_mean": 0.0018141658438253216, "epoch": 0.06626650100041416, "grad_norm": 0.1150774359703064, "learning_rate": 2e-07, "loss": 0.0457, "step": 710 }, { "clip_ratio/high_max": 0.0017806248652050272, "clip_ratio/high_mean": 0.0007395404736598721, "clip_ratio/low_mean": 0.0009387073332618456, "clip_ratio/low_min": 5.177752245799638e-05, "clip_ratio/region_mean": 0.0016782477832748555, "epoch": 0.06635983410041475, "grad_norm": 0.17688456177711487, "learning_rate": 2e-07, "loss": 0.1088, "step": 711 }, { "clip_ratio/high_max": 0.0019820799498120323, "clip_ratio/high_mean": 0.0008600428482168354, "clip_ratio/low_mean": 0.0008501248739776202, "clip_ratio/low_min": 8.499159594066441e-05, "clip_ratio/region_mean": 0.0017101677076425403, "epoch": 0.06645316720041533, "grad_norm": 0.11207538843154907, "learning_rate": 2e-07, "loss": 0.0308, "step": 712 }, { "clip_ratio/high_max": 0.0021238459266896825, "clip_ratio/high_mean": 0.0008535132838005666, "clip_ratio/low_mean": 0.001046808967657853, "clip_ratio/low_min": 0.00013002192736166762, "clip_ratio/region_mean": 0.0019003222478204407, "epoch": 0.06654650030041591, "grad_norm": 0.12009285390377045, "learning_rate": 2e-07, "loss": 0.0595, "step": 713 }, { "clip_ratio/high_max": 0.0023175162423285656, "clip_ratio/high_mean": 0.001047347210260341, "clip_ratio/low_mean": 0.0008378422171517741, "clip_ratio/low_min": 9.342610337625956e-05, "clip_ratio/region_mean": 0.001885189391032327, "epoch": 0.0666398334004165, "grad_norm": 0.1148824393749237, "learning_rate": 2e-07, "loss": 0.0242, "step": 714 }, { "clip_ratio/high_max": 0.0023664085056225304, "clip_ratio/high_mean": 0.0008393244370381581, "clip_ratio/low_mean": 0.0009190603595925495, "clip_ratio/low_min": 0.00013298190879140748, "clip_ratio/region_mean": 0.0017583848093636334, "epoch": 0.06673316650041708, "grad_norm": 0.12180853635072708, "learning_rate": 2e-07, "loss": 0.0365, "step": 715 }, { "clip_ratio/high_max": 0.0018710716831265017, "clip_ratio/high_mean": 0.0007821640774636762, "clip_ratio/low_mean": 0.0008545887885702541, "clip_ratio/low_min": 2.1312996977940202e-05, "clip_ratio/region_mean": 0.001636752873309888, "epoch": 0.06682649960041767, "grad_norm": 0.11269804835319519, "learning_rate": 2e-07, "loss": 0.0508, "step": 716 }, { "clip_ratio/high_max": 0.0022945914315641858, "clip_ratio/high_mean": 0.0009172579902951838, "clip_ratio/low_mean": 0.000992382087133592, "clip_ratio/low_min": 0.00012047116160829319, "clip_ratio/region_mean": 0.001909640101075638, "epoch": 0.06691983270041825, "grad_norm": 0.11313951760530472, "learning_rate": 2e-07, "loss": 0.0234, "step": 717 }, { "clip_ratio/high_max": 0.001972037454834208, "clip_ratio/high_mean": 0.0009391573639732087, "clip_ratio/low_mean": 0.0008576384680054616, "clip_ratio/low_min": 3.053646560147172e-05, "clip_ratio/region_mean": 0.0017967958046938293, "epoch": 0.06701316580041883, "grad_norm": 0.1067579984664917, "learning_rate": 2e-07, "loss": -0.0248, "step": 718 }, { "clip_ratio/high_max": 0.001900318053230876, "clip_ratio/high_mean": 0.0008600979490438476, "clip_ratio/low_mean": 0.0009095592649828177, "clip_ratio/low_min": 0.00010968286096613156, "clip_ratio/region_mean": 0.0017696572103886865, "epoch": 0.06710649890041942, "grad_norm": 0.11289706081151962, "learning_rate": 2e-07, "loss": 0.0329, "step": 719 }, { "clip_ratio/high_max": 0.001627892575925216, "clip_ratio/high_mean": 0.0007271597596627544, "clip_ratio/low_mean": 0.0008214818526539602, "clip_ratio/low_min": 0.00011580747832340421, "clip_ratio/region_mean": 0.001548641623230651, "epoch": 0.06719983200042, "grad_norm": 0.1185273751616478, "learning_rate": 2e-07, "loss": 0.0232, "step": 720 }, { "clip_ratio/high_max": 0.0025091104325838387, "clip_ratio/high_mean": 0.001004717472824268, "clip_ratio/low_mean": 0.0010284751497238176, "clip_ratio/low_min": 0.00013612890234071529, "clip_ratio/region_mean": 0.002033192584349308, "epoch": 0.06729316510042058, "grad_norm": 0.12472806870937347, "learning_rate": 2e-07, "loss": 0.0441, "step": 721 }, { "clip_ratio/high_max": 0.0021003730144002475, "clip_ratio/high_mean": 0.0009572078815835994, "clip_ratio/low_mean": 0.0008839241345413029, "clip_ratio/low_min": 0.0001134941958298441, "clip_ratio/region_mean": 0.0018411320488667116, "epoch": 0.06738649820042117, "grad_norm": 0.11459222435951233, "learning_rate": 2e-07, "loss": -0.0066, "step": 722 }, { "clip_ratio/high_max": 0.002506335797079373, "clip_ratio/high_mean": 0.0010977315942000132, "clip_ratio/low_mean": 0.0008580103731219424, "clip_ratio/low_min": 4.105770585738355e-05, "clip_ratio/region_mean": 0.0019557419582270086, "epoch": 0.06747983130042175, "grad_norm": 0.12623362243175507, "learning_rate": 2e-07, "loss": 0.0222, "step": 723 }, { "clip_ratio/high_max": 0.002190314407926053, "clip_ratio/high_mean": 0.0009012124301079893, "clip_ratio/low_mean": 0.0009357231956528267, "clip_ratio/low_min": 3.7644071198883466e-05, "clip_ratio/region_mean": 0.001836935589381028, "epoch": 0.06757316440042234, "grad_norm": 0.1150001585483551, "learning_rate": 2e-07, "loss": 0.0676, "step": 724 }, { "clip_ratio/high_max": 0.002078385296044871, "clip_ratio/high_mean": 0.0008824624164844863, "clip_ratio/low_mean": 0.0009405448854522547, "clip_ratio/low_min": 6.518939244415378e-05, "clip_ratio/region_mean": 0.0018230072964797728, "epoch": 0.06766649750042292, "grad_norm": 0.12104333937168121, "learning_rate": 2e-07, "loss": 0.0194, "step": 725 }, { "clip_ratio/high_max": 0.002160909352824092, "clip_ratio/high_mean": 0.0009302425460191444, "clip_ratio/low_mean": 0.0009362047167087439, "clip_ratio/low_min": 0.00022817623266746523, "clip_ratio/region_mean": 0.0018664472590899095, "epoch": 0.0677598306004235, "grad_norm": 0.1236250102519989, "learning_rate": 2e-07, "loss": 0.0179, "step": 726 }, { "clip_ratio/high_max": 0.0019130986802338157, "clip_ratio/high_mean": 0.0008639747065899428, "clip_ratio/low_mean": 0.0008459764922008617, "clip_ratio/low_min": 8.590639481553808e-05, "clip_ratio/region_mean": 0.0017099512333516032, "epoch": 0.06785316370042409, "grad_norm": 0.10899059474468231, "learning_rate": 2e-07, "loss": 0.0192, "step": 727 }, { "clip_ratio/high_max": 0.0020576702154357918, "clip_ratio/high_mean": 0.0009057469214894809, "clip_ratio/low_mean": 0.001013988734484883, "clip_ratio/low_min": 0.00022528200770466356, "clip_ratio/region_mean": 0.0019197357032680884, "epoch": 0.06794649680042467, "grad_norm": 0.11812598258256912, "learning_rate": 2e-07, "loss": 0.02, "step": 728 }, { "clip_ratio/high_max": 0.001882033142464934, "clip_ratio/high_mean": 0.0008616699533376959, "clip_ratio/low_mean": 0.0008443151555184158, "clip_ratio/low_min": 6.502476480818586e-05, "clip_ratio/region_mean": 0.0017059850979421753, "epoch": 0.06803982990042524, "grad_norm": 0.10649298131465912, "learning_rate": 2e-07, "loss": 0.0175, "step": 729 }, { "clip_ratio/high_max": 0.0019728978659259155, "clip_ratio/high_mean": 0.0008461367979180068, "clip_ratio/low_mean": 0.0008904438618628774, "clip_ratio/low_min": 0.00011251856903982116, "clip_ratio/region_mean": 0.0017365806561429054, "epoch": 0.06813316300042584, "grad_norm": 0.11021938174962997, "learning_rate": 2e-07, "loss": 0.0409, "step": 730 }, { "clip_ratio/high_max": 0.0021869997508474626, "clip_ratio/high_mean": 0.0008697310731804464, "clip_ratio/low_mean": 0.0008457896092295414, "clip_ratio/low_min": 0.00012011953913315665, "clip_ratio/region_mean": 0.0017155206805909984, "epoch": 0.06822649610042641, "grad_norm": 0.12389024347066879, "learning_rate": 2e-07, "loss": 0.0427, "step": 731 }, { "clip_ratio/high_max": 0.0022479001054307446, "clip_ratio/high_mean": 0.0008328508811246138, "clip_ratio/low_mean": 0.0008902785812097136, "clip_ratio/low_min": 2.1662051040038932e-05, "clip_ratio/region_mean": 0.0017231294841622002, "epoch": 0.06831982920042699, "grad_norm": 0.11572396755218506, "learning_rate": 2e-07, "loss": 0.0185, "step": 732 }, { "clip_ratio/high_max": 0.002065587257675361, "clip_ratio/high_mean": 0.0009545866487314925, "clip_ratio/low_mean": 0.0009328608357463963, "clip_ratio/low_min": 9.97515489871148e-05, "clip_ratio/region_mean": 0.001887447462650016, "epoch": 0.06841316230042759, "grad_norm": 0.11197543889284134, "learning_rate": 2e-07, "loss": 0.0228, "step": 733 }, { "clip_ratio/high_max": 0.001878383965959074, "clip_ratio/high_mean": 0.0007418678633257514, "clip_ratio/low_mean": 0.000992299184872536, "clip_ratio/low_min": 0.00014046389514987823, "clip_ratio/region_mean": 0.0017341670900350437, "epoch": 0.06850649540042816, "grad_norm": 0.17135785520076752, "learning_rate": 2e-07, "loss": 0.07, "step": 734 }, { "clip_ratio/high_max": 0.0019266775925643742, "clip_ratio/high_mean": 0.0007866799714975059, "clip_ratio/low_mean": 0.0009148485041805543, "clip_ratio/low_min": 0.00020009678110000095, "clip_ratio/region_mean": 0.0017015284829540178, "epoch": 0.06859982850042876, "grad_norm": 0.11963098496198654, "learning_rate": 2e-07, "loss": 0.0284, "step": 735 }, { "clip_ratio/high_max": 0.0021162900229683146, "clip_ratio/high_mean": 0.0008298033371829661, "clip_ratio/low_mean": 0.0009440252651984338, "clip_ratio/low_min": 9.66167135629803e-05, "clip_ratio/region_mean": 0.001773828553268686, "epoch": 0.06869316160042933, "grad_norm": 0.11108630895614624, "learning_rate": 2e-07, "loss": 0.0187, "step": 736 }, { "clip_ratio/high_max": 0.0022498252728837542, "clip_ratio/high_mean": 0.0008797802038316149, "clip_ratio/low_mean": 0.0009930819396686275, "clip_ratio/low_min": 0.00010114498854818521, "clip_ratio/region_mean": 0.0018728621580521576, "epoch": 0.06878649470042991, "grad_norm": 0.11905164271593094, "learning_rate": 2e-07, "loss": 0.0745, "step": 737 }, { "clip_ratio/high_max": 0.0017428310311515816, "clip_ratio/high_mean": 0.0007454080023308052, "clip_ratio/low_mean": 0.0008469142230751459, "clip_ratio/low_min": 0.00011297363562334795, "clip_ratio/region_mean": 0.0015923221944831312, "epoch": 0.0688798278004305, "grad_norm": 0.1111283153295517, "learning_rate": 2e-07, "loss": 0.025, "step": 738 }, { "clip_ratio/high_max": 0.0019911056660930626, "clip_ratio/high_mean": 0.0009044735943462001, "clip_ratio/low_mean": 0.0009426217520740465, "clip_ratio/low_min": 0.00014444810949498788, "clip_ratio/region_mean": 0.0018470953291398473, "epoch": 0.06897316090043108, "grad_norm": 0.1140967607498169, "learning_rate": 2e-07, "loss": 0.0284, "step": 739 }, { "clip_ratio/high_max": 0.0023734492060611956, "clip_ratio/high_mean": 0.0008955471043918806, "clip_ratio/low_mean": 0.0007816377237759298, "clip_ratio/low_min": 1.6835016140248626e-05, "clip_ratio/region_mean": 0.0016771848349890206, "epoch": 0.06906649400043166, "grad_norm": 0.1195204108953476, "learning_rate": 2e-07, "loss": -0.0384, "step": 740 }, { "clip_ratio/high_max": 0.001963869322935352, "clip_ratio/high_mean": 0.0008524227559973951, "clip_ratio/low_mean": 0.0010128797766810749, "clip_ratio/low_min": 7.881188503233716e-05, "clip_ratio/region_mean": 0.0018653024890227243, "epoch": 0.06915982710043225, "grad_norm": 0.1177157387137413, "learning_rate": 2e-07, "loss": 0.0027, "step": 741 }, { "clip_ratio/high_max": 0.0022743974514014553, "clip_ratio/high_mean": 0.0009050069347722456, "clip_ratio/low_mean": 0.0007918814899312565, "clip_ratio/low_min": 0.00011168578384967986, "clip_ratio/region_mean": 0.0016968884010566399, "epoch": 0.06925316020043283, "grad_norm": 0.1124471127986908, "learning_rate": 2e-07, "loss": -0.0015, "step": 742 }, { "clip_ratio/high_max": 0.0023312706834985875, "clip_ratio/high_mean": 0.0009307631808042061, "clip_ratio/low_mean": 0.0009224760706274537, "clip_ratio/low_min": 7.910745807748754e-05, "clip_ratio/region_mean": 0.0018532393005443737, "epoch": 0.06934649330043341, "grad_norm": 0.12191157788038254, "learning_rate": 2e-07, "loss": 0.0455, "step": 743 }, { "clip_ratio/high_max": 0.002409063759841956, "clip_ratio/high_mean": 0.0010149744121008553, "clip_ratio/low_mean": 0.0007499483090214198, "clip_ratio/low_min": 4.060786341142375e-05, "clip_ratio/region_mean": 0.0017649226720095612, "epoch": 0.069439826400434, "grad_norm": 0.11714068055152893, "learning_rate": 2e-07, "loss": -0.0289, "step": 744 }, { "clip_ratio/high_max": 0.002355433545744745, "clip_ratio/high_mean": 0.0009446828717045719, "clip_ratio/low_mean": 0.0008667201163916616, "clip_ratio/low_min": 7.820624159649014e-05, "clip_ratio/region_mean": 0.001811402995372191, "epoch": 0.06953315950043458, "grad_norm": 0.11103984713554382, "learning_rate": 2e-07, "loss": 0.0088, "step": 745 }, { "clip_ratio/high_max": 0.002212938830780331, "clip_ratio/high_mean": 0.0009228865928889718, "clip_ratio/low_mean": 0.0008818378555588424, "clip_ratio/low_min": 0.0001661954702285584, "clip_ratio/region_mean": 0.001804724452085793, "epoch": 0.06962649260043517, "grad_norm": 0.1162828877568245, "learning_rate": 2e-07, "loss": 0.0217, "step": 746 }, { "clip_ratio/high_max": 0.002329253555217292, "clip_ratio/high_mean": 0.0009723975636006799, "clip_ratio/low_mean": 0.0008930267231335165, "clip_ratio/low_min": 4.6486876271956135e-05, "clip_ratio/region_mean": 0.0018654242703632917, "epoch": 0.06971982570043575, "grad_norm": 0.11526258289813995, "learning_rate": 2e-07, "loss": 0.0001, "step": 747 }, { "clip_ratio/high_max": 0.0021571044126176275, "clip_ratio/high_mean": 0.0009515761157672387, "clip_ratio/low_mean": 0.0009640668122301577, "clip_ratio/low_min": 0.0001224556708621094, "clip_ratio/region_mean": 0.0019156428825226612, "epoch": 0.06981315880043633, "grad_norm": 0.10905270278453827, "learning_rate": 2e-07, "loss": 0.0089, "step": 748 }, { "clip_ratio/high_max": 0.0022246990447456483, "clip_ratio/high_mean": 0.0009498218969383743, "clip_ratio/low_mean": 0.0008899442254914902, "clip_ratio/low_min": 6.861019937787205e-05, "clip_ratio/region_mean": 0.0018397661551716737, "epoch": 0.06990649190043692, "grad_norm": 0.11899080127477646, "learning_rate": 2e-07, "loss": -0.0192, "step": 749 }, { "clip_ratio/high_max": 0.0019298111801617779, "clip_ratio/high_mean": 0.0008656012432766147, "clip_ratio/low_mean": 0.001014886433040374, "clip_ratio/low_min": 8.82513340911828e-05, "clip_ratio/region_mean": 0.0018804876672220416, "epoch": 0.0699998250004375, "grad_norm": 0.11136862635612488, "learning_rate": 2e-07, "loss": 0.0321, "step": 750 }, { "clip_ratio/high_max": 0.0020187934424029663, "clip_ratio/high_mean": 0.000896969111636281, "clip_ratio/low_mean": 0.001041161591274431, "clip_ratio/low_min": 0.00010871546874113847, "clip_ratio/region_mean": 0.0019381307647563517, "epoch": 0.07009315810043808, "grad_norm": 0.11871477961540222, "learning_rate": 2e-07, "loss": 0.0014, "step": 751 }, { "clip_ratio/high_max": 0.0019320468018122483, "clip_ratio/high_mean": 0.0008972299383458449, "clip_ratio/low_mean": 0.0009356309965369292, "clip_ratio/low_min": 6.975257656449685e-05, "clip_ratio/region_mean": 0.0018328609294258058, "epoch": 0.07018649120043867, "grad_norm": 0.11033106595277786, "learning_rate": 2e-07, "loss": 0.0386, "step": 752 }, { "clip_ratio/high_max": 0.002200088470999617, "clip_ratio/high_mean": 0.0010095337165694218, "clip_ratio/low_mean": 0.0010783316029119305, "clip_ratio/low_min": 0.00011663478107948322, "clip_ratio/region_mean": 0.002087865323119331, "epoch": 0.07027982430043925, "grad_norm": 0.12559662759304047, "learning_rate": 2e-07, "loss": 0.0233, "step": 753 }, { "clip_ratio/high_max": 0.0019773646927205846, "clip_ratio/high_mean": 0.0008177626605174737, "clip_ratio/low_mean": 0.0009762931113073137, "clip_ratio/low_min": 9.805459285416873e-05, "clip_ratio/region_mean": 0.0017940557663678192, "epoch": 0.07037315740043983, "grad_norm": 0.1201983094215393, "learning_rate": 2e-07, "loss": 0.0577, "step": 754 }, { "clip_ratio/high_max": 0.0025453485068283044, "clip_ratio/high_mean": 0.0009743473710841499, "clip_ratio/low_mean": 0.0008333201258210465, "clip_ratio/low_min": 8.023405916901538e-05, "clip_ratio/region_mean": 0.001807667526009027, "epoch": 0.07046649050044042, "grad_norm": 0.11247541010379791, "learning_rate": 2e-07, "loss": 0.0088, "step": 755 }, { "clip_ratio/high_max": 0.0021611853335343767, "clip_ratio/high_mean": 0.0008779607196629513, "clip_ratio/low_mean": 0.0010269088779750746, "clip_ratio/low_min": 6.551597743964521e-05, "clip_ratio/region_mean": 0.0019048696049139835, "epoch": 0.070559823600441, "grad_norm": 0.11212287843227386, "learning_rate": 2e-07, "loss": 0.0581, "step": 756 }, { "clip_ratio/high_max": 0.0023448791544069536, "clip_ratio/high_mean": 0.0009797515194804873, "clip_ratio/low_mean": 0.0008834284017211758, "clip_ratio/low_min": 0.00011036920659535099, "clip_ratio/region_mean": 0.0018631798884598538, "epoch": 0.07065315670044159, "grad_norm": 0.11847711354494095, "learning_rate": 2e-07, "loss": 0.0058, "step": 757 }, { "clip_ratio/high_max": 0.001902271767903585, "clip_ratio/high_mean": 0.0008421897073276341, "clip_ratio/low_mean": 0.0008874270770320436, "clip_ratio/low_min": 3.423310408834368e-05, "clip_ratio/region_mean": 0.0017296168007305823, "epoch": 0.07074648980044217, "grad_norm": 0.11571494489908218, "learning_rate": 2e-07, "loss": 0.0245, "step": 758 }, { "clip_ratio/high_max": 0.0023027062488836236, "clip_ratio/high_mean": 0.0009378148679388687, "clip_ratio/low_mean": 0.0008736145500733983, "clip_ratio/low_min": 4.6971411393315066e-05, "clip_ratio/region_mean": 0.0018114294507540762, "epoch": 0.07083982290044274, "grad_norm": 0.11439782381057739, "learning_rate": 2e-07, "loss": -0.002, "step": 759 }, { "clip_ratio/high_max": 0.0018527741412981413, "clip_ratio/high_mean": 0.0008256449127657106, "clip_ratio/low_mean": 0.0009732884172990452, "clip_ratio/low_min": 6.181068965815939e-05, "clip_ratio/region_mean": 0.0017989333209698088, "epoch": 0.07093315600044334, "grad_norm": 0.11378923803567886, "learning_rate": 2e-07, "loss": 0.0277, "step": 760 }, { "clip_ratio/high_max": 0.0016957177031144965, "clip_ratio/high_mean": 0.0007491546348319389, "clip_ratio/low_mean": 0.0008771952579991193, "clip_ratio/low_min": 8.114224328892305e-05, "clip_ratio/region_mean": 0.0016263498982880265, "epoch": 0.07102648910044392, "grad_norm": 0.1099378913640976, "learning_rate": 2e-07, "loss": 0.0104, "step": 761 }, { "clip_ratio/high_max": 0.0018984484122483991, "clip_ratio/high_mean": 0.0007875142491684528, "clip_ratio/low_mean": 0.0008903663565433817, "clip_ratio/low_min": 8.743663602217566e-05, "clip_ratio/region_mean": 0.0016778806129877921, "epoch": 0.0711198222004445, "grad_norm": 0.11020497232675552, "learning_rate": 2e-07, "loss": 0.0266, "step": 762 }, { "clip_ratio/high_max": 0.002502305382222403, "clip_ratio/high_mean": 0.0010114824272022815, "clip_ratio/low_mean": 0.0008947852511482779, "clip_ratio/low_min": 0.00011245607765886234, "clip_ratio/region_mean": 0.001906267716549337, "epoch": 0.07121315530044509, "grad_norm": 0.11607792228460312, "learning_rate": 2e-07, "loss": -0.0181, "step": 763 }, { "clip_ratio/high_max": 0.0020452847311389633, "clip_ratio/high_mean": 0.0008163719139702152, "clip_ratio/low_mean": 0.0010603377686493332, "clip_ratio/low_min": 9.414563828613609e-05, "clip_ratio/region_mean": 0.0018767096698866226, "epoch": 0.07130648840044566, "grad_norm": 0.11937215924263, "learning_rate": 2e-07, "loss": 0.029, "step": 764 }, { "clip_ratio/high_max": 0.0022216725774342194, "clip_ratio/high_mean": 0.0009963398661057, "clip_ratio/low_mean": 0.0009490548109170049, "clip_ratio/low_min": 6.010155448166188e-05, "clip_ratio/region_mean": 0.0019453946515568532, "epoch": 0.07139982150044624, "grad_norm": 0.12609019875526428, "learning_rate": 2e-07, "loss": -0.0051, "step": 765 }, { "clip_ratio/high_max": 0.0021355415956350043, "clip_ratio/high_mean": 0.0009356030241178814, "clip_ratio/low_mean": 0.0008936798312788596, "clip_ratio/low_min": 9.539840721117798e-05, "clip_ratio/region_mean": 0.001829282846301794, "epoch": 0.07149315460044683, "grad_norm": 0.11530712991952896, "learning_rate": 2e-07, "loss": 0.0146, "step": 766 }, { "clip_ratio/high_max": 0.00240807839873014, "clip_ratio/high_mean": 0.0010244719160255045, "clip_ratio/low_mean": 0.0008021351532079279, "clip_ratio/low_min": 6.404719079000643e-05, "clip_ratio/region_mean": 0.0018266070474055596, "epoch": 0.07158648770044741, "grad_norm": 0.11356697231531143, "learning_rate": 2e-07, "loss": -0.0252, "step": 767 }, { "clip_ratio/high_max": 0.0020306615806475747, "clip_ratio/high_mean": 0.0009128033489105292, "clip_ratio/low_mean": 0.0008606476822023978, "clip_ratio/low_min": 1.9154153051204048e-05, "clip_ratio/region_mean": 0.001773451076587662, "epoch": 0.071679820800448, "grad_norm": 0.11348698288202286, "learning_rate": 2e-07, "loss": -0.0364, "step": 768 }, { "clip_ratio/high_max": 0.0, "clip_ratio/high_mean": 0.0, "clip_ratio/low_mean": 0.0, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0, "completions/clipped_ratio": 0.01513671875, "completions/max_length": 4096.0, "completions/max_terminated_length": 4089.0, "completions/mean_length": 613.3158569335938, "completions/mean_terminated_length": 559.7891845703125, "completions/min_length": 3.0, "completions/min_terminated_length": 3.0, "epoch": 0.07177315390044858, "grad_norm": 0.11815542727708817, "learning_rate": 2e-07, "loss": 0.0359, "num_tokens": 570763057.0, "reward": 0.5616629719734192, "reward_std": 0.20617172122001648, "rewards/simpleverify_reward/mean": 0.5616629719734192, "rewards/simpleverify_reward/std": 0.4961852729320526, "step": 769 }, { "clip_ratio/high_max": 0.0018406135932309553, "clip_ratio/high_mean": 0.0008951789059210569, "clip_ratio/low_mean": 0.0005774876772193238, "clip_ratio/low_min": 3.470255705906311e-05, "clip_ratio/region_mean": 0.001472666575864423, "epoch": 0.07186648700044916, "grad_norm": 0.11962782591581345, "learning_rate": 2e-07, "loss": 0.0072, "step": 770 }, { "clip_ratio/high_max": 0.0023160294695117045, "clip_ratio/high_mean": 0.0009494787991570774, "clip_ratio/low_mean": 0.0005388381596276304, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.001488316964241676, "epoch": 0.07195982010044975, "grad_norm": 0.11105542629957199, "learning_rate": 2e-07, "loss": -0.0394, "step": 771 }, { "clip_ratio/high_max": 0.001954167859366862, "clip_ratio/high_mean": 0.000802307297817606, "clip_ratio/low_mean": 0.0005239310594333801, "clip_ratio/low_min": 4.9426314944867045e-05, "clip_ratio/region_mean": 0.0013262383654364385, "epoch": 0.07205315320045033, "grad_norm": 0.1073770821094513, "learning_rate": 2e-07, "loss": 0.0266, "step": 772 }, { "clip_ratio/high_max": 0.0020542793936328962, "clip_ratio/high_mean": 0.0008261467128249933, "clip_ratio/low_mean": 0.000629717735137092, "clip_ratio/low_min": 1.3376136848819442e-05, "clip_ratio/region_mean": 0.0014558644252247177, "epoch": 0.07214648630045091, "grad_norm": 0.1255156546831131, "learning_rate": 2e-07, "loss": 0.0216, "step": 773 }, { "clip_ratio/high_max": 0.0019543344897101633, "clip_ratio/high_mean": 0.0008676360776007641, "clip_ratio/low_mean": 0.000501413402162143, "clip_ratio/low_min": 8.451656867691781e-06, "clip_ratio/region_mean": 0.0013690494888578542, "epoch": 0.0722398194004515, "grad_norm": 0.10792669653892517, "learning_rate": 2e-07, "loss": 0.0116, "step": 774 }, { "clip_ratio/high_max": 0.00238672334671719, "clip_ratio/high_mean": 0.0008461753423034679, "clip_ratio/low_mean": 0.0006655327706539538, "clip_ratio/low_min": 3.055272918572882e-05, "clip_ratio/region_mean": 0.0015117081347852945, "epoch": 0.07233315250045208, "grad_norm": 0.11510008573532104, "learning_rate": 2e-07, "loss": 0.0085, "step": 775 }, { "clip_ratio/high_max": 0.002013993860600749, "clip_ratio/high_mean": 0.0008614347534603439, "clip_ratio/low_mean": 0.0005944693311903393, "clip_ratio/low_min": 1.4007171557750553e-05, "clip_ratio/region_mean": 0.001455904079193715, "epoch": 0.07242648560045266, "grad_norm": 0.12511181831359863, "learning_rate": 2e-07, "loss": 0.021, "step": 776 }, { "clip_ratio/high_max": 0.0018188524009019602, "clip_ratio/high_mean": 0.0008142310689436272, "clip_ratio/low_mean": 0.0005512810839718441, "clip_ratio/low_min": 1.0113268217537552e-05, "clip_ratio/region_mean": 0.001365512205666164, "epoch": 0.07251981870045325, "grad_norm": 0.11056258529424667, "learning_rate": 2e-07, "loss": 0.0437, "step": 777 }, { "clip_ratio/high_max": 0.0021318527724361047, "clip_ratio/high_mean": 0.0008097993140836479, "clip_ratio/low_mean": 0.0006199879680934828, "clip_ratio/low_min": 5.177959792490583e-05, "clip_ratio/region_mean": 0.0014297872621682473, "epoch": 0.07261315180045383, "grad_norm": 0.11419839411973953, "learning_rate": 2e-07, "loss": 0.0521, "step": 778 }, { "clip_ratio/high_max": 0.0019724474623217247, "clip_ratio/high_mean": 0.0008278065306512872, "clip_ratio/low_mean": 0.0006515258610306773, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0014793324153288268, "epoch": 0.07270648490045442, "grad_norm": 0.11579925566911697, "learning_rate": 2e-07, "loss": 0.0179, "step": 779 }, { "clip_ratio/high_max": 0.002167513212043559, "clip_ratio/high_mean": 0.0009479320378886769, "clip_ratio/low_mean": 0.0005952054016233888, "clip_ratio/low_min": 2.898516822824604e-05, "clip_ratio/region_mean": 0.0015431373976753093, "epoch": 0.072799818000455, "grad_norm": 0.11341644823551178, "learning_rate": 2e-07, "loss": -0.0066, "step": 780 }, { "clip_ratio/high_max": 0.0018813005826814333, "clip_ratio/high_mean": 0.0008299990831801551, "clip_ratio/low_mean": 0.0005868619109605788, "clip_ratio/low_min": 5.1651465582835954e-05, "clip_ratio/region_mean": 0.0014168610177875962, "epoch": 0.07289315110045558, "grad_norm": 0.12438472360372543, "learning_rate": 2e-07, "loss": -0.0034, "step": 781 }, { "clip_ratio/high_max": 0.0022534427771461196, "clip_ratio/high_mean": 0.0009194329359161202, "clip_ratio/low_mean": 0.0005607950879493728, "clip_ratio/low_min": 7.73652245698031e-05, "clip_ratio/region_mean": 0.001480228042055387, "epoch": 0.07298648420045617, "grad_norm": 0.13085101544857025, "learning_rate": 2e-07, "loss": -0.0005, "step": 782 }, { "clip_ratio/high_max": 0.002416175771941198, "clip_ratio/high_mean": 0.0009033886726683704, "clip_ratio/low_mean": 0.0006422624505830754, "clip_ratio/low_min": 3.308700343040982e-05, "clip_ratio/region_mean": 0.0015456511500815395, "epoch": 0.07307981730045675, "grad_norm": 0.11092827469110489, "learning_rate": 2e-07, "loss": -0.0195, "step": 783 }, { "clip_ratio/high_max": 0.0019378230317670386, "clip_ratio/high_mean": 0.0007436561918439111, "clip_ratio/low_mean": 0.0007039391311991494, "clip_ratio/low_min": 5.7071463743341155e-05, "clip_ratio/region_mean": 0.0014475953394139651, "epoch": 0.07317315040045733, "grad_norm": 0.11660467833280563, "learning_rate": 2e-07, "loss": 0.078, "step": 784 }, { "clip_ratio/high_max": 0.001909873892145697, "clip_ratio/high_mean": 0.0007331809756578878, "clip_ratio/low_mean": 0.0006277019856497645, "clip_ratio/low_min": 5.49912601854885e-05, "clip_ratio/region_mean": 0.00136088296858361, "epoch": 0.07326648350045792, "grad_norm": 0.11439983546733856, "learning_rate": 2e-07, "loss": 0.0829, "step": 785 }, { "clip_ratio/high_max": 0.001834483460697811, "clip_ratio/high_mean": 0.0007999898625712376, "clip_ratio/low_mean": 0.0006353595617838437, "clip_ratio/low_min": 4.1536803109920584e-05, "clip_ratio/region_mean": 0.001435349440725986, "epoch": 0.0733598166004585, "grad_norm": 0.1136215403676033, "learning_rate": 2e-07, "loss": 0.0308, "step": 786 }, { "clip_ratio/high_max": 0.0019801714370260015, "clip_ratio/high_mean": 0.000763623293096316, "clip_ratio/low_mean": 0.0007482195906050038, "clip_ratio/low_min": 8.509602548656403e-05, "clip_ratio/region_mean": 0.0015118428855203092, "epoch": 0.07345314970045909, "grad_norm": 0.11211632937192917, "learning_rate": 2e-07, "loss": 0.0734, "step": 787 }, { "clip_ratio/high_max": 0.002130993496393785, "clip_ratio/high_mean": 0.0008854681545926724, "clip_ratio/low_mean": 0.0007022492027317639, "clip_ratio/low_min": 7.136206841096282e-05, "clip_ratio/region_mean": 0.0015877173718763515, "epoch": 0.07354648280045967, "grad_norm": 0.11957481503486633, "learning_rate": 2e-07, "loss": -0.0081, "step": 788 }, { "clip_ratio/high_max": 0.0018580957184894942, "clip_ratio/high_mean": 0.0007327506664296379, "clip_ratio/low_mean": 0.0006446797251555836, "clip_ratio/low_min": 9.072100056073396e-05, "clip_ratio/region_mean": 0.0013774303770333063, "epoch": 0.07363981590046025, "grad_norm": 0.1123182401061058, "learning_rate": 2e-07, "loss": 0.0527, "step": 789 }, { "clip_ratio/high_max": 0.0022652892730548047, "clip_ratio/high_mean": 0.0009085375950235175, "clip_ratio/low_mean": 0.0007382839157799026, "clip_ratio/low_min": 8.794690893410007e-05, "clip_ratio/region_mean": 0.0016468214998894837, "epoch": 0.07373314900046084, "grad_norm": 0.11017676442861557, "learning_rate": 2e-07, "loss": 0.0415, "step": 790 }, { "clip_ratio/high_max": 0.002239024717709981, "clip_ratio/high_mean": 0.0009216399430442834, "clip_ratio/low_mean": 0.0006979401205171598, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0016195800344576128, "epoch": 0.07382648210046142, "grad_norm": 0.1129654049873352, "learning_rate": 2e-07, "loss": -0.0032, "step": 791 }, { "clip_ratio/high_max": 0.0018680905141081894, "clip_ratio/high_mean": 0.0007654549494873208, "clip_ratio/low_mean": 0.0007547381228505401, "clip_ratio/low_min": 0.00010563037812971743, "clip_ratio/region_mean": 0.0015201930345938308, "epoch": 0.073919815200462, "grad_norm": 0.11200012266635895, "learning_rate": 2e-07, "loss": 0.0793, "step": 792 }, { "clip_ratio/high_max": 0.0020571316526911687, "clip_ratio/high_mean": 0.0008623508711025352, "clip_ratio/low_mean": 0.000799039315097616, "clip_ratio/low_min": 5.026038979849545e-05, "clip_ratio/region_mean": 0.0016613901680102572, "epoch": 0.07401314830046259, "grad_norm": 0.12031158059835434, "learning_rate": 2e-07, "loss": 0.0293, "step": 793 }, { "clip_ratio/high_max": 0.0023140867670008447, "clip_ratio/high_mean": 0.0009250216853615711, "clip_ratio/low_mean": 0.0008091779773167218, "clip_ratio/low_min": 0.00010961086445604451, "clip_ratio/region_mean": 0.0017341996572213247, "epoch": 0.07410648140046316, "grad_norm": 0.11367065459489822, "learning_rate": 2e-07, "loss": 0.0074, "step": 794 }, { "clip_ratio/high_max": 0.0022362971649272367, "clip_ratio/high_mean": 0.0008638054296170594, "clip_ratio/low_mean": 0.0007498363665945362, "clip_ratio/low_min": 7.719989298493601e-05, "clip_ratio/region_mean": 0.0016136418125825003, "epoch": 0.07419981450046374, "grad_norm": 0.12453027069568634, "learning_rate": 2e-07, "loss": 0.0494, "step": 795 }, { "clip_ratio/high_max": 0.0018696574952627998, "clip_ratio/high_mean": 0.0007434031040247646, "clip_ratio/low_mean": 0.0008674162327224622, "clip_ratio/low_min": 3.7690821045544e-05, "clip_ratio/region_mean": 0.001610819366760552, "epoch": 0.07429314760046433, "grad_norm": 0.1564548909664154, "learning_rate": 2e-07, "loss": 0.0514, "step": 796 }, { "clip_ratio/high_max": 0.002054108594165882, "clip_ratio/high_mean": 0.0008844041203701636, "clip_ratio/low_mean": 0.0006944568785911542, "clip_ratio/low_min": 4.297071609471459e-05, "clip_ratio/region_mean": 0.0015788609998708125, "epoch": 0.07438648070046491, "grad_norm": 0.10839328914880753, "learning_rate": 2e-07, "loss": 0.0174, "step": 797 }, { "clip_ratio/high_max": 0.001910743914777413, "clip_ratio/high_mean": 0.0008881840512913186, "clip_ratio/low_mean": 0.000726361565739353, "clip_ratio/low_min": 8.571409307478461e-05, "clip_ratio/region_mean": 0.0016145456029335037, "epoch": 0.0744798138004655, "grad_norm": 0.11174105107784271, "learning_rate": 2e-07, "loss": 0.0051, "step": 798 }, { "clip_ratio/high_max": 0.0021640864724759012, "clip_ratio/high_mean": 0.0008132260845741257, "clip_ratio/low_mean": 0.000854491867357865, "clip_ratio/low_min": 3.266042904215283e-05, "clip_ratio/region_mean": 0.0016677179592079483, "epoch": 0.07457314690046608, "grad_norm": 0.12809504568576813, "learning_rate": 2e-07, "loss": 0.0563, "step": 799 }, { "clip_ratio/high_max": 0.001969370299775619, "clip_ratio/high_mean": 0.0008444750365015352, "clip_ratio/low_mean": 0.0007440772351401392, "clip_ratio/low_min": 5.975224485155195e-05, "clip_ratio/region_mean": 0.0015885522589087486, "epoch": 0.07466648000046666, "grad_norm": 0.11028800159692764, "learning_rate": 2e-07, "loss": 0.036, "step": 800 }, { "clip_ratio/high_max": 0.002031433967204066, "clip_ratio/high_mean": 0.0008159696226357482, "clip_ratio/low_mean": 0.0008281027221528348, "clip_ratio/low_min": 4.407746109791333e-05, "clip_ratio/region_mean": 0.0016440723229607102, "epoch": 0.07475981310046725, "grad_norm": 0.11633311212062836, "learning_rate": 2e-07, "loss": 0.0648, "step": 801 }, { "clip_ratio/high_max": 0.0019917547833756544, "clip_ratio/high_mean": 0.0008821331575745717, "clip_ratio/low_mean": 0.0008060858781391289, "clip_ratio/low_min": 5.2474158110271674e-05, "clip_ratio/region_mean": 0.0016882190029718913, "epoch": 0.07485314620046783, "grad_norm": 0.11978299915790558, "learning_rate": 2e-07, "loss": 0.0397, "step": 802 }, { "clip_ratio/high_max": 0.002210826482041739, "clip_ratio/high_mean": 0.0008793110673650517, "clip_ratio/low_mean": 0.0008752111971261911, "clip_ratio/low_min": 3.7206449633231387e-05, "clip_ratio/region_mean": 0.0017545222435728647, "epoch": 0.07494647930046841, "grad_norm": 0.12210392951965332, "learning_rate": 2e-07, "loss": 0.0455, "step": 803 }, { "clip_ratio/high_max": 0.0022734067533747293, "clip_ratio/high_mean": 0.0008890612298273481, "clip_ratio/low_mean": 0.000864874069520738, "clip_ratio/low_min": 5.874089674762217e-05, "clip_ratio/region_mean": 0.0017539352847961709, "epoch": 0.075039812400469, "grad_norm": 0.1219240128993988, "learning_rate": 2e-07, "loss": -0.0051, "step": 804 }, { "clip_ratio/high_max": 0.002201729585067369, "clip_ratio/high_mean": 0.0007600494409416569, "clip_ratio/low_mean": 0.0009157030181086157, "clip_ratio/low_min": 9.428187649973552e-05, "clip_ratio/region_mean": 0.0016757524354034103, "epoch": 0.07513314550046958, "grad_norm": 0.11391404271125793, "learning_rate": 2e-07, "loss": 0.0514, "step": 805 }, { "clip_ratio/high_max": 0.0020251438472769223, "clip_ratio/high_mean": 0.0009449685567233246, "clip_ratio/low_mean": 0.0009324367620138219, "clip_ratio/low_min": 9.895572475215886e-05, "clip_ratio/region_mean": 0.0018774053387460299, "epoch": 0.07522647860047016, "grad_norm": 0.12327658385038376, "learning_rate": 2e-07, "loss": 0.0214, "step": 806 }, { "clip_ratio/high_max": 0.0019707472893060185, "clip_ratio/high_mean": 0.000925991240364965, "clip_ratio/low_mean": 0.0008850759259075858, "clip_ratio/low_min": 5.538283494388452e-05, "clip_ratio/region_mean": 0.001811067144444678, "epoch": 0.07531981170047075, "grad_norm": 0.11590573191642761, "learning_rate": 2e-07, "loss": -0.0184, "step": 807 }, { "clip_ratio/high_max": 0.0020089485369680915, "clip_ratio/high_mean": 0.000834725553431781, "clip_ratio/low_mean": 0.0009222548324032687, "clip_ratio/low_min": 0.0001571323728057905, "clip_ratio/region_mean": 0.0017569803821970709, "epoch": 0.07541314480047133, "grad_norm": 0.11885417252779007, "learning_rate": 2e-07, "loss": 0.0568, "step": 808 }, { "clip_ratio/high_max": 0.00207575828244444, "clip_ratio/high_mean": 0.0008897327006707201, "clip_ratio/low_mean": 0.0008757144987612264, "clip_ratio/low_min": 0.00011913617163372692, "clip_ratio/region_mean": 0.00176544718851801, "epoch": 0.07550647790047192, "grad_norm": 0.11395089328289032, "learning_rate": 2e-07, "loss": 0.0257, "step": 809 }, { "clip_ratio/high_max": 0.0022518398400279693, "clip_ratio/high_mean": 0.0009516576974419877, "clip_ratio/low_mean": 0.0009147005112026818, "clip_ratio/low_min": 6.148095235403161e-05, "clip_ratio/region_mean": 0.0018663581649889238, "epoch": 0.0755998110004725, "grad_norm": 0.121428482234478, "learning_rate": 2e-07, "loss": 0.0252, "step": 810 }, { "clip_ratio/high_max": 0.0020481559695326723, "clip_ratio/high_mean": 0.0008491357766615693, "clip_ratio/low_mean": 0.0009198384541377891, "clip_ratio/low_min": 7.827800982340705e-05, "clip_ratio/region_mean": 0.0017689742162474431, "epoch": 0.07569314410047308, "grad_norm": 0.1197175458073616, "learning_rate": 2e-07, "loss": 0.0198, "step": 811 }, { "clip_ratio/high_max": 0.0018028829035756644, "clip_ratio/high_mean": 0.0008212973898480413, "clip_ratio/low_mean": 0.0008151634901878424, "clip_ratio/low_min": 8.263806057584588e-05, "clip_ratio/region_mean": 0.0016364609109587036, "epoch": 0.07578647720047367, "grad_norm": 0.12057220935821533, "learning_rate": 2e-07, "loss": 0.0281, "step": 812 }, { "clip_ratio/high_max": 0.0018012533510045614, "clip_ratio/high_mean": 0.0006724153563482105, "clip_ratio/low_mean": 0.0009348849889647681, "clip_ratio/low_min": 8.79561084730085e-05, "clip_ratio/region_mean": 0.001607300353498431, "epoch": 0.07587981030047425, "grad_norm": 0.10819491744041443, "learning_rate": 2e-07, "loss": 0.0351, "step": 813 }, { "clip_ratio/high_max": 0.0019885458423232194, "clip_ratio/high_mean": 0.0008939470153563889, "clip_ratio/low_mean": 0.0007221258601930458, "clip_ratio/low_min": 6.840105379524175e-05, "clip_ratio/region_mean": 0.0016160728919203393, "epoch": 0.07597314340047483, "grad_norm": 0.11247130483388901, "learning_rate": 2e-07, "loss": 0.0128, "step": 814 }, { "clip_ratio/high_max": 0.0023813931038603187, "clip_ratio/high_mean": 0.0008267920384241734, "clip_ratio/low_mean": 0.0009095919558603782, "clip_ratio/low_min": 0.00013230991953605553, "clip_ratio/region_mean": 0.001736383987008594, "epoch": 0.07606647650047542, "grad_norm": 0.12277612835168839, "learning_rate": 2e-07, "loss": 0.058, "step": 815 }, { "clip_ratio/high_max": 0.0018914303291239776, "clip_ratio/high_mean": 0.0008524496588506736, "clip_ratio/low_mean": 0.0009592161623004358, "clip_ratio/low_min": 9.309589222539216e-05, "clip_ratio/region_mean": 0.001811665846616961, "epoch": 0.076159809600476, "grad_norm": 0.12231984734535217, "learning_rate": 2e-07, "loss": 0.0611, "step": 816 }, { "clip_ratio/high_max": 0.001822645357606234, "clip_ratio/high_mean": 0.0008658065416966565, "clip_ratio/low_mean": 0.0008335979291587137, "clip_ratio/low_min": 7.880553948780289e-05, "clip_ratio/region_mean": 0.0016994044963212218, "epoch": 0.07625314270047658, "grad_norm": 0.11026028543710709, "learning_rate": 2e-07, "loss": 0.0138, "step": 817 }, { "clip_ratio/high_max": 0.0021347676920413505, "clip_ratio/high_mean": 0.0009027673622767907, "clip_ratio/low_mean": 0.000806166986876633, "clip_ratio/low_min": 7.982353326951852e-05, "clip_ratio/region_mean": 0.0017089343455154449, "epoch": 0.07634647580047717, "grad_norm": 0.11254287511110306, "learning_rate": 2e-07, "loss": 0.0143, "step": 818 }, { "clip_ratio/high_max": 0.002188172897149343, "clip_ratio/high_mean": 0.0009822262381931068, "clip_ratio/low_mean": 0.0008530010854883585, "clip_ratio/low_min": 6.820563521614531e-05, "clip_ratio/region_mean": 0.0018352273109485395, "epoch": 0.07643980890047775, "grad_norm": 0.10810264945030212, "learning_rate": 2e-07, "loss": 0.0084, "step": 819 }, { "clip_ratio/high_max": 0.00202627872931771, "clip_ratio/high_mean": 0.0008325006219820352, "clip_ratio/low_mean": 0.0007411972528643673, "clip_ratio/low_min": 7.503960387111874e-05, "clip_ratio/region_mean": 0.001573697827552678, "epoch": 0.07653314200047834, "grad_norm": 0.10369493812322617, "learning_rate": 2e-07, "loss": 0.0134, "step": 820 }, { "clip_ratio/high_max": 0.0019521393769537099, "clip_ratio/high_mean": 0.0007577197466162033, "clip_ratio/low_mean": 0.0010085839167004451, "clip_ratio/low_min": 8.91615318323602e-05, "clip_ratio/region_mean": 0.001766303652402712, "epoch": 0.07662647510047892, "grad_norm": 0.11065830290317535, "learning_rate": 2e-07, "loss": 0.0492, "step": 821 }, { "clip_ratio/high_max": 0.002060710405203281, "clip_ratio/high_mean": 0.0008459494274575263, "clip_ratio/low_mean": 0.0008618019874120364, "clip_ratio/low_min": 0.00010607540343698929, "clip_ratio/region_mean": 0.0017077514276024885, "epoch": 0.0767198082004795, "grad_norm": 0.11574377864599228, "learning_rate": 2e-07, "loss": 0.0424, "step": 822 }, { "clip_ratio/high_max": 0.0018048021956929006, "clip_ratio/high_mean": 0.0007672194988117553, "clip_ratio/low_mean": 0.0008789924177108333, "clip_ratio/low_min": 5.627569680655142e-05, "clip_ratio/region_mean": 0.0016462118946947157, "epoch": 0.07681314130048009, "grad_norm": 0.1251182109117508, "learning_rate": 2e-07, "loss": 0.0496, "step": 823 }, { "clip_ratio/high_max": 0.002250038225611206, "clip_ratio/high_mean": 0.0009154693325399421, "clip_ratio/low_mean": 0.0007858142689656233, "clip_ratio/low_min": 3.786786510318052e-05, "clip_ratio/region_mean": 0.00170128361787647, "epoch": 0.07690647440048066, "grad_norm": 0.11992879956960678, "learning_rate": 2e-07, "loss": -0.0067, "step": 824 }, { "clip_ratio/high_max": 0.0021376510740083177, "clip_ratio/high_mean": 0.0008447336404060479, "clip_ratio/low_mean": 0.0009001328417070908, "clip_ratio/low_min": 0.00010302131568096229, "clip_ratio/region_mean": 0.001744866451190319, "epoch": 0.07699980750048124, "grad_norm": 0.12252639979124069, "learning_rate": 2e-07, "loss": 0.0179, "step": 825 }, { "clip_ratio/high_max": 0.0022197407379280776, "clip_ratio/high_mean": 0.0009219504536304157, "clip_ratio/low_mean": 0.0008650454656162765, "clip_ratio/low_min": 8.402550520258956e-05, "clip_ratio/region_mean": 0.0017869958974188194, "epoch": 0.07709314060048184, "grad_norm": 0.11647389084100723, "learning_rate": 2e-07, "loss": 0.0055, "step": 826 }, { "clip_ratio/high_max": 0.001958800246939063, "clip_ratio/high_mean": 0.0008809373266558396, "clip_ratio/low_mean": 0.0009099125927605201, "clip_ratio/low_min": 0.00010302225882696803, "clip_ratio/region_mean": 0.0017908498775796033, "epoch": 0.07718647370048241, "grad_norm": 0.11774373054504395, "learning_rate": 2e-07, "loss": 0.027, "step": 827 }, { "clip_ratio/high_max": 0.0024077695852611214, "clip_ratio/high_mean": 0.0009791178945306456, "clip_ratio/low_mean": 0.0007297373012988828, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.001708855212200433, "epoch": 0.07727980680048299, "grad_norm": 0.11540964245796204, "learning_rate": 2e-07, "loss": -0.0186, "step": 828 }, { "clip_ratio/high_max": 0.0019382004829822108, "clip_ratio/high_mean": 0.0008374913413717877, "clip_ratio/low_mean": 0.0008181532957678428, "clip_ratio/low_min": 9.262867206416558e-05, "clip_ratio/region_mean": 0.0016556446644244716, "epoch": 0.07737313990048358, "grad_norm": 0.11175844818353653, "learning_rate": 2e-07, "loss": -0.015, "step": 829 }, { "clip_ratio/high_max": 0.0017290142459387425, "clip_ratio/high_mean": 0.0007726519670541165, "clip_ratio/low_mean": 0.0008547711076971609, "clip_ratio/low_min": 0.00012042331582051702, "clip_ratio/region_mean": 0.0016274230511044152, "epoch": 0.07746647300048416, "grad_norm": 0.11575040221214294, "learning_rate": 2e-07, "loss": 0.0288, "step": 830 }, { "clip_ratio/high_max": 0.0022843038532300852, "clip_ratio/high_mean": 0.0008940826519392431, "clip_ratio/low_mean": 0.0006594453298021108, "clip_ratio/low_min": 2.7699252314050682e-05, "clip_ratio/region_mean": 0.0015535279817413539, "epoch": 0.07755980610048475, "grad_norm": 0.10554547607898712, "learning_rate": 2e-07, "loss": 0.0083, "step": 831 }, { "clip_ratio/high_max": 0.0020738437233376317, "clip_ratio/high_mean": 0.000906540781215881, "clip_ratio/low_mean": 0.0008279761605081148, "clip_ratio/low_min": 4.9889058573171496e-05, "clip_ratio/region_mean": 0.0017345169399050064, "epoch": 0.07765313920048533, "grad_norm": 0.11285263299942017, "learning_rate": 2e-07, "loss": 0.0474, "step": 832 }, { "clip_ratio/high_max": 0.0018290228290425148, "clip_ratio/high_mean": 0.0008261084731202573, "clip_ratio/low_mean": 0.0008738580690987874, "clip_ratio/low_min": 3.444614321779227e-05, "clip_ratio/region_mean": 0.0016999665313051082, "epoch": 0.07774647230048591, "grad_norm": 0.11581651121377945, "learning_rate": 2e-07, "loss": 0.0412, "step": 833 }, { "clip_ratio/high_max": 0.001994646205275785, "clip_ratio/high_mean": 0.0008670792485645507, "clip_ratio/low_mean": 0.0007960418115544599, "clip_ratio/low_min": 6.800799292250304e-05, "clip_ratio/region_mean": 0.00166312103101518, "epoch": 0.0778398054004865, "grad_norm": 0.1084277406334877, "learning_rate": 2e-07, "loss": 0.0039, "step": 834 }, { "clip_ratio/high_max": 0.0018941663329314906, "clip_ratio/high_mean": 0.0008794665009190794, "clip_ratio/low_mean": 0.0009355217716802144, "clip_ratio/low_min": 0.00015284758592315484, "clip_ratio/region_mean": 0.0018149882889701985, "epoch": 0.07793313850048708, "grad_norm": 0.10668100416660309, "learning_rate": 2e-07, "loss": 0.0344, "step": 835 }, { "clip_ratio/high_max": 0.0018539468037488405, "clip_ratio/high_mean": 0.0007754559883323964, "clip_ratio/low_mean": 0.0008293645114463288, "clip_ratio/low_min": 5.7782831390795764e-05, "clip_ratio/region_mean": 0.0016048204925027676, "epoch": 0.07802647160048766, "grad_norm": 0.11463084071874619, "learning_rate": 2e-07, "loss": 0.0257, "step": 836 }, { "clip_ratio/high_max": 0.001998334118979983, "clip_ratio/high_mean": 0.000766747663874412, "clip_ratio/low_mean": 0.0008621477136330213, "clip_ratio/low_min": 3.490594053801033e-05, "clip_ratio/region_mean": 0.0016288954066112638, "epoch": 0.07811980470048825, "grad_norm": 0.11016237735748291, "learning_rate": 2e-07, "loss": 0.0697, "step": 837 }, { "clip_ratio/high_max": 0.0016024340548028704, "clip_ratio/high_mean": 0.0007589341657876503, "clip_ratio/low_mean": 0.0008838661196932662, "clip_ratio/low_min": 3.351427267261897e-05, "clip_ratio/region_mean": 0.0016428002782049589, "epoch": 0.07821313780048883, "grad_norm": 0.1140173077583313, "learning_rate": 2e-07, "loss": 0.0289, "step": 838 }, { "clip_ratio/high_max": 0.0020428650532267056, "clip_ratio/high_mean": 0.0007943295404402306, "clip_ratio/low_mean": 0.0010124424243258545, "clip_ratio/low_min": 0.0002021675190917449, "clip_ratio/region_mean": 0.0018067719356622547, "epoch": 0.07830647090048942, "grad_norm": 0.11717087775468826, "learning_rate": 2e-07, "loss": 0.0387, "step": 839 }, { "clip_ratio/high_max": 0.002202466297603678, "clip_ratio/high_mean": 0.0008675922817928949, "clip_ratio/low_mean": 0.000806574200396426, "clip_ratio/low_min": 0.00010892111640714575, "clip_ratio/region_mean": 0.0016741664367145859, "epoch": 0.07839980400049, "grad_norm": 0.11594445258378983, "learning_rate": 2e-07, "loss": 0.013, "step": 840 }, { "clip_ratio/high_max": 0.0020431987213669345, "clip_ratio/high_mean": 0.0009041275243362179, "clip_ratio/low_mean": 0.0008589667449996341, "clip_ratio/low_min": 5.366946879803436e-05, "clip_ratio/region_mean": 0.0017630942675168626, "epoch": 0.07849313710049058, "grad_norm": 0.12500528991222382, "learning_rate": 2e-07, "loss": 0.0382, "step": 841 }, { "clip_ratio/high_max": 0.002097187261824729, "clip_ratio/high_mean": 0.0008882522215571953, "clip_ratio/low_mean": 0.000821704818008584, "clip_ratio/low_min": 7.116395045159152e-05, "clip_ratio/region_mean": 0.0017099570395657793, "epoch": 0.07858647020049117, "grad_norm": 0.1250203251838684, "learning_rate": 2e-07, "loss": 0.0173, "step": 842 }, { "clip_ratio/high_max": 0.0020374701962282415, "clip_ratio/high_mean": 0.0008369560800929321, "clip_ratio/low_mean": 0.0009016376352519728, "clip_ratio/low_min": 0.00015083842845342588, "clip_ratio/region_mean": 0.001738593724439852, "epoch": 0.07867980330049175, "grad_norm": 0.11403858661651611, "learning_rate": 2e-07, "loss": 0.0298, "step": 843 }, { "clip_ratio/high_max": 0.0019630739916465245, "clip_ratio/high_mean": 0.0008085092795226956, "clip_ratio/low_mean": 0.00093123019541963, "clip_ratio/low_min": 4.6451079469989054e-05, "clip_ratio/region_mean": 0.001739739476761315, "epoch": 0.07877313640049233, "grad_norm": 0.11661913990974426, "learning_rate": 2e-07, "loss": 0.0416, "step": 844 }, { "clip_ratio/high_max": 0.0019510698257363401, "clip_ratio/high_mean": 0.000811376210549497, "clip_ratio/low_mean": 0.0007822837887943024, "clip_ratio/low_min": 7.463270867447136e-05, "clip_ratio/region_mean": 0.0015936599666019902, "epoch": 0.07886646950049292, "grad_norm": 0.11432009190320969, "learning_rate": 2e-07, "loss": 0.0293, "step": 845 }, { "clip_ratio/high_max": 0.001964373637747485, "clip_ratio/high_mean": 0.0008648544953757664, "clip_ratio/low_mean": 0.0009044642101798672, "clip_ratio/low_min": 3.922053201677045e-05, "clip_ratio/region_mean": 0.0017693186600808986, "epoch": 0.0789598026004935, "grad_norm": 0.11986778676509857, "learning_rate": 2e-07, "loss": 0.0402, "step": 846 }, { "clip_ratio/high_max": 0.002131155641109217, "clip_ratio/high_mean": 0.0008118690730043454, "clip_ratio/low_mean": 0.000716558997737593, "clip_ratio/low_min": 5.617265105684055e-05, "clip_ratio/region_mean": 0.0015284280816558748, "epoch": 0.07905313570049408, "grad_norm": 0.10968732833862305, "learning_rate": 2e-07, "loss": -0.0186, "step": 847 }, { "clip_ratio/high_max": 0.002097861379297683, "clip_ratio/high_mean": 0.0008518869299223297, "clip_ratio/low_mean": 0.0009144793220912106, "clip_ratio/low_min": 5.3859293075220194e-05, "clip_ratio/region_mean": 0.0017663662110862788, "epoch": 0.07914646880049467, "grad_norm": 0.11068090051412582, "learning_rate": 2e-07, "loss": 0.0292, "step": 848 }, { "clip_ratio/high_max": 0.0018163008462579455, "clip_ratio/high_mean": 0.0008417613880737917, "clip_ratio/low_mean": 0.0008767534891376272, "clip_ratio/low_min": 4.1145489376503974e-05, "clip_ratio/region_mean": 0.0017185148753924295, "epoch": 0.07923980190049525, "grad_norm": 0.11685491353273392, "learning_rate": 2e-07, "loss": 0.0352, "step": 849 }, { "clip_ratio/high_max": 0.0019360077494638972, "clip_ratio/high_mean": 0.0007704757517785765, "clip_ratio/low_mean": 0.0008984834712464362, "clip_ratio/low_min": 8.914970021578483e-05, "clip_ratio/region_mean": 0.001668959179369267, "epoch": 0.07933313500049584, "grad_norm": 0.1745588183403015, "learning_rate": 2e-07, "loss": 0.0574, "step": 850 }, { "clip_ratio/high_max": 0.0021599106876237784, "clip_ratio/high_mean": 0.0008832753273964045, "clip_ratio/low_mean": 0.0008645042307762196, "clip_ratio/low_min": 2.242882601422025e-05, "clip_ratio/region_mean": 0.001747779519064352, "epoch": 0.07942646810049642, "grad_norm": 0.11549002677202225, "learning_rate": 2e-07, "loss": 0.0058, "step": 851 }, { "clip_ratio/high_max": 0.001960432688065339, "clip_ratio/high_mean": 0.0008217911272367928, "clip_ratio/low_mean": 0.0009330485845566727, "clip_ratio/low_min": 5.3144354751566425e-05, "clip_ratio/region_mean": 0.001754839664499741, "epoch": 0.079519801200497, "grad_norm": 0.10849033296108246, "learning_rate": 2e-07, "loss": 0.0418, "step": 852 }, { "clip_ratio/high_max": 0.0020198188358335756, "clip_ratio/high_mean": 0.0008318453137690085, "clip_ratio/low_mean": 0.0008052710309129907, "clip_ratio/low_min": 7.065302997943945e-05, "clip_ratio/region_mean": 0.0016371163401345257, "epoch": 0.07961313430049759, "grad_norm": 0.13017603754997253, "learning_rate": 2e-07, "loss": 0.0212, "step": 853 }, { "clip_ratio/high_max": 0.0018999883577635046, "clip_ratio/high_mean": 0.0008207933733501704, "clip_ratio/low_mean": 0.0009260458300559549, "clip_ratio/low_min": 0.00015258730127243325, "clip_ratio/region_mean": 0.0017468392543378286, "epoch": 0.07970646740049817, "grad_norm": 0.11225332319736481, "learning_rate": 2e-07, "loss": 0.0447, "step": 854 }, { "clip_ratio/high_max": 0.002196789049776271, "clip_ratio/high_mean": 0.0009522681411908707, "clip_ratio/low_mean": 0.0008119098874885822, "clip_ratio/low_min": 8.707637607585639e-05, "clip_ratio/region_mean": 0.0017641780359554105, "epoch": 0.07979980050049874, "grad_norm": 0.13699984550476074, "learning_rate": 2e-07, "loss": 0.0152, "step": 855 }, { "clip_ratio/high_max": 0.002096785457979422, "clip_ratio/high_mean": 0.0008688605194038246, "clip_ratio/low_mean": 0.0008006164025573526, "clip_ratio/low_min": 0.00013634201422974002, "clip_ratio/region_mean": 0.0016694769292371348, "epoch": 0.07989313360049934, "grad_norm": 0.11947979032993317, "learning_rate": 2e-07, "loss": 0.0101, "step": 856 }, { "clip_ratio/high_max": 0.0022515038690471556, "clip_ratio/high_mean": 0.0008531360435881652, "clip_ratio/low_mean": 0.0007404095231322572, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0015935455667204224, "epoch": 0.07998646670049991, "grad_norm": 0.1121777594089508, "learning_rate": 2e-07, "loss": 0.0213, "step": 857 }, { "clip_ratio/high_max": 0.0020023567449243274, "clip_ratio/high_mean": 0.000855905807839008, "clip_ratio/low_mean": 0.0007608406740473583, "clip_ratio/low_min": 1.7217922504642047e-05, "clip_ratio/region_mean": 0.001616746507352218, "epoch": 0.08007979980050049, "grad_norm": 0.10610252618789673, "learning_rate": 2e-07, "loss": 0.0231, "step": 858 }, { "clip_ratio/high_max": 0.0021039444545749575, "clip_ratio/high_mean": 0.0008074646630120696, "clip_ratio/low_mean": 0.0009658961025706958, "clip_ratio/low_min": 9.328449141321471e-05, "clip_ratio/region_mean": 0.0017733607528498396, "epoch": 0.08017313290050108, "grad_norm": 0.12367263436317444, "learning_rate": 2e-07, "loss": 0.0166, "step": 859 }, { "clip_ratio/high_max": 0.0020069144884473644, "clip_ratio/high_mean": 0.0007846043299650773, "clip_ratio/low_mean": 0.0008355021363968262, "clip_ratio/low_min": 7.897800787759479e-05, "clip_ratio/region_mean": 0.0016201064645429142, "epoch": 0.08026646600050166, "grad_norm": 0.11115848273038864, "learning_rate": 2e-07, "loss": 0.011, "step": 860 }, { "clip_ratio/high_max": 0.0019340567341714632, "clip_ratio/high_mean": 0.0008245551980508026, "clip_ratio/low_mean": 0.0009977112385968212, "clip_ratio/low_min": 0.00015124695346457884, "clip_ratio/region_mean": 0.001822266451199539, "epoch": 0.08035979910050225, "grad_norm": 0.12156204879283905, "learning_rate": 2e-07, "loss": 0.0433, "step": 861 }, { "clip_ratio/high_max": 0.0022457092272816226, "clip_ratio/high_mean": 0.0009067931277968455, "clip_ratio/low_mean": 0.0009122645133174956, "clip_ratio/low_min": 4.0038154111243784e-05, "clip_ratio/region_mean": 0.001819057604734553, "epoch": 0.08045313220050283, "grad_norm": 0.1250375360250473, "learning_rate": 2e-07, "loss": 0.016, "step": 862 }, { "clip_ratio/high_max": 0.002131820496288128, "clip_ratio/high_mean": 0.0009264678046747576, "clip_ratio/low_mean": 0.0009567226443323307, "clip_ratio/low_min": 0.0001037610763887642, "clip_ratio/region_mean": 0.0018831904526450671, "epoch": 0.08054646530050341, "grad_norm": 0.11784426867961884, "learning_rate": 2e-07, "loss": 0.0038, "step": 863 }, { "clip_ratio/high_max": 0.0020498053927440196, "clip_ratio/high_mean": 0.0008363905781152425, "clip_ratio/low_mean": 0.0009697305176814552, "clip_ratio/low_min": 0.00011386315327399643, "clip_ratio/region_mean": 0.0018061211303574964, "epoch": 0.080639798400504, "grad_norm": 0.12424205243587494, "learning_rate": 2e-07, "loss": 0.0432, "step": 864 }, { "clip_ratio/high_max": 0.0019944470113841817, "clip_ratio/high_mean": 0.0008256175060523674, "clip_ratio/low_mean": 0.0009339187381556258, "clip_ratio/low_min": 6.113740619184682e-05, "clip_ratio/region_mean": 0.0017595362514839508, "epoch": 0.08073313150050458, "grad_norm": 0.11761760711669922, "learning_rate": 2e-07, "loss": 0.0467, "step": 865 }, { "clip_ratio/high_max": 0.0017818830056057777, "clip_ratio/high_mean": 0.0008638606632302981, "clip_ratio/low_mean": 0.0008776586255407892, "clip_ratio/low_min": 4.779991195391631e-05, "clip_ratio/region_mean": 0.0017415192851331085, "epoch": 0.08082646460050516, "grad_norm": 0.10859088599681854, "learning_rate": 2e-07, "loss": 0.0356, "step": 866 }, { "clip_ratio/high_max": 0.0018029165221378207, "clip_ratio/high_mean": 0.0007920448661025148, "clip_ratio/low_mean": 0.0007731226833129767, "clip_ratio/low_min": 4.139177872275468e-05, "clip_ratio/region_mean": 0.0015651675494154915, "epoch": 0.08091979770050575, "grad_norm": 0.11384664475917816, "learning_rate": 2e-07, "loss": 0.0431, "step": 867 }, { "clip_ratio/high_max": 0.001969834767805878, "clip_ratio/high_mean": 0.0008501778556819772, "clip_ratio/low_mean": 0.0009673888271208853, "clip_ratio/low_min": 0.0001167666632682085, "clip_ratio/region_mean": 0.0018175666991737671, "epoch": 0.08101313080050633, "grad_norm": 0.12121117115020752, "learning_rate": 2e-07, "loss": 0.0533, "step": 868 }, { "clip_ratio/high_max": 0.0019424174715823028, "clip_ratio/high_mean": 0.0008343732697539963, "clip_ratio/low_mean": 0.0008565648404328385, "clip_ratio/low_min": 0.0001499726622569142, "clip_ratio/region_mean": 0.0016909381229197606, "epoch": 0.08110646390050691, "grad_norm": 0.1272365003824234, "learning_rate": 2e-07, "loss": 0.028, "step": 869 }, { "clip_ratio/high_max": 0.002419726450170856, "clip_ratio/high_mean": 0.0009976168148568831, "clip_ratio/low_mean": 0.0009186365114146611, "clip_ratio/low_min": 5.557616623264039e-05, "clip_ratio/region_mean": 0.0019162533135386184, "epoch": 0.0811997970005075, "grad_norm": 0.12106209248304367, "learning_rate": 2e-07, "loss": 0.0116, "step": 870 }, { "clip_ratio/high_max": 0.002204809985414613, "clip_ratio/high_mean": 0.0008635136546217836, "clip_ratio/low_mean": 0.0009179110329569085, "clip_ratio/low_min": 0.00010254782409901964, "clip_ratio/region_mean": 0.0017814247039495967, "epoch": 0.08129313010050808, "grad_norm": 0.11858925968408585, "learning_rate": 2e-07, "loss": 0.0153, "step": 871 }, { "clip_ratio/high_max": 0.0020446186063054483, "clip_ratio/high_mean": 0.000821780666228733, "clip_ratio/low_mean": 0.0008586461772210896, "clip_ratio/low_min": 8.591065125074238e-06, "clip_ratio/region_mean": 0.0016804268052510452, "epoch": 0.08138646320050867, "grad_norm": 0.10342464596033096, "learning_rate": 2e-07, "loss": 0.0275, "step": 872 }, { "clip_ratio/high_max": 0.0023051178359310143, "clip_ratio/high_mean": 0.0008783240355114685, "clip_ratio/low_mean": 0.0008666777357575484, "clip_ratio/low_min": 4.870078464591643e-05, "clip_ratio/region_mean": 0.0017450017840019427, "epoch": 0.08147979630050925, "grad_norm": 0.11449926346540451, "learning_rate": 2e-07, "loss": 0.0271, "step": 873 }, { "clip_ratio/high_max": 0.0021750144042016473, "clip_ratio/high_mean": 0.000939085375648574, "clip_ratio/low_mean": 0.0008441420905000996, "clip_ratio/low_min": 0.00010081344680656912, "clip_ratio/region_mean": 0.0017832274716056418, "epoch": 0.08157312940050983, "grad_norm": 0.10220494866371155, "learning_rate": 2e-07, "loss": 0.0235, "step": 874 }, { "clip_ratio/high_max": 0.0023619382409378886, "clip_ratio/high_mean": 0.0008909159987524617, "clip_ratio/low_mean": 0.0009391218336531892, "clip_ratio/low_min": 6.212108746694867e-05, "clip_ratio/region_mean": 0.0018300378069397993, "epoch": 0.08166646250051042, "grad_norm": 0.11200816184282303, "learning_rate": 2e-07, "loss": 0.0308, "step": 875 }, { "clip_ratio/high_max": 0.0023630687792319804, "clip_ratio/high_mean": 0.000964456330621033, "clip_ratio/low_mean": 0.0008920752643462038, "clip_ratio/low_min": 0.0001292768038183567, "clip_ratio/region_mean": 0.0018565316204330884, "epoch": 0.081759795600511, "grad_norm": 0.11393171548843384, "learning_rate": 2e-07, "loss": 0.0174, "step": 876 }, { "clip_ratio/high_max": 0.0022815628035459667, "clip_ratio/high_mean": 0.0009169753848254913, "clip_ratio/low_mean": 0.0009521250103716739, "clip_ratio/low_min": 0.0001140278072853107, "clip_ratio/region_mean": 0.0018691004297579639, "epoch": 0.08185312870051158, "grad_norm": 0.12352942675352097, "learning_rate": 2e-07, "loss": 0.0426, "step": 877 }, { "clip_ratio/high_max": 0.00209259594703326, "clip_ratio/high_mean": 0.0008454976978100603, "clip_ratio/low_mean": 0.0009140108368228539, "clip_ratio/low_min": 8.487772856824449e-05, "clip_ratio/region_mean": 0.0017595085228094831, "epoch": 0.08194646180051217, "grad_norm": 0.11961931735277176, "learning_rate": 2e-07, "loss": 0.0217, "step": 878 }, { "clip_ratio/high_max": 0.0020301751319493633, "clip_ratio/high_mean": 0.0009181723726214841, "clip_ratio/low_mean": 0.0008950343981268816, "clip_ratio/low_min": 0.00013385956663114484, "clip_ratio/region_mean": 0.0018132067998521961, "epoch": 0.08203979490051275, "grad_norm": 0.11827986687421799, "learning_rate": 2e-07, "loss": 0.015, "step": 879 }, { "clip_ratio/high_max": 0.002399175940809073, "clip_ratio/high_mean": 0.0008318445143231656, "clip_ratio/low_mean": 0.0009716146414575633, "clip_ratio/low_min": 8.073976823652629e-05, "clip_ratio/region_mean": 0.001803459133952856, "epoch": 0.08213312800051333, "grad_norm": 0.119765505194664, "learning_rate": 2e-07, "loss": 0.0442, "step": 880 }, { "clip_ratio/high_max": 0.002387790307693649, "clip_ratio/high_mean": 0.0009293005441577407, "clip_ratio/low_mean": 0.0008951399358920753, "clip_ratio/low_min": 0.00013323382427188335, "clip_ratio/region_mean": 0.0018244404345750809, "epoch": 0.08222646110051392, "grad_norm": 0.11568864434957504, "learning_rate": 2e-07, "loss": -0.0004, "step": 881 }, { "clip_ratio/high_max": 0.0022156382001412567, "clip_ratio/high_mean": 0.0009404894772160333, "clip_ratio/low_mean": 0.0008771842258283868, "clip_ratio/low_min": 5.5137741583166644e-05, "clip_ratio/region_mean": 0.0018176737285102718, "epoch": 0.0823197942005145, "grad_norm": 0.11203434318304062, "learning_rate": 2e-07, "loss": -0.0002, "step": 882 }, { "clip_ratio/high_max": 0.0020574462832883, "clip_ratio/high_mean": 0.0007554463791166199, "clip_ratio/low_mean": 0.000940479764722113, "clip_ratio/low_min": 6.0541056882357225e-05, "clip_ratio/region_mean": 0.001695926155662164, "epoch": 0.08241312730051509, "grad_norm": 0.1065397709608078, "learning_rate": 2e-07, "loss": 0.0174, "step": 883 }, { "clip_ratio/high_max": 0.0019534163729986176, "clip_ratio/high_mean": 0.0008670921142766019, "clip_ratio/low_mean": 0.0008861019305186346, "clip_ratio/low_min": 1.3935339666204527e-05, "clip_ratio/region_mean": 0.0017531940175103955, "epoch": 0.08250646040051567, "grad_norm": 0.11947846412658691, "learning_rate": 2e-07, "loss": 0.0288, "step": 884 }, { "clip_ratio/high_max": 0.002271034743898781, "clip_ratio/high_mean": 0.0008737468942854321, "clip_ratio/low_mean": 0.0008831299564917572, "clip_ratio/low_min": 9.324590610049199e-05, "clip_ratio/region_mean": 0.0017568768525961787, "epoch": 0.08259979350051624, "grad_norm": 0.11321040242910385, "learning_rate": 2e-07, "loss": 0.0166, "step": 885 }, { "clip_ratio/high_max": 0.0020306627920945175, "clip_ratio/high_mean": 0.000770256832765881, "clip_ratio/low_mean": 0.0009700578320916975, "clip_ratio/low_min": 7.050455133139621e-05, "clip_ratio/region_mean": 0.0017403146412107162, "epoch": 0.08269312660051684, "grad_norm": 0.1118687316775322, "learning_rate": 2e-07, "loss": 0.0057, "step": 886 }, { "clip_ratio/high_max": 0.001880112016806379, "clip_ratio/high_mean": 0.0008832221519696759, "clip_ratio/low_mean": 0.0009546936489641666, "clip_ratio/low_min": 4.9851501898956485e-05, "clip_ratio/region_mean": 0.0018379157700110227, "epoch": 0.08278645970051741, "grad_norm": 0.12087177485227585, "learning_rate": 2e-07, "loss": 0.0183, "step": 887 }, { "clip_ratio/high_max": 0.001974722123122774, "clip_ratio/high_mean": 0.0008303438971779542, "clip_ratio/low_mean": 0.0009517904691165313, "clip_ratio/low_min": 5.022104051022325e-05, "clip_ratio/region_mean": 0.0017821343571995385, "epoch": 0.08287979280051799, "grad_norm": 0.1101384162902832, "learning_rate": 2e-07, "loss": 0.0322, "step": 888 }, { "clip_ratio/high_max": 0.0023476662099710666, "clip_ratio/high_mean": 0.0010228882692899788, "clip_ratio/low_mean": 0.0008413346295128576, "clip_ratio/low_min": 4.152257952227956e-05, "clip_ratio/region_mean": 0.0018642228678800166, "epoch": 0.08297312590051859, "grad_norm": 0.11497638374567032, "learning_rate": 2e-07, "loss": -0.0239, "step": 889 }, { "clip_ratio/high_max": 0.0017871092022687662, "clip_ratio/high_mean": 0.0008639523712190567, "clip_ratio/low_mean": 0.0009225734738720348, "clip_ratio/low_min": 9.810910250962479e-05, "clip_ratio/region_mean": 0.0017865258414531127, "epoch": 0.08306645900051916, "grad_norm": 0.1248597651720047, "learning_rate": 2e-07, "loss": 0.0697, "step": 890 }, { "clip_ratio/high_max": 0.0020408479940670077, "clip_ratio/high_mean": 0.0007691061164223356, "clip_ratio/low_mean": 0.00086121924505278, "clip_ratio/low_min": 3.6258114960219245e-05, "clip_ratio/region_mean": 0.001630325372389052, "epoch": 0.08315979210051976, "grad_norm": 0.12337683886289597, "learning_rate": 2e-07, "loss": 0.0393, "step": 891 }, { "clip_ratio/high_max": 0.0017209156649187207, "clip_ratio/high_mean": 0.0007117234508768888, "clip_ratio/low_mean": 0.0009266066081181634, "clip_ratio/low_min": 6.840476271463558e-05, "clip_ratio/region_mean": 0.0016383300680899993, "epoch": 0.08325312520052033, "grad_norm": 0.11849468946456909, "learning_rate": 2e-07, "loss": 0.0191, "step": 892 }, { "clip_ratio/high_max": 0.002107576103298925, "clip_ratio/high_mean": 0.000852651372042601, "clip_ratio/low_mean": 0.0008518492741131922, "clip_ratio/low_min": 6.255854714254383e-05, "clip_ratio/region_mean": 0.0017045006461557932, "epoch": 0.08334645830052091, "grad_norm": 0.123601533472538, "learning_rate": 2e-07, "loss": 0.0141, "step": 893 }, { "clip_ratio/high_max": 0.0017648997272772249, "clip_ratio/high_mean": 0.0007755604892736301, "clip_ratio/low_mean": 0.0008379606133530615, "clip_ratio/low_min": 0.000113152645099035, "clip_ratio/region_mean": 0.0016135211080836598, "epoch": 0.0834397914005215, "grad_norm": 0.11255298554897308, "learning_rate": 2e-07, "loss": 0.0393, "step": 894 }, { "clip_ratio/high_max": 0.0021342843465390615, "clip_ratio/high_mean": 0.0009118295747612137, "clip_ratio/low_mean": 0.0009437077751499601, "clip_ratio/low_min": 5.5717297072988003e-05, "clip_ratio/region_mean": 0.001855537364463089, "epoch": 0.08353312450052208, "grad_norm": 0.12703007459640503, "learning_rate": 2e-07, "loss": 0.0066, "step": 895 }, { "clip_ratio/high_max": 0.0021259242566884495, "clip_ratio/high_mean": 0.0008717195778444875, "clip_ratio/low_mean": 0.0009662341544753872, "clip_ratio/low_min": 5.353550841391552e-05, "clip_ratio/region_mean": 0.001837953706854023, "epoch": 0.08362645760052266, "grad_norm": 0.110402412712574, "learning_rate": 2e-07, "loss": 0.0378, "step": 896 }, { "clip_ratio/high_max": 0.0, "clip_ratio/high_mean": 0.0, "clip_ratio/low_mean": 0.0, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0, "completions/clipped_ratio": 0.01409912109375, "completions/max_length": 4096.0, "completions/max_terminated_length": 4087.0, "completions/mean_length": 613.0856323242188, "completions/mean_terminated_length": 563.27734375, "completions/min_length": 3.0, "completions/min_terminated_length": 3.0, "epoch": 0.08371979070052325, "grad_norm": 0.12162449210882187, "learning_rate": 2e-07, "loss": -0.0045, "num_tokens": 652469314.0, "reward": 0.567513644695282, "reward_std": 0.20693106949329376, "rewards/simpleverify_reward/mean": 0.5675135850906372, "rewards/simpleverify_reward/std": 0.4954230785369873, "step": 897 }, { "clip_ratio/high_max": 0.0018112511315848678, "clip_ratio/high_mean": 0.0008163897473423276, "clip_ratio/low_mean": 0.0005542654935197788, "clip_ratio/low_min": 1.227415577886859e-05, "clip_ratio/region_mean": 0.0013706552599614952, "epoch": 0.08381312380052383, "grad_norm": 0.12288690358400345, "learning_rate": 2e-07, "loss": 0.0516, "step": 898 }, { "clip_ratio/high_max": 0.0020576967217493802, "clip_ratio/high_mean": 0.0007747524377919035, "clip_ratio/low_mean": 0.0006511052870337153, "clip_ratio/low_min": 5.7001117056643125e-05, "clip_ratio/region_mean": 0.0014258577066357248, "epoch": 0.08390645690052441, "grad_norm": 0.1210097074508667, "learning_rate": 2e-07, "loss": 0.022, "step": 899 }, { "clip_ratio/high_max": 0.0016279331684927456, "clip_ratio/high_mean": 0.0007152366470108973, "clip_ratio/low_mean": 0.0005978735853204853, "clip_ratio/low_min": 1.5570503819617443e-05, "clip_ratio/region_mean": 0.0013131102241459303, "epoch": 0.083999790000525, "grad_norm": 0.1158841997385025, "learning_rate": 2e-07, "loss": 0.0236, "step": 900 }, { "clip_ratio/high_max": 0.002052200525213266, "clip_ratio/high_mean": 0.0008301850302814273, "clip_ratio/low_mean": 0.0005943389642197872, "clip_ratio/low_min": 6.800342725910014e-05, "clip_ratio/region_mean": 0.0014245240272430237, "epoch": 0.08409312310052558, "grad_norm": 0.11771244555711746, "learning_rate": 2e-07, "loss": 0.0431, "step": 901 }, { "clip_ratio/high_max": 0.0017894144948513713, "clip_ratio/high_mean": 0.0008076579415501328, "clip_ratio/low_mean": 0.0005177047241886612, "clip_ratio/low_min": 1.636982779018581e-05, "clip_ratio/region_mean": 0.001325362693023635, "epoch": 0.08418645620052617, "grad_norm": 0.12184035032987595, "learning_rate": 2e-07, "loss": 0.0336, "step": 902 }, { "clip_ratio/high_max": 0.0021417176139948424, "clip_ratio/high_mean": 0.0008567755485273665, "clip_ratio/low_mean": 0.000586350288358517, "clip_ratio/low_min": 5.038973358750809e-05, "clip_ratio/region_mean": 0.0014431258387048729, "epoch": 0.08427978930052675, "grad_norm": 0.11789008975028992, "learning_rate": 2e-07, "loss": 0.0285, "step": 903 }, { "clip_ratio/high_max": 0.001982196539756842, "clip_ratio/high_mean": 0.0008022846213862067, "clip_ratio/low_mean": 0.0005833629938933882, "clip_ratio/low_min": 8.178356529242592e-05, "clip_ratio/region_mean": 0.001385647618008079, "epoch": 0.08437312240052733, "grad_norm": 0.11251118779182434, "learning_rate": 2e-07, "loss": 0.0203, "step": 904 }, { "clip_ratio/high_max": 0.001968657725228695, "clip_ratio/high_mean": 0.0006951486739126267, "clip_ratio/low_mean": 0.0006485604608315043, "clip_ratio/low_min": 2.9024657123954967e-05, "clip_ratio/region_mean": 0.0013437091038213111, "epoch": 0.08446645550052792, "grad_norm": 0.10889243334531784, "learning_rate": 2e-07, "loss": 0.0493, "step": 905 }, { "clip_ratio/high_max": 0.0022171865493874066, "clip_ratio/high_mean": 0.0008838489738991484, "clip_ratio/low_mean": 0.0006033356248735799, "clip_ratio/low_min": 4.4095952034695074e-05, "clip_ratio/region_mean": 0.0014871845742163714, "epoch": 0.0845597886005285, "grad_norm": 0.11601719260215759, "learning_rate": 2e-07, "loss": -0.02, "step": 906 }, { "clip_ratio/high_max": 0.0019106171166640706, "clip_ratio/high_mean": 0.0008115542987070512, "clip_ratio/low_mean": 0.0006392508712451672, "clip_ratio/low_min": 5.486358168127481e-05, "clip_ratio/region_mean": 0.0014508051608572714, "epoch": 0.08465312170052908, "grad_norm": 0.11521967500448227, "learning_rate": 2e-07, "loss": 0.0216, "step": 907 }, { "clip_ratio/high_max": 0.0022556756375706755, "clip_ratio/high_mean": 0.0009922235913109034, "clip_ratio/low_mean": 0.0006621750399062876, "clip_ratio/low_min": 2.4872084395610727e-05, "clip_ratio/region_mean": 0.001654398649407085, "epoch": 0.08474645480052967, "grad_norm": 0.12133180350065231, "learning_rate": 2e-07, "loss": 0.0155, "step": 908 }, { "clip_ratio/high_max": 0.0018382212801952846, "clip_ratio/high_mean": 0.0007134501483960776, "clip_ratio/low_mean": 0.0005804501379316207, "clip_ratio/low_min": 2.909769318648614e-05, "clip_ratio/region_mean": 0.00129390028087073, "epoch": 0.08483978790053025, "grad_norm": 0.1057668924331665, "learning_rate": 2e-07, "loss": 0.0401, "step": 909 }, { "clip_ratio/high_max": 0.00180272100988077, "clip_ratio/high_mean": 0.0007555153497378342, "clip_ratio/low_mean": 0.0006065388570277719, "clip_ratio/low_min": 2.6427924240124412e-05, "clip_ratio/region_mean": 0.001362054197670659, "epoch": 0.08493312100053083, "grad_norm": 0.11370846629142761, "learning_rate": 2e-07, "loss": 0.046, "step": 910 }, { "clip_ratio/high_max": 0.002161943026294466, "clip_ratio/high_mean": 0.0009072519933397416, "clip_ratio/low_mean": 0.0006787254933442455, "clip_ratio/low_min": 4.366896610008553e-05, "clip_ratio/region_mean": 0.0015859774648561142, "epoch": 0.08502645410053142, "grad_norm": 0.11793677508831024, "learning_rate": 2e-07, "loss": 0.0047, "step": 911 }, { "clip_ratio/high_max": 0.0015450228747795336, "clip_ratio/high_mean": 0.0006537077142638736, "clip_ratio/low_mean": 0.0006339934134302894, "clip_ratio/low_min": 2.498501089576166e-05, "clip_ratio/region_mean": 0.0012877011286036577, "epoch": 0.085119787200532, "grad_norm": 0.11759548634290695, "learning_rate": 2e-07, "loss": 0.0835, "step": 912 }, { "clip_ratio/high_max": 0.0019005588837899268, "clip_ratio/high_mean": 0.0008523499345756136, "clip_ratio/low_mean": 0.0006931839270691853, "clip_ratio/low_min": 3.243231003580149e-05, "clip_ratio/region_mean": 0.0015455338543688413, "epoch": 0.08521312030053259, "grad_norm": 0.12224702537059784, "learning_rate": 2e-07, "loss": 0.0271, "step": 913 }, { "clip_ratio/high_max": 0.002013933008129243, "clip_ratio/high_mean": 0.0006861950678285211, "clip_ratio/low_mean": 0.0006104234525992069, "clip_ratio/low_min": 2.5240056857001036e-05, "clip_ratio/region_mean": 0.001296618502237834, "epoch": 0.08530645340053317, "grad_norm": 0.11139517277479172, "learning_rate": 2e-07, "loss": 0.0119, "step": 914 }, { "clip_ratio/high_max": 0.0017724530407576822, "clip_ratio/high_mean": 0.000858788760524476, "clip_ratio/low_mean": 0.0007118752237147419, "clip_ratio/low_min": 3.753434339159867e-05, "clip_ratio/region_mean": 0.0015706639605923556, "epoch": 0.08539978650053374, "grad_norm": 0.11773455142974854, "learning_rate": 2e-07, "loss": 0.0022, "step": 915 }, { "clip_ratio/high_max": 0.002184279750508722, "clip_ratio/high_mean": 0.0008765644579398213, "clip_ratio/low_mean": 0.0006635896297666477, "clip_ratio/low_min": 1.2124150998715777e-05, "clip_ratio/region_mean": 0.0015401540949824266, "epoch": 0.08549311960053434, "grad_norm": 0.12331472337245941, "learning_rate": 2e-07, "loss": 0.0608, "step": 916 }, { "clip_ratio/high_max": 0.0020577519353537355, "clip_ratio/high_mean": 0.0008414249550696695, "clip_ratio/low_mean": 0.0006563262486452004, "clip_ratio/low_min": 3.9569691580254585e-05, "clip_ratio/region_mean": 0.0014977512473706156, "epoch": 0.08558645270053492, "grad_norm": 0.11278630793094635, "learning_rate": 2e-07, "loss": 0.0004, "step": 917 }, { "clip_ratio/high_max": 0.0019813824765151367, "clip_ratio/high_mean": 0.00086567283324257, "clip_ratio/low_mean": 0.0007036796514512389, "clip_ratio/low_min": 5.2408238843781874e-05, "clip_ratio/region_mean": 0.0015693524474045262, "epoch": 0.0856797858005355, "grad_norm": 0.12220539152622223, "learning_rate": 2e-07, "loss": 0.0315, "step": 918 }, { "clip_ratio/high_max": 0.002388926935964264, "clip_ratio/high_mean": 0.0008990698697743937, "clip_ratio/low_mean": 0.000677353227729327, "clip_ratio/low_min": 1.3012700037506875e-05, "clip_ratio/region_mean": 0.0015764231320645195, "epoch": 0.08577311890053609, "grad_norm": 0.12273003160953522, "learning_rate": 2e-07, "loss": 0.0097, "step": 919 }, { "clip_ratio/high_max": 0.0018908923448179848, "clip_ratio/high_mean": 0.0007378340014838614, "clip_ratio/low_mean": 0.0007001546127867186, "clip_ratio/low_min": 4.040355088363867e-05, "clip_ratio/region_mean": 0.0014379886306414846, "epoch": 0.08586645200053666, "grad_norm": 0.11449079215526581, "learning_rate": 2e-07, "loss": 0.0389, "step": 920 }, { "clip_ratio/high_max": 0.002017174403590616, "clip_ratio/high_mean": 0.0008725191764824558, "clip_ratio/low_mean": 0.0007863672344683437, "clip_ratio/low_min": 6.224476146599045e-05, "clip_ratio/region_mean": 0.0016588863618380856, "epoch": 0.08595978510053724, "grad_norm": 0.1231214702129364, "learning_rate": 2e-07, "loss": 0.0207, "step": 921 }, { "clip_ratio/high_max": 0.0021106831991346553, "clip_ratio/high_mean": 0.0008220247109420598, "clip_ratio/low_mean": 0.0007833340187062277, "clip_ratio/low_min": 6.12956491750083e-05, "clip_ratio/region_mean": 0.0016053587714850437, "epoch": 0.08605311820053783, "grad_norm": 0.1185522973537445, "learning_rate": 2e-07, "loss": 0.0307, "step": 922 }, { "clip_ratio/high_max": 0.001878073591797147, "clip_ratio/high_mean": 0.0008282860217150301, "clip_ratio/low_mean": 0.0007637700273335213, "clip_ratio/low_min": 4.9278947699349374e-05, "clip_ratio/region_mean": 0.0015920560108497739, "epoch": 0.08614645130053841, "grad_norm": 0.11243151873350143, "learning_rate": 2e-07, "loss": 0.0252, "step": 923 }, { "clip_ratio/high_max": 0.0016648050950607285, "clip_ratio/high_mean": 0.000784222911534016, "clip_ratio/low_mean": 0.0006318370633380255, "clip_ratio/low_min": 2.6227444323012605e-05, "clip_ratio/region_mean": 0.0014160599494061898, "epoch": 0.086239784400539, "grad_norm": 0.11436755210161209, "learning_rate": 2e-07, "loss": 0.0114, "step": 924 }, { "clip_ratio/high_max": 0.0021438626645249315, "clip_ratio/high_mean": 0.0009502341399638681, "clip_ratio/low_mean": 0.0007864092440286186, "clip_ratio/low_min": 5.119885281601455e-05, "clip_ratio/region_mean": 0.0017366433894494548, "epoch": 0.08633311750053958, "grad_norm": 0.1177460253238678, "learning_rate": 2e-07, "loss": 0.0048, "step": 925 }, { "clip_ratio/high_max": 0.0018546308201621287, "clip_ratio/high_mean": 0.0007976996439538198, "clip_ratio/low_mean": 0.0008232041564042447, "clip_ratio/low_min": 0.0001256245641343412, "clip_ratio/region_mean": 0.0016209037930821069, "epoch": 0.08642645060054016, "grad_norm": 0.1133279874920845, "learning_rate": 2e-07, "loss": 0.0389, "step": 926 }, { "clip_ratio/high_max": 0.002005259295401629, "clip_ratio/high_mean": 0.0008612799210823141, "clip_ratio/low_mean": 0.0007214718443719903, "clip_ratio/low_min": 4.7352654291898943e-05, "clip_ratio/region_mean": 0.0015827517563593574, "epoch": 0.08651978370054075, "grad_norm": 0.13077805936336517, "learning_rate": 2e-07, "loss": 0.0178, "step": 927 }, { "clip_ratio/high_max": 0.0019897491729352623, "clip_ratio/high_mean": 0.0008163117918229545, "clip_ratio/low_mean": 0.0008165552717400715, "clip_ratio/low_min": 7.056026879581623e-05, "clip_ratio/region_mean": 0.0016328670753864571, "epoch": 0.08661311680054133, "grad_norm": 0.11461208015680313, "learning_rate": 2e-07, "loss": 0.0341, "step": 928 }, { "clip_ratio/high_max": 0.00191262239968637, "clip_ratio/high_mean": 0.0009016308467835188, "clip_ratio/low_mean": 0.0007832888713892316, "clip_ratio/low_min": 3.441614353505429e-05, "clip_ratio/region_mean": 0.0016849196872499306, "epoch": 0.08670644990054191, "grad_norm": 0.1089409813284874, "learning_rate": 2e-07, "loss": 0.0162, "step": 929 }, { "clip_ratio/high_max": 0.0019098342309007421, "clip_ratio/high_mean": 0.0008114214615488891, "clip_ratio/low_mean": 0.0007405589203699492, "clip_ratio/low_min": 9.251988376490772e-05, "clip_ratio/region_mean": 0.0015519803928327747, "epoch": 0.0867997830005425, "grad_norm": 0.11598870903253555, "learning_rate": 2e-07, "loss": 0.041, "step": 930 }, { "clip_ratio/high_max": 0.0017543869435030501, "clip_ratio/high_mean": 0.000739471481210785, "clip_ratio/low_mean": 0.0008223292315960862, "clip_ratio/low_min": 3.6769027246918995e-05, "clip_ratio/region_mean": 0.0015618007237208076, "epoch": 0.08689311610054308, "grad_norm": 0.10901755839586258, "learning_rate": 2e-07, "loss": 0.0514, "step": 931 }, { "clip_ratio/high_max": 0.0018613182837725617, "clip_ratio/high_mean": 0.0007458259678969625, "clip_ratio/low_mean": 0.0009024664395838045, "clip_ratio/low_min": 0.00010434735304443166, "clip_ratio/region_mean": 0.0016482924038427882, "epoch": 0.08698644920054366, "grad_norm": 0.11705763638019562, "learning_rate": 2e-07, "loss": 0.0672, "step": 932 }, { "clip_ratio/high_max": 0.002030564395681722, "clip_ratio/high_mean": 0.0008195288701244863, "clip_ratio/low_mean": 0.0008193046214728383, "clip_ratio/low_min": 5.855677773070056e-05, "clip_ratio/region_mean": 0.0016388334915973246, "epoch": 0.08707978230054425, "grad_norm": 0.1096845343708992, "learning_rate": 2e-07, "loss": 0.0317, "step": 933 }, { "clip_ratio/high_max": 0.002046170164248906, "clip_ratio/high_mean": 0.0008752874382480513, "clip_ratio/low_mean": 0.0008919659048842732, "clip_ratio/low_min": 5.395487096393481e-05, "clip_ratio/region_mean": 0.001767253335856367, "epoch": 0.08717311540054483, "grad_norm": 0.1310867816209793, "learning_rate": 2e-07, "loss": 0.0261, "step": 934 }, { "clip_ratio/high_max": 0.0019501530405250378, "clip_ratio/high_mean": 0.0008152059635904152, "clip_ratio/low_mean": 0.0008583470626035705, "clip_ratio/low_min": 0.00012287273966649082, "clip_ratio/region_mean": 0.001673553000728134, "epoch": 0.08726644850054542, "grad_norm": 0.17055778205394745, "learning_rate": 2e-07, "loss": 0.034, "step": 935 }, { "clip_ratio/high_max": 0.002291861492267344, "clip_ratio/high_mean": 0.000919654641620582, "clip_ratio/low_mean": 0.0007677253706788179, "clip_ratio/low_min": 2.5183428078889847e-05, "clip_ratio/region_mean": 0.0016873800559551455, "epoch": 0.087359781600546, "grad_norm": 0.12035069614648819, "learning_rate": 2e-07, "loss": 0.0093, "step": 936 }, { "clip_ratio/high_max": 0.0020925548815284856, "clip_ratio/high_mean": 0.0008404631262237672, "clip_ratio/low_mean": 0.0008868924269336276, "clip_ratio/low_min": 0.00010809292780322721, "clip_ratio/region_mean": 0.0017273555895371828, "epoch": 0.08745311470054658, "grad_norm": 0.12469220161437988, "learning_rate": 2e-07, "loss": 0.0543, "step": 937 }, { "clip_ratio/high_max": 0.002034360441030003, "clip_ratio/high_mean": 0.0008725235202291515, "clip_ratio/low_mean": 0.0007693826246395474, "clip_ratio/low_min": 1.2562813935801387e-05, "clip_ratio/region_mean": 0.0016419061503256671, "epoch": 0.08754644780054717, "grad_norm": 0.11948986351490021, "learning_rate": 2e-07, "loss": 0.0317, "step": 938 }, { "clip_ratio/high_max": 0.0022533698356710374, "clip_ratio/high_mean": 0.000901546940440312, "clip_ratio/low_mean": 0.0008149975365085993, "clip_ratio/low_min": 7.090882627380779e-05, "clip_ratio/region_mean": 0.0017165445169666782, "epoch": 0.08763978090054775, "grad_norm": 0.10130567103624344, "learning_rate": 2e-07, "loss": 0.0302, "step": 939 }, { "clip_ratio/high_max": 0.002076921555271838, "clip_ratio/high_mean": 0.0008431170026597101, "clip_ratio/low_mean": 0.0008643443361506797, "clip_ratio/low_min": 9.085899819183396e-05, "clip_ratio/region_mean": 0.001707461357000284, "epoch": 0.08773311400054833, "grad_norm": 0.11579747498035431, "learning_rate": 2e-07, "loss": 0.0335, "step": 940 }, { "clip_ratio/high_max": 0.0020242117534507997, "clip_ratio/high_mean": 0.0008476191305817338, "clip_ratio/low_mean": 0.0008681526815053076, "clip_ratio/low_min": 7.699066190980375e-05, "clip_ratio/region_mean": 0.001715771810268052, "epoch": 0.08782644710054892, "grad_norm": 0.11279744654893875, "learning_rate": 2e-07, "loss": 0.0421, "step": 941 }, { "clip_ratio/high_max": 0.002041839514276944, "clip_ratio/high_mean": 0.0009012126192828873, "clip_ratio/low_mean": 0.0008445609109912766, "clip_ratio/low_min": 3.9047647987899836e-05, "clip_ratio/region_mean": 0.001745773530274164, "epoch": 0.0879197802005495, "grad_norm": 0.11809305846691132, "learning_rate": 2e-07, "loss": -0.0215, "step": 942 }, { "clip_ratio/high_max": 0.0016858389935805462, "clip_ratio/high_mean": 0.00079108682621154, "clip_ratio/low_mean": 0.0007168900474425755, "clip_ratio/low_min": 9.11174611246679e-05, "clip_ratio/region_mean": 0.0015079768636496738, "epoch": 0.08801311330055009, "grad_norm": 0.11560371518135071, "learning_rate": 2e-07, "loss": 0.037, "step": 943 }, { "clip_ratio/high_max": 0.00236108490753395, "clip_ratio/high_mean": 0.0009472165602346649, "clip_ratio/low_mean": 0.0007802465843269601, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0017274631682084873, "epoch": 0.08810644640055067, "grad_norm": 0.12202728539705276, "learning_rate": 2e-07, "loss": 0.0232, "step": 944 }, { "clip_ratio/high_max": 0.001921471739478875, "clip_ratio/high_mean": 0.0008335469210578594, "clip_ratio/low_mean": 0.0008223636341426754, "clip_ratio/low_min": 9.087680882657878e-05, "clip_ratio/region_mean": 0.0016559105497435667, "epoch": 0.08819977950055125, "grad_norm": 0.10965220630168915, "learning_rate": 2e-07, "loss": 0.0439, "step": 945 }, { "clip_ratio/high_max": 0.002313583761861082, "clip_ratio/high_mean": 0.0010062177807412809, "clip_ratio/low_mean": 0.000809705999927246, "clip_ratio/low_min": 6.776536793040577e-06, "clip_ratio/region_mean": 0.0018159237952204421, "epoch": 0.08829311260055184, "grad_norm": 0.1171477660536766, "learning_rate": 2e-07, "loss": -0.0243, "step": 946 }, { "clip_ratio/high_max": 0.002093440489261411, "clip_ratio/high_mean": 0.000878754144650884, "clip_ratio/low_mean": 0.0008670026891195448, "clip_ratio/low_min": 0.00017789201592677273, "clip_ratio/region_mean": 0.0017457568901591003, "epoch": 0.08838644570055242, "grad_norm": 0.11711817979812622, "learning_rate": 2e-07, "loss": 0.031, "step": 947 }, { "clip_ratio/high_max": 0.0019138724965159781, "clip_ratio/high_mean": 0.0007966125303937588, "clip_ratio/low_mean": 0.0007924304645712255, "clip_ratio/low_min": 4.5359948217083e-05, "clip_ratio/region_mean": 0.0015890430113358889, "epoch": 0.088479778800553, "grad_norm": 0.11546622216701508, "learning_rate": 2e-07, "loss": 0.0526, "step": 948 }, { "clip_ratio/high_max": 0.002295453494298272, "clip_ratio/high_mean": 0.0010069425279652933, "clip_ratio/low_mean": 0.0008885426013875986, "clip_ratio/low_min": 8.437967608188046e-05, "clip_ratio/region_mean": 0.001895485089335125, "epoch": 0.08857311190055359, "grad_norm": 0.1301276683807373, "learning_rate": 2e-07, "loss": 0.01, "step": 949 }, { "clip_ratio/high_max": 0.0018856589413189795, "clip_ratio/high_mean": 0.0008266574859590037, "clip_ratio/low_mean": 0.0008140431564243045, "clip_ratio/low_min": 0.00010384570941823767, "clip_ratio/region_mean": 0.0016407006260124035, "epoch": 0.08866644500055416, "grad_norm": 0.12614940106868744, "learning_rate": 2e-07, "loss": 0.0195, "step": 950 }, { "clip_ratio/high_max": 0.0021159039752092212, "clip_ratio/high_mean": 0.0008462677269562846, "clip_ratio/low_mean": 0.0008240963288699277, "clip_ratio/low_min": 5.575320847128751e-05, "clip_ratio/region_mean": 0.0016703640576452017, "epoch": 0.08875977810055474, "grad_norm": 0.12276522815227509, "learning_rate": 2e-07, "loss": -0.0034, "step": 951 }, { "clip_ratio/high_max": 0.0019863678026013076, "clip_ratio/high_mean": 0.000858555073136813, "clip_ratio/low_mean": 0.0009153956052614376, "clip_ratio/low_min": 0.00013255642261356115, "clip_ratio/region_mean": 0.0017739506874931976, "epoch": 0.08885311120055533, "grad_norm": 0.10823127627372742, "learning_rate": 2e-07, "loss": 0.0252, "step": 952 }, { "clip_ratio/high_max": 0.002332548850972671, "clip_ratio/high_mean": 0.0009975165121431928, "clip_ratio/low_mean": 0.0008832455096126068, "clip_ratio/low_min": 8.306824020110071e-05, "clip_ratio/region_mean": 0.0018807620581355877, "epoch": 0.08894644430055591, "grad_norm": 0.11643475294113159, "learning_rate": 2e-07, "loss": 0.014, "step": 953 }, { "clip_ratio/high_max": 0.0018594835601106752, "clip_ratio/high_mean": 0.0007775677095196443, "clip_ratio/low_mean": 0.0008015284965949832, "clip_ratio/low_min": 7.283348895725794e-05, "clip_ratio/region_mean": 0.0015790962206665426, "epoch": 0.0890397774005565, "grad_norm": 0.11232029646635056, "learning_rate": 2e-07, "loss": 0.0095, "step": 954 }, { "clip_ratio/high_max": 0.0017830657889135182, "clip_ratio/high_mean": 0.0007708430512138875, "clip_ratio/low_mean": 0.000925613843719475, "clip_ratio/low_min": 6.687655968562467e-05, "clip_ratio/region_mean": 0.001696456893114373, "epoch": 0.08913311050055708, "grad_norm": 0.10987037420272827, "learning_rate": 2e-07, "loss": 0.0254, "step": 955 }, { "clip_ratio/high_max": 0.0020257518372091, "clip_ratio/high_mean": 0.0008076957274170127, "clip_ratio/low_mean": 0.0009689747166703455, "clip_ratio/low_min": 9.391971707373159e-05, "clip_ratio/region_mean": 0.0017766704258974642, "epoch": 0.08922644360055766, "grad_norm": 0.13589760661125183, "learning_rate": 2e-07, "loss": 0.0634, "step": 956 }, { "clip_ratio/high_max": 0.0024122320755850524, "clip_ratio/high_mean": 0.0008989317502710037, "clip_ratio/low_mean": 0.0008413095092691947, "clip_ratio/low_min": 3.076743905694457e-05, "clip_ratio/region_mean": 0.0017402412631781772, "epoch": 0.08931977670055825, "grad_norm": 0.11439386010169983, "learning_rate": 2e-07, "loss": 0.0137, "step": 957 }, { "clip_ratio/high_max": 0.0023550021323899273, "clip_ratio/high_mean": 0.0008650238451082259, "clip_ratio/low_mean": 0.0008620612325103139, "clip_ratio/low_min": 7.331076449190732e-05, "clip_ratio/region_mean": 0.0017270850948989391, "epoch": 0.08941310980055883, "grad_norm": 0.11734023690223694, "learning_rate": 2e-07, "loss": 0.0092, "step": 958 }, { "clip_ratio/high_max": 0.0019581940323405433, "clip_ratio/high_mean": 0.0007858424269215902, "clip_ratio/low_mean": 0.0008579355526308063, "clip_ratio/low_min": 4.8267926558764884e-05, "clip_ratio/region_mean": 0.0016437779959233012, "epoch": 0.08950644290055941, "grad_norm": 0.11336815357208252, "learning_rate": 2e-07, "loss": 0.0143, "step": 959 }, { "clip_ratio/high_max": 0.0018540622113505378, "clip_ratio/high_mean": 0.0007637033941136906, "clip_ratio/low_mean": 0.0007706349424552172, "clip_ratio/low_min": 5.44963777429075e-05, "clip_ratio/region_mean": 0.0015343383347499184, "epoch": 0.08959977600056, "grad_norm": 0.11859084665775299, "learning_rate": 2e-07, "loss": 0.0157, "step": 960 }, { "clip_ratio/high_max": 0.0019286093884147704, "clip_ratio/high_mean": 0.0008351902633876307, "clip_ratio/low_mean": 0.0008590877878305037, "clip_ratio/low_min": 4.528342105913907e-05, "clip_ratio/region_mean": 0.0016942781148827635, "epoch": 0.08969310910056058, "grad_norm": 0.12416113913059235, "learning_rate": 2e-07, "loss": 0.0192, "step": 961 }, { "clip_ratio/high_max": 0.0024747895877226256, "clip_ratio/high_mean": 0.0009779722859093454, "clip_ratio/low_mean": 0.0008579803579777945, "clip_ratio/low_min": 3.0215937840694096e-05, "clip_ratio/region_mean": 0.001835952658439055, "epoch": 0.08978644220056116, "grad_norm": 0.10516249388456345, "learning_rate": 2e-07, "loss": -0.0232, "step": 962 }, { "clip_ratio/high_max": 0.0019244435461587273, "clip_ratio/high_mean": 0.0008635844442324014, "clip_ratio/low_mean": 0.0008423518775089178, "clip_ratio/low_min": 1.2344459719315637e-05, "clip_ratio/region_mean": 0.0017059362871805206, "epoch": 0.08987977530056175, "grad_norm": 0.11149899661540985, "learning_rate": 2e-07, "loss": 0.025, "step": 963 }, { "clip_ratio/high_max": 0.0021665901294909418, "clip_ratio/high_mean": 0.00097296190506313, "clip_ratio/low_mean": 0.0006637404785578838, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0016367023599741515, "epoch": 0.08997310840056233, "grad_norm": 0.107357457280159, "learning_rate": 2e-07, "loss": -0.0238, "step": 964 }, { "clip_ratio/high_max": 0.002055946875771042, "clip_ratio/high_mean": 0.0008675349254190223, "clip_ratio/low_mean": 0.0010152770373679232, "clip_ratio/low_min": 0.00015040939797472674, "clip_ratio/region_mean": 0.0018828120082616806, "epoch": 0.09006644150056292, "grad_norm": 0.11596270650625229, "learning_rate": 2e-07, "loss": 0.0401, "step": 965 }, { "clip_ratio/high_max": 0.0018330240363866324, "clip_ratio/high_mean": 0.0007851546160964062, "clip_ratio/low_mean": 0.0008707594697625609, "clip_ratio/low_min": 7.75835496824584e-05, "clip_ratio/region_mean": 0.0016559140931349248, "epoch": 0.0901597746005635, "grad_norm": 0.1132001057267189, "learning_rate": 2e-07, "loss": 0.0541, "step": 966 }, { "clip_ratio/high_max": 0.0018118869375030044, "clip_ratio/high_mean": 0.0008117737361317268, "clip_ratio/low_mean": 0.0009556810673529981, "clip_ratio/low_min": 5.418737873696955e-05, "clip_ratio/region_mean": 0.001767454836226534, "epoch": 0.09025310770056408, "grad_norm": 0.12437739223241806, "learning_rate": 2e-07, "loss": 0.0671, "step": 967 }, { "clip_ratio/high_max": 0.002003908397455234, "clip_ratio/high_mean": 0.0008942763815866783, "clip_ratio/low_mean": 0.0009594810235284967, "clip_ratio/low_min": 0.00019052210609515896, "clip_ratio/region_mean": 0.0018537573996582069, "epoch": 0.09034644080056467, "grad_norm": 0.12926779687404633, "learning_rate": 2e-07, "loss": 0.0395, "step": 968 }, { "clip_ratio/high_max": 0.0017841601729742251, "clip_ratio/high_mean": 0.0008013698879949516, "clip_ratio/low_mean": 0.0008834136096993461, "clip_ratio/low_min": 8.871262252796441e-05, "clip_ratio/region_mean": 0.0016847835067892447, "epoch": 0.09043977390056525, "grad_norm": 0.1251688301563263, "learning_rate": 2e-07, "loss": 0.0876, "step": 969 }, { "clip_ratio/high_max": 0.0023219510330818594, "clip_ratio/high_mean": 0.0009198222833219916, "clip_ratio/low_mean": 0.0009581765534676379, "clip_ratio/low_min": 0.00013087765273667173, "clip_ratio/region_mean": 0.0018779988677124493, "epoch": 0.09053310700056583, "grad_norm": 0.10932859033346176, "learning_rate": 2e-07, "loss": 0.0096, "step": 970 }, { "clip_ratio/high_max": 0.002132044788595522, "clip_ratio/high_mean": 0.0009358852075820323, "clip_ratio/low_mean": 0.000817614954939927, "clip_ratio/low_min": 6.469332311098697e-05, "clip_ratio/region_mean": 0.0017535001825308427, "epoch": 0.09062644010056642, "grad_norm": 0.1037466898560524, "learning_rate": 2e-07, "loss": -0.0083, "step": 971 }, { "clip_ratio/high_max": 0.002072294180834433, "clip_ratio/high_mean": 0.0009490374741289997, "clip_ratio/low_mean": 0.0010738928613136522, "clip_ratio/low_min": 0.00022222782081371406, "clip_ratio/region_mean": 0.0020229303336236626, "epoch": 0.090719773200567, "grad_norm": 0.11123389005661011, "learning_rate": 2e-07, "loss": 0.0237, "step": 972 }, { "clip_ratio/high_max": 0.002361332473810762, "clip_ratio/high_mean": 0.0008936092999647371, "clip_ratio/low_mean": 0.0009090846269828035, "clip_ratio/low_min": 6.882975230837474e-05, "clip_ratio/region_mean": 0.0018026939142146148, "epoch": 0.09081310630056758, "grad_norm": 0.11967220157384872, "learning_rate": 2e-07, "loss": 0.0112, "step": 973 }, { "clip_ratio/high_max": 0.002203014009865001, "clip_ratio/high_mean": 0.0008650745039631147, "clip_ratio/low_mean": 0.0007681401039008051, "clip_ratio/low_min": 6.3989977206802e-05, "clip_ratio/region_mean": 0.0016332145751221105, "epoch": 0.09090643940056817, "grad_norm": 0.10897765308618546, "learning_rate": 2e-07, "loss": 0.0041, "step": 974 }, { "clip_ratio/high_max": 0.0019967908738180995, "clip_ratio/high_mean": 0.0008973964613687713, "clip_ratio/low_mean": 0.0008402748062508181, "clip_ratio/low_min": 8.001156857062597e-05, "clip_ratio/region_mean": 0.0017376712639816105, "epoch": 0.09099977250056875, "grad_norm": 0.12271881103515625, "learning_rate": 2e-07, "loss": -0.0029, "step": 975 }, { "clip_ratio/high_max": 0.002196803383412771, "clip_ratio/high_mean": 0.0009303459955845028, "clip_ratio/low_mean": 0.0008683754294906976, "clip_ratio/low_min": 3.2912177630350925e-05, "clip_ratio/region_mean": 0.0017987214305321686, "epoch": 0.09109310560056934, "grad_norm": 0.11869372427463531, "learning_rate": 2e-07, "loss": -0.002, "step": 976 }, { "clip_ratio/high_max": 0.0018257142801303416, "clip_ratio/high_mean": 0.0007538001009379514, "clip_ratio/low_mean": 0.0009255762124666944, "clip_ratio/low_min": 2.9875778636778705e-05, "clip_ratio/region_mean": 0.0016793763134046458, "epoch": 0.09118643870056992, "grad_norm": 0.11280801892280579, "learning_rate": 2e-07, "loss": 0.0852, "step": 977 }, { "clip_ratio/high_max": 0.0020910201346850954, "clip_ratio/high_mean": 0.0008601889985584421, "clip_ratio/low_mean": 0.0008726039595785551, "clip_ratio/low_min": 7.63088228268316e-05, "clip_ratio/region_mean": 0.0017327929381281137, "epoch": 0.0912797718005705, "grad_norm": 0.11719376593828201, "learning_rate": 2e-07, "loss": 0.0413, "step": 978 }, { "clip_ratio/high_max": 0.0020004201651318, "clip_ratio/high_mean": 0.0008818800506560365, "clip_ratio/low_mean": 0.0009966871693904977, "clip_ratio/low_min": 2.1776619178126566e-05, "clip_ratio/region_mean": 0.0018785671927616931, "epoch": 0.09137310490057109, "grad_norm": 0.12042779475450516, "learning_rate": 2e-07, "loss": 0.0447, "step": 979 }, { "clip_ratio/high_max": 0.0020042865944560617, "clip_ratio/high_mean": 0.0008000141133379657, "clip_ratio/low_mean": 0.0009567451525072102, "clip_ratio/low_min": 0.0001877875229183701, "clip_ratio/region_mean": 0.0017567592731211334, "epoch": 0.09146643800057166, "grad_norm": 0.12119458615779877, "learning_rate": 2e-07, "loss": 0.0395, "step": 980 }, { "clip_ratio/high_max": 0.001993588884943165, "clip_ratio/high_mean": 0.0008360182036994956, "clip_ratio/low_mean": 0.000900883240319672, "clip_ratio/low_min": 8.681547205924289e-05, "clip_ratio/region_mean": 0.0017369014713040087, "epoch": 0.09155977110057224, "grad_norm": 0.11315525323152542, "learning_rate": 2e-07, "loss": 0.0345, "step": 981 }, { "clip_ratio/high_max": 0.0021334458215278573, "clip_ratio/high_mean": 0.0008581919355492573, "clip_ratio/low_mean": 0.0008236867288360372, "clip_ratio/low_min": 6.683915671601426e-05, "clip_ratio/region_mean": 0.0016818786607473157, "epoch": 0.09165310420057284, "grad_norm": 0.11125931888818741, "learning_rate": 2e-07, "loss": 0.0291, "step": 982 }, { "clip_ratio/high_max": 0.0024736154155107215, "clip_ratio/high_mean": 0.0009020390607474837, "clip_ratio/low_mean": 0.000821926452772459, "clip_ratio/low_min": 0.00019632312751127756, "clip_ratio/region_mean": 0.00172396549169207, "epoch": 0.09174643730057341, "grad_norm": 0.12084562331438065, "learning_rate": 2e-07, "loss": 0.0233, "step": 983 }, { "clip_ratio/high_max": 0.00187194837781135, "clip_ratio/high_mean": 0.0007703531646257034, "clip_ratio/low_mean": 0.0008461422694381326, "clip_ratio/low_min": 3.258036667830311e-05, "clip_ratio/region_mean": 0.0016164954286068678, "epoch": 0.09183977040057399, "grad_norm": 0.10466741770505905, "learning_rate": 2e-07, "loss": 0.0361, "step": 984 }, { "clip_ratio/high_max": 0.001791259230230935, "clip_ratio/high_mean": 0.0007597864196213777, "clip_ratio/low_mean": 0.0008684928288857918, "clip_ratio/low_min": 8.072165655903518e-05, "clip_ratio/region_mean": 0.0016282792057609186, "epoch": 0.09193310350057458, "grad_norm": 0.10636524856090546, "learning_rate": 2e-07, "loss": 0.0474, "step": 985 }, { "clip_ratio/high_max": 0.002009421863476746, "clip_ratio/high_mean": 0.0008232108502852498, "clip_ratio/low_mean": 0.0008072093278315151, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.001630420156288892, "epoch": 0.09202643660057516, "grad_norm": 0.1134420856833458, "learning_rate": 2e-07, "loss": 0.0155, "step": 986 }, { "clip_ratio/high_max": 0.0018274192625540309, "clip_ratio/high_mean": 0.0007767710067128064, "clip_ratio/low_mean": 0.000820938554170425, "clip_ratio/low_min": 6.44837818981614e-05, "clip_ratio/region_mean": 0.0015977095099515282, "epoch": 0.09211976970057575, "grad_norm": 0.2671923041343689, "learning_rate": 2e-07, "loss": 0.0272, "step": 987 }, { "clip_ratio/high_max": 0.0024588367668911815, "clip_ratio/high_mean": 0.0010189931417698972, "clip_ratio/low_mean": 0.0009727282777021173, "clip_ratio/low_min": 6.512393338198308e-05, "clip_ratio/region_mean": 0.0019917214158340357, "epoch": 0.09221310280057633, "grad_norm": 0.1211543083190918, "learning_rate": 2e-07, "loss": 0.0077, "step": 988 }, { "clip_ratio/high_max": 0.0021852910285815597, "clip_ratio/high_mean": 0.0009293494840676431, "clip_ratio/low_mean": 0.0008635377707832959, "clip_ratio/low_min": 5.683523522748146e-05, "clip_ratio/region_mean": 0.001792887254850939, "epoch": 0.09230643590057691, "grad_norm": 0.1211959719657898, "learning_rate": 2e-07, "loss": 0.0272, "step": 989 }, { "clip_ratio/high_max": 0.001791674760170281, "clip_ratio/high_mean": 0.0007268133949764888, "clip_ratio/low_mean": 0.0008831236846162938, "clip_ratio/low_min": 0.00010805446709127864, "clip_ratio/region_mean": 0.0016099370768642984, "epoch": 0.0923997690005775, "grad_norm": 0.11524740606546402, "learning_rate": 2e-07, "loss": 0.0649, "step": 990 }, { "clip_ratio/high_max": 0.002256779662275221, "clip_ratio/high_mean": 0.0008427663924521767, "clip_ratio/low_mean": 0.0008623797530162847, "clip_ratio/low_min": 5.661984050675528e-05, "clip_ratio/region_mean": 0.0017051461836672388, "epoch": 0.09249310210057808, "grad_norm": 0.10698087513446808, "learning_rate": 2e-07, "loss": 0.0636, "step": 991 }, { "clip_ratio/high_max": 0.0021723976969951764, "clip_ratio/high_mean": 0.0008339583873748779, "clip_ratio/low_mean": 0.000844788235554006, "clip_ratio/low_min": 8.170138607965782e-05, "clip_ratio/region_mean": 0.0016787466374807991, "epoch": 0.09258643520057866, "grad_norm": 0.11497218906879425, "learning_rate": 2e-07, "loss": 0.0198, "step": 992 }, { "clip_ratio/high_max": 0.0023466148413717747, "clip_ratio/high_mean": 0.0009220513402397046, "clip_ratio/low_mean": 0.0009673230961197987, "clip_ratio/low_min": 0.00013091791879560333, "clip_ratio/region_mean": 0.0018893744854722172, "epoch": 0.09267976830057925, "grad_norm": 0.1168917715549469, "learning_rate": 2e-07, "loss": 0.0556, "step": 993 }, { "clip_ratio/high_max": 0.002069155641947873, "clip_ratio/high_mean": 0.0008533294039807515, "clip_ratio/low_mean": 0.0008307002026413102, "clip_ratio/low_min": 4.3277378608763684e-05, "clip_ratio/region_mean": 0.0016840295793372206, "epoch": 0.09277310140057983, "grad_norm": 0.12683254480361938, "learning_rate": 2e-07, "loss": 0.0244, "step": 994 }, { "clip_ratio/high_max": 0.0019231456026318483, "clip_ratio/high_mean": 0.0008257195895566838, "clip_ratio/low_mean": 0.0008599707171015325, "clip_ratio/low_min": 8.868014174368e-05, "clip_ratio/region_mean": 0.0016856903457664885, "epoch": 0.09286643450058042, "grad_norm": 0.11973443627357483, "learning_rate": 2e-07, "loss": 0.0328, "step": 995 }, { "clip_ratio/high_max": 0.0022378537905751728, "clip_ratio/high_mean": 0.0009615243743610336, "clip_ratio/low_mean": 0.0008887166641216027, "clip_ratio/low_min": 0.00016375274390156846, "clip_ratio/region_mean": 0.0018502410748624243, "epoch": 0.092959767600581, "grad_norm": 0.1267317831516266, "learning_rate": 2e-07, "loss": -0.0261, "step": 996 }, { "clip_ratio/high_max": 0.002005895621550735, "clip_ratio/high_mean": 0.0008810547551547643, "clip_ratio/low_mean": 0.0008940059997257777, "clip_ratio/low_min": 4.1510569644742645e-05, "clip_ratio/region_mean": 0.0017750607512425631, "epoch": 0.09305310070058158, "grad_norm": 0.10944966971874237, "learning_rate": 2e-07, "loss": 0.023, "step": 997 }, { "clip_ratio/high_max": 0.002037375954387244, "clip_ratio/high_mean": 0.000861705768329557, "clip_ratio/low_mean": 0.0008990853420982603, "clip_ratio/low_min": 8.570147747377632e-05, "clip_ratio/region_mean": 0.0017607911213417538, "epoch": 0.09314643380058217, "grad_norm": 0.10956969112157822, "learning_rate": 2e-07, "loss": 0.0111, "step": 998 }, { "clip_ratio/high_max": 0.0017950280962395482, "clip_ratio/high_mean": 0.0008521399158780696, "clip_ratio/low_mean": 0.0009003007435239851, "clip_ratio/low_min": 0.00011540521882125176, "clip_ratio/region_mean": 0.001752440646669129, "epoch": 0.09323976690058275, "grad_norm": 0.11849506944417953, "learning_rate": 2e-07, "loss": -0.0055, "step": 999 }, { "clip_ratio/high_max": 0.0021616601807181723, "clip_ratio/high_mean": 0.0008717874879948795, "clip_ratio/low_mean": 0.0008567062905058265, "clip_ratio/low_min": 6.136550928204088e-05, "clip_ratio/region_mean": 0.0017284938221564516, "epoch": 0.09333310000058333, "grad_norm": 0.10934802889823914, "learning_rate": 2e-07, "loss": 0.0398, "step": 1000 }, { "clip_ratio/high_max": 0.0020906590143567882, "clip_ratio/high_mean": 0.0008639007155579748, "clip_ratio/low_mean": 0.0009225610137946205, "clip_ratio/low_min": 9.850160313362721e-05, "clip_ratio/region_mean": 0.0017864617657323834, "epoch": 0.09342643310058392, "grad_norm": 0.11452668160200119, "learning_rate": 2e-07, "loss": 0.0425, "step": 1001 }, { "clip_ratio/high_max": 0.002146396283933427, "clip_ratio/high_mean": 0.0008341445773112355, "clip_ratio/low_mean": 0.0009327636234957026, "clip_ratio/low_min": 4.049407743877964e-05, "clip_ratio/region_mean": 0.0017669081862550229, "epoch": 0.0935197662005845, "grad_norm": 0.11556244641542435, "learning_rate": 2e-07, "loss": -0.0012, "step": 1002 }, { "clip_ratio/high_max": 0.0020002389246656094, "clip_ratio/high_mean": 0.0008471804849250475, "clip_ratio/low_mean": 0.0008568522680434398, "clip_ratio/low_min": 6.098800713516539e-05, "clip_ratio/region_mean": 0.0017040327365975827, "epoch": 0.09361309930058508, "grad_norm": 0.11908892542123795, "learning_rate": 2e-07, "loss": 0.0207, "step": 1003 }, { "clip_ratio/high_max": 0.002064168147626333, "clip_ratio/high_mean": 0.0008712071639820351, "clip_ratio/low_mean": 0.0009583357405062998, "clip_ratio/low_min": 7.76968181526172e-05, "clip_ratio/region_mean": 0.0018295429181307554, "epoch": 0.09370643240058567, "grad_norm": 0.13336260616779327, "learning_rate": 2e-07, "loss": 0.0522, "step": 1004 }, { "clip_ratio/high_max": 0.0020985850715078413, "clip_ratio/high_mean": 0.0009526226567686535, "clip_ratio/low_mean": 0.0007868906177463941, "clip_ratio/low_min": 6.733665759384166e-05, "clip_ratio/region_mean": 0.0017395133036188781, "epoch": 0.09379976550058625, "grad_norm": 0.1192016676068306, "learning_rate": 2e-07, "loss": -0.0117, "step": 1005 }, { "clip_ratio/high_max": 0.0019675765215652063, "clip_ratio/high_mean": 0.0007772126773488708, "clip_ratio/low_mean": 0.0007840984944778029, "clip_ratio/low_min": 6.602033681701869e-05, "clip_ratio/region_mean": 0.001561311128170928, "epoch": 0.09389309860058684, "grad_norm": 0.11258529126644135, "learning_rate": 2e-07, "loss": 0.0123, "step": 1006 }, { "clip_ratio/high_max": 0.0019282072134956252, "clip_ratio/high_mean": 0.0008211592539737467, "clip_ratio/low_mean": 0.0008041220316954423, "clip_ratio/low_min": 4.0883094698074274e-05, "clip_ratio/region_mean": 0.0016252812783932313, "epoch": 0.09398643170058742, "grad_norm": 0.10717396438121796, "learning_rate": 2e-07, "loss": -0.0275, "step": 1007 }, { "clip_ratio/high_max": 0.001854359477874823, "clip_ratio/high_mean": 0.0007320370732486481, "clip_ratio/low_mean": 0.0008720583646208979, "clip_ratio/low_min": 6.503721124317963e-05, "clip_ratio/region_mean": 0.001604095428774599, "epoch": 0.094079764800588, "grad_norm": 0.11644408106803894, "learning_rate": 2e-07, "loss": 0.029, "step": 1008 }, { "clip_ratio/high_max": 0.0021990323293721303, "clip_ratio/high_mean": 0.0008968757192633348, "clip_ratio/low_mean": 0.0008929435225581983, "clip_ratio/low_min": 4.568906570057152e-05, "clip_ratio/region_mean": 0.0017898192454595119, "epoch": 0.09417309790058859, "grad_norm": 0.13738375902175903, "learning_rate": 2e-07, "loss": 0.0306, "step": 1009 }, { "clip_ratio/high_max": 0.0024352449836442247, "clip_ratio/high_mean": 0.0009713883118820377, "clip_ratio/low_mean": 0.0009145517869910691, "clip_ratio/low_min": 3.2470941732754e-05, "clip_ratio/region_mean": 0.0018859401534427889, "epoch": 0.09426643100058917, "grad_norm": 0.11485923826694489, "learning_rate": 2e-07, "loss": 0.0033, "step": 1010 }, { "clip_ratio/high_max": 0.002140145792509429, "clip_ratio/high_mean": 0.0008622380992164835, "clip_ratio/low_mean": 0.0010366331534896744, "clip_ratio/low_min": 0.0001207550030812854, "clip_ratio/region_mean": 0.0018988712727150414, "epoch": 0.09435976410058974, "grad_norm": 0.12227575480937958, "learning_rate": 2e-07, "loss": 0.0347, "step": 1011 }, { "clip_ratio/high_max": 0.0020840392826357856, "clip_ratio/high_mean": 0.000865648384205997, "clip_ratio/low_mean": 0.0008360022820852464, "clip_ratio/low_min": 0.00012096665886929259, "clip_ratio/region_mean": 0.0017016506608342752, "epoch": 0.09445309720059034, "grad_norm": 0.12027329206466675, "learning_rate": 2e-07, "loss": 0.0107, "step": 1012 }, { "clip_ratio/high_max": 0.0019310668649268337, "clip_ratio/high_mean": 0.000824711452878546, "clip_ratio/low_mean": 0.0008870713281794451, "clip_ratio/low_min": 0.00013021745689911768, "clip_ratio/region_mean": 0.0017117827956099063, "epoch": 0.09454643030059091, "grad_norm": 0.12233252823352814, "learning_rate": 2e-07, "loss": 0.048, "step": 1013 }, { "clip_ratio/high_max": 0.001979655760806054, "clip_ratio/high_mean": 0.0009054432375705801, "clip_ratio/low_mean": 0.0008655234923935495, "clip_ratio/low_min": 1.725565925880801e-05, "clip_ratio/region_mean": 0.0017709667372400872, "epoch": 0.09463976340059149, "grad_norm": 0.11256289482116699, "learning_rate": 2e-07, "loss": 0.005, "step": 1014 }, { "clip_ratio/high_max": 0.002051736955763772, "clip_ratio/high_mean": 0.0007575205891043879, "clip_ratio/low_mean": 0.001004393341645482, "clip_ratio/low_min": 8.749662902118871e-05, "clip_ratio/region_mean": 0.0017619139325688593, "epoch": 0.09473309650059208, "grad_norm": 0.132577583193779, "learning_rate": 2e-07, "loss": 0.0481, "step": 1015 }, { "clip_ratio/high_max": 0.001996080951357726, "clip_ratio/high_mean": 0.0008625501650385559, "clip_ratio/low_mean": 0.0009059396234079031, "clip_ratio/low_min": 0.00014188603290676838, "clip_ratio/region_mean": 0.0017684898048173636, "epoch": 0.09482642960059266, "grad_norm": 0.12402306497097015, "learning_rate": 2e-07, "loss": 0.0386, "step": 1016 }, { "clip_ratio/high_max": 0.0019890289440809283, "clip_ratio/high_mean": 0.000892858712177258, "clip_ratio/low_mean": 0.0007998637229320593, "clip_ratio/low_min": 2.5860126697807573e-05, "clip_ratio/region_mean": 0.001692722420557402, "epoch": 0.09491976270059325, "grad_norm": 0.11991361528635025, "learning_rate": 2e-07, "loss": 0.0068, "step": 1017 }, { "clip_ratio/high_max": 0.0020844308091909625, "clip_ratio/high_mean": 0.0008315276281791739, "clip_ratio/low_mean": 0.0009131267706834478, "clip_ratio/low_min": 0.00010666692833183333, "clip_ratio/region_mean": 0.0017446544370613992, "epoch": 0.09501309580059383, "grad_norm": 0.11610961705446243, "learning_rate": 2e-07, "loss": 0.0206, "step": 1018 }, { "clip_ratio/high_max": 0.00225478078937158, "clip_ratio/high_mean": 0.0008971553525043419, "clip_ratio/low_mean": 0.0009153171304205898, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0018124724811059423, "epoch": 0.09510642890059441, "grad_norm": 0.12555032968521118, "learning_rate": 2e-07, "loss": 0.0287, "step": 1019 }, { "clip_ratio/high_max": 0.002217986562754959, "clip_ratio/high_mean": 0.0008098206453723833, "clip_ratio/low_mean": 0.0008464433522021864, "clip_ratio/low_min": 0.0001041021660057595, "clip_ratio/region_mean": 0.0016562639284529723, "epoch": 0.095199762000595, "grad_norm": 0.11540576815605164, "learning_rate": 2e-07, "loss": 0.0015, "step": 1020 }, { "clip_ratio/high_max": 0.0024876170718926005, "clip_ratio/high_mean": 0.000947672324400628, "clip_ratio/low_mean": 0.0010449639084981754, "clip_ratio/low_min": 5.6488809605070855e-05, "clip_ratio/region_mean": 0.001992636258364655, "epoch": 0.09529309510059558, "grad_norm": 0.12486743927001953, "learning_rate": 2e-07, "loss": 0.0047, "step": 1021 }, { "clip_ratio/high_max": 0.0018987356270372402, "clip_ratio/high_mean": 0.0007894445116107818, "clip_ratio/low_mean": 0.00100619234945043, "clip_ratio/low_min": 0.00013737818426307058, "clip_ratio/region_mean": 0.001795636853785254, "epoch": 0.09538642820059616, "grad_norm": 0.11219488829374313, "learning_rate": 2e-07, "loss": 0.0023, "step": 1022 }, { "clip_ratio/high_max": 0.0022074135413276963, "clip_ratio/high_mean": 0.0008982023991848109, "clip_ratio/low_mean": 0.0008508882874593837, "clip_ratio/low_min": 0.00014223130710888654, "clip_ratio/region_mean": 0.001749090697558131, "epoch": 0.09547976130059675, "grad_norm": 0.11575962603092194, "learning_rate": 2e-07, "loss": 0.0154, "step": 1023 }, { "clip_ratio/high_max": 0.0018066917546093464, "clip_ratio/high_mean": 0.0007693958177696913, "clip_ratio/low_mean": 0.0010509676940273494, "clip_ratio/low_min": 0.00017019441838783678, "clip_ratio/region_mean": 0.001820363504521083, "epoch": 0.09557309440059733, "grad_norm": 0.11805713176727295, "learning_rate": 2e-07, "loss": 0.0601, "step": 1024 }, { "clip_ratio/high_max": 0.0, "clip_ratio/high_mean": 0.0, "clip_ratio/low_mean": 0.0, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0, "completions/clipped_ratio": 0.015398297991071397, "completions/max_length": 4096.0, "completions/max_terminated_length": 4082.0, "completions/mean_length": 619.4093627929688, "completions/mean_terminated_length": 565.0384521484375, "completions/min_length": 4.0, "completions/min_terminated_length": 4.0, "epoch": 0.09566642750059791, "grad_norm": 0.10612509399652481, "learning_rate": 2e-07, "loss": 0.0404, "num_tokens": 735075230.0, "reward": 0.568551242351532, "reward_std": 0.20006971061229706, "rewards/simpleverify_reward/mean": 0.5685511827468872, "rewards/simpleverify_reward/std": 0.49528056383132935, "step": 1025 }, { "clip_ratio/high_max": 0.00200909937848337, "clip_ratio/high_mean": 0.0008687268345966004, "clip_ratio/low_mean": 0.0005489155187206052, "clip_ratio/low_min": 4.169086105321185e-05, "clip_ratio/region_mean": 0.0014176423392200377, "epoch": 0.0957597606005985, "grad_norm": 0.11542902141809464, "learning_rate": 2e-07, "loss": 0.0303, "step": 1026 }, { "clip_ratio/high_max": 0.00221441725443583, "clip_ratio/high_mean": 0.0008715675467101391, "clip_ratio/low_mean": 0.0005372579744289396, "clip_ratio/low_min": 2.2664639800495934e-05, "clip_ratio/region_mean": 0.0014088255556998774, "epoch": 0.09585309370059908, "grad_norm": 0.12312428653240204, "learning_rate": 2e-07, "loss": 0.0209, "step": 1027 }, { "clip_ratio/high_max": 0.0019153052162437234, "clip_ratio/high_mean": 0.0009056340240931604, "clip_ratio/low_mean": 0.0005892724821023876, "clip_ratio/low_min": 9.31029353523627e-06, "clip_ratio/region_mean": 0.0014949065480323043, "epoch": 0.09594642680059967, "grad_norm": 0.11696968227624893, "learning_rate": 2e-07, "loss": 0.019, "step": 1028 }, { "clip_ratio/high_max": 0.0020166482026979793, "clip_ratio/high_mean": 0.0007799352551955963, "clip_ratio/low_mean": 0.0006383797335729469, "clip_ratio/low_min": 7.189817915786989e-05, "clip_ratio/region_mean": 0.0014183149651216809, "epoch": 0.09603975990060025, "grad_norm": 0.10812655836343765, "learning_rate": 2e-07, "loss": 0.0827, "step": 1029 }, { "clip_ratio/high_max": 0.0018582608354336116, "clip_ratio/high_mean": 0.0008466122862955672, "clip_ratio/low_mean": 0.0005671514718414983, "clip_ratio/low_min": 4.651596009352943e-05, "clip_ratio/region_mean": 0.001413763762684539, "epoch": 0.09613309300060083, "grad_norm": 0.12490763515233994, "learning_rate": 2e-07, "loss": -0.0094, "step": 1030 }, { "clip_ratio/high_max": 0.0018109347656718455, "clip_ratio/high_mean": 0.0006978304190852214, "clip_ratio/low_mean": 0.000630987026852381, "clip_ratio/low_min": 1.7016063793562353e-05, "clip_ratio/region_mean": 0.0013288174704939593, "epoch": 0.09622642610060142, "grad_norm": 0.1300068348646164, "learning_rate": 2e-07, "loss": 0.0482, "step": 1031 }, { "clip_ratio/high_max": 0.002211858969531022, "clip_ratio/high_mean": 0.0008658963306515943, "clip_ratio/low_mean": 0.0005230009046499617, "clip_ratio/low_min": 3.1061657864484005e-05, "clip_ratio/region_mean": 0.0013888972207496408, "epoch": 0.096319759200602, "grad_norm": 0.11759167909622192, "learning_rate": 2e-07, "loss": 0.0099, "step": 1032 }, { "clip_ratio/high_max": 0.0020253094189683907, "clip_ratio/high_mean": 0.0007893627589510288, "clip_ratio/low_mean": 0.000528521579781227, "clip_ratio/low_min": 3.862824996758718e-05, "clip_ratio/region_mean": 0.0013178843873902224, "epoch": 0.09641309230060258, "grad_norm": 0.1104261577129364, "learning_rate": 2e-07, "loss": 0.0263, "step": 1033 }, { "clip_ratio/high_max": 0.002103252638335107, "clip_ratio/high_mean": 0.0008204953510357882, "clip_ratio/low_mean": 0.0005232537387200864, "clip_ratio/low_min": 1.569169035064988e-05, "clip_ratio/region_mean": 0.0013437490997603163, "epoch": 0.09650642540060317, "grad_norm": 0.10767585039138794, "learning_rate": 2e-07, "loss": 0.0191, "step": 1034 }, { "clip_ratio/high_max": 0.0021298135798133444, "clip_ratio/high_mean": 0.0008127565497488831, "clip_ratio/low_mean": 0.0006266660693654558, "clip_ratio/low_min": 1.5798786989762448e-05, "clip_ratio/region_mean": 0.0014394226018339396, "epoch": 0.09659975850060375, "grad_norm": 0.12416986376047134, "learning_rate": 2e-07, "loss": 0.0448, "step": 1035 }, { "clip_ratio/high_max": 0.0018184005457442254, "clip_ratio/high_mean": 0.0007904096182755893, "clip_ratio/low_mean": 0.0005866300980414962, "clip_ratio/low_min": 2.15846748687909e-05, "clip_ratio/region_mean": 0.0013770396762993187, "epoch": 0.09669309160060433, "grad_norm": 0.11928658932447433, "learning_rate": 2e-07, "loss": 0.0363, "step": 1036 }, { "clip_ratio/high_max": 0.002093279756081756, "clip_ratio/high_mean": 0.0007995607047632802, "clip_ratio/low_mean": 0.0005888536543352529, "clip_ratio/low_min": 4.548974811768858e-05, "clip_ratio/region_mean": 0.0013884143590985332, "epoch": 0.09678642470060492, "grad_norm": 0.1095636710524559, "learning_rate": 2e-07, "loss": 0.0338, "step": 1037 }, { "clip_ratio/high_max": 0.0017970094522752333, "clip_ratio/high_mean": 0.0006786877420381643, "clip_ratio/low_mean": 0.0005995274714223342, "clip_ratio/low_min": 1.1050212378904689e-05, "clip_ratio/region_mean": 0.0012782152007275727, "epoch": 0.0968797578006055, "grad_norm": 0.12018336355686188, "learning_rate": 2e-07, "loss": 0.0144, "step": 1038 }, { "clip_ratio/high_max": 0.0018620755799929611, "clip_ratio/high_mean": 0.0007562834798591211, "clip_ratio/low_mean": 0.0005498287246155087, "clip_ratio/low_min": 4.623696986527648e-05, "clip_ratio/region_mean": 0.0013061121935606934, "epoch": 0.09697309090060609, "grad_norm": 0.11076406389474869, "learning_rate": 2e-07, "loss": 0.013, "step": 1039 }, { "clip_ratio/high_max": 0.001813300754292868, "clip_ratio/high_mean": 0.0006771729895262979, "clip_ratio/low_mean": 0.0006753592906534323, "clip_ratio/low_min": 6.330964833978214e-05, "clip_ratio/region_mean": 0.0013525322538043838, "epoch": 0.09706642400060667, "grad_norm": 0.10745476931333542, "learning_rate": 2e-07, "loss": 0.0383, "step": 1040 }, { "clip_ratio/high_max": 0.0018643237490323372, "clip_ratio/high_mean": 0.0008069909235928208, "clip_ratio/low_mean": 0.0005738788713642862, "clip_ratio/low_min": 6.147780550236348e-05, "clip_ratio/region_mean": 0.0013808698022330645, "epoch": 0.09715975710060724, "grad_norm": 0.11222362518310547, "learning_rate": 2e-07, "loss": 0.0208, "step": 1041 }, { "clip_ratio/high_max": 0.002037535967247095, "clip_ratio/high_mean": 0.0008209636889660032, "clip_ratio/low_mean": 0.0007089836344675859, "clip_ratio/low_min": 4.360807088232832e-05, "clip_ratio/region_mean": 0.0015299473197956104, "epoch": 0.09725309020060784, "grad_norm": 0.13237662613391876, "learning_rate": 2e-07, "loss": 0.0473, "step": 1042 }, { "clip_ratio/high_max": 0.0019452841588645242, "clip_ratio/high_mean": 0.0008072995260590687, "clip_ratio/low_mean": 0.0005725833470933139, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0013798828513245098, "epoch": 0.09734642330060841, "grad_norm": 0.11559829115867615, "learning_rate": 2e-07, "loss": -0.0031, "step": 1043 }, { "clip_ratio/high_max": 0.0020842577650910243, "clip_ratio/high_mean": 0.0009226381371263415, "clip_ratio/low_mean": 0.0006014705904817674, "clip_ratio/low_min": 5.5758075177436695e-05, "clip_ratio/region_mean": 0.0015241086803143844, "epoch": 0.09743975640060899, "grad_norm": 0.11245186626911163, "learning_rate": 2e-07, "loss": 0.0169, "step": 1044 }, { "clip_ratio/high_max": 0.001956108237209264, "clip_ratio/high_mean": 0.000859139756357763, "clip_ratio/low_mean": 0.000626116694547818, "clip_ratio/low_min": 5.559574219660135e-05, "clip_ratio/region_mean": 0.0014852564490865916, "epoch": 0.09753308950060958, "grad_norm": 0.11967827379703522, "learning_rate": 2e-07, "loss": 0.0238, "step": 1045 }, { "clip_ratio/high_max": 0.0019159843668603571, "clip_ratio/high_mean": 0.0007228265940284473, "clip_ratio/low_mean": 0.00066216304730915, "clip_ratio/low_min": 4.909236031380715e-05, "clip_ratio/region_mean": 0.0013849896495230496, "epoch": 0.09762642260061016, "grad_norm": 0.11571131646633148, "learning_rate": 2e-07, "loss": 0.0173, "step": 1046 }, { "clip_ratio/high_max": 0.002013220902881585, "clip_ratio/high_mean": 0.0008193629182642326, "clip_ratio/low_mean": 0.0007448258984368294, "clip_ratio/low_min": 4.7649728003307246e-05, "clip_ratio/region_mean": 0.001564188780321274, "epoch": 0.09771975570061076, "grad_norm": 0.11303745955228806, "learning_rate": 2e-07, "loss": 0.0255, "step": 1047 }, { "clip_ratio/high_max": 0.0016550441905565094, "clip_ratio/high_mean": 0.0007180012653407175, "clip_ratio/low_mean": 0.0007260254005814204, "clip_ratio/low_min": 0.0001159520315923146, "clip_ratio/region_mean": 0.0014440266859310213, "epoch": 0.09781308880061133, "grad_norm": 0.11802028119564056, "learning_rate": 2e-07, "loss": 0.0465, "step": 1048 }, { "clip_ratio/high_max": 0.0021046784859208856, "clip_ratio/high_mean": 0.0008069247014645953, "clip_ratio/low_mean": 0.0006705772957502631, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0014775020099477842, "epoch": 0.09790642190061191, "grad_norm": 0.1254933923482895, "learning_rate": 2e-07, "loss": 0.0164, "step": 1049 }, { "clip_ratio/high_max": 0.001635778786294395, "clip_ratio/high_mean": 0.0006478861969299032, "clip_ratio/low_mean": 0.0008029379077925114, "clip_ratio/low_min": 6.546891199832316e-05, "clip_ratio/region_mean": 0.0014508241147268564, "epoch": 0.0979997550006125, "grad_norm": 0.11035629361867905, "learning_rate": 2e-07, "loss": 0.09, "step": 1050 }, { "clip_ratio/high_max": 0.0019566735754779074, "clip_ratio/high_mean": 0.0007161116300267167, "clip_ratio/low_mean": 0.0007278470675373683, "clip_ratio/low_min": 6.76014833516092e-05, "clip_ratio/region_mean": 0.0014439587175729685, "epoch": 0.09809308810061308, "grad_norm": 0.12333068996667862, "learning_rate": 2e-07, "loss": 0.0791, "step": 1051 }, { "clip_ratio/high_max": 0.0020421241970325354, "clip_ratio/high_mean": 0.0008152516020345502, "clip_ratio/low_mean": 0.0007355098532570992, "clip_ratio/low_min": 0.00010034862225438701, "clip_ratio/region_mean": 0.00155076142254984, "epoch": 0.09818642120061366, "grad_norm": 0.12062771618366241, "learning_rate": 2e-07, "loss": 0.0326, "step": 1052 }, { "clip_ratio/high_max": 0.0021323332039173692, "clip_ratio/high_mean": 0.0009559003010508604, "clip_ratio/low_mean": 0.0007342600292759016, "clip_ratio/low_min": 4.302698107494507e-05, "clip_ratio/region_mean": 0.0016901603157748468, "epoch": 0.09827975430061425, "grad_norm": 0.11315330862998962, "learning_rate": 2e-07, "loss": 0.0065, "step": 1053 }, { "clip_ratio/high_max": 0.002306951500941068, "clip_ratio/high_mean": 0.0009268999874620931, "clip_ratio/low_mean": 0.0006443302336265333, "clip_ratio/low_min": 4.9266970563621726e-05, "clip_ratio/region_mean": 0.001571230219269637, "epoch": 0.09837308740061483, "grad_norm": 0.11879207193851471, "learning_rate": 2e-07, "loss": -0.0087, "step": 1054 }, { "clip_ratio/high_max": 0.0019880685649695806, "clip_ratio/high_mean": 0.0007960067523526959, "clip_ratio/low_mean": 0.000778449065364839, "clip_ratio/low_min": 7.420547808578704e-05, "clip_ratio/region_mean": 0.001574455829540966, "epoch": 0.09846642050061541, "grad_norm": 0.1177000030875206, "learning_rate": 2e-07, "loss": 0.0372, "step": 1055 }, { "clip_ratio/high_max": 0.0020156319260422606, "clip_ratio/high_mean": 0.0008593644051870797, "clip_ratio/low_mean": 0.0007748235839244444, "clip_ratio/low_min": 0.00012247606628079666, "clip_ratio/region_mean": 0.0016341879963874817, "epoch": 0.098559753600616, "grad_norm": 0.11429823189973831, "learning_rate": 2e-07, "loss": 0.0426, "step": 1056 }, { "clip_ratio/high_max": 0.0024814455173327588, "clip_ratio/high_mean": 0.0009049328909895848, "clip_ratio/low_mean": 0.0007363257927863742, "clip_ratio/low_min": 2.036559544649208e-05, "clip_ratio/region_mean": 0.0016412586883234326, "epoch": 0.09865308670061658, "grad_norm": 0.11523015797138214, "learning_rate": 2e-07, "loss": 0.0038, "step": 1057 }, { "clip_ratio/high_max": 0.0021379570389399305, "clip_ratio/high_mean": 0.0008549280082661426, "clip_ratio/low_mean": 0.0007272395978361601, "clip_ratio/low_min": 4.373304000182543e-05, "clip_ratio/region_mean": 0.0015821675915503874, "epoch": 0.09874641980061717, "grad_norm": 0.11110664159059525, "learning_rate": 2e-07, "loss": 0.0214, "step": 1058 }, { "clip_ratio/high_max": 0.002366235727095045, "clip_ratio/high_mean": 0.0008457103140244726, "clip_ratio/low_mean": 0.0007364335797319654, "clip_ratio/low_min": 2.8895968171127606e-05, "clip_ratio/region_mean": 0.0015821438719285652, "epoch": 0.09883975290061775, "grad_norm": 0.11646465212106705, "learning_rate": 2e-07, "loss": 0.0268, "step": 1059 }, { "clip_ratio/high_max": 0.002042945681751007, "clip_ratio/high_mean": 0.0008221959596994566, "clip_ratio/low_mean": 0.0008916161368688336, "clip_ratio/low_min": 0.00016732110634620767, "clip_ratio/region_mean": 0.001713812100206269, "epoch": 0.09893308600061833, "grad_norm": 0.12157513946294785, "learning_rate": 2e-07, "loss": 0.037, "step": 1060 }, { "clip_ratio/high_max": 0.0018318782131245825, "clip_ratio/high_mean": 0.0007447359967045486, "clip_ratio/low_mean": 0.0007199955321084417, "clip_ratio/low_min": 4.930352224619128e-05, "clip_ratio/region_mean": 0.0014647315729234833, "epoch": 0.09902641910061892, "grad_norm": 0.10849598050117493, "learning_rate": 2e-07, "loss": 0.007, "step": 1061 }, { "clip_ratio/high_max": 0.0016698007566446904, "clip_ratio/high_mean": 0.0007013490230747266, "clip_ratio/low_mean": 0.0008168893473339267, "clip_ratio/low_min": 4.719498519989429e-05, "clip_ratio/region_mean": 0.001518238386779558, "epoch": 0.0991197522006195, "grad_norm": 0.10390421003103256, "learning_rate": 2e-07, "loss": 0.0349, "step": 1062 }, { "clip_ratio/high_max": 0.0018767394176393282, "clip_ratio/high_mean": 0.0008249612037616316, "clip_ratio/low_mean": 0.0007666630517633166, "clip_ratio/low_min": 8.77899510669522e-05, "clip_ratio/region_mean": 0.001591624204593245, "epoch": 0.09921308530062008, "grad_norm": 0.12781000137329102, "learning_rate": 2e-07, "loss": 0.0361, "step": 1063 }, { "clip_ratio/high_max": 0.0017819565546233207, "clip_ratio/high_mean": 0.0008160048655554419, "clip_ratio/low_mean": 0.000698604006174719, "clip_ratio/low_min": 1.4331575584947132e-05, "clip_ratio/region_mean": 0.0015146088480832987, "epoch": 0.09930641840062067, "grad_norm": 0.12184551358222961, "learning_rate": 2e-07, "loss": 0.0187, "step": 1064 }, { "clip_ratio/high_max": 0.001829377950343769, "clip_ratio/high_mean": 0.0007921309534140164, "clip_ratio/low_mean": 0.0007184045061876532, "clip_ratio/low_min": 7.475746497220825e-05, "clip_ratio/region_mean": 0.0015105354395927861, "epoch": 0.09939975150062125, "grad_norm": 0.12417765706777573, "learning_rate": 2e-07, "loss": 0.0272, "step": 1065 }, { "clip_ratio/high_max": 0.0018722661479841918, "clip_ratio/high_mean": 0.0007263788229465717, "clip_ratio/low_mean": 0.0006154481943667633, "clip_ratio/low_min": 4.9115525143861305e-05, "clip_ratio/region_mean": 0.0013418270136753563, "epoch": 0.09949308460062183, "grad_norm": 0.10719404369592667, "learning_rate": 2e-07, "loss": 0.0046, "step": 1066 }, { "clip_ratio/high_max": 0.001996098639210686, "clip_ratio/high_mean": 0.0008819526356091956, "clip_ratio/low_mean": 0.000784837060564314, "clip_ratio/low_min": 1.589117709954735e-05, "clip_ratio/region_mean": 0.0016667896634317003, "epoch": 0.09958641770062242, "grad_norm": 0.1103110983967781, "learning_rate": 2e-07, "loss": 0.0035, "step": 1067 }, { "clip_ratio/high_max": 0.0018349019956076518, "clip_ratio/high_mean": 0.0007514952612837078, "clip_ratio/low_mean": 0.0008402582607232034, "clip_ratio/low_min": 0.00010443256360304076, "clip_ratio/region_mean": 0.001591753498360049, "epoch": 0.099679750800623, "grad_norm": 0.11763601750135422, "learning_rate": 2e-07, "loss": 0.0298, "step": 1068 }, { "clip_ratio/high_max": 0.0018825083679985255, "clip_ratio/high_mean": 0.0006604894442716613, "clip_ratio/low_mean": 0.0007511981639254373, "clip_ratio/low_min": 3.6491422179096844e-05, "clip_ratio/region_mean": 0.0014116876227490138, "epoch": 0.09977308390062359, "grad_norm": 0.11118053644895554, "learning_rate": 2e-07, "loss": 0.0262, "step": 1069 }, { "clip_ratio/high_max": 0.001727916627714876, "clip_ratio/high_mean": 0.0007680283069930738, "clip_ratio/low_mean": 0.0009504074441792909, "clip_ratio/low_min": 0.00016193270948861027, "clip_ratio/region_mean": 0.001718435756629333, "epoch": 0.09986641700062417, "grad_norm": 0.12723352015018463, "learning_rate": 2e-07, "loss": 0.0973, "step": 1070 }, { "clip_ratio/high_max": 0.0022111690195742995, "clip_ratio/high_mean": 0.0008360342490050243, "clip_ratio/low_mean": 0.0008783506782492623, "clip_ratio/low_min": 9.841723749559605e-05, "clip_ratio/region_mean": 0.0017143849545391276, "epoch": 0.09995975010062474, "grad_norm": 0.1087203323841095, "learning_rate": 2e-07, "loss": 0.0328, "step": 1071 }, { "clip_ratio/high_max": 0.0024032819201238453, "clip_ratio/high_mean": 0.0009821057792578358, "clip_ratio/low_mean": 0.0008250527607742697, "clip_ratio/low_min": 8.333040113939205e-05, "clip_ratio/region_mean": 0.0018071585436700843, "epoch": 0.10005308320062534, "grad_norm": 0.11916292458772659, "learning_rate": 2e-07, "loss": -0.0041, "step": 1072 }, { "clip_ratio/high_max": 0.0019411818684602622, "clip_ratio/high_mean": 0.0008123722800519317, "clip_ratio/low_mean": 0.0007953064177854685, "clip_ratio/low_min": 0.00010040878441941459, "clip_ratio/region_mean": 0.0016076786996563897, "epoch": 0.10014641630062592, "grad_norm": 0.12069952487945557, "learning_rate": 2e-07, "loss": 0.0245, "step": 1073 }, { "clip_ratio/high_max": 0.0018460884130035993, "clip_ratio/high_mean": 0.0007424151808663737, "clip_ratio/low_mean": 0.000792841543443501, "clip_ratio/low_min": 5.472223165270407e-05, "clip_ratio/region_mean": 0.0015352567133959383, "epoch": 0.1002397494006265, "grad_norm": 0.1334504783153534, "learning_rate": 2e-07, "loss": 0.0304, "step": 1074 }, { "clip_ratio/high_max": 0.002016742786508985, "clip_ratio/high_mean": 0.0008146014770318288, "clip_ratio/low_mean": 0.0008282469361802214, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.00164284845959628, "epoch": 0.10033308250062709, "grad_norm": 0.11254438757896423, "learning_rate": 2e-07, "loss": 0.0173, "step": 1075 }, { "clip_ratio/high_max": 0.001995411850657547, "clip_ratio/high_mean": 0.0008796934052952565, "clip_ratio/low_mean": 0.000744623752325424, "clip_ratio/low_min": 6.59671450193855e-05, "clip_ratio/region_mean": 0.0016243171448877547, "epoch": 0.10042641560062766, "grad_norm": 0.10862419009208679, "learning_rate": 2e-07, "loss": 0.0171, "step": 1076 }, { "clip_ratio/high_max": 0.00225502470129868, "clip_ratio/high_mean": 0.0009365297482872847, "clip_ratio/low_mean": 0.0007325530432353844, "clip_ratio/low_min": 6.544880216097226e-05, "clip_ratio/region_mean": 0.0016690827833372168, "epoch": 0.10051974870062824, "grad_norm": 0.11361183971166611, "learning_rate": 2e-07, "loss": 0.0206, "step": 1077 }, { "clip_ratio/high_max": 0.0020471842217375524, "clip_ratio/high_mean": 0.0008454867893306073, "clip_ratio/low_mean": 0.0009161932430288289, "clip_ratio/low_min": 9.062401204573689e-05, "clip_ratio/region_mean": 0.0017616800250834785, "epoch": 0.10061308180062883, "grad_norm": 0.11313845217227936, "learning_rate": 2e-07, "loss": 0.0468, "step": 1078 }, { "clip_ratio/high_max": 0.0018490948459657375, "clip_ratio/high_mean": 0.0008132376005960396, "clip_ratio/low_mean": 0.0007983236755535472, "clip_ratio/low_min": 6.570025470864493e-05, "clip_ratio/region_mean": 0.0016115612597786821, "epoch": 0.10070641490062941, "grad_norm": 0.12399954348802567, "learning_rate": 2e-07, "loss": 0.0442, "step": 1079 }, { "clip_ratio/high_max": 0.0019192113504686859, "clip_ratio/high_mean": 0.0007545054832007736, "clip_ratio/low_mean": 0.0008420489466516301, "clip_ratio/low_min": 3.072040362894768e-05, "clip_ratio/region_mean": 0.001596554444404319, "epoch": 0.10079974800063, "grad_norm": 0.11172471940517426, "learning_rate": 2e-07, "loss": 0.0593, "step": 1080 }, { "clip_ratio/high_max": 0.0019154816181981005, "clip_ratio/high_mean": 0.0007603476024087286, "clip_ratio/low_mean": 0.0007633390086994041, "clip_ratio/low_min": 4.91468144900864e-05, "clip_ratio/region_mean": 0.0015236866020131856, "epoch": 0.10089308110063058, "grad_norm": 0.10909705609083176, "learning_rate": 2e-07, "loss": 0.0132, "step": 1081 }, { "clip_ratio/high_max": 0.0023609171621501446, "clip_ratio/high_mean": 0.000854767655255273, "clip_ratio/low_mean": 0.0008780776843195781, "clip_ratio/low_min": 0.00010604064482322428, "clip_ratio/region_mean": 0.0017328453250229359, "epoch": 0.10098641420063116, "grad_norm": 0.11832371354103088, "learning_rate": 2e-07, "loss": 0.0231, "step": 1082 }, { "clip_ratio/high_max": 0.0022351345178321935, "clip_ratio/high_mean": 0.0009177069478027988, "clip_ratio/low_mean": 0.0008693587587913498, "clip_ratio/low_min": 4.0491150684829336e-05, "clip_ratio/region_mean": 0.0017870657029561698, "epoch": 0.10107974730063175, "grad_norm": 0.11290975660085678, "learning_rate": 2e-07, "loss": 0.003, "step": 1083 }, { "clip_ratio/high_max": 0.0017265301903535146, "clip_ratio/high_mean": 0.0008462908808724023, "clip_ratio/low_mean": 0.0007203924842542619, "clip_ratio/low_min": 6.00441626374959e-05, "clip_ratio/region_mean": 0.0015666833678551484, "epoch": 0.10117308040063233, "grad_norm": 0.12059751898050308, "learning_rate": 2e-07, "loss": -0.0045, "step": 1084 }, { "clip_ratio/high_max": 0.0021807513694511726, "clip_ratio/high_mean": 0.0009053893791133305, "clip_ratio/low_mean": 0.000797509883341263, "clip_ratio/low_min": 6.250067599467002e-05, "clip_ratio/region_mean": 0.001702899236988742, "epoch": 0.10126641350063291, "grad_norm": 0.11631078273057938, "learning_rate": 2e-07, "loss": 0.0047, "step": 1085 }, { "clip_ratio/high_max": 0.002077118817396695, "clip_ratio/high_mean": 0.0008382392843486741, "clip_ratio/low_mean": 0.0007583996539324289, "clip_ratio/low_min": 5.860773217136739e-05, "clip_ratio/region_mean": 0.0015966389364621136, "epoch": 0.1013597466006335, "grad_norm": 0.12410097569227219, "learning_rate": 2e-07, "loss": 0.0029, "step": 1086 }, { "clip_ratio/high_max": 0.0017220151967194397, "clip_ratio/high_mean": 0.000719004645361565, "clip_ratio/low_mean": 0.0008417512872256339, "clip_ratio/low_min": 2.7354638859833358e-05, "clip_ratio/region_mean": 0.001560755932587199, "epoch": 0.10145307970063408, "grad_norm": 0.11336301267147064, "learning_rate": 2e-07, "loss": 0.0627, "step": 1087 }, { "clip_ratio/high_max": 0.002099617544445209, "clip_ratio/high_mean": 0.0009771045952220447, "clip_ratio/low_mean": 0.0009149752095254371, "clip_ratio/low_min": 3.9397866203216836e-05, "clip_ratio/region_mean": 0.0018920798029284924, "epoch": 0.10154641280063466, "grad_norm": 0.11746526509523392, "learning_rate": 2e-07, "loss": 0.0354, "step": 1088 }, { "clip_ratio/high_max": 0.0019658932797028683, "clip_ratio/high_mean": 0.000778603702201508, "clip_ratio/low_mean": 0.0008007173983060056, "clip_ratio/low_min": 4.578670996124856e-05, "clip_ratio/region_mean": 0.0015793211568961851, "epoch": 0.10163974590063525, "grad_norm": 0.11328791826963425, "learning_rate": 2e-07, "loss": 0.0452, "step": 1089 }, { "clip_ratio/high_max": 0.0021752080938313156, "clip_ratio/high_mean": 0.0008506809244863689, "clip_ratio/low_mean": 0.0007326957493205555, "clip_ratio/low_min": 7.076767269609263e-05, "clip_ratio/region_mean": 0.0015833766410651151, "epoch": 0.10173307900063583, "grad_norm": 0.10923239588737488, "learning_rate": 2e-07, "loss": 0.0174, "step": 1090 }, { "clip_ratio/high_max": 0.001614278975466732, "clip_ratio/high_mean": 0.000705878122971626, "clip_ratio/low_mean": 0.0007754426842438988, "clip_ratio/low_min": 3.842758269456681e-05, "clip_ratio/region_mean": 0.001481320785387652, "epoch": 0.10182641210063642, "grad_norm": 0.1076093539595604, "learning_rate": 2e-07, "loss": 0.0266, "step": 1091 }, { "clip_ratio/high_max": 0.002261327921587508, "clip_ratio/high_mean": 0.0008584322258684551, "clip_ratio/low_mean": 0.0007846187509130687, "clip_ratio/low_min": 4.919822640658822e-05, "clip_ratio/region_mean": 0.0016430509713245556, "epoch": 0.101919745200637, "grad_norm": 0.11794722080230713, "learning_rate": 2e-07, "loss": 0.0599, "step": 1092 }, { "clip_ratio/high_max": 0.0021251750622468535, "clip_ratio/high_mean": 0.000815811894426588, "clip_ratio/low_mean": 0.0007784433782944689, "clip_ratio/low_min": 9.144111572823022e-06, "clip_ratio/region_mean": 0.0015942552745400462, "epoch": 0.10201307830063758, "grad_norm": 0.11315100640058517, "learning_rate": 2e-07, "loss": 0.04, "step": 1093 }, { "clip_ratio/high_max": 0.002073282317724079, "clip_ratio/high_mean": 0.0009544330405333312, "clip_ratio/low_mean": 0.0008388463429582771, "clip_ratio/low_min": 0.0001354926971544046, "clip_ratio/region_mean": 0.0017932793307409156, "epoch": 0.10210641140063817, "grad_norm": 0.11916402727365494, "learning_rate": 2e-07, "loss": 0.0256, "step": 1094 }, { "clip_ratio/high_max": 0.002155423746444285, "clip_ratio/high_mean": 0.0007569857325506746, "clip_ratio/low_mean": 0.0009109617858484853, "clip_ratio/low_min": 8.427258853771491e-05, "clip_ratio/region_mean": 0.001667947530222591, "epoch": 0.10219974450063875, "grad_norm": 0.11849229782819748, "learning_rate": 2e-07, "loss": 0.0853, "step": 1095 }, { "clip_ratio/high_max": 0.001994823949644342, "clip_ratio/high_mean": 0.0008184825273929164, "clip_ratio/low_mean": 0.0009306589745392557, "clip_ratio/low_min": 0.00010842217216122663, "clip_ratio/region_mean": 0.0017491415128461085, "epoch": 0.10229307760063933, "grad_norm": 0.12253943085670471, "learning_rate": 2e-07, "loss": 0.0873, "step": 1096 }, { "clip_ratio/high_max": 0.0021545973941101693, "clip_ratio/high_mean": 0.0008954573440860258, "clip_ratio/low_mean": 0.0008735132596484618, "clip_ratio/low_min": 7.369538525381358e-05, "clip_ratio/region_mean": 0.001768970636476297, "epoch": 0.10238641070063992, "grad_norm": 0.11572254449129105, "learning_rate": 2e-07, "loss": -0.0185, "step": 1097 }, { "clip_ratio/high_max": 0.0017969388281926513, "clip_ratio/high_mean": 0.0007034912741801236, "clip_ratio/low_mean": 0.00084436800898402, "clip_ratio/low_min": 2.633242002048064e-05, "clip_ratio/region_mean": 0.0015478592504223343, "epoch": 0.1024797438006405, "grad_norm": 0.10648554563522339, "learning_rate": 2e-07, "loss": 0.0395, "step": 1098 }, { "clip_ratio/high_max": 0.0019292561773909256, "clip_ratio/high_mean": 0.0007359561932389624, "clip_ratio/low_mean": 0.0008914447607821785, "clip_ratio/low_min": 0.0001390475736116059, "clip_ratio/region_mean": 0.0016274009685730562, "epoch": 0.10257307690064109, "grad_norm": 0.12148498743772507, "learning_rate": 2e-07, "loss": 0.0441, "step": 1099 }, { "clip_ratio/high_max": 0.001723540324746864, "clip_ratio/high_mean": 0.0007289462173503125, "clip_ratio/low_mean": 0.0008931817719712853, "clip_ratio/low_min": 0.00010042834674095502, "clip_ratio/region_mean": 0.001622127994778566, "epoch": 0.10266641000064167, "grad_norm": 0.11375328153371811, "learning_rate": 2e-07, "loss": 0.0569, "step": 1100 }, { "clip_ratio/high_max": 0.002119248347298708, "clip_ratio/high_mean": 0.0008900709926820127, "clip_ratio/low_mean": 0.0007716899108345388, "clip_ratio/low_min": 0.00010984358277710271, "clip_ratio/region_mean": 0.0016617609362583607, "epoch": 0.10275974310064225, "grad_norm": 0.1113136038184166, "learning_rate": 2e-07, "loss": 0.0084, "step": 1101 }, { "clip_ratio/high_max": 0.0020283608719182666, "clip_ratio/high_mean": 0.0008413325958827045, "clip_ratio/low_mean": 0.0009567802117089741, "clip_ratio/low_min": 9.349070387543179e-05, "clip_ratio/region_mean": 0.0017981128112296574, "epoch": 0.10285307620064284, "grad_norm": 0.12160176038742065, "learning_rate": 2e-07, "loss": 0.0989, "step": 1102 }, { "clip_ratio/high_max": 0.0022197196230990812, "clip_ratio/high_mean": 0.0007876326981204329, "clip_ratio/low_mean": 0.0006906549378982163, "clip_ratio/low_min": 3.766714598896215e-05, "clip_ratio/region_mean": 0.0014782876351091545, "epoch": 0.10294640930064342, "grad_norm": 0.11059887707233429, "learning_rate": 2e-07, "loss": -0.0393, "step": 1103 }, { "clip_ratio/high_max": 0.001964307619346073, "clip_ratio/high_mean": 0.0007930527499411255, "clip_ratio/low_mean": 0.0007491178021155065, "clip_ratio/low_min": 3.4556951959530124e-05, "clip_ratio/region_mean": 0.001542170561151579, "epoch": 0.103039742400644, "grad_norm": 0.11319715529680252, "learning_rate": 2e-07, "loss": 0.0052, "step": 1104 }, { "clip_ratio/high_max": 0.0019591390519053675, "clip_ratio/high_mean": 0.0007469331721949857, "clip_ratio/low_mean": 0.0008855506912368583, "clip_ratio/low_min": 0.0001102419892049511, "clip_ratio/region_mean": 0.0016324838434229605, "epoch": 0.10313307550064459, "grad_norm": 0.11341693252325058, "learning_rate": 2e-07, "loss": 0.0093, "step": 1105 }, { "clip_ratio/high_max": 0.0017568017065059394, "clip_ratio/high_mean": 0.0007546131946583046, "clip_ratio/low_mean": 0.0008069149516813923, "clip_ratio/low_min": 3.5863718039763626e-05, "clip_ratio/region_mean": 0.0015615281481586862, "epoch": 0.10322640860064516, "grad_norm": 0.10901373624801636, "learning_rate": 2e-07, "loss": 0.0469, "step": 1106 }, { "clip_ratio/high_max": 0.001485999582655495, "clip_ratio/high_mean": 0.0006948374993953621, "clip_ratio/low_mean": 0.000807143625934259, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0015019811289676, "epoch": 0.10331974170064574, "grad_norm": 0.10426880419254303, "learning_rate": 2e-07, "loss": 0.0179, "step": 1107 }, { "clip_ratio/high_max": 0.001955616789928172, "clip_ratio/high_mean": 0.0008533026866643922, "clip_ratio/low_mean": 0.0007920500029285904, "clip_ratio/low_min": 4.137967607675819e-05, "clip_ratio/region_mean": 0.001645352691411972, "epoch": 0.10341307480064633, "grad_norm": 0.1212708055973053, "learning_rate": 2e-07, "loss": 0.0142, "step": 1108 }, { "clip_ratio/high_max": 0.0018582081138447393, "clip_ratio/high_mean": 0.0007425123112625442, "clip_ratio/low_mean": 0.0008275588079413865, "clip_ratio/low_min": 9.259584112442099e-05, "clip_ratio/region_mean": 0.0015700711301178671, "epoch": 0.10350640790064691, "grad_norm": 0.11190538108348846, "learning_rate": 2e-07, "loss": 0.0232, "step": 1109 }, { "clip_ratio/high_max": 0.0024843899154802784, "clip_ratio/high_mean": 0.0009926175771397538, "clip_ratio/low_mean": 0.0008856208460201742, "clip_ratio/low_min": 5.9152535868634004e-05, "clip_ratio/region_mean": 0.0018782384358928539, "epoch": 0.1035997410006475, "grad_norm": 0.11843601614236832, "learning_rate": 2e-07, "loss": 0.013, "step": 1110 }, { "clip_ratio/high_max": 0.0021362017214414664, "clip_ratio/high_mean": 0.0008731988800718682, "clip_ratio/low_mean": 0.0007880772609496489, "clip_ratio/low_min": 6.004100760037545e-05, "clip_ratio/region_mean": 0.001661276153754443, "epoch": 0.10369307410064808, "grad_norm": 0.11400327831506729, "learning_rate": 2e-07, "loss": 0.0202, "step": 1111 }, { "clip_ratio/high_max": 0.002435993272229098, "clip_ratio/high_mean": 0.0009255400836991612, "clip_ratio/low_mean": 0.0008060041964199627, "clip_ratio/low_min": 3.1354175007436424e-05, "clip_ratio/region_mean": 0.0017315442164544947, "epoch": 0.10378640720064866, "grad_norm": 0.11254655569791794, "learning_rate": 2e-07, "loss": 0.023, "step": 1112 }, { "clip_ratio/high_max": 0.0018898217167588882, "clip_ratio/high_mean": 0.0009461856934649404, "clip_ratio/low_mean": 0.0008216769729187945, "clip_ratio/low_min": 3.1727216992294416e-05, "clip_ratio/region_mean": 0.0017678626645647455, "epoch": 0.10387974030064925, "grad_norm": 0.1092531606554985, "learning_rate": 2e-07, "loss": -0.0034, "step": 1113 }, { "clip_ratio/high_max": 0.0023776433190505486, "clip_ratio/high_mean": 0.0009607675565348472, "clip_ratio/low_mean": 0.0007999022836884251, "clip_ratio/low_min": 2.5491858650639188e-05, "clip_ratio/region_mean": 0.0017606698602321558, "epoch": 0.10397307340064983, "grad_norm": 0.11789583414793015, "learning_rate": 2e-07, "loss": -0.0079, "step": 1114 }, { "clip_ratio/high_max": 0.002123565565852914, "clip_ratio/high_mean": 0.0008442826474492904, "clip_ratio/low_mean": 0.00085145919729257, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0016957418120000511, "epoch": 0.10406640650065041, "grad_norm": 0.11386961489915848, "learning_rate": 2e-07, "loss": 0.0132, "step": 1115 }, { "clip_ratio/high_max": 0.0019518846638675313, "clip_ratio/high_mean": 0.0007517185185861308, "clip_ratio/low_mean": 0.0008811710595182376, "clip_ratio/low_min": 8.791580330580473e-05, "clip_ratio/region_mean": 0.001632889558095485, "epoch": 0.104159739600651, "grad_norm": 0.11639447510242462, "learning_rate": 2e-07, "loss": 0.0505, "step": 1116 }, { "clip_ratio/high_max": 0.0019146030099363998, "clip_ratio/high_mean": 0.0007663730830245186, "clip_ratio/low_mean": 0.000903773423488019, "clip_ratio/low_min": 0.00010537352136452682, "clip_ratio/region_mean": 0.0016701464701327495, "epoch": 0.10425307270065158, "grad_norm": 0.11998254060745239, "learning_rate": 2e-07, "loss": 0.0706, "step": 1117 }, { "clip_ratio/high_max": 0.002060027814877685, "clip_ratio/high_mean": 0.0007911094908195082, "clip_ratio/low_mean": 0.0008561759641452227, "clip_ratio/low_min": 3.8407549254770856e-05, "clip_ratio/region_mean": 0.0016472854476887733, "epoch": 0.10434640580065216, "grad_norm": 0.10776705294847488, "learning_rate": 2e-07, "loss": 0.0417, "step": 1118 }, { "clip_ratio/high_max": 0.0023762541022733785, "clip_ratio/high_mean": 0.0008951831259764731, "clip_ratio/low_mean": 0.0009972692641895264, "clip_ratio/low_min": 0.00018105510616805987, "clip_ratio/region_mean": 0.0018924524410977028, "epoch": 0.10443973890065275, "grad_norm": 0.11696118861436844, "learning_rate": 2e-07, "loss": 0.0537, "step": 1119 }, { "clip_ratio/high_max": 0.0019373905743123032, "clip_ratio/high_mean": 0.0007854196737753227, "clip_ratio/low_mean": 0.0007882638055889402, "clip_ratio/low_min": 5.97609387114062e-05, "clip_ratio/region_mean": 0.0015736834830022417, "epoch": 0.10453307200065333, "grad_norm": 0.11502838879823685, "learning_rate": 2e-07, "loss": 0.0164, "step": 1120 }, { "clip_ratio/high_max": 0.00196491542737931, "clip_ratio/high_mean": 0.0007803541957400739, "clip_ratio/low_mean": 0.0009862065544439247, "clip_ratio/low_min": 0.00016101685196190374, "clip_ratio/region_mean": 0.0017665607228991576, "epoch": 0.10462640510065392, "grad_norm": 0.10364340245723724, "learning_rate": 2e-07, "loss": 0.0502, "step": 1121 }, { "clip_ratio/high_max": 0.0021214132284512743, "clip_ratio/high_mean": 0.0008876967622200027, "clip_ratio/low_mean": 0.0006826360040577129, "clip_ratio/low_min": 4.5663475248147734e-05, "clip_ratio/region_mean": 0.0015703327517258003, "epoch": 0.1047197382006545, "grad_norm": 0.11766502261161804, "learning_rate": 2e-07, "loss": -0.0365, "step": 1122 }, { "clip_ratio/high_max": 0.001993548503378406, "clip_ratio/high_mean": 0.0008586051881138701, "clip_ratio/low_mean": 0.0007542029716205434, "clip_ratio/low_min": 1.2510007763921749e-05, "clip_ratio/region_mean": 0.001612808136997046, "epoch": 0.10481307130065508, "grad_norm": 0.11161106824874878, "learning_rate": 2e-07, "loss": 0.0119, "step": 1123 }, { "clip_ratio/high_max": 0.0020322481723269448, "clip_ratio/high_mean": 0.0009426568030903582, "clip_ratio/low_mean": 0.00084526019054465, "clip_ratio/low_min": 8.557700220990228e-05, "clip_ratio/region_mean": 0.001787917033652775, "epoch": 0.10490640440065567, "grad_norm": 0.1170584112405777, "learning_rate": 2e-07, "loss": -0.0459, "step": 1124 }, { "clip_ratio/high_max": 0.0020064402488060296, "clip_ratio/high_mean": 0.0008623619414720451, "clip_ratio/low_mean": 0.0008255675866166712, "clip_ratio/low_min": 5.298409996612463e-05, "clip_ratio/region_mean": 0.001687929528998211, "epoch": 0.10499973750065625, "grad_norm": 0.1188339814543724, "learning_rate": 2e-07, "loss": 0.0443, "step": 1125 }, { "clip_ratio/high_max": 0.001964855386177078, "clip_ratio/high_mean": 0.0007491772466892144, "clip_ratio/low_mean": 0.0007843884268368129, "clip_ratio/low_min": 5.0382098379486706e-05, "clip_ratio/region_mean": 0.0015335656971728895, "epoch": 0.10509307060065683, "grad_norm": 0.09919366985559464, "learning_rate": 2e-07, "loss": 0.0169, "step": 1126 }, { "clip_ratio/high_max": 0.0022139290085760877, "clip_ratio/high_mean": 0.0009930781252478482, "clip_ratio/low_mean": 0.0007822934021533001, "clip_ratio/low_min": 8.812764463073108e-05, "clip_ratio/region_mean": 0.0017753715728758834, "epoch": 0.10518640370065742, "grad_norm": 0.10725989937782288, "learning_rate": 2e-07, "loss": -0.0389, "step": 1127 }, { "clip_ratio/high_max": 0.0019060509075643495, "clip_ratio/high_mean": 0.0008020602308533853, "clip_ratio/low_mean": 0.0008654398279759334, "clip_ratio/low_min": 3.916478272003587e-05, "clip_ratio/region_mean": 0.001667500073381234, "epoch": 0.105279736800658, "grad_norm": 0.11149710416793823, "learning_rate": 2e-07, "loss": 0.0254, "step": 1128 }, { "clip_ratio/high_max": 0.002058269274129998, "clip_ratio/high_mean": 0.000836152186820982, "clip_ratio/low_mean": 0.0007773707529850071, "clip_ratio/low_min": 7.954085685923928e-05, "clip_ratio/region_mean": 0.0016135229307110421, "epoch": 0.10537306990065858, "grad_norm": 0.11640170216560364, "learning_rate": 2e-07, "loss": 0.0266, "step": 1129 }, { "clip_ratio/high_max": 0.0019290172749606427, "clip_ratio/high_mean": 0.0008134646886901464, "clip_ratio/low_mean": 0.0008313503458339255, "clip_ratio/low_min": 7.45459856261732e-05, "clip_ratio/region_mean": 0.001644815034524072, "epoch": 0.10546640300065917, "grad_norm": 0.11858923733234406, "learning_rate": 2e-07, "loss": 0.0436, "step": 1130 }, { "clip_ratio/high_max": 0.002271311699587386, "clip_ratio/high_mean": 0.0008803390919638332, "clip_ratio/low_mean": 0.000953260936512379, "clip_ratio/low_min": 6.299695905909175e-05, "clip_ratio/region_mean": 0.0018335999993723817, "epoch": 0.10555973610065975, "grad_norm": 0.1107635572552681, "learning_rate": 2e-07, "loss": 0.0014, "step": 1131 }, { "clip_ratio/high_max": 0.0021464369419845752, "clip_ratio/high_mean": 0.0007732665053481469, "clip_ratio/low_mean": 0.0009778240309969988, "clip_ratio/low_min": 0.00014680325239169179, "clip_ratio/region_mean": 0.0017510905672679655, "epoch": 0.10565306920066034, "grad_norm": 0.11545167863368988, "learning_rate": 2e-07, "loss": 0.0534, "step": 1132 }, { "clip_ratio/high_max": 0.0020635016917367466, "clip_ratio/high_mean": 0.0007953010044730036, "clip_ratio/low_mean": 0.0007714597049925942, "clip_ratio/low_min": 5.726727977162227e-05, "clip_ratio/region_mean": 0.0015667607294744812, "epoch": 0.10574640230066092, "grad_norm": 0.11513207107782364, "learning_rate": 2e-07, "loss": -0.0055, "step": 1133 }, { "clip_ratio/high_max": 0.002458238377585076, "clip_ratio/high_mean": 0.0009145115636783885, "clip_ratio/low_mean": 0.0009321716752310749, "clip_ratio/low_min": 3.3603108022361994e-05, "clip_ratio/region_mean": 0.0018466832116246223, "epoch": 0.1058397354006615, "grad_norm": 0.11788010597229004, "learning_rate": 2e-07, "loss": 0.0393, "step": 1134 }, { "clip_ratio/high_max": 0.0018190643058915157, "clip_ratio/high_mean": 0.000730126548660337, "clip_ratio/low_mean": 0.0008839536913001211, "clip_ratio/low_min": 0.00013752832819591276, "clip_ratio/region_mean": 0.0016140802472364157, "epoch": 0.10593306850066209, "grad_norm": 0.10765480250120163, "learning_rate": 2e-07, "loss": 0.0448, "step": 1135 }, { "clip_ratio/high_max": 0.0019771008228417486, "clip_ratio/high_mean": 0.0008210890409827698, "clip_ratio/low_mean": 0.0006791227096982766, "clip_ratio/low_min": 0.00010360239957662998, "clip_ratio/region_mean": 0.0015002117615949828, "epoch": 0.10602640160066266, "grad_norm": 0.1010265126824379, "learning_rate": 2e-07, "loss": -0.0064, "step": 1136 }, { "clip_ratio/high_max": 0.0023271221871254966, "clip_ratio/high_mean": 0.0009044749094755389, "clip_ratio/low_mean": 0.000815372866782127, "clip_ratio/low_min": 9.613530346541665e-05, "clip_ratio/region_mean": 0.001719847772619687, "epoch": 0.10611973470066324, "grad_norm": 0.13308583199977875, "learning_rate": 2e-07, "loss": -0.0005, "step": 1137 }, { "clip_ratio/high_max": 0.0019794295949395746, "clip_ratio/high_mean": 0.0008731149209779687, "clip_ratio/low_mean": 0.0008726155574549921, "clip_ratio/low_min": 7.460645656465204e-05, "clip_ratio/region_mean": 0.0017457305184507277, "epoch": 0.10621306780066384, "grad_norm": 0.12127518653869629, "learning_rate": 2e-07, "loss": 0.0026, "step": 1138 }, { "clip_ratio/high_max": 0.001878964394563809, "clip_ratio/high_mean": 0.0008652834003441967, "clip_ratio/low_mean": 0.0007468720323231537, "clip_ratio/low_min": 6.369221227942035e-05, "clip_ratio/region_mean": 0.0016121554617711809, "epoch": 0.10630640090066441, "grad_norm": 0.12518629431724548, "learning_rate": 2e-07, "loss": 0.0177, "step": 1139 }, { "clip_ratio/high_max": 0.002306116384716006, "clip_ratio/high_mean": 0.0009400194103363901, "clip_ratio/low_mean": 0.0009537517271382967, "clip_ratio/low_min": 0.00016255638547590934, "clip_ratio/region_mean": 0.001893771142931655, "epoch": 0.10639973400066499, "grad_norm": 0.11931274086236954, "learning_rate": 2e-07, "loss": 0.0048, "step": 1140 }, { "clip_ratio/high_max": 0.0017165084354928695, "clip_ratio/high_mean": 0.0006907038568897406, "clip_ratio/low_mean": 0.0008570180252718274, "clip_ratio/low_min": 7.601393735967577e-05, "clip_ratio/region_mean": 0.001547721869428642, "epoch": 0.10649306710066558, "grad_norm": 0.11279512196779251, "learning_rate": 2e-07, "loss": 0.0352, "step": 1141 }, { "clip_ratio/high_max": 0.0019221193215344101, "clip_ratio/high_mean": 0.0007903558325779159, "clip_ratio/low_mean": 0.0009620098207960837, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.001752365642460063, "epoch": 0.10658640020066616, "grad_norm": 0.11947794258594513, "learning_rate": 2e-07, "loss": 0.0236, "step": 1142 }, { "clip_ratio/high_max": 0.0015755723288748413, "clip_ratio/high_mean": 0.000655124849799904, "clip_ratio/low_mean": 0.0008957450372690801, "clip_ratio/low_min": 8.161739151546499e-05, "clip_ratio/region_mean": 0.00155086989980191, "epoch": 0.10667973330066675, "grad_norm": 0.11713862419128418, "learning_rate": 2e-07, "loss": 0.0885, "step": 1143 }, { "clip_ratio/high_max": 0.0018858881885535084, "clip_ratio/high_mean": 0.0008289517463708762, "clip_ratio/low_mean": 0.0008811488642095355, "clip_ratio/low_min": 5.9594045978883514e-05, "clip_ratio/region_mean": 0.0017101006596931256, "epoch": 0.10677306640066733, "grad_norm": 0.11162342131137848, "learning_rate": 2e-07, "loss": 0.0392, "step": 1144 }, { "clip_ratio/high_max": 0.0026227020425722003, "clip_ratio/high_mean": 0.001007443321213941, "clip_ratio/low_mean": 0.0008193480080080917, "clip_ratio/low_min": 4.3744031245296355e-05, "clip_ratio/region_mean": 0.00182679130739416, "epoch": 0.10686639950066791, "grad_norm": 0.12195838987827301, "learning_rate": 2e-07, "loss": 0.0319, "step": 1145 }, { "clip_ratio/high_max": 0.001861441989603918, "clip_ratio/high_mean": 0.000848241808853345, "clip_ratio/low_mean": 0.0008853249128151219, "clip_ratio/low_min": 6.093463525758125e-05, "clip_ratio/region_mean": 0.0017335666852886789, "epoch": 0.1069597326006685, "grad_norm": 0.12574167549610138, "learning_rate": 2e-07, "loss": 0.0384, "step": 1146 }, { "clip_ratio/high_max": 0.0018904901116911788, "clip_ratio/high_mean": 0.000757511894335039, "clip_ratio/low_mean": 0.0010635354010446463, "clip_ratio/low_min": 0.00010545681379880989, "clip_ratio/region_mean": 0.0018210473062936217, "epoch": 0.10705306570066908, "grad_norm": 0.11610447615385056, "learning_rate": 2e-07, "loss": 0.0583, "step": 1147 }, { "clip_ratio/high_max": 0.0022015433132764883, "clip_ratio/high_mean": 0.0008801695385045605, "clip_ratio/low_mean": 0.0008953559645306086, "clip_ratio/low_min": 5.52388792129932e-05, "clip_ratio/region_mean": 0.0017755254448275082, "epoch": 0.10714639880066966, "grad_norm": 0.1057298555970192, "learning_rate": 2e-07, "loss": 0.0346, "step": 1148 }, { "clip_ratio/high_max": 0.002047515841695713, "clip_ratio/high_mean": 0.0008516731268173316, "clip_ratio/low_mean": 0.0009468160096730571, "clip_ratio/low_min": 7.918330265965778e-05, "clip_ratio/region_mean": 0.0017984891819651239, "epoch": 0.10723973190067025, "grad_norm": 0.11584507673978806, "learning_rate": 2e-07, "loss": 0.0413, "step": 1149 }, { "clip_ratio/high_max": 0.0021017427352489904, "clip_ratio/high_mean": 0.0008125445292535005, "clip_ratio/low_mean": 0.0008262821102107409, "clip_ratio/low_min": 9.536821926303674e-05, "clip_ratio/region_mean": 0.0016388266521971673, "epoch": 0.10733306500067083, "grad_norm": 0.12657034397125244, "learning_rate": 2e-07, "loss": -0.0087, "step": 1150 }, { "clip_ratio/high_max": 0.001750627692672424, "clip_ratio/high_mean": 0.000777348228439223, "clip_ratio/low_mean": 0.0010250919531245017, "clip_ratio/low_min": 5.6210994443972595e-05, "clip_ratio/region_mean": 0.0018024401942966506, "epoch": 0.10742639810067142, "grad_norm": 0.11520180106163025, "learning_rate": 2e-07, "loss": 0.0283, "step": 1151 }, { "clip_ratio/high_max": 0.0021279325883369893, "clip_ratio/high_mean": 0.0007706253491051029, "clip_ratio/low_mean": 0.0008342934379470535, "clip_ratio/low_min": 5.73432189412415e-05, "clip_ratio/region_mean": 0.0016049188270699233, "epoch": 0.107519731200672, "grad_norm": 0.12096858024597168, "learning_rate": 2e-07, "loss": 0.0319, "step": 1152 }, { "clip_ratio/high_max": 0.0, "clip_ratio/high_mean": 0.0, "clip_ratio/low_mean": 0.0, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0, "completions/clipped_ratio": 0.015485491071428603, "completions/max_length": 4096.0, "completions/max_terminated_length": 4096.0, "completions/mean_length": 614.3460693359375, "completions/mean_terminated_length": 559.5828857421875, "completions/min_length": 3.0, "completions/min_terminated_length": 3.0, "epoch": 0.10761306430067258, "grad_norm": 0.1160568818449974, "learning_rate": 2e-07, "loss": -0.0061, "num_tokens": 816859429.0, "reward": 0.5833391547203064, "reward_std": 0.19667354226112366, "rewards/simpleverify_reward/mean": 0.5833391547203064, "rewards/simpleverify_reward/std": 0.49300768971443176, "step": 1153 }, { "clip_ratio/high_max": 0.0019169123988831416, "clip_ratio/high_mean": 0.0008564926611143164, "clip_ratio/low_mean": 0.00048126526235137135, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0013377579125517514, "epoch": 0.10770639740067317, "grad_norm": 0.11682841926813126, "learning_rate": 2e-07, "loss": -0.0141, "step": 1154 }, { "clip_ratio/high_max": 0.0019670104811666533, "clip_ratio/high_mean": 0.00077349924686132, "clip_ratio/low_mean": 0.0005076172701592441, "clip_ratio/low_min": 4.773238470079377e-05, "clip_ratio/region_mean": 0.0012811165288439952, "epoch": 0.10779973050067375, "grad_norm": 0.11736146360635757, "learning_rate": 2e-07, "loss": 0.0125, "step": 1155 }, { "clip_ratio/high_max": 0.002156670092517743, "clip_ratio/high_mean": 0.0008013919778022682, "clip_ratio/low_mean": 0.0005886760918656364, "clip_ratio/low_min": 4.0733886635280214e-05, "clip_ratio/region_mean": 0.0013900680605729576, "epoch": 0.10789306360067433, "grad_norm": 0.11771664023399353, "learning_rate": 2e-07, "loss": 0.0168, "step": 1156 }, { "clip_ratio/high_max": 0.0017371336252836045, "clip_ratio/high_mean": 0.0007800079074513633, "clip_ratio/low_mean": 0.000612374702541274, "clip_ratio/low_min": 4.243132752890233e-05, "clip_ratio/region_mean": 0.0013923826663813088, "epoch": 0.10798639670067492, "grad_norm": 0.1343723088502884, "learning_rate": 2e-07, "loss": 0.0346, "step": 1157 }, { "clip_ratio/high_max": 0.00187909827218391, "clip_ratio/high_mean": 0.0007998681248864159, "clip_ratio/low_mean": 0.0006239180329430383, "clip_ratio/low_min": 2.607074839033885e-05, "clip_ratio/region_mean": 0.001423786161467433, "epoch": 0.1080797298006755, "grad_norm": 0.11986269056797028, "learning_rate": 2e-07, "loss": 0.0291, "step": 1158 }, { "clip_ratio/high_max": 0.0025008884440467227, "clip_ratio/high_mean": 0.0008782572058407823, "clip_ratio/low_mean": 0.0005666578172167647, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.001444915007596137, "epoch": 0.10817306290067608, "grad_norm": 0.12095480412244797, "learning_rate": 2e-07, "loss": -0.0002, "step": 1159 }, { "clip_ratio/high_max": 0.0019961771031375974, "clip_ratio/high_mean": 0.0008152804002747871, "clip_ratio/low_mean": 0.0006073411987017607, "clip_ratio/low_min": 2.481021329003852e-05, "clip_ratio/region_mean": 0.001422621604433516, "epoch": 0.10826639600067667, "grad_norm": 0.11017649620771408, "learning_rate": 2e-07, "loss": 0.0507, "step": 1160 }, { "clip_ratio/high_max": 0.0019432085173320957, "clip_ratio/high_mean": 0.0007215921432361938, "clip_ratio/low_mean": 0.0006896377508383011, "clip_ratio/low_min": 1.6094848888315028e-05, "clip_ratio/region_mean": 0.0014112299249973148, "epoch": 0.10835972910067725, "grad_norm": 0.13379618525505066, "learning_rate": 2e-07, "loss": 0.0507, "step": 1161 }, { "clip_ratio/high_max": 0.0018634473090060055, "clip_ratio/high_mean": 0.0007880788671172922, "clip_ratio/low_mean": 0.00048597215209156275, "clip_ratio/low_min": 2.084969946736237e-05, "clip_ratio/region_mean": 0.0012740510210278444, "epoch": 0.10845306220067784, "grad_norm": 0.11517704278230667, "learning_rate": 2e-07, "loss": 0.0143, "step": 1162 }, { "clip_ratio/high_max": 0.0020613764427253045, "clip_ratio/high_mean": 0.0008299237488245126, "clip_ratio/low_mean": 0.0005871897246834124, "clip_ratio/low_min": 1.0952422599075362e-05, "clip_ratio/region_mean": 0.0014171135226206388, "epoch": 0.10854639530067842, "grad_norm": 0.12492489069700241, "learning_rate": 2e-07, "loss": 0.0236, "step": 1163 }, { "clip_ratio/high_max": 0.0021904926034039818, "clip_ratio/high_mean": 0.0008724889667064417, "clip_ratio/low_mean": 0.0005500883307831828, "clip_ratio/low_min": 4.500663726503262e-05, "clip_ratio/region_mean": 0.0014225773156795185, "epoch": 0.108639728400679, "grad_norm": 0.13476698100566864, "learning_rate": 2e-07, "loss": -0.0069, "step": 1164 }, { "clip_ratio/high_max": 0.002182456912123598, "clip_ratio/high_mean": 0.0008935629884945229, "clip_ratio/low_mean": 0.0005632210577459773, "clip_ratio/low_min": 1.8590124454931356e-05, "clip_ratio/region_mean": 0.0014567840480594896, "epoch": 0.10873306150067959, "grad_norm": 0.1174546554684639, "learning_rate": 2e-07, "loss": 0.0437, "step": 1165 }, { "clip_ratio/high_max": 0.0020987595053156838, "clip_ratio/high_mean": 0.0008152350537784514, "clip_ratio/low_mean": 0.000653669891107711, "clip_ratio/low_min": 3.969934186898172e-05, "clip_ratio/region_mean": 0.0014689049530716147, "epoch": 0.10882639460068017, "grad_norm": 0.12381657212972641, "learning_rate": 2e-07, "loss": 0.0259, "step": 1166 }, { "clip_ratio/high_max": 0.0019331540679559112, "clip_ratio/high_mean": 0.0007569987756141927, "clip_ratio/low_mean": 0.0005940187456872081, "clip_ratio/low_min": 2.534651957830647e-05, "clip_ratio/region_mean": 0.0013510174940165598, "epoch": 0.10891972770068074, "grad_norm": 0.10602670907974243, "learning_rate": 2e-07, "loss": -0.0147, "step": 1167 }, { "clip_ratio/high_max": 0.0021925612782069948, "clip_ratio/high_mean": 0.0008483400670229457, "clip_ratio/low_mean": 0.0006754874666512478, "clip_ratio/low_min": 5.366726963984547e-05, "clip_ratio/region_mean": 0.0015238275482261088, "epoch": 0.10901306080068134, "grad_norm": 0.11531234532594681, "learning_rate": 2e-07, "loss": 0.036, "step": 1168 }, { "clip_ratio/high_max": 0.0016864828648976982, "clip_ratio/high_mean": 0.0006497343565570191, "clip_ratio/low_mean": 0.0007049825926515041, "clip_ratio/low_min": 2.9486224775610026e-05, "clip_ratio/region_mean": 0.001354716943751555, "epoch": 0.10910639390068191, "grad_norm": 0.12472192198038101, "learning_rate": 2e-07, "loss": 0.0673, "step": 1169 }, { "clip_ratio/high_max": 0.0017993573201238178, "clip_ratio/high_mean": 0.0008040061402425636, "clip_ratio/low_mean": 0.0005592716988758184, "clip_ratio/low_min": 2.8837846002716105e-05, "clip_ratio/region_mean": 0.0013632778354804032, "epoch": 0.10919972700068249, "grad_norm": 0.12474675476551056, "learning_rate": 2e-07, "loss": 0.0274, "step": 1170 }, { "clip_ratio/high_max": 0.0019246646043029614, "clip_ratio/high_mean": 0.0008153026283252984, "clip_ratio/low_mean": 0.0007104376463757944, "clip_ratio/low_min": 5.048953153163893e-05, "clip_ratio/region_mean": 0.0015257402847055346, "epoch": 0.10929306010068308, "grad_norm": 0.12403801828622818, "learning_rate": 2e-07, "loss": 0.0407, "step": 1171 }, { "clip_ratio/high_max": 0.0019398540098336525, "clip_ratio/high_mean": 0.0008247403020504862, "clip_ratio/low_mean": 0.0007010963818174787, "clip_ratio/low_min": 6.504519296868239e-05, "clip_ratio/region_mean": 0.0015258366693160497, "epoch": 0.10938639320068366, "grad_norm": 0.11764136701822281, "learning_rate": 2e-07, "loss": 0.0955, "step": 1172 }, { "clip_ratio/high_max": 0.0019484196382109076, "clip_ratio/high_mean": 0.0008372347856493434, "clip_ratio/low_mean": 0.0007686056105740136, "clip_ratio/low_min": 9.999172016250668e-05, "clip_ratio/region_mean": 0.0016058404107752722, "epoch": 0.10947972630068425, "grad_norm": 0.12035224586725235, "learning_rate": 2e-07, "loss": 0.0036, "step": 1173 }, { "clip_ratio/high_max": 0.0017932676819327753, "clip_ratio/high_mean": 0.0007719401273789117, "clip_ratio/low_mean": 0.0006990238034632057, "clip_ratio/low_min": 3.231880873499904e-05, "clip_ratio/region_mean": 0.001470963910833234, "epoch": 0.10957305940068483, "grad_norm": 0.11542928218841553, "learning_rate": 2e-07, "loss": 0.044, "step": 1174 }, { "clip_ratio/high_max": 0.0018528577784309164, "clip_ratio/high_mean": 0.0007469789434253471, "clip_ratio/low_mean": 0.0007874780039855978, "clip_ratio/low_min": 5.4546777391806245e-05, "clip_ratio/region_mean": 0.0015344569583248813, "epoch": 0.10966639250068541, "grad_norm": 0.12118572741746902, "learning_rate": 2e-07, "loss": 0.106, "step": 1175 }, { "clip_ratio/high_max": 0.0019193279586033896, "clip_ratio/high_mean": 0.0007498701488657389, "clip_ratio/low_mean": 0.0007427552063745679, "clip_ratio/low_min": 5.0132297474192455e-05, "clip_ratio/region_mean": 0.0014926253643352538, "epoch": 0.109759725600686, "grad_norm": 0.10780536383390427, "learning_rate": 2e-07, "loss": 0.0456, "step": 1176 }, { "clip_ratio/high_max": 0.0019665240215545055, "clip_ratio/high_mean": 0.0008728644515940687, "clip_ratio/low_mean": 0.0005660294882545713, "clip_ratio/low_min": 3.0269677154137753e-05, "clip_ratio/region_mean": 0.0014388939416676294, "epoch": 0.10985305870068658, "grad_norm": 0.10996058583259583, "learning_rate": 2e-07, "loss": -0.0332, "step": 1177 }, { "clip_ratio/high_max": 0.0018952702666865662, "clip_ratio/high_mean": 0.0007833548497728771, "clip_ratio/low_mean": 0.0006925992456672247, "clip_ratio/low_min": 6.992949329287512e-05, "clip_ratio/region_mean": 0.001475954042689409, "epoch": 0.10994639180068716, "grad_norm": 0.11363290250301361, "learning_rate": 2e-07, "loss": 0.0036, "step": 1178 }, { "clip_ratio/high_max": 0.001990711192775052, "clip_ratio/high_mean": 0.0009112081261264393, "clip_ratio/low_mean": 0.0008442802609351929, "clip_ratio/low_min": 2.433987901895307e-05, "clip_ratio/region_mean": 0.0017554883597767912, "epoch": 0.11003972490068775, "grad_norm": 0.1146884635090828, "learning_rate": 2e-07, "loss": 0.0245, "step": 1179 }, { "clip_ratio/high_max": 0.0019520042551448569, "clip_ratio/high_mean": 0.0008398876561841462, "clip_ratio/low_mean": 0.0007790342351654544, "clip_ratio/low_min": 8.77535312611144e-05, "clip_ratio/region_mean": 0.00161892192409141, "epoch": 0.11013305800068833, "grad_norm": 0.1171574667096138, "learning_rate": 2e-07, "loss": 0.0388, "step": 1180 }, { "clip_ratio/high_max": 0.0022093849365774076, "clip_ratio/high_mean": 0.0008202156514016679, "clip_ratio/low_mean": 0.0005785415651189396, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0013987572492624167, "epoch": 0.11022639110068891, "grad_norm": 0.11124298721551895, "learning_rate": 2e-07, "loss": -0.0162, "step": 1181 }, { "clip_ratio/high_max": 0.0019945314052165486, "clip_ratio/high_mean": 0.0008481447148369625, "clip_ratio/low_mean": 0.0006369259517668979, "clip_ratio/low_min": 6.987217693676939e-05, "clip_ratio/region_mean": 0.0014850707011646591, "epoch": 0.1103197242006895, "grad_norm": 0.1174883171916008, "learning_rate": 2e-07, "loss": 0.0196, "step": 1182 }, { "clip_ratio/high_max": 0.0021828490171174053, "clip_ratio/high_mean": 0.0008022232505027205, "clip_ratio/low_mean": 0.0008029562704905402, "clip_ratio/low_min": 4.004565744253341e-05, "clip_ratio/region_mean": 0.0016051795028033666, "epoch": 0.11041305730069008, "grad_norm": 0.18150027096271515, "learning_rate": 2e-07, "loss": 0.0156, "step": 1183 }, { "clip_ratio/high_max": 0.0019037793535972014, "clip_ratio/high_mean": 0.0007116621418390423, "clip_ratio/low_mean": 0.0007621612639923114, "clip_ratio/low_min": 5.1575255838542944e-05, "clip_ratio/region_mean": 0.0014738233876414597, "epoch": 0.11050639040069067, "grad_norm": 0.1087121069431305, "learning_rate": 2e-07, "loss": 0.0506, "step": 1184 }, { "clip_ratio/high_max": 0.0017710304764477769, "clip_ratio/high_mean": 0.0007795245683155372, "clip_ratio/low_mean": 0.0007834432581148576, "clip_ratio/low_min": 5.330464591679629e-05, "clip_ratio/region_mean": 0.0015629678018740378, "epoch": 0.11059972350069125, "grad_norm": 0.1128527820110321, "learning_rate": 2e-07, "loss": 0.0176, "step": 1185 }, { "clip_ratio/high_max": 0.0024984141637105495, "clip_ratio/high_mean": 0.0009966985853679944, "clip_ratio/low_mean": 0.0009169587719952688, "clip_ratio/low_min": 7.654900764464401e-05, "clip_ratio/region_mean": 0.0019136572809657082, "epoch": 0.11069305660069183, "grad_norm": 0.12492623180150986, "learning_rate": 2e-07, "loss": 0.0117, "step": 1186 }, { "clip_ratio/high_max": 0.001772872270521475, "clip_ratio/high_mean": 0.0007062738595777773, "clip_ratio/low_mean": 0.000910099095563055, "clip_ratio/low_min": 0.00015414242989209015, "clip_ratio/region_mean": 0.001616372956050327, "epoch": 0.11078638970069242, "grad_norm": 0.1232641339302063, "learning_rate": 2e-07, "loss": 0.1136, "step": 1187 }, { "clip_ratio/high_max": 0.0019422236837272067, "clip_ratio/high_mean": 0.0008002994400158059, "clip_ratio/low_mean": 0.000754012795368908, "clip_ratio/low_min": 2.9714957236137707e-05, "clip_ratio/region_mean": 0.0015543122353847139, "epoch": 0.110879722800693, "grad_norm": 0.12839746475219727, "learning_rate": 2e-07, "loss": 0.0192, "step": 1188 }, { "clip_ratio/high_max": 0.0017465170240029693, "clip_ratio/high_mean": 0.000802778700744966, "clip_ratio/low_mean": 0.0007932489770610118, "clip_ratio/low_min": 6.0512755226227455e-05, "clip_ratio/region_mean": 0.0015960277014528401, "epoch": 0.11097305590069358, "grad_norm": 0.12504327297210693, "learning_rate": 2e-07, "loss": 0.0446, "step": 1189 }, { "clip_ratio/high_max": 0.002352633724512998, "clip_ratio/high_mean": 0.0009217006318067433, "clip_ratio/low_mean": 0.0008952159241744084, "clip_ratio/low_min": 7.399133301078109e-05, "clip_ratio/region_mean": 0.0018169165632571094, "epoch": 0.11106638900069417, "grad_norm": 0.11342830210924149, "learning_rate": 2e-07, "loss": 0.0202, "step": 1190 }, { "clip_ratio/high_max": 0.00249566811544355, "clip_ratio/high_mean": 0.0010179015807807446, "clip_ratio/low_mean": 0.000696452178999607, "clip_ratio/low_min": 5.6053685511869844e-05, "clip_ratio/region_mean": 0.001714353813440539, "epoch": 0.11115972210069475, "grad_norm": 0.11984187364578247, "learning_rate": 2e-07, "loss": -0.0065, "step": 1191 }, { "clip_ratio/high_max": 0.0018396105806459673, "clip_ratio/high_mean": 0.0006802157577112666, "clip_ratio/low_mean": 0.0007860857422201661, "clip_ratio/low_min": 8.549891572329216e-05, "clip_ratio/region_mean": 0.001466301480832044, "epoch": 0.11125305520069532, "grad_norm": 0.11490648984909058, "learning_rate": 2e-07, "loss": 0.0487, "step": 1192 }, { "clip_ratio/high_max": 0.00193311082693981, "clip_ratio/high_mean": 0.0008310069370054407, "clip_ratio/low_mean": 0.0006997083110036328, "clip_ratio/low_min": 3.4047306598949945e-05, "clip_ratio/region_mean": 0.001530715249828063, "epoch": 0.11134638830069592, "grad_norm": 0.1359480917453766, "learning_rate": 2e-07, "loss": -0.0222, "step": 1193 }, { "clip_ratio/high_max": 0.0018432959441270214, "clip_ratio/high_mean": 0.0007472018041880801, "clip_ratio/low_mean": 0.00083012976210739, "clip_ratio/low_min": 9.060174761543749e-05, "clip_ratio/region_mean": 0.0015773315753904171, "epoch": 0.1114397214006965, "grad_norm": 0.10427822172641754, "learning_rate": 2e-07, "loss": 0.0706, "step": 1194 }, { "clip_ratio/high_max": 0.0021867651084903628, "clip_ratio/high_mean": 0.0008061830376391299, "clip_ratio/low_mean": 0.0007828877423889935, "clip_ratio/low_min": 4.988770160707645e-05, "clip_ratio/region_mean": 0.0015890707727521658, "epoch": 0.11153305450069709, "grad_norm": 0.11788173764944077, "learning_rate": 2e-07, "loss": 0.0379, "step": 1195 }, { "clip_ratio/high_max": 0.0017576654408912873, "clip_ratio/high_mean": 0.0007978930552781094, "clip_ratio/low_mean": 0.000846145638206508, "clip_ratio/low_min": 9.403496369486675e-05, "clip_ratio/region_mean": 0.0016440386898466386, "epoch": 0.11162638760069767, "grad_norm": 0.11406026035547256, "learning_rate": 2e-07, "loss": 0.0393, "step": 1196 }, { "clip_ratio/high_max": 0.0019311979958729353, "clip_ratio/high_mean": 0.0008237655638367869, "clip_ratio/low_mean": 0.0007275782882061321, "clip_ratio/low_min": 3.051213025173638e-05, "clip_ratio/region_mean": 0.001551343852042919, "epoch": 0.11171972070069824, "grad_norm": 0.10777253657579422, "learning_rate": 2e-07, "loss": 0.0217, "step": 1197 }, { "clip_ratio/high_max": 0.0022947357247176114, "clip_ratio/high_mean": 0.0008924265239329543, "clip_ratio/low_mean": 0.0007863756072765682, "clip_ratio/low_min": 3.124994691461325e-05, "clip_ratio/region_mean": 0.0016788021493994165, "epoch": 0.11181305380069884, "grad_norm": 0.12788107991218567, "learning_rate": 2e-07, "loss": 0.0229, "step": 1198 }, { "clip_ratio/high_max": 0.0020752979107783176, "clip_ratio/high_mean": 0.0008639029529149411, "clip_ratio/low_mean": 0.0008551260452804854, "clip_ratio/low_min": 4.765569156006677e-05, "clip_ratio/region_mean": 0.001719029045489151, "epoch": 0.11190638690069941, "grad_norm": 0.11600267142057419, "learning_rate": 2e-07, "loss": 0.0228, "step": 1199 }, { "clip_ratio/high_max": 0.0020669780496973544, "clip_ratio/high_mean": 0.0008292913735203911, "clip_ratio/low_mean": 0.0007420840938721085, "clip_ratio/low_min": 1.660467569308821e-05, "clip_ratio/region_mean": 0.0015713754655735102, "epoch": 0.11199972000069999, "grad_norm": 0.11781024932861328, "learning_rate": 2e-07, "loss": 0.0419, "step": 1200 }, { "clip_ratio/high_max": 0.002111534631694667, "clip_ratio/high_mean": 0.0009496090933680534, "clip_ratio/low_mean": 0.0007281413145392435, "clip_ratio/low_min": 6.176906663313275e-05, "clip_ratio/region_mean": 0.0016777504206402227, "epoch": 0.11209305310070058, "grad_norm": 0.11852071434259415, "learning_rate": 2e-07, "loss": -0.0496, "step": 1201 }, { "clip_ratio/high_max": 0.001932803810632322, "clip_ratio/high_mean": 0.0008238646278186934, "clip_ratio/low_mean": 0.0007732026533631142, "clip_ratio/low_min": 9.599760960554704e-05, "clip_ratio/region_mean": 0.001597067283000797, "epoch": 0.11218638620070116, "grad_norm": 0.11483114957809448, "learning_rate": 2e-07, "loss": 0.0114, "step": 1202 }, { "clip_ratio/high_max": 0.002115432929713279, "clip_ratio/high_mean": 0.0007764452129777055, "clip_ratio/low_mean": 0.000762305322496104, "clip_ratio/low_min": 0.00011534126133483369, "clip_ratio/region_mean": 0.0015387505773105659, "epoch": 0.11227971930070174, "grad_norm": 0.11859200894832611, "learning_rate": 2e-07, "loss": 0.0401, "step": 1203 }, { "clip_ratio/high_max": 0.002112038455379661, "clip_ratio/high_mean": 0.0008635458652861416, "clip_ratio/low_mean": 0.0006961665949347662, "clip_ratio/low_min": 3.740331521839835e-05, "clip_ratio/region_mean": 0.0015597124365740456, "epoch": 0.11237305240070233, "grad_norm": 0.10531630367040634, "learning_rate": 2e-07, "loss": -0.0046, "step": 1204 }, { "clip_ratio/high_max": 0.002204091757448623, "clip_ratio/high_mean": 0.000830211965876515, "clip_ratio/low_mean": 0.000871369486048934, "clip_ratio/low_min": 6.462169403675944e-05, "clip_ratio/region_mean": 0.0017015814082697034, "epoch": 0.11246638550070291, "grad_norm": 0.11408296227455139, "learning_rate": 2e-07, "loss": 0.0207, "step": 1205 }, { "clip_ratio/high_max": 0.0017554707228555344, "clip_ratio/high_mean": 0.0007931946820463054, "clip_ratio/low_mean": 0.0007716078835073858, "clip_ratio/low_min": 4.33665445598308e-05, "clip_ratio/region_mean": 0.0015648025437258184, "epoch": 0.1125597186007035, "grad_norm": 0.09365818649530411, "learning_rate": 2e-07, "loss": 0.0129, "step": 1206 }, { "clip_ratio/high_max": 0.0022533061637659557, "clip_ratio/high_mean": 0.0009474693124502664, "clip_ratio/low_mean": 0.0009492696426605107, "clip_ratio/low_min": 0.00015591148167004576, "clip_ratio/region_mean": 0.0018967389696626924, "epoch": 0.11265305170070408, "grad_norm": 0.13851717114448547, "learning_rate": 2e-07, "loss": 0.0406, "step": 1207 }, { "clip_ratio/high_max": 0.0020389800920384005, "clip_ratio/high_mean": 0.000793401149167039, "clip_ratio/low_mean": 0.0008588657055952353, "clip_ratio/low_min": 0.00011588213010327308, "clip_ratio/region_mean": 0.0016522668520337902, "epoch": 0.11274638480070466, "grad_norm": 0.108412966132164, "learning_rate": 2e-07, "loss": 0.0156, "step": 1208 }, { "clip_ratio/high_max": 0.0016904340118344408, "clip_ratio/high_mean": 0.0007059813679006766, "clip_ratio/low_mean": 0.0008582589980505873, "clip_ratio/low_min": 2.127638344973093e-05, "clip_ratio/region_mean": 0.0015642403304809704, "epoch": 0.11283971790070525, "grad_norm": 0.10778053104877472, "learning_rate": 2e-07, "loss": 0.0619, "step": 1209 }, { "clip_ratio/high_max": 0.001868135997938225, "clip_ratio/high_mean": 0.0007393834193862858, "clip_ratio/low_mean": 0.0009097276015381794, "clip_ratio/low_min": 9.324779966846108e-05, "clip_ratio/region_mean": 0.0016491109963681083, "epoch": 0.11293305100070583, "grad_norm": 0.10354004800319672, "learning_rate": 2e-07, "loss": 0.0217, "step": 1210 }, { "clip_ratio/high_max": 0.0020001848024548963, "clip_ratio/high_mean": 0.0007857140280975727, "clip_ratio/low_mean": 0.0007351571393883205, "clip_ratio/low_min": 6.782066338928416e-05, "clip_ratio/region_mean": 0.0015208711556624621, "epoch": 0.11302638410070641, "grad_norm": 0.11621309071779251, "learning_rate": 2e-07, "loss": 0.001, "step": 1211 }, { "clip_ratio/high_max": 0.0020490801907726564, "clip_ratio/high_mean": 0.0008738568358239718, "clip_ratio/low_mean": 0.0008715053427295061, "clip_ratio/low_min": 0.00010988885514962021, "clip_ratio/region_mean": 0.0017453621985623613, "epoch": 0.113119717200707, "grad_norm": 0.11413492262363434, "learning_rate": 2e-07, "loss": 0.003, "step": 1212 }, { "clip_ratio/high_max": 0.0020726569382532034, "clip_ratio/high_mean": 0.0007956870304042241, "clip_ratio/low_mean": 0.0008640593987365719, "clip_ratio/low_min": 3.67334287147969e-05, "clip_ratio/region_mean": 0.0016597464491496794, "epoch": 0.11321305030070758, "grad_norm": 0.1138414666056633, "learning_rate": 2e-07, "loss": 0.0524, "step": 1213 }, { "clip_ratio/high_max": 0.001865880643890705, "clip_ratio/high_mean": 0.0007615362956130411, "clip_ratio/low_mean": 0.0009168303731712513, "clip_ratio/low_min": 0.00011854500962726888, "clip_ratio/region_mean": 0.001678366657870356, "epoch": 0.11330638340070817, "grad_norm": 0.12223517894744873, "learning_rate": 2e-07, "loss": 0.0331, "step": 1214 }, { "clip_ratio/high_max": 0.001995548060222063, "clip_ratio/high_mean": 0.0007981050257512834, "clip_ratio/low_mean": 0.0007976561855684849, "clip_ratio/low_min": 6.560211113537662e-05, "clip_ratio/region_mean": 0.0015957612231431995, "epoch": 0.11339971650070875, "grad_norm": 0.11277613043785095, "learning_rate": 2e-07, "loss": 0.0496, "step": 1215 }, { "clip_ratio/high_max": 0.002083441569993738, "clip_ratio/high_mean": 0.0008352843960892642, "clip_ratio/low_mean": 0.0008326690731337294, "clip_ratio/low_min": 8.29732334750588e-05, "clip_ratio/region_mean": 0.0016679534746799618, "epoch": 0.11349304960070933, "grad_norm": 0.11591725051403046, "learning_rate": 2e-07, "loss": 0.0388, "step": 1216 }, { "clip_ratio/high_max": 0.002270214376039803, "clip_ratio/high_mean": 0.0009172108530037804, "clip_ratio/low_mean": 0.0008881935473254998, "clip_ratio/low_min": 8.657275520818075e-05, "clip_ratio/region_mean": 0.00180540432484122, "epoch": 0.11358638270070992, "grad_norm": 0.12421771883964539, "learning_rate": 2e-07, "loss": 0.0164, "step": 1217 }, { "clip_ratio/high_max": 0.0020374860214360524, "clip_ratio/high_mean": 0.0008294130730064353, "clip_ratio/low_mean": 0.0008619504751550267, "clip_ratio/low_min": 3.186044432368362e-05, "clip_ratio/region_mean": 0.001691363548161462, "epoch": 0.1136797158007105, "grad_norm": 0.11322672665119171, "learning_rate": 2e-07, "loss": 0.0195, "step": 1218 }, { "clip_ratio/high_max": 0.0022462502020061947, "clip_ratio/high_mean": 0.000882840311533073, "clip_ratio/low_mean": 0.0008962206593423616, "clip_ratio/low_min": 1.4977234968682751e-05, "clip_ratio/region_mean": 0.0017790609781513922, "epoch": 0.11377304890071108, "grad_norm": 0.1102449968457222, "learning_rate": 2e-07, "loss": -0.0037, "step": 1219 }, { "clip_ratio/high_max": 0.001908599238959141, "clip_ratio/high_mean": 0.0007807299298292492, "clip_ratio/low_mean": 0.00081813555516419, "clip_ratio/low_min": 6.076049521652749e-05, "clip_ratio/region_mean": 0.0015988655140972696, "epoch": 0.11386638200071167, "grad_norm": 0.10638296604156494, "learning_rate": 2e-07, "loss": 0.0481, "step": 1220 }, { "clip_ratio/high_max": 0.002443530276650563, "clip_ratio/high_mean": 0.000935048579776776, "clip_ratio/low_mean": 0.0008235428176703863, "clip_ratio/low_min": 2.9591305064968765e-05, "clip_ratio/region_mean": 0.0017585913810762577, "epoch": 0.11395971510071225, "grad_norm": 0.11245433241128922, "learning_rate": 2e-07, "loss": 0.0001, "step": 1221 }, { "clip_ratio/high_max": 0.001613102896953933, "clip_ratio/high_mean": 0.0008267928351415321, "clip_ratio/low_mean": 0.0009212252953147981, "clip_ratio/low_min": 0.00013178066365071572, "clip_ratio/region_mean": 0.0017480181122664362, "epoch": 0.11405304820071283, "grad_norm": 0.11638496816158295, "learning_rate": 2e-07, "loss": 0.0469, "step": 1222 }, { "clip_ratio/high_max": 0.0019148120263707824, "clip_ratio/high_mean": 0.0008064890771493083, "clip_ratio/low_mean": 0.0008693019208294572, "clip_ratio/low_min": 6.363917600538116e-05, "clip_ratio/region_mean": 0.0016757910016167443, "epoch": 0.11414638130071342, "grad_norm": 0.10747750103473663, "learning_rate": 2e-07, "loss": 0.0025, "step": 1223 }, { "clip_ratio/high_max": 0.0021657798606611323, "clip_ratio/high_mean": 0.0008227466141761397, "clip_ratio/low_mean": 0.0007386120159935672, "clip_ratio/low_min": 5.230808710621204e-05, "clip_ratio/region_mean": 0.0015613586401741486, "epoch": 0.114239714400714, "grad_norm": 0.10033287853002548, "learning_rate": 2e-07, "loss": -0.0017, "step": 1224 }, { "clip_ratio/high_max": 0.0016708233197277877, "clip_ratio/high_mean": 0.0008065455876931082, "clip_ratio/low_mean": 0.0006711288515361957, "clip_ratio/low_min": 3.706374400280765e-05, "clip_ratio/region_mean": 0.001477674457419198, "epoch": 0.11433304750071459, "grad_norm": 0.10920832306146622, "learning_rate": 2e-07, "loss": 0.038, "step": 1225 }, { "clip_ratio/high_max": 0.0018396891173324548, "clip_ratio/high_mean": 0.0006660056760665611, "clip_ratio/low_mean": 0.0008196005619538482, "clip_ratio/low_min": 4.479878680285765e-05, "clip_ratio/region_mean": 0.001485606193455169, "epoch": 0.11442638060071517, "grad_norm": 0.12292346358299255, "learning_rate": 2e-07, "loss": 0.0468, "step": 1226 }, { "clip_ratio/high_max": 0.0019379481600481085, "clip_ratio/high_mean": 0.0007798262795404298, "clip_ratio/low_mean": 0.0008681403596710879, "clip_ratio/low_min": 5.457082261273172e-05, "clip_ratio/region_mean": 0.0016479666519444436, "epoch": 0.11451971370071574, "grad_norm": 0.11060839891433716, "learning_rate": 2e-07, "loss": 0.021, "step": 1227 }, { "clip_ratio/high_max": 0.001950278445292497, "clip_ratio/high_mean": 0.0007084988519636681, "clip_ratio/low_mean": 0.0008055313737713732, "clip_ratio/low_min": 7.543660558440024e-05, "clip_ratio/region_mean": 0.0015140302675717976, "epoch": 0.11461304680071634, "grad_norm": 0.10495229810476303, "learning_rate": 2e-07, "loss": 0.0043, "step": 1228 }, { "clip_ratio/high_max": 0.0018927559940493666, "clip_ratio/high_mean": 0.0007947094727569493, "clip_ratio/low_mean": 0.0008430821917499998, "clip_ratio/low_min": 8.546850131097017e-05, "clip_ratio/region_mean": 0.001637791639950592, "epoch": 0.11470637990071691, "grad_norm": 0.10346551984548569, "learning_rate": 2e-07, "loss": -0.0028, "step": 1229 }, { "clip_ratio/high_max": 0.0019753634405788034, "clip_ratio/high_mean": 0.0007713105405855458, "clip_ratio/low_mean": 0.0007691345872444799, "clip_ratio/low_min": 9.41641128520132e-05, "clip_ratio/region_mean": 0.0015404451405629516, "epoch": 0.1147997130007175, "grad_norm": 0.11502096801996231, "learning_rate": 2e-07, "loss": 0.0342, "step": 1230 }, { "clip_ratio/high_max": 0.001879706029285444, "clip_ratio/high_mean": 0.0007299277713173069, "clip_ratio/low_mean": 0.0007254328338603955, "clip_ratio/low_min": 3.324135741422651e-05, "clip_ratio/region_mean": 0.001455360630643554, "epoch": 0.11489304610071809, "grad_norm": 0.11662667989730835, "learning_rate": 2e-07, "loss": -0.0251, "step": 1231 }, { "clip_ratio/high_max": 0.0020478001388255507, "clip_ratio/high_mean": 0.0007860343503125478, "clip_ratio/low_mean": 0.0008958977450674865, "clip_ratio/low_min": 0.00010175487113883719, "clip_ratio/region_mean": 0.0016819320881040767, "epoch": 0.11498637920071866, "grad_norm": 0.11087875068187714, "learning_rate": 2e-07, "loss": 0.0539, "step": 1232 }, { "clip_ratio/high_max": 0.0023131085763452575, "clip_ratio/high_mean": 0.0009578384524502326, "clip_ratio/low_mean": 0.0007182490844570566, "clip_ratio/low_min": 5.8581706980476156e-05, "clip_ratio/region_mean": 0.0016760875660111196, "epoch": 0.11507971230071924, "grad_norm": 0.1278061419725418, "learning_rate": 2e-07, "loss": -0.0046, "step": 1233 }, { "clip_ratio/high_max": 0.00219521337930928, "clip_ratio/high_mean": 0.0008923426757974084, "clip_ratio/low_mean": 0.0008511046144121792, "clip_ratio/low_min": 3.810725047515007e-05, "clip_ratio/region_mean": 0.001743447304761503, "epoch": 0.11517304540071983, "grad_norm": 0.10875792801380157, "learning_rate": 2e-07, "loss": 0.0119, "step": 1234 }, { "clip_ratio/high_max": 0.002423665479000192, "clip_ratio/high_mean": 0.0008994623185571982, "clip_ratio/low_mean": 0.0008991525191959227, "clip_ratio/low_min": 0.00011491538771224441, "clip_ratio/region_mean": 0.0017986148086492904, "epoch": 0.11526637850072041, "grad_norm": 0.11544710397720337, "learning_rate": 2e-07, "loss": -0.0081, "step": 1235 }, { "clip_ratio/high_max": 0.0017239671742572682, "clip_ratio/high_mean": 0.0006969740898057353, "clip_ratio/low_mean": 0.0008017204154384672, "clip_ratio/low_min": 7.44395883884863e-05, "clip_ratio/region_mean": 0.0014986944988777395, "epoch": 0.115359711600721, "grad_norm": 0.1294483244419098, "learning_rate": 2e-07, "loss": 0.0729, "step": 1236 }, { "clip_ratio/high_max": 0.002054000688076485, "clip_ratio/high_mean": 0.0008127877972583519, "clip_ratio/low_mean": 0.0009079644332814496, "clip_ratio/low_min": 8.182839519577101e-05, "clip_ratio/region_mean": 0.0017207522432727274, "epoch": 0.11545304470072158, "grad_norm": 0.12334328889846802, "learning_rate": 2e-07, "loss": 0.0434, "step": 1237 }, { "clip_ratio/high_max": 0.0019080756974290125, "clip_ratio/high_mean": 0.0008283273455162998, "clip_ratio/low_mean": 0.0008467517782264622, "clip_ratio/low_min": 1.131836324930191e-05, "clip_ratio/region_mean": 0.0016750791546655819, "epoch": 0.11554637780072216, "grad_norm": 0.10619993507862091, "learning_rate": 2e-07, "loss": 0.0244, "step": 1238 }, { "clip_ratio/high_max": 0.001827751701057423, "clip_ratio/high_mean": 0.0008342516703123692, "clip_ratio/low_mean": 0.0007992610699147917, "clip_ratio/low_min": 4.920940500596771e-05, "clip_ratio/region_mean": 0.001633512758417055, "epoch": 0.11563971090072275, "grad_norm": 0.11235214024782181, "learning_rate": 2e-07, "loss": 0.0397, "step": 1239 }, { "clip_ratio/high_max": 0.0019134866852255072, "clip_ratio/high_mean": 0.0007765542140987236, "clip_ratio/low_mean": 0.000753001899283845, "clip_ratio/low_min": 5.559531655308092e-05, "clip_ratio/region_mean": 0.0015295560806407593, "epoch": 0.11573304400072333, "grad_norm": 0.10510806739330292, "learning_rate": 2e-07, "loss": 0.0262, "step": 1240 }, { "clip_ratio/high_max": 0.002360225422307849, "clip_ratio/high_mean": 0.0009099936050915858, "clip_ratio/low_mean": 0.0008719120560272131, "clip_ratio/low_min": 7.648472001164919e-05, "clip_ratio/region_mean": 0.0017819056520238519, "epoch": 0.11582637710072391, "grad_norm": 0.11368588358163834, "learning_rate": 2e-07, "loss": -0.0212, "step": 1241 }, { "clip_ratio/high_max": 0.0017875433004519437, "clip_ratio/high_mean": 0.0007639376271981746, "clip_ratio/low_mean": 0.0008226685258705402, "clip_ratio/low_min": 4.9217871492146514e-05, "clip_ratio/region_mean": 0.0015866061075939797, "epoch": 0.1159197102007245, "grad_norm": 0.1118081733584404, "learning_rate": 2e-07, "loss": 0.0161, "step": 1242 }, { "clip_ratio/high_max": 0.002419930257019587, "clip_ratio/high_mean": 0.0009026735060615465, "clip_ratio/low_mean": 0.0009171222609438701, "clip_ratio/low_min": 0.00010606079013086855, "clip_ratio/region_mean": 0.0018197957542724907, "epoch": 0.11601304330072508, "grad_norm": 0.11847953498363495, "learning_rate": 2e-07, "loss": 0.0441, "step": 1243 }, { "clip_ratio/high_max": 0.0017746237208484672, "clip_ratio/high_mean": 0.0007691937480558408, "clip_ratio/low_mean": 0.0010152311115234625, "clip_ratio/low_min": 8.938203609432094e-05, "clip_ratio/region_mean": 0.001784424835932441, "epoch": 0.11610637640072566, "grad_norm": 0.11602036654949188, "learning_rate": 2e-07, "loss": 0.0904, "step": 1244 }, { "clip_ratio/high_max": 0.0018058280074910726, "clip_ratio/high_mean": 0.0007626161495863926, "clip_ratio/low_mean": 0.0008111793104035314, "clip_ratio/low_min": 0.00012743080378641025, "clip_ratio/region_mean": 0.001573795496369712, "epoch": 0.11619970950072625, "grad_norm": 0.11438401788473129, "learning_rate": 2e-07, "loss": 0.0416, "step": 1245 }, { "clip_ratio/high_max": 0.0019699835538631305, "clip_ratio/high_mean": 0.0008379699211218394, "clip_ratio/low_mean": 0.0007400125759886578, "clip_ratio/low_min": 1.1993859516223893e-05, "clip_ratio/region_mean": 0.0015779824607307091, "epoch": 0.11629304260072683, "grad_norm": 0.11323001980781555, "learning_rate": 2e-07, "loss": -0.0071, "step": 1246 }, { "clip_ratio/high_max": 0.002266485862492118, "clip_ratio/high_mean": 0.0009387195623276057, "clip_ratio/low_mean": 0.0008420690119237406, "clip_ratio/low_min": 5.7145622122334316e-05, "clip_ratio/region_mean": 0.0017807885451475158, "epoch": 0.11638637570072742, "grad_norm": 0.13581421971321106, "learning_rate": 2e-07, "loss": 0.0156, "step": 1247 }, { "clip_ratio/high_max": 0.0019202183539164253, "clip_ratio/high_mean": 0.0007860586301831063, "clip_ratio/low_mean": 0.0008332226007041754, "clip_ratio/low_min": 9.343978035758482e-05, "clip_ratio/region_mean": 0.0016192812508961651, "epoch": 0.116479708800728, "grad_norm": 0.10907955467700958, "learning_rate": 2e-07, "loss": 0.0044, "step": 1248 }, { "clip_ratio/high_max": 0.0023313688070629723, "clip_ratio/high_mean": 0.000847421440994367, "clip_ratio/low_mean": 0.0008927945455070585, "clip_ratio/low_min": 0.00011394355533411726, "clip_ratio/region_mean": 0.0017402160374331288, "epoch": 0.11657304190072858, "grad_norm": 0.11954310536384583, "learning_rate": 2e-07, "loss": 0.0173, "step": 1249 }, { "clip_ratio/high_max": 0.0021776166358904447, "clip_ratio/high_mean": 0.0008525486719008768, "clip_ratio/low_mean": 0.000859988071169937, "clip_ratio/low_min": 5.5955397328943945e-05, "clip_ratio/region_mean": 0.001712536730337888, "epoch": 0.11666637500072917, "grad_norm": 0.11375118792057037, "learning_rate": 2e-07, "loss": 0.0249, "step": 1250 }, { "clip_ratio/high_max": 0.0018622580537339672, "clip_ratio/high_mean": 0.0007105404729372822, "clip_ratio/low_mean": 0.0008734183829801623, "clip_ratio/low_min": 0.00010334390935895499, "clip_ratio/region_mean": 0.0015839588668313809, "epoch": 0.11675970810072975, "grad_norm": 0.10558773577213287, "learning_rate": 2e-07, "loss": 0.0843, "step": 1251 }, { "clip_ratio/high_max": 0.0018929272482637316, "clip_ratio/high_mean": 0.0007242157244036207, "clip_ratio/low_mean": 0.0008977099041658221, "clip_ratio/low_min": 5.905154557694914e-05, "clip_ratio/region_mean": 0.0016219256212934852, "epoch": 0.11685304120073033, "grad_norm": 0.1191813200712204, "learning_rate": 2e-07, "loss": 0.0606, "step": 1252 }, { "clip_ratio/high_max": 0.0019294920857646503, "clip_ratio/high_mean": 0.0007853019105823478, "clip_ratio/low_mean": 0.000721386204531882, "clip_ratio/low_min": 3.310584997961996e-05, "clip_ratio/region_mean": 0.0015066880951053463, "epoch": 0.11694637430073092, "grad_norm": 0.1070413887500763, "learning_rate": 2e-07, "loss": -0.0102, "step": 1253 }, { "clip_ratio/high_max": 0.0019341374645591713, "clip_ratio/high_mean": 0.0008035879673116142, "clip_ratio/low_mean": 0.0009537913283566013, "clip_ratio/low_min": 0.0001228183509738301, "clip_ratio/region_mean": 0.0017573793011251837, "epoch": 0.1170397074007315, "grad_norm": 0.11011584103107452, "learning_rate": 2e-07, "loss": 0.0485, "step": 1254 }, { "clip_ratio/high_max": 0.0020656913075072225, "clip_ratio/high_mean": 0.000839835543956724, "clip_ratio/low_mean": 0.0007645375662832521, "clip_ratio/low_min": 3.4989998312084936e-05, "clip_ratio/region_mean": 0.0016043731084209867, "epoch": 0.11713304050073207, "grad_norm": 0.12412241101264954, "learning_rate": 2e-07, "loss": 0.0227, "step": 1255 }, { "clip_ratio/high_max": 0.002056520570477005, "clip_ratio/high_mean": 0.0007989274399733404, "clip_ratio/low_mean": 0.0009076085952983703, "clip_ratio/low_min": 9.075580055650789e-05, "clip_ratio/region_mean": 0.0017065360661945306, "epoch": 0.11722637360073267, "grad_norm": 0.1196042150259018, "learning_rate": 2e-07, "loss": 0.0811, "step": 1256 }, { "clip_ratio/high_max": 0.0018036756191577297, "clip_ratio/high_mean": 0.0007927739006845513, "clip_ratio/low_mean": 0.0007583720707771135, "clip_ratio/low_min": 0.00010789481439132942, "clip_ratio/region_mean": 0.0015511459605477285, "epoch": 0.11731970670073325, "grad_norm": 0.12168120592832565, "learning_rate": 2e-07, "loss": 0.0372, "step": 1257 }, { "clip_ratio/high_max": 0.0017812302467064, "clip_ratio/high_mean": 0.0008989349335024599, "clip_ratio/low_mean": 0.0009040644727065228, "clip_ratio/low_min": 1.269551103177946e-05, "clip_ratio/region_mean": 0.0018029994171229191, "epoch": 0.11741303980073384, "grad_norm": 0.1223897859454155, "learning_rate": 2e-07, "loss": -0.0036, "step": 1258 }, { "clip_ratio/high_max": 0.002029828305239789, "clip_ratio/high_mean": 0.0008761010485613951, "clip_ratio/low_mean": 0.000835226315757609, "clip_ratio/low_min": 7.22292170394212e-05, "clip_ratio/region_mean": 0.0017113273534050677, "epoch": 0.11750637290073442, "grad_norm": 0.12463203072547913, "learning_rate": 2e-07, "loss": 0.0055, "step": 1259 }, { "clip_ratio/high_max": 0.0023080080827639904, "clip_ratio/high_mean": 0.0008742368008824997, "clip_ratio/low_mean": 0.0008573055656597717, "clip_ratio/low_min": 4.7253022785298526e-05, "clip_ratio/region_mean": 0.0017315423501713667, "epoch": 0.117599706000735, "grad_norm": 0.10717450827360153, "learning_rate": 2e-07, "loss": 0.036, "step": 1260 }, { "clip_ratio/high_max": 0.002051246599876322, "clip_ratio/high_mean": 0.0008882177753548604, "clip_ratio/low_mean": 0.000920922466320917, "clip_ratio/low_min": 5.8171653108729515e-05, "clip_ratio/region_mean": 0.0018091402598656714, "epoch": 0.11769303910073559, "grad_norm": 0.12884287536144257, "learning_rate": 2e-07, "loss": 0.0504, "step": 1261 }, { "clip_ratio/high_max": 0.001917469362524571, "clip_ratio/high_mean": 0.0007637278740730835, "clip_ratio/low_mean": 0.000919482594326837, "clip_ratio/low_min": 0.00014906526757840766, "clip_ratio/region_mean": 0.0016832105029607192, "epoch": 0.11778637220073616, "grad_norm": 0.11313272267580032, "learning_rate": 2e-07, "loss": 0.069, "step": 1262 }, { "clip_ratio/high_max": 0.0018638844740053173, "clip_ratio/high_mean": 0.0008398063509957865, "clip_ratio/low_mean": 0.0009204009984387085, "clip_ratio/low_min": 5.226992379903095e-05, "clip_ratio/region_mean": 0.0017602073712623678, "epoch": 0.11787970530073674, "grad_norm": 0.11856982111930847, "learning_rate": 2e-07, "loss": 0.0525, "step": 1263 }, { "clip_ratio/high_max": 0.002179149196308572, "clip_ratio/high_mean": 0.0008859064164425945, "clip_ratio/low_mean": 0.0006719771326970658, "clip_ratio/low_min": 3.1709791073808447e-05, "clip_ratio/region_mean": 0.0015578835518681444, "epoch": 0.11797303840073733, "grad_norm": 0.11060228198766708, "learning_rate": 2e-07, "loss": -0.0142, "step": 1264 }, { "clip_ratio/high_max": 0.0020856459777860437, "clip_ratio/high_mean": 0.0009041079429152887, "clip_ratio/low_mean": 0.0007919257222965825, "clip_ratio/low_min": 8.721704034542199e-05, "clip_ratio/region_mean": 0.0016960336652118713, "epoch": 0.11806637150073791, "grad_norm": 0.13098886609077454, "learning_rate": 2e-07, "loss": 0.0322, "step": 1265 }, { "clip_ratio/high_max": 0.002070820795779582, "clip_ratio/high_mean": 0.0008962347928900272, "clip_ratio/low_mean": 0.0007770225038257195, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0016732572476030327, "epoch": 0.1181597046007385, "grad_norm": 0.11110086739063263, "learning_rate": 2e-07, "loss": 0.0106, "step": 1266 }, { "clip_ratio/high_max": 0.002047376019618241, "clip_ratio/high_mean": 0.0008570518875785638, "clip_ratio/low_mean": 0.0010188540127273882, "clip_ratio/low_min": 5.829214296682039e-05, "clip_ratio/region_mean": 0.0018759059385047294, "epoch": 0.11825303770073908, "grad_norm": 0.11763789504766464, "learning_rate": 2e-07, "loss": 0.041, "step": 1267 }, { "clip_ratio/high_max": 0.002049378166702809, "clip_ratio/high_mean": 0.0008164798291545594, "clip_ratio/low_mean": 0.0008584502520534443, "clip_ratio/low_min": 6.599660264328122e-05, "clip_ratio/region_mean": 0.00167493009212194, "epoch": 0.11834637080073966, "grad_norm": 0.11030558496713638, "learning_rate": 2e-07, "loss": 0.0465, "step": 1268 }, { "clip_ratio/high_max": 0.0020261454592400696, "clip_ratio/high_mean": 0.0007925728923510178, "clip_ratio/low_mean": 0.0008793359920673538, "clip_ratio/low_min": 4.802137482329272e-05, "clip_ratio/region_mean": 0.0016719088998797815, "epoch": 0.11843970390074025, "grad_norm": 0.14299002289772034, "learning_rate": 2e-07, "loss": -0.0056, "step": 1269 }, { "clip_ratio/high_max": 0.0020423365858732723, "clip_ratio/high_mean": 0.0008801974145171698, "clip_ratio/low_mean": 0.0009305765324825188, "clip_ratio/low_min": 4.416650790517451e-05, "clip_ratio/region_mean": 0.0018107739160768688, "epoch": 0.11853303700074083, "grad_norm": 0.11933523416519165, "learning_rate": 2e-07, "loss": 0.0502, "step": 1270 }, { "clip_ratio/high_max": 0.0019059473415836692, "clip_ratio/high_mean": 0.0008221294901886722, "clip_ratio/low_mean": 0.0008911958757380489, "clip_ratio/low_min": 2.9392213946266565e-05, "clip_ratio/region_mean": 0.0017133253568317741, "epoch": 0.11862637010074141, "grad_norm": 0.1225162222981453, "learning_rate": 2e-07, "loss": 0.0507, "step": 1271 }, { "clip_ratio/high_max": 0.0021927156267338432, "clip_ratio/high_mean": 0.0008499666091665858, "clip_ratio/low_mean": 0.0007836035438231193, "clip_ratio/low_min": 3.091482631134568e-05, "clip_ratio/region_mean": 0.0016335701511707157, "epoch": 0.118719703200742, "grad_norm": 0.11760083585977554, "learning_rate": 2e-07, "loss": -0.0029, "step": 1272 }, { "clip_ratio/high_max": 0.0018140102129109437, "clip_ratio/high_mean": 0.0006895255910421838, "clip_ratio/low_mean": 0.0009769509288162226, "clip_ratio/low_min": 0.00019755776975216577, "clip_ratio/region_mean": 0.0016664765134919435, "epoch": 0.11881303630074258, "grad_norm": 0.11006279289722443, "learning_rate": 2e-07, "loss": 0.0761, "step": 1273 }, { "clip_ratio/high_max": 0.002206230114097707, "clip_ratio/high_mean": 0.0007905423099145992, "clip_ratio/low_mean": 0.000774677097069798, "clip_ratio/low_min": 2.1493623535207007e-05, "clip_ratio/region_mean": 0.001565219456097111, "epoch": 0.11890636940074316, "grad_norm": 0.12093015015125275, "learning_rate": 2e-07, "loss": 0.0173, "step": 1274 }, { "clip_ratio/high_max": 0.0019278471809229814, "clip_ratio/high_mean": 0.0008056201113504358, "clip_ratio/low_mean": 0.0008403868887398858, "clip_ratio/low_min": 8.407686891587218e-05, "clip_ratio/region_mean": 0.0016460070328321308, "epoch": 0.11899970250074375, "grad_norm": 0.11792382597923279, "learning_rate": 2e-07, "loss": 0.0571, "step": 1275 }, { "clip_ratio/high_max": 0.0018337529145355802, "clip_ratio/high_mean": 0.0007815584731361014, "clip_ratio/low_mean": 0.0010024495277320966, "clip_ratio/low_min": 0.00013555973191614612, "clip_ratio/region_mean": 0.0017840079890447669, "epoch": 0.11909303560074433, "grad_norm": 0.13313107192516327, "learning_rate": 2e-07, "loss": 0.0423, "step": 1276 }, { "clip_ratio/high_max": 0.0024227298599726055, "clip_ratio/high_mean": 0.000993618656139006, "clip_ratio/low_mean": 0.0007206804602901684, "clip_ratio/low_min": 4.507718858803855e-05, "clip_ratio/region_mean": 0.00171429916008492, "epoch": 0.11918636870074492, "grad_norm": 0.12411339581012726, "learning_rate": 2e-07, "loss": -0.0153, "step": 1277 }, { "clip_ratio/high_max": 0.0019752088373934384, "clip_ratio/high_mean": 0.0007882494192017475, "clip_ratio/low_mean": 0.0009225240064552054, "clip_ratio/low_min": 5.028835585108027e-05, "clip_ratio/region_mean": 0.0017107734020100906, "epoch": 0.1192797018007455, "grad_norm": 0.10785482078790665, "learning_rate": 2e-07, "loss": 0.0096, "step": 1278 }, { "clip_ratio/high_max": 0.0022215704739210196, "clip_ratio/high_mean": 0.0009048702522704843, "clip_ratio/low_mean": 0.0008989415910036769, "clip_ratio/low_min": 1.5114873349375557e-05, "clip_ratio/region_mean": 0.0018038118505501188, "epoch": 0.11937303490074608, "grad_norm": 0.12280572950839996, "learning_rate": 2e-07, "loss": 0.0198, "step": 1279 }, { "clip_ratio/high_max": 0.0022226244400371797, "clip_ratio/high_mean": 0.0008412776733166538, "clip_ratio/low_mean": 0.0008919942738430109, "clip_ratio/low_min": 4.465624260774348e-05, "clip_ratio/region_mean": 0.0017332719362457283, "epoch": 0.11946636800074667, "grad_norm": 0.11854033172130585, "learning_rate": 2e-07, "loss": 0.0565, "step": 1280 }, { "clip_ratio/high_max": 0.0, "clip_ratio/high_mean": 0.0, "clip_ratio/low_mean": 0.0, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0, "completions/clipped_ratio": 0.015781947544642905, "completions/max_length": 4096.0, "completions/max_terminated_length": 4091.0, "completions/mean_length": 619.0377197265625, "completions/mean_terminated_length": 563.2845458984375, "completions/min_length": 3.0, "completions/min_terminated_length": 3.0, "epoch": 0.11955970110074725, "grad_norm": 0.12688198685646057, "learning_rate": 2e-07, "loss": 0.0509, "num_tokens": 899221623.0, "reward": 0.5822056531906128, "reward_std": 0.1952030062675476, "rewards/simpleverify_reward/mean": 0.5822056531906128, "rewards/simpleverify_reward/std": 0.49319806694984436, "step": 1281 }, { "clip_ratio/high_max": 0.002237274995422922, "clip_ratio/high_mean": 0.0009497948485659435, "clip_ratio/low_mean": 0.00045672380474570673, "clip_ratio/low_min": 3.3642649214016274e-05, "clip_ratio/region_mean": 0.0014065186369407456, "epoch": 0.11965303420074783, "grad_norm": 0.12993404269218445, "learning_rate": 2e-07, "loss": -0.019, "step": 1282 }, { "clip_ratio/high_max": 0.0018448435730533674, "clip_ratio/high_mean": 0.0007705260904913303, "clip_ratio/low_mean": 0.0005753373970946996, "clip_ratio/low_min": 3.372757146280492e-05, "clip_ratio/region_mean": 0.0013458634966809768, "epoch": 0.11974636730074842, "grad_norm": 0.12392816692590714, "learning_rate": 2e-07, "loss": 0.0266, "step": 1283 }, { "clip_ratio/high_max": 0.0021304773472365923, "clip_ratio/high_mean": 0.0009025477957038675, "clip_ratio/low_mean": 0.00053511579244514, "clip_ratio/low_min": 3.971419391746167e-05, "clip_ratio/region_mean": 0.001437663540855283, "epoch": 0.119839700400749, "grad_norm": 0.11513909697532654, "learning_rate": 2e-07, "loss": -0.0241, "step": 1284 }, { "clip_ratio/high_max": 0.001829718858061824, "clip_ratio/high_mean": 0.0008170826949935872, "clip_ratio/low_mean": 0.0006137321761343628, "clip_ratio/low_min": 1.5703517419751734e-05, "clip_ratio/region_mean": 0.0014308148493000772, "epoch": 0.11993303350074958, "grad_norm": 0.11753255128860474, "learning_rate": 2e-07, "loss": 0.0241, "step": 1285 }, { "clip_ratio/high_max": 0.0020469412629608996, "clip_ratio/high_mean": 0.0008231695210270118, "clip_ratio/low_mean": 0.0006000685425533447, "clip_ratio/low_min": 2.509833575459197e-05, "clip_ratio/region_mean": 0.0014232380453904625, "epoch": 0.12002636660075017, "grad_norm": 0.11521323025226593, "learning_rate": 2e-07, "loss": 0.0218, "step": 1286 }, { "clip_ratio/high_max": 0.001616724875930231, "clip_ratio/high_mean": 0.0006818897909397492, "clip_ratio/low_mean": 0.0007092160594766028, "clip_ratio/low_min": 6.42336990495096e-05, "clip_ratio/region_mean": 0.001391105841321405, "epoch": 0.12011969970075075, "grad_norm": 0.12416064739227295, "learning_rate": 2e-07, "loss": 0.0841, "step": 1287 }, { "clip_ratio/high_max": 0.0023209856371977367, "clip_ratio/high_mean": 0.0008622707955510123, "clip_ratio/low_mean": 0.0006456378250732087, "clip_ratio/low_min": 3.2998945243889466e-05, "clip_ratio/region_mean": 0.001507908611529274, "epoch": 0.12021303280075134, "grad_norm": 0.12193427979946136, "learning_rate": 2e-07, "loss": 0.011, "step": 1288 }, { "clip_ratio/high_max": 0.001958115717570763, "clip_ratio/high_mean": 0.0007254978600030881, "clip_ratio/low_mean": 0.0006155058817967074, "clip_ratio/low_min": 2.332426083739847e-05, "clip_ratio/region_mean": 0.001341003746347269, "epoch": 0.12030636590075192, "grad_norm": 0.12509892880916595, "learning_rate": 2e-07, "loss": 0.0632, "step": 1289 }, { "clip_ratio/high_max": 0.0018624325784912799, "clip_ratio/high_mean": 0.00074036071964656, "clip_ratio/low_mean": 0.0005930324659857433, "clip_ratio/low_min": 2.6523425731284078e-05, "clip_ratio/region_mean": 0.0013333931783563457, "epoch": 0.1203996990007525, "grad_norm": 0.1452750712633133, "learning_rate": 2e-07, "loss": 0.0686, "step": 1290 }, { "clip_ratio/high_max": 0.0017573742479726207, "clip_ratio/high_mean": 0.0007294003844435792, "clip_ratio/low_mean": 0.0006194503430378973, "clip_ratio/low_min": 4.2847221266129054e-05, "clip_ratio/region_mean": 0.0013488507247529924, "epoch": 0.12049303210075309, "grad_norm": 0.11402731388807297, "learning_rate": 2e-07, "loss": 0.0728, "step": 1291 }, { "clip_ratio/high_max": 0.0018332460822421126, "clip_ratio/high_mean": 0.0007175283953984035, "clip_ratio/low_mean": 0.0005725871251343051, "clip_ratio/low_min": 3.2476525120728184e-05, "clip_ratio/region_mean": 0.0012901155205327086, "epoch": 0.12058636520075366, "grad_norm": 0.11244647949934006, "learning_rate": 2e-07, "loss": 0.0156, "step": 1292 }, { "clip_ratio/high_max": 0.0019175177767465357, "clip_ratio/high_mean": 0.0007106208777258871, "clip_ratio/low_mean": 0.0006810693266743328, "clip_ratio/low_min": 7.588348125864286e-05, "clip_ratio/region_mean": 0.0013916902171331458, "epoch": 0.12067969830075424, "grad_norm": 0.10773490369319916, "learning_rate": 2e-07, "loss": 0.0405, "step": 1293 }, { "clip_ratio/high_max": 0.002088671848468948, "clip_ratio/high_mean": 0.00087170261394931, "clip_ratio/low_mean": 0.0006050293650332605, "clip_ratio/low_min": 4.853846530750161e-05, "clip_ratio/region_mean": 0.0014767319662496448, "epoch": 0.12077303140075484, "grad_norm": 0.1277056336402893, "learning_rate": 2e-07, "loss": 0.0117, "step": 1294 }, { "clip_ratio/high_max": 0.0016398517218476627, "clip_ratio/high_mean": 0.0006783624103263719, "clip_ratio/low_mean": 0.0006956428778721602, "clip_ratio/low_min": 2.8436493266781326e-05, "clip_ratio/region_mean": 0.0013740053072979208, "epoch": 0.12086636450075541, "grad_norm": 0.11704213172197342, "learning_rate": 2e-07, "loss": 0.0599, "step": 1295 }, { "clip_ratio/high_max": 0.002175861653086031, "clip_ratio/high_mean": 0.0008985730146378046, "clip_ratio/low_mean": 0.0006175336911837803, "clip_ratio/low_min": 4.370401438791305e-05, "clip_ratio/region_mean": 0.0015161067130975425, "epoch": 0.12095969760075599, "grad_norm": 0.12253289669752121, "learning_rate": 2e-07, "loss": -0.0297, "step": 1296 }, { "clip_ratio/high_max": 0.0018491959672246594, "clip_ratio/high_mean": 0.0007620924207003554, "clip_ratio/low_mean": 0.0005179382551432354, "clip_ratio/low_min": 1.4124293556960765e-05, "clip_ratio/region_mean": 0.001280030672205612, "epoch": 0.12105303070075658, "grad_norm": 0.11305180937051773, "learning_rate": 2e-07, "loss": 0.0194, "step": 1297 }, { "clip_ratio/high_max": 0.0021752618777099997, "clip_ratio/high_mean": 0.0008719950565136969, "clip_ratio/low_mean": 0.0005499561575561529, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.001421951219526818, "epoch": 0.12114636380075716, "grad_norm": 0.12070444226264954, "learning_rate": 2e-07, "loss": -0.0185, "step": 1298 }, { "clip_ratio/high_max": 0.0017141780554084107, "clip_ratio/high_mean": 0.0007650631814613007, "clip_ratio/low_mean": 0.0006180219888847205, "clip_ratio/low_min": 6.00194343860494e-05, "clip_ratio/region_mean": 0.0013830851930833887, "epoch": 0.12123969690075775, "grad_norm": 0.12539488077163696, "learning_rate": 2e-07, "loss": 0.0286, "step": 1299 }, { "clip_ratio/high_max": 0.0018528481814428233, "clip_ratio/high_mean": 0.0007961042465467472, "clip_ratio/low_mean": 0.000547546791494824, "clip_ratio/low_min": 1.6923910152399912e-05, "clip_ratio/region_mean": 0.0013436510853352956, "epoch": 0.12133303000075833, "grad_norm": 0.12457545101642609, "learning_rate": 2e-07, "loss": 0.0152, "step": 1300 }, { "clip_ratio/high_max": 0.001839087221014779, "clip_ratio/high_mean": 0.0007433371229126351, "clip_ratio/low_mean": 0.0006297287545748986, "clip_ratio/low_min": 3.695238865475403e-05, "clip_ratio/region_mean": 0.0013730659156863112, "epoch": 0.12142636310075891, "grad_norm": 0.11740198731422424, "learning_rate": 2e-07, "loss": 0.0215, "step": 1301 }, { "clip_ratio/high_max": 0.0018031347062787972, "clip_ratio/high_mean": 0.0007138295222830493, "clip_ratio/low_mean": 0.000810269966677879, "clip_ratio/low_min": 5.719525506719947e-05, "clip_ratio/region_mean": 0.0015240995271597058, "epoch": 0.1215196962007595, "grad_norm": 0.11833522468805313, "learning_rate": 2e-07, "loss": 0.0543, "step": 1302 }, { "clip_ratio/high_max": 0.0023794261760485824, "clip_ratio/high_mean": 0.0009604798960936023, "clip_ratio/low_mean": 0.0006661318457190646, "clip_ratio/low_min": 1.5508685464737937e-05, "clip_ratio/region_mean": 0.0016266117454506457, "epoch": 0.12161302930076008, "grad_norm": 0.11131729185581207, "learning_rate": 2e-07, "loss": -0.0044, "step": 1303 }, { "clip_ratio/high_max": 0.0017867329625005368, "clip_ratio/high_mean": 0.0007614299229317112, "clip_ratio/low_mean": 0.0007110604146873811, "clip_ratio/low_min": 2.931691415142268e-05, "clip_ratio/region_mean": 0.0014724903521710075, "epoch": 0.12170636240076066, "grad_norm": 0.1142159253358841, "learning_rate": 2e-07, "loss": 0.0464, "step": 1304 }, { "clip_ratio/high_max": 0.0018880033640016336, "clip_ratio/high_mean": 0.0008275798954855418, "clip_ratio/low_mean": 0.0005981316789984703, "clip_ratio/low_min": 2.725570902839536e-05, "clip_ratio/region_mean": 0.0014257116017688531, "epoch": 0.12179969550076125, "grad_norm": 0.12431085109710693, "learning_rate": 2e-07, "loss": -0.0124, "step": 1305 }, { "clip_ratio/high_max": 0.00199195952154696, "clip_ratio/high_mean": 0.0008900863995222608, "clip_ratio/low_mean": 0.0006659560604020953, "clip_ratio/low_min": 4.803826504939934e-05, "clip_ratio/region_mean": 0.001556042472657282, "epoch": 0.12189302860076183, "grad_norm": 0.11198938637971878, "learning_rate": 2e-07, "loss": 0.0202, "step": 1306 }, { "clip_ratio/high_max": 0.001976894898689352, "clip_ratio/high_mean": 0.000800876285211416, "clip_ratio/low_mean": 0.000678934427924105, "clip_ratio/low_min": 3.11717931253952e-05, "clip_ratio/region_mean": 0.0014798107549722772, "epoch": 0.12198636170076241, "grad_norm": 0.11416193842887878, "learning_rate": 2e-07, "loss": 0.0107, "step": 1307 }, { "clip_ratio/high_max": 0.0017797157597669866, "clip_ratio/high_mean": 0.0008009411285456736, "clip_ratio/low_mean": 0.0006502323967652046, "clip_ratio/low_min": 6.77673851896543e-05, "clip_ratio/region_mean": 0.001451173553505214, "epoch": 0.122079694800763, "grad_norm": 0.12489336729049683, "learning_rate": 2e-07, "loss": 0.0061, "step": 1308 }, { "clip_ratio/high_max": 0.002262069618154783, "clip_ratio/high_mean": 0.0009238261827704264, "clip_ratio/low_mean": 0.0006869185526738875, "clip_ratio/low_min": 4.555833584163338e-05, "clip_ratio/region_mean": 0.0016107447518152185, "epoch": 0.12217302790076358, "grad_norm": 0.10739597678184509, "learning_rate": 2e-07, "loss": -0.0024, "step": 1309 }, { "clip_ratio/high_max": 0.0019352532690390944, "clip_ratio/high_mean": 0.0007492706718039699, "clip_ratio/low_mean": 0.0007993404014996486, "clip_ratio/low_min": 1.4479323908744846e-05, "clip_ratio/region_mean": 0.0015486111005884595, "epoch": 0.12226636100076417, "grad_norm": 0.10822403430938721, "learning_rate": 2e-07, "loss": 0.06, "step": 1310 }, { "clip_ratio/high_max": 0.0020146769820712507, "clip_ratio/high_mean": 0.0008131334361678455, "clip_ratio/low_mean": 0.0007048316383588826, "clip_ratio/low_min": 0.000101008989076945, "clip_ratio/region_mean": 0.0015179650727077387, "epoch": 0.12235969410076475, "grad_norm": 0.11638078093528748, "learning_rate": 2e-07, "loss": 0.0394, "step": 1311 }, { "clip_ratio/high_max": 0.0019140009899274446, "clip_ratio/high_mean": 0.0007973179544933373, "clip_ratio/low_mean": 0.0007648816044820705, "clip_ratio/low_min": 1.7715419744490646e-05, "clip_ratio/region_mean": 0.0015621995626133867, "epoch": 0.12245302720076533, "grad_norm": 0.11824315786361694, "learning_rate": 2e-07, "loss": 0.0554, "step": 1312 }, { "clip_ratio/high_max": 0.0019488194666337222, "clip_ratio/high_mean": 0.0008056914521148428, "clip_ratio/low_mean": 0.0007476858609152259, "clip_ratio/low_min": 0.00011086229596912744, "clip_ratio/region_mean": 0.0015533772930211853, "epoch": 0.12254636030076592, "grad_norm": 0.13050085306167603, "learning_rate": 2e-07, "loss": 0.0291, "step": 1313 }, { "clip_ratio/high_max": 0.0017312336349277757, "clip_ratio/high_mean": 0.0007407043121929746, "clip_ratio/low_mean": 0.0006735342049069004, "clip_ratio/low_min": 3.3115506084868684e-05, "clip_ratio/region_mean": 0.0014142385043669492, "epoch": 0.1226396934007665, "grad_norm": 0.09814959019422531, "learning_rate": 2e-07, "loss": 0.0196, "step": 1314 }, { "clip_ratio/high_max": 0.0018504586405470036, "clip_ratio/high_mean": 0.000805423449492082, "clip_ratio/low_mean": 0.0008105913548206445, "clip_ratio/low_min": 0.00011086061749665532, "clip_ratio/region_mean": 0.0016160148261405993, "epoch": 0.12273302650076708, "grad_norm": 0.13023895025253296, "learning_rate": 2e-07, "loss": 0.0167, "step": 1315 }, { "clip_ratio/high_max": 0.0018706200280576013, "clip_ratio/high_mean": 0.000772117589804111, "clip_ratio/low_mean": 0.0006118500023148954, "clip_ratio/low_min": 1.3598781151813455e-05, "clip_ratio/region_mean": 0.001383967599394964, "epoch": 0.12282635960076767, "grad_norm": 0.10273943841457367, "learning_rate": 2e-07, "loss": 0.0051, "step": 1316 }, { "clip_ratio/high_max": 0.0019135317161271814, "clip_ratio/high_mean": 0.0008217557387979468, "clip_ratio/low_mean": 0.0008032238802115899, "clip_ratio/low_min": 1.8677554180612788e-05, "clip_ratio/region_mean": 0.0016249796317424625, "epoch": 0.12291969270076825, "grad_norm": 0.121872678399086, "learning_rate": 2e-07, "loss": 0.0373, "step": 1317 }, { "clip_ratio/high_max": 0.0019634568234323524, "clip_ratio/high_mean": 0.000739400262318668, "clip_ratio/low_mean": 0.0008409292750002351, "clip_ratio/low_min": 2.7838242203870323e-05, "clip_ratio/region_mean": 0.0015803295536898077, "epoch": 0.12301302580076884, "grad_norm": 0.12631100416183472, "learning_rate": 2e-07, "loss": 0.0486, "step": 1318 }, { "clip_ratio/high_max": 0.0017509164827060886, "clip_ratio/high_mean": 0.0006088771024224116, "clip_ratio/low_mean": 0.0008602916441304842, "clip_ratio/low_min": 5.470852192956954e-05, "clip_ratio/region_mean": 0.0014691687465528958, "epoch": 0.12310635890076942, "grad_norm": 0.11109542846679688, "learning_rate": 2e-07, "loss": 0.0654, "step": 1319 }, { "clip_ratio/high_max": 0.0018388596108707134, "clip_ratio/high_mean": 0.0008008454296941636, "clip_ratio/low_mean": 0.0009000296031445032, "clip_ratio/low_min": 3.5915950775233796e-05, "clip_ratio/region_mean": 0.0017008750000968575, "epoch": 0.12319969200077, "grad_norm": 0.10932740569114685, "learning_rate": 2e-07, "loss": 0.0778, "step": 1320 }, { "clip_ratio/high_max": 0.0020189276692690328, "clip_ratio/high_mean": 0.0007975131939019775, "clip_ratio/low_mean": 0.000674091701512225, "clip_ratio/low_min": 5.92733940720791e-05, "clip_ratio/region_mean": 0.0014716048535774462, "epoch": 0.12329302510077059, "grad_norm": 0.11329285055398941, "learning_rate": 2e-07, "loss": 0.0373, "step": 1321 }, { "clip_ratio/high_max": 0.001719163792586187, "clip_ratio/high_mean": 0.0007870773515605833, "clip_ratio/low_mean": 0.0007668163343623746, "clip_ratio/low_min": 3.931189257855294e-05, "clip_ratio/region_mean": 0.0015538936931989156, "epoch": 0.12338635820077117, "grad_norm": 0.10936406999826431, "learning_rate": 2e-07, "loss": 0.0477, "step": 1322 }, { "clip_ratio/high_max": 0.0020099618450331036, "clip_ratio/high_mean": 0.0008026376217458164, "clip_ratio/low_mean": 0.000672098563882173, "clip_ratio/low_min": 8.032417463255115e-05, "clip_ratio/region_mean": 0.0014747361601621378, "epoch": 0.12347969130077174, "grad_norm": 0.11646878719329834, "learning_rate": 2e-07, "loss": -0.0352, "step": 1323 }, { "clip_ratio/high_max": 0.0018599412142066285, "clip_ratio/high_mean": 0.0007940567884361371, "clip_ratio/low_mean": 0.0007120338723325403, "clip_ratio/low_min": 1.1993859516223893e-05, "clip_ratio/region_mean": 0.0015060906735016033, "epoch": 0.12357302440077234, "grad_norm": 0.11073994636535645, "learning_rate": 2e-07, "loss": 0.0121, "step": 1324 }, { "clip_ratio/high_max": 0.002135036622348707, "clip_ratio/high_mean": 0.000890463566975086, "clip_ratio/low_mean": 0.0007381301566056209, "clip_ratio/low_min": 2.404101542197168e-05, "clip_ratio/region_mean": 0.0016285937235807069, "epoch": 0.12366635750077291, "grad_norm": 0.11253755539655685, "learning_rate": 2e-07, "loss": -0.0309, "step": 1325 }, { "clip_ratio/high_max": 0.0018998489176738076, "clip_ratio/high_mean": 0.0007989315809027175, "clip_ratio/low_mean": 0.0008088099602900911, "clip_ratio/low_min": 5.2774474170291796e-05, "clip_ratio/region_mean": 0.0016077415457402822, "epoch": 0.12375969060077349, "grad_norm": 0.11740503460168839, "learning_rate": 2e-07, "loss": 0.0169, "step": 1326 }, { "clip_ratio/high_max": 0.0022139619977679104, "clip_ratio/high_mean": 0.0008775857431828626, "clip_ratio/low_mean": 0.0008328584171977127, "clip_ratio/low_min": 5.653375592373777e-05, "clip_ratio/region_mean": 0.0017104441576520912, "epoch": 0.12385302370077408, "grad_norm": 0.12344039231538773, "learning_rate": 2e-07, "loss": 0.0062, "step": 1327 }, { "clip_ratio/high_max": 0.0023019051222945563, "clip_ratio/high_mean": 0.0008459249256702606, "clip_ratio/low_mean": 0.0008911171516956529, "clip_ratio/low_min": 4.2282475988031365e-05, "clip_ratio/region_mean": 0.0017370420682709664, "epoch": 0.12394635680077466, "grad_norm": 0.10999125242233276, "learning_rate": 2e-07, "loss": 0.0505, "step": 1328 }, { "clip_ratio/high_max": 0.0018589935534691904, "clip_ratio/high_mean": 0.0007180971915659029, "clip_ratio/low_mean": 0.0008852310488691728, "clip_ratio/low_min": 0.00010674968598323176, "clip_ratio/region_mean": 0.001603328259079717, "epoch": 0.12403968990077525, "grad_norm": 0.11771617084741592, "learning_rate": 2e-07, "loss": 0.0446, "step": 1329 }, { "clip_ratio/high_max": 0.0020248024666216224, "clip_ratio/high_mean": 0.0007161255507526221, "clip_ratio/low_mean": 0.0007925977224658709, "clip_ratio/low_min": 2.605602639960125e-05, "clip_ratio/region_mean": 0.0015087232895893976, "epoch": 0.12413302300077583, "grad_norm": 0.09847821295261383, "learning_rate": 2e-07, "loss": 0.058, "step": 1330 }, { "clip_ratio/high_max": 0.002107880820403807, "clip_ratio/high_mean": 0.0008424481393376482, "clip_ratio/low_mean": 0.000729685691112536, "clip_ratio/low_min": 6.482567459897837e-05, "clip_ratio/region_mean": 0.0015721338277217, "epoch": 0.12422635610077641, "grad_norm": 0.11891872435808182, "learning_rate": 2e-07, "loss": 0.0286, "step": 1331 }, { "clip_ratio/high_max": 0.0021182078344281763, "clip_ratio/high_mean": 0.0008850360663927859, "clip_ratio/low_mean": 0.0007166761060943827, "clip_ratio/low_min": 2.9308323064469732e-05, "clip_ratio/region_mean": 0.0016017121670302004, "epoch": 0.124319689200777, "grad_norm": 0.11174578964710236, "learning_rate": 2e-07, "loss": -0.0569, "step": 1332 }, { "clip_ratio/high_max": 0.0019496309469104744, "clip_ratio/high_mean": 0.0008736768668313744, "clip_ratio/low_mean": 0.0008197153219953179, "clip_ratio/low_min": 3.104044299107045e-05, "clip_ratio/region_mean": 0.0016933921724557877, "epoch": 0.12441302230077758, "grad_norm": 0.1273231953382492, "learning_rate": 2e-07, "loss": 0.022, "step": 1333 }, { "clip_ratio/high_max": 0.001964032941032201, "clip_ratio/high_mean": 0.0007847272299841279, "clip_ratio/low_mean": 0.0007582127218483947, "clip_ratio/low_min": 2.7267023142485414e-05, "clip_ratio/region_mean": 0.0015429399645654485, "epoch": 0.12450635540077816, "grad_norm": 0.11268296837806702, "learning_rate": 2e-07, "loss": 0.0208, "step": 1334 }, { "clip_ratio/high_max": 0.0016437351805507205, "clip_ratio/high_mean": 0.0007942922802612884, "clip_ratio/low_mean": 0.0007324452544708038, "clip_ratio/low_min": 5.3376370487967506e-05, "clip_ratio/region_mean": 0.0015267375056282617, "epoch": 0.12459968850077875, "grad_norm": 0.11572766304016113, "learning_rate": 2e-07, "loss": 0.0419, "step": 1335 }, { "clip_ratio/high_max": 0.0022419536762754433, "clip_ratio/high_mean": 0.0008681780818733387, "clip_ratio/low_mean": 0.0007631867629243061, "clip_ratio/low_min": 4.932762931275647e-05, "clip_ratio/region_mean": 0.001631364822969772, "epoch": 0.12469302160077933, "grad_norm": 0.1116037517786026, "learning_rate": 2e-07, "loss": 0.0454, "step": 1336 }, { "clip_ratio/high_max": 0.0019251447592978366, "clip_ratio/high_mean": 0.0008934832221711986, "clip_ratio/low_mean": 0.0009079969877348049, "clip_ratio/low_min": 6.7823759309249e-05, "clip_ratio/region_mean": 0.0018014802008110564, "epoch": 0.12478635470077991, "grad_norm": 0.13691624999046326, "learning_rate": 2e-07, "loss": -0.0006, "step": 1337 }, { "clip_ratio/high_max": 0.0019187659563613124, "clip_ratio/high_mean": 0.0007910221565907705, "clip_ratio/low_mean": 0.0008070780895650387, "clip_ratio/low_min": 8.765063557802932e-05, "clip_ratio/region_mean": 0.0015981002579792403, "epoch": 0.1248796878007805, "grad_norm": 0.11461508274078369, "learning_rate": 2e-07, "loss": 0.0064, "step": 1338 }, { "clip_ratio/high_max": 0.002006720857025357, "clip_ratio/high_mean": 0.0007753497811791021, "clip_ratio/low_mean": 0.0007955997098179068, "clip_ratio/low_min": 4.210306087770732e-05, "clip_ratio/region_mean": 0.001570949490997009, "epoch": 0.12497302090078108, "grad_norm": 0.10362855345010757, "learning_rate": 2e-07, "loss": 0.0203, "step": 1339 }, { "clip_ratio/high_max": 0.0019034137912967708, "clip_ratio/high_mean": 0.0007742341531411512, "clip_ratio/low_mean": 0.0008003267230378697, "clip_ratio/low_min": 4.327625174482819e-05, "clip_ratio/region_mean": 0.0015745608652650844, "epoch": 0.12506635400078167, "grad_norm": 0.10168452560901642, "learning_rate": 2e-07, "loss": 0.0207, "step": 1340 }, { "clip_ratio/high_max": 0.0018485786349629052, "clip_ratio/high_mean": 0.0008419820387643995, "clip_ratio/low_mean": 0.0007919491963548353, "clip_ratio/low_min": 2.632371979416348e-05, "clip_ratio/region_mean": 0.0016339312605850864, "epoch": 0.12515968710078224, "grad_norm": 0.104018434882164, "learning_rate": 2e-07, "loss": 0.0221, "step": 1341 }, { "clip_ratio/high_max": 0.001992455541767413, "clip_ratio/high_mean": 0.0007964157630340196, "clip_ratio/low_mean": 0.0008396405755775049, "clip_ratio/low_min": 8.004526171134785e-05, "clip_ratio/region_mean": 0.0016360563604393974, "epoch": 0.12525302020078283, "grad_norm": 0.11589255183935165, "learning_rate": 2e-07, "loss": 0.004, "step": 1342 }, { "clip_ratio/high_max": 0.0022969185301917605, "clip_ratio/high_mean": 0.0008733358845347539, "clip_ratio/low_mean": 0.0007875369974499336, "clip_ratio/low_min": 9.361048705613939e-05, "clip_ratio/region_mean": 0.0016608728474238887, "epoch": 0.12534635330078342, "grad_norm": 0.12406916171312332, "learning_rate": 2e-07, "loss": 0.0453, "step": 1343 }, { "clip_ratio/high_max": 0.0019710665292222984, "clip_ratio/high_mean": 0.0008206484562833793, "clip_ratio/low_mean": 0.0007231691124616191, "clip_ratio/low_min": 5.45953344044392e-05, "clip_ratio/region_mean": 0.001543817539641168, "epoch": 0.125439686400784, "grad_norm": 0.10222864151000977, "learning_rate": 2e-07, "loss": 0.0209, "step": 1344 }, { "clip_ratio/high_max": 0.001744320023135515, "clip_ratio/high_mean": 0.0007084503531586961, "clip_ratio/low_mean": 0.0008621361521363724, "clip_ratio/low_min": 1.6756031982367858e-05, "clip_ratio/region_mean": 0.0015705865116615314, "epoch": 0.12553301950078458, "grad_norm": 0.12423655390739441, "learning_rate": 2e-07, "loss": 0.0253, "step": 1345 }, { "clip_ratio/high_max": 0.0019296712926006876, "clip_ratio/high_mean": 0.0007393226733256597, "clip_ratio/low_mean": 0.0008750409142521676, "clip_ratio/low_min": 6.293658589129336e-05, "clip_ratio/region_mean": 0.0016143635803018697, "epoch": 0.12562635260078517, "grad_norm": 0.11862718313932419, "learning_rate": 2e-07, "loss": 0.0521, "step": 1346 }, { "clip_ratio/high_max": 0.0019521245012583677, "clip_ratio/high_mean": 0.0007952720461616991, "clip_ratio/low_mean": 0.0008362513908650726, "clip_ratio/low_min": 5.358497946872376e-05, "clip_ratio/region_mean": 0.0016315234461217187, "epoch": 0.12571968570078576, "grad_norm": 0.11597266793251038, "learning_rate": 2e-07, "loss": 0.0573, "step": 1347 }, { "clip_ratio/high_max": 0.0021935147378826514, "clip_ratio/high_mean": 0.0008777333023317624, "clip_ratio/low_mean": 0.0008727461772650713, "clip_ratio/low_min": 7.596710293000797e-05, "clip_ratio/region_mean": 0.001750479481415823, "epoch": 0.12581301880078632, "grad_norm": 0.11926323920488358, "learning_rate": 2e-07, "loss": 0.0155, "step": 1348 }, { "clip_ratio/high_max": 0.001696984596492257, "clip_ratio/high_mean": 0.0007343245006268262, "clip_ratio/low_mean": 0.0007927610204205848, "clip_ratio/low_min": 2.4996666979859583e-05, "clip_ratio/region_mean": 0.0015270855474227574, "epoch": 0.12590635190078692, "grad_norm": 0.11394165456295013, "learning_rate": 2e-07, "loss": 0.0257, "step": 1349 }, { "clip_ratio/high_max": 0.0017198930472659413, "clip_ratio/high_mean": 0.0006548472865688382, "clip_ratio/low_mean": 0.0009312796737503959, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.001586126978509128, "epoch": 0.1259996850007875, "grad_norm": 0.13544532656669617, "learning_rate": 2e-07, "loss": 0.0522, "step": 1350 }, { "clip_ratio/high_max": 0.0017238400887436, "clip_ratio/high_mean": 0.0006778573388146469, "clip_ratio/low_mean": 0.0008407142959185876, "clip_ratio/low_min": 3.163672408845741e-05, "clip_ratio/region_mean": 0.0015185716474661604, "epoch": 0.12609301810078807, "grad_norm": 0.12109499424695969, "learning_rate": 2e-07, "loss": 0.0754, "step": 1351 }, { "clip_ratio/high_max": 0.001900982271763496, "clip_ratio/high_mean": 0.000703891417288105, "clip_ratio/low_mean": 0.0009812156240514014, "clip_ratio/low_min": 9.24032451621315e-05, "clip_ratio/region_mean": 0.0016851070176926441, "epoch": 0.12618635120078867, "grad_norm": 0.1227816715836525, "learning_rate": 2e-07, "loss": 0.0688, "step": 1352 }, { "clip_ratio/high_max": 0.0018113867517968174, "clip_ratio/high_mean": 0.0007505493467760971, "clip_ratio/low_mean": 0.0008484310710628051, "clip_ratio/low_min": 0.00015394354522868525, "clip_ratio/region_mean": 0.0015989804596756585, "epoch": 0.12627968430078926, "grad_norm": 0.12363375723361969, "learning_rate": 2e-07, "loss": 0.0145, "step": 1353 }, { "clip_ratio/high_max": 0.001879474839370232, "clip_ratio/high_mean": 0.0008216540009016171, "clip_ratio/low_mean": 0.0007710950485488866, "clip_ratio/low_min": 4.2583806134643964e-05, "clip_ratio/region_mean": 0.0015927489948808216, "epoch": 0.12637301740078982, "grad_norm": 0.11476366221904755, "learning_rate": 2e-07, "loss": -0.0056, "step": 1354 }, { "clip_ratio/high_max": 0.001902898682601517, "clip_ratio/high_mean": 0.0008166079587681452, "clip_ratio/low_mean": 0.0008785147801972926, "clip_ratio/low_min": 0.00012305654672672972, "clip_ratio/region_mean": 0.001695122744422406, "epoch": 0.12646635050079041, "grad_norm": 0.12615498900413513, "learning_rate": 2e-07, "loss": 0.0218, "step": 1355 }, { "clip_ratio/high_max": 0.0016254130714514758, "clip_ratio/high_mean": 0.0006449857155530481, "clip_ratio/low_mean": 0.0008349606105184648, "clip_ratio/low_min": 3.813054718193598e-05, "clip_ratio/region_mean": 0.0014799463460803963, "epoch": 0.126559683600791, "grad_norm": 0.10438607633113861, "learning_rate": 2e-07, "loss": 0.0566, "step": 1356 }, { "clip_ratio/high_max": 0.0018869786981667858, "clip_ratio/high_mean": 0.0008093931273833732, "clip_ratio/low_mean": 0.0008076961639744695, "clip_ratio/low_min": 6.509423110401258e-05, "clip_ratio/region_mean": 0.0016170892595255282, "epoch": 0.12665301670079157, "grad_norm": 0.17984412610530853, "learning_rate": 2e-07, "loss": 0.0551, "step": 1357 }, { "clip_ratio/high_max": 0.002043806714937091, "clip_ratio/high_mean": 0.0008907688243198209, "clip_ratio/low_mean": 0.0008046686853049323, "clip_ratio/low_min": 5.99684462940786e-05, "clip_ratio/region_mean": 0.0016954375169007108, "epoch": 0.12674634980079216, "grad_norm": 0.11563490331172943, "learning_rate": 2e-07, "loss": 0.0395, "step": 1358 }, { "clip_ratio/high_max": 0.001947351367562078, "clip_ratio/high_mean": 0.0009166836898657493, "clip_ratio/low_mean": 0.0006928579477971653, "clip_ratio/low_min": 2.8569049391080625e-05, "clip_ratio/region_mean": 0.00160954162129201, "epoch": 0.12683968290079276, "grad_norm": 0.12137407809495926, "learning_rate": 2e-07, "loss": -0.0323, "step": 1359 }, { "clip_ratio/high_max": 0.001947672171809245, "clip_ratio/high_mean": 0.0006809177375544095, "clip_ratio/low_mean": 0.0007939507759147091, "clip_ratio/low_min": 1.3607664186565671e-05, "clip_ratio/region_mean": 0.0014748685280210339, "epoch": 0.12693301600079332, "grad_norm": 0.11899052560329437, "learning_rate": 2e-07, "loss": 0.0546, "step": 1360 }, { "clip_ratio/high_max": 0.001995060742046917, "clip_ratio/high_mean": 0.000850983424243168, "clip_ratio/low_mean": 0.0008002845079317922, "clip_ratio/low_min": 0.00010585146992525551, "clip_ratio/region_mean": 0.0016512679467268754, "epoch": 0.1270263491007939, "grad_norm": 0.11994443833827972, "learning_rate": 2e-07, "loss": 0.0214, "step": 1361 }, { "clip_ratio/high_max": 0.0017821453511714935, "clip_ratio/high_mean": 0.0006969243186176755, "clip_ratio/low_mean": 0.0007804116576153319, "clip_ratio/low_min": 6.842797938588774e-05, "clip_ratio/region_mean": 0.0014773359689570498, "epoch": 0.1271196822007945, "grad_norm": 0.11319860816001892, "learning_rate": 2e-07, "loss": 0.0042, "step": 1362 }, { "clip_ratio/high_max": 0.001954909967025742, "clip_ratio/high_mean": 0.0008259686655947007, "clip_ratio/low_mean": 0.0008877356685843552, "clip_ratio/low_min": 3.052798729186179e-05, "clip_ratio/region_mean": 0.0017137042887043208, "epoch": 0.12721301530079507, "grad_norm": 0.11658068001270294, "learning_rate": 2e-07, "loss": 0.0795, "step": 1363 }, { "clip_ratio/high_max": 0.0020592361252056435, "clip_ratio/high_mean": 0.00086695232312195, "clip_ratio/low_mean": 0.0008231270458054496, "clip_ratio/low_min": 0.00015492898910451913, "clip_ratio/region_mean": 0.0016900793671084102, "epoch": 0.12730634840079566, "grad_norm": 0.10606466978788376, "learning_rate": 2e-07, "loss": 0.0131, "step": 1364 }, { "clip_ratio/high_max": 0.0016039220645325258, "clip_ratio/high_mean": 0.0007197350259957602, "clip_ratio/low_mean": 0.0008865467389114201, "clip_ratio/low_min": 4.5338552808971144e-05, "clip_ratio/region_mean": 0.0016062817703641485, "epoch": 0.12739968150079625, "grad_norm": 0.843982994556427, "learning_rate": 2e-07, "loss": 0.0623, "step": 1365 }, { "clip_ratio/high_max": 0.0018291545566171408, "clip_ratio/high_mean": 0.0008289910383609822, "clip_ratio/low_mean": 0.0008150193898472935, "clip_ratio/low_min": 8.07268443168141e-05, "clip_ratio/region_mean": 0.001644010451855138, "epoch": 0.12749301460079684, "grad_norm": 0.12914171814918518, "learning_rate": 2e-07, "loss": -0.0083, "step": 1366 }, { "clip_ratio/high_max": 0.00210142316063866, "clip_ratio/high_mean": 0.0007961212158988928, "clip_ratio/low_mean": 0.0009216088046741788, "clip_ratio/low_min": 8.545851960661821e-05, "clip_ratio/region_mean": 0.0017177300251205452, "epoch": 0.1275863477007974, "grad_norm": 0.121550552546978, "learning_rate": 2e-07, "loss": 0.0294, "step": 1367 }, { "clip_ratio/high_max": 0.0019436086186033208, "clip_ratio/high_mean": 0.0008264223379228497, "clip_ratio/low_mean": 0.000956607133957732, "clip_ratio/low_min": 8.771960983722238e-05, "clip_ratio/region_mean": 0.0017830295037128963, "epoch": 0.127679680800798, "grad_norm": 0.12034498155117035, "learning_rate": 2e-07, "loss": 0.0405, "step": 1368 }, { "clip_ratio/high_max": 0.002366542070376454, "clip_ratio/high_mean": 0.0009092929813050432, "clip_ratio/low_mean": 0.0008590921406721463, "clip_ratio/low_min": 6.484520417870954e-05, "clip_ratio/region_mean": 0.001768385096511338, "epoch": 0.1277730139007986, "grad_norm": 0.11182699352502823, "learning_rate": 2e-07, "loss": 0.0324, "step": 1369 }, { "clip_ratio/high_max": 0.0019343640633451287, "clip_ratio/high_mean": 0.0007515680572396377, "clip_ratio/low_mean": 0.0008977384550235001, "clip_ratio/low_min": 6.996171214268543e-05, "clip_ratio/region_mean": 0.0016493065122631378, "epoch": 0.12786634700079916, "grad_norm": 0.1282419115304947, "learning_rate": 2e-07, "loss": 0.0456, "step": 1370 }, { "clip_ratio/high_max": 0.0018687982446863316, "clip_ratio/high_mean": 0.0007957882071423228, "clip_ratio/low_mean": 0.0010032841782958712, "clip_ratio/low_min": 0.0001506550015619723, "clip_ratio/region_mean": 0.0017990724081755616, "epoch": 0.12795968010079975, "grad_norm": 0.13035976886749268, "learning_rate": 2e-07, "loss": 0.0422, "step": 1371 }, { "clip_ratio/high_max": 0.0017985887097893283, "clip_ratio/high_mean": 0.0007372637192020193, "clip_ratio/low_mean": 0.0008413499817834236, "clip_ratio/low_min": 7.533705684181768e-05, "clip_ratio/region_mean": 0.0015786137009854428, "epoch": 0.12805301320080034, "grad_norm": 0.1623329371213913, "learning_rate": 2e-07, "loss": 0.0464, "step": 1372 }, { "clip_ratio/high_max": 0.002135154551069718, "clip_ratio/high_mean": 0.0008657198250148213, "clip_ratio/low_mean": 0.0008392841700697318, "clip_ratio/low_min": 1.162358148576459e-05, "clip_ratio/region_mean": 0.0017050039969035424, "epoch": 0.1281463463008009, "grad_norm": 0.11920281499624252, "learning_rate": 2e-07, "loss": 0.0249, "step": 1373 }, { "clip_ratio/high_max": 0.00228666751718265, "clip_ratio/high_mean": 0.0008101774064925849, "clip_ratio/low_mean": 0.0010114672950294334, "clip_ratio/low_min": 0.00019415795395616442, "clip_ratio/region_mean": 0.001821644720621407, "epoch": 0.1282396794008015, "grad_norm": 0.12889491021633148, "learning_rate": 2e-07, "loss": 0.0287, "step": 1374 }, { "clip_ratio/high_max": 0.001978518113901373, "clip_ratio/high_mean": 0.0008065135370998178, "clip_ratio/low_mean": 0.0008249698521467508, "clip_ratio/low_min": 5.6722374210949056e-05, "clip_ratio/region_mean": 0.0016314834574586712, "epoch": 0.1283330125008021, "grad_norm": 0.119633749127388, "learning_rate": 2e-07, "loss": 0.0136, "step": 1375 }, { "clip_ratio/high_max": 0.0017309194481640588, "clip_ratio/high_mean": 0.0006493311093436205, "clip_ratio/low_mean": 0.0008063004042924149, "clip_ratio/low_min": 2.8154799110780004e-05, "clip_ratio/region_mean": 0.00145563151454553, "epoch": 0.12842634560080265, "grad_norm": 0.10172529518604279, "learning_rate": 2e-07, "loss": 0.0196, "step": 1376 }, { "clip_ratio/high_max": 0.001866466864157701, "clip_ratio/high_mean": 0.0007752442215860356, "clip_ratio/low_mean": 0.0007749105807306478, "clip_ratio/low_min": 5.425374365586322e-05, "clip_ratio/region_mean": 0.0015501547823078, "epoch": 0.12851967870080325, "grad_norm": 0.11901126056909561, "learning_rate": 2e-07, "loss": 0.0471, "step": 1377 }, { "clip_ratio/high_max": 0.0020305791331338696, "clip_ratio/high_mean": 0.0007855076837586239, "clip_ratio/low_mean": 0.0008952132502599852, "clip_ratio/low_min": 5.849377612321405e-05, "clip_ratio/region_mean": 0.0016807209613034502, "epoch": 0.12861301180080384, "grad_norm": 0.1198928952217102, "learning_rate": 2e-07, "loss": 0.0374, "step": 1378 }, { "clip_ratio/high_max": 0.0015008701157057658, "clip_ratio/high_mean": 0.0006661140505457297, "clip_ratio/low_mean": 0.0010226668146060547, "clip_ratio/low_min": 6.821769329690142e-05, "clip_ratio/region_mean": 0.001688780845142901, "epoch": 0.1287063449008044, "grad_norm": 0.11290942877531052, "learning_rate": 2e-07, "loss": 0.0739, "step": 1379 }, { "clip_ratio/high_max": 0.001983251506317174, "clip_ratio/high_mean": 0.0008443498263659421, "clip_ratio/low_mean": 0.0008328299700224306, "clip_ratio/low_min": 7.496846774301957e-05, "clip_ratio/region_mean": 0.0016771797818364576, "epoch": 0.128799678000805, "grad_norm": 0.11423109471797943, "learning_rate": 2e-07, "loss": 0.0138, "step": 1380 }, { "clip_ratio/high_max": 0.0020995248523831833, "clip_ratio/high_mean": 0.00087003310181899, "clip_ratio/low_mean": 0.000675805797072826, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0015458388916158583, "epoch": 0.1288930111008056, "grad_norm": 0.11436010897159576, "learning_rate": 2e-07, "loss": -0.0446, "step": 1381 }, { "clip_ratio/high_max": 0.0019688259053509682, "clip_ratio/high_mean": 0.0008213131477532443, "clip_ratio/low_mean": 0.000590219769946998, "clip_ratio/low_min": 4.0555058149038814e-05, "clip_ratio/region_mean": 0.001411532939528115, "epoch": 0.12898634420080615, "grad_norm": 0.108339823782444, "learning_rate": 2e-07, "loss": 0.0006, "step": 1382 }, { "clip_ratio/high_max": 0.001881070558738429, "clip_ratio/high_mean": 0.0007644221295777243, "clip_ratio/low_mean": 0.0009268050416721962, "clip_ratio/low_min": 5.833477189298719e-05, "clip_ratio/region_mean": 0.0016912271385081112, "epoch": 0.12907967730080674, "grad_norm": 0.10900482535362244, "learning_rate": 2e-07, "loss": 0.0326, "step": 1383 }, { "clip_ratio/high_max": 0.0017810699355322868, "clip_ratio/high_mean": 0.0007846378794056363, "clip_ratio/low_mean": 0.0009189346419589128, "clip_ratio/low_min": 0.00021171450862311758, "clip_ratio/region_mean": 0.0017035725031746551, "epoch": 0.12917301040080734, "grad_norm": 0.129139244556427, "learning_rate": 2e-07, "loss": 0.0308, "step": 1384 }, { "clip_ratio/high_max": 0.0021921206134720705, "clip_ratio/high_mean": 0.0007737524829281028, "clip_ratio/low_mean": 0.0008307507887366228, "clip_ratio/low_min": 5.058836268290179e-05, "clip_ratio/region_mean": 0.0016045032389229164, "epoch": 0.1292663435008079, "grad_norm": 0.10910157859325409, "learning_rate": 2e-07, "loss": 0.0675, "step": 1385 }, { "clip_ratio/high_max": 0.002048816837486811, "clip_ratio/high_mean": 0.0008342174132849323, "clip_ratio/low_mean": 0.000801860758656403, "clip_ratio/low_min": 4.7279774662456475e-05, "clip_ratio/region_mean": 0.0016360781737603247, "epoch": 0.1293596766008085, "grad_norm": 0.12120600044727325, "learning_rate": 2e-07, "loss": -0.0048, "step": 1386 }, { "clip_ratio/high_max": 0.0019853022786264773, "clip_ratio/high_mean": 0.000771567541960394, "clip_ratio/low_mean": 0.00091455184519873, "clip_ratio/low_min": 0.00011517951406858629, "clip_ratio/region_mean": 0.0016861193580552936, "epoch": 0.12945300970080909, "grad_norm": 0.12327404320240021, "learning_rate": 2e-07, "loss": 0.0508, "step": 1387 }, { "clip_ratio/high_max": 0.0023137271200539544, "clip_ratio/high_mean": 0.0009077252252609469, "clip_ratio/low_mean": 0.0009236120058631059, "clip_ratio/low_min": 0.00010793218189064646, "clip_ratio/region_mean": 0.0018313371983822435, "epoch": 0.12954634280080968, "grad_norm": 0.12423425167798996, "learning_rate": 2e-07, "loss": 0.0205, "step": 1388 }, { "clip_ratio/high_max": 0.002105442494212184, "clip_ratio/high_mean": 0.0008330524597113254, "clip_ratio/low_mean": 0.0007312409579753876, "clip_ratio/low_min": 2.134198439307511e-05, "clip_ratio/region_mean": 0.0015642934231436811, "epoch": 0.12963967590081024, "grad_norm": 0.10687970370054245, "learning_rate": 2e-07, "loss": -0.006, "step": 1389 }, { "clip_ratio/high_max": 0.0019074811098107602, "clip_ratio/high_mean": 0.0007050114563753596, "clip_ratio/low_mean": 0.0007939244715089444, "clip_ratio/low_min": 0.00012383759440126596, "clip_ratio/region_mean": 0.0014989359478931874, "epoch": 0.12973300900081083, "grad_norm": 0.12760306894779205, "learning_rate": 2e-07, "loss": 0.0357, "step": 1390 }, { "clip_ratio/high_max": 0.001898354254080914, "clip_ratio/high_mean": 0.0007583394872199278, "clip_ratio/low_mean": 0.0010159825378650567, "clip_ratio/low_min": 1.27577059174655e-05, "clip_ratio/region_mean": 0.0017743220014381222, "epoch": 0.12982634210081143, "grad_norm": 0.12471260875463486, "learning_rate": 2e-07, "loss": 0.0444, "step": 1391 }, { "clip_ratio/high_max": 0.001985157337912824, "clip_ratio/high_mean": 0.0008023914833756862, "clip_ratio/low_mean": 0.0009106786037591519, "clip_ratio/low_min": 0.00015100621112651424, "clip_ratio/region_mean": 0.0017130701162386686, "epoch": 0.129919675200812, "grad_norm": 0.1151493489742279, "learning_rate": 2e-07, "loss": 0.0235, "step": 1392 }, { "clip_ratio/high_max": 0.0020410348879522644, "clip_ratio/high_mean": 0.0008071577321970835, "clip_ratio/low_mean": 0.0008693257223058026, "clip_ratio/low_min": 0.0001162223297797027, "clip_ratio/region_mean": 0.0016764834799687378, "epoch": 0.13001300830081258, "grad_norm": 0.127003476023674, "learning_rate": 2e-07, "loss": 0.0031, "step": 1393 }, { "clip_ratio/high_max": 0.0019196809516870417, "clip_ratio/high_mean": 0.0007679477985220728, "clip_ratio/low_mean": 0.000835339909826871, "clip_ratio/low_min": 0.000127444752251904, "clip_ratio/region_mean": 0.0016032877101679333, "epoch": 0.13010634140081317, "grad_norm": 0.11123500764369965, "learning_rate": 2e-07, "loss": 0.0331, "step": 1394 }, { "clip_ratio/high_max": 0.0019755180801439565, "clip_ratio/high_mean": 0.0007841616388759576, "clip_ratio/low_mean": 0.0008942230724642286, "clip_ratio/low_min": 0.00011670821277220966, "clip_ratio/region_mean": 0.0016783847022452392, "epoch": 0.13019967450081374, "grad_norm": 0.10742918401956558, "learning_rate": 2e-07, "loss": 0.0361, "step": 1395 }, { "clip_ratio/high_max": 0.0020528695749817416, "clip_ratio/high_mean": 0.0008011451764105004, "clip_ratio/low_mean": 0.000984573649475351, "clip_ratio/low_min": 7.484278648917098e-05, "clip_ratio/region_mean": 0.0017857188067864627, "epoch": 0.13029300760081433, "grad_norm": 0.11655457317829132, "learning_rate": 2e-07, "loss": 0.0446, "step": 1396 }, { "clip_ratio/high_max": 0.0019212019797123503, "clip_ratio/high_mean": 0.0007598771298944484, "clip_ratio/low_mean": 0.0008176048850145889, "clip_ratio/low_min": 3.232134440622758e-05, "clip_ratio/region_mean": 0.0015774820203660056, "epoch": 0.13038634070081492, "grad_norm": 0.11722779273986816, "learning_rate": 2e-07, "loss": 0.0622, "step": 1397 }, { "clip_ratio/high_max": 0.0020545092411339283, "clip_ratio/high_mean": 0.000918252051633317, "clip_ratio/low_mean": 0.0009099662202061154, "clip_ratio/low_min": 5.779476623501978e-05, "clip_ratio/region_mean": 0.00182821827911539, "epoch": 0.1304796738008155, "grad_norm": 0.11346706748008728, "learning_rate": 2e-07, "loss": 0.0074, "step": 1398 }, { "clip_ratio/high_max": 0.0020436286940821446, "clip_ratio/high_mean": 0.0008327026807819493, "clip_ratio/low_mean": 0.000968271149758948, "clip_ratio/low_min": 8.875710500433343e-05, "clip_ratio/region_mean": 0.001800973815988982, "epoch": 0.13057300690081608, "grad_norm": 0.12064658850431442, "learning_rate": 2e-07, "loss": 0.0107, "step": 1399 }, { "clip_ratio/high_max": 0.002070170554361539, "clip_ratio/high_mean": 0.0008184742546291091, "clip_ratio/low_mean": 0.000858435745612951, "clip_ratio/low_min": 1.3950892935099546e-05, "clip_ratio/region_mean": 0.001676909982052166, "epoch": 0.13066634000081667, "grad_norm": 0.11773994565010071, "learning_rate": 2e-07, "loss": 0.0998, "step": 1400 }, { "clip_ratio/high_max": 0.0016582413954893127, "clip_ratio/high_mean": 0.0007318408061109949, "clip_ratio/low_mean": 0.0008042468034545891, "clip_ratio/low_min": 2.5402031496923883e-05, "clip_ratio/region_mean": 0.0015360876132035628, "epoch": 0.13075967310081724, "grad_norm": 0.10315852612257004, "learning_rate": 2e-07, "loss": 0.0338, "step": 1401 }, { "clip_ratio/high_max": 0.002121425641234964, "clip_ratio/high_mean": 0.0008209840634663124, "clip_ratio/low_mean": 0.0007946453042677604, "clip_ratio/low_min": 0.00012355416583886836, "clip_ratio/region_mean": 0.0016156293568201363, "epoch": 0.13085300620081783, "grad_norm": 0.11440485715866089, "learning_rate": 2e-07, "loss": -0.0199, "step": 1402 }, { "clip_ratio/high_max": 0.0021531325692194514, "clip_ratio/high_mean": 0.0008210143150790827, "clip_ratio/low_mean": 0.000890845254616579, "clip_ratio/low_min": 3.161348377034301e-05, "clip_ratio/region_mean": 0.0017118595424108207, "epoch": 0.13094633930081842, "grad_norm": 0.12360069155693054, "learning_rate": 2e-07, "loss": 0.0381, "step": 1403 }, { "clip_ratio/high_max": 0.001991602333873743, "clip_ratio/high_mean": 0.000876546868312289, "clip_ratio/low_mean": 0.0008671397508805967, "clip_ratio/low_min": 5.895727372262627e-05, "clip_ratio/region_mean": 0.001743686581903603, "epoch": 0.13103967240081899, "grad_norm": 0.12088468670845032, "learning_rate": 2e-07, "loss": 0.0196, "step": 1404 }, { "clip_ratio/high_max": 0.0019330487120896578, "clip_ratio/high_mean": 0.0006968895268073538, "clip_ratio/low_mean": 0.000759258883590519, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.001456148413126357, "epoch": 0.13113300550081958, "grad_norm": 0.1030145063996315, "learning_rate": 2e-07, "loss": 0.0093, "step": 1405 }, { "clip_ratio/high_max": 0.00222775642760098, "clip_ratio/high_mean": 0.0008343548470293172, "clip_ratio/low_mean": 0.0008974049960670527, "clip_ratio/low_min": 8.95316552487202e-05, "clip_ratio/region_mean": 0.0017317598831141368, "epoch": 0.13122633860082017, "grad_norm": 0.114702969789505, "learning_rate": 2e-07, "loss": 0.0501, "step": 1406 }, { "clip_ratio/high_max": 0.00177004542274517, "clip_ratio/high_mean": 0.0007043215719022555, "clip_ratio/low_mean": 0.0008895602441043593, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0015938818069116678, "epoch": 0.13131967170082076, "grad_norm": 0.11877228319644928, "learning_rate": 2e-07, "loss": 0.0563, "step": 1407 }, { "clip_ratio/high_max": 0.0019409472224651836, "clip_ratio/high_mean": 0.0008373026012122864, "clip_ratio/low_mean": 0.0008248523463407764, "clip_ratio/low_min": 6.86320781824179e-05, "clip_ratio/region_mean": 0.0016621549548290204, "epoch": 0.13141300480082133, "grad_norm": 0.12597309052944183, "learning_rate": 2e-07, "loss": 0.0315, "step": 1408 }, { "clip_ratio/high_max": 0.0, "clip_ratio/high_mean": 0.0, "clip_ratio/low_mean": 0.0, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0, "completions/clipped_ratio": 0.015651157924107095, "completions/max_length": 4096.0, "completions/max_terminated_length": 4096.0, "completions/mean_length": 619.1614990234375, "completions/mean_terminated_length": 563.8796997070312, "completions/min_length": 3.0, "completions/min_terminated_length": 3.0, "epoch": 0.13150633790082192, "grad_norm": 0.11607356369495392, "learning_rate": 2e-07, "loss": 0.011, "num_tokens": 981604834.0, "reward": 0.5808890461921692, "reward_std": 0.19411884248256683, "rewards/simpleverify_reward/mean": 0.5808890461921692, "rewards/simpleverify_reward/std": 0.4934157431125641, "step": 1409 }, { "clip_ratio/high_max": 0.0020238581200828776, "clip_ratio/high_mean": 0.0007730272864137078, "clip_ratio/low_mean": 0.0005922187438045512, "clip_ratio/low_min": 1.444752615498146e-05, "clip_ratio/region_mean": 0.001365246054774616, "epoch": 0.1315996710008225, "grad_norm": 0.11262534558773041, "learning_rate": 2e-07, "loss": 0.0253, "step": 1410 }, { "clip_ratio/high_max": 0.0021391870104707778, "clip_ratio/high_mean": 0.00081176625462831, "clip_ratio/low_mean": 0.0005476342303154524, "clip_ratio/low_min": 2.5403228391951416e-05, "clip_ratio/region_mean": 0.0013594004849437624, "epoch": 0.13169300410082307, "grad_norm": 0.1096932664513588, "learning_rate": 2e-07, "loss": 0.0097, "step": 1411 }, { "clip_ratio/high_max": 0.002004061512707267, "clip_ratio/high_mean": 0.0007933758606668562, "clip_ratio/low_mean": 0.0005940421901868831, "clip_ratio/low_min": 3.173394361510873e-05, "clip_ratio/region_mean": 0.0013874180949642323, "epoch": 0.13178633720082367, "grad_norm": 0.11943253874778748, "learning_rate": 2e-07, "loss": 0.0278, "step": 1412 }, { "clip_ratio/high_max": 0.0018894285458372906, "clip_ratio/high_mean": 0.0007234920358314412, "clip_ratio/low_mean": 0.0005762428090747562, "clip_ratio/low_min": 5.5969412642298266e-05, "clip_ratio/region_mean": 0.0012997348530916497, "epoch": 0.13187967030082426, "grad_norm": 0.10913825035095215, "learning_rate": 2e-07, "loss": 0.0561, "step": 1413 }, { "clip_ratio/high_max": 0.0017913886040332727, "clip_ratio/high_mean": 0.0007872335845604539, "clip_ratio/low_mean": 0.0005389732605181052, "clip_ratio/low_min": 2.2572666239284445e-05, "clip_ratio/region_mean": 0.001326206860539969, "epoch": 0.13197300340082482, "grad_norm": 0.11583413928747177, "learning_rate": 2e-07, "loss": 0.032, "step": 1414 }, { "clip_ratio/high_max": 0.0018558311203378253, "clip_ratio/high_mean": 0.0007339506046264432, "clip_ratio/low_mean": 0.0006354933366310433, "clip_ratio/low_min": 9.521632819087245e-06, "clip_ratio/region_mean": 0.0013694439076061826, "epoch": 0.13206633650082542, "grad_norm": 0.11540807783603668, "learning_rate": 2e-07, "loss": 0.0231, "step": 1415 }, { "clip_ratio/high_max": 0.0017646006162976846, "clip_ratio/high_mean": 0.0006957149198569823, "clip_ratio/low_mean": 0.0006115770938777132, "clip_ratio/low_min": 7.063610792101827e-05, "clip_ratio/region_mean": 0.0013072920446575154, "epoch": 0.132159669600826, "grad_norm": 0.11199679970741272, "learning_rate": 2e-07, "loss": -0.0072, "step": 1416 }, { "clip_ratio/high_max": 0.001956811833224492, "clip_ratio/high_mean": 0.0008024005364859477, "clip_ratio/low_mean": 0.0004979553104931256, "clip_ratio/low_min": 1.4602804185415152e-05, "clip_ratio/region_mean": 0.0013003558742639143, "epoch": 0.13225300270082657, "grad_norm": 0.12055734544992447, "learning_rate": 2e-07, "loss": -0.0357, "step": 1417 }, { "clip_ratio/high_max": 0.0018860762393160257, "clip_ratio/high_mean": 0.0007725949599262094, "clip_ratio/low_mean": 0.0005332180953701027, "clip_ratio/low_min": 1.5056612937769387e-05, "clip_ratio/region_mean": 0.0013058130207355134, "epoch": 0.13234633580082716, "grad_norm": 0.11625038087368011, "learning_rate": 2e-07, "loss": 0.0028, "step": 1418 }, { "clip_ratio/high_max": 0.0016960201646725181, "clip_ratio/high_mean": 0.0006671453647868475, "clip_ratio/low_mean": 0.0006675170534435892, "clip_ratio/low_min": 5.092612536827801e-05, "clip_ratio/region_mean": 0.0013346624000405427, "epoch": 0.13243966890082776, "grad_norm": 0.11156806349754333, "learning_rate": 2e-07, "loss": 0.0633, "step": 1419 }, { "clip_ratio/high_max": 0.0020214892174408305, "clip_ratio/high_mean": 0.0007565125088149216, "clip_ratio/low_mean": 0.000651777761959238, "clip_ratio/low_min": 3.872359957313165e-05, "clip_ratio/region_mean": 0.001408290281688096, "epoch": 0.13253300200082832, "grad_norm": 0.11487922072410583, "learning_rate": 2e-07, "loss": 0.0449, "step": 1420 }, { "clip_ratio/high_max": 0.0018075659518217435, "clip_ratio/high_mean": 0.0007784570561852888, "clip_ratio/low_mean": 0.0006550850612256909, "clip_ratio/low_min": 4.3345678932382725e-05, "clip_ratio/region_mean": 0.001433542125596432, "epoch": 0.1326263351008289, "grad_norm": 0.11866822838783264, "learning_rate": 2e-07, "loss": 0.012, "step": 1421 }, { "clip_ratio/high_max": 0.0019527479562384542, "clip_ratio/high_mean": 0.0007215898713184288, "clip_ratio/low_mean": 0.0005829317215102492, "clip_ratio/low_min": 3.928259957319824e-05, "clip_ratio/region_mean": 0.0013045215673628263, "epoch": 0.1327196682008295, "grad_norm": 0.11857002973556519, "learning_rate": 2e-07, "loss": 0.0568, "step": 1422 }, { "clip_ratio/high_max": 0.0019850226381095126, "clip_ratio/high_mean": 0.0007415770869556582, "clip_ratio/low_mean": 0.0006260837362788152, "clip_ratio/low_min": 1.1730480764526874e-05, "clip_ratio/region_mean": 0.0013676608359673992, "epoch": 0.13281300130083007, "grad_norm": 0.12022221088409424, "learning_rate": 2e-07, "loss": 0.0511, "step": 1423 }, { "clip_ratio/high_max": 0.0016174246848095208, "clip_ratio/high_mean": 0.0007002751881373115, "clip_ratio/low_mean": 0.0006261249695853621, "clip_ratio/low_min": 3.4016984500340186e-05, "clip_ratio/region_mean": 0.001326400182733778, "epoch": 0.13290633440083066, "grad_norm": 0.12217580527067184, "learning_rate": 2e-07, "loss": 0.0571, "step": 1424 }, { "clip_ratio/high_max": 0.0019720216223504394, "clip_ratio/high_mean": 0.0008390181174036115, "clip_ratio/low_mean": 0.000581809006689582, "clip_ratio/low_min": 1.8269511201651767e-05, "clip_ratio/region_mean": 0.0014208271459210664, "epoch": 0.13299966750083125, "grad_norm": 0.12014545500278473, "learning_rate": 2e-07, "loss": 0.0326, "step": 1425 }, { "clip_ratio/high_max": 0.0018012042673944961, "clip_ratio/high_mean": 0.0008219068076869007, "clip_ratio/low_mean": 0.0006239979666133877, "clip_ratio/low_min": 3.668366298370529e-05, "clip_ratio/region_mean": 0.0014459047524724156, "epoch": 0.13309300060083182, "grad_norm": 0.11980492621660233, "learning_rate": 2e-07, "loss": 0.048, "step": 1426 }, { "clip_ratio/high_max": 0.0014298383248387836, "clip_ratio/high_mean": 0.0006193339158926392, "clip_ratio/low_mean": 0.0005814515616293647, "clip_ratio/low_min": 3.1079078780749114e-05, "clip_ratio/region_mean": 0.0012007854566036258, "epoch": 0.1331863337008324, "grad_norm": 0.11604022234678268, "learning_rate": 2e-07, "loss": 0.0136, "step": 1427 }, { "clip_ratio/high_max": 0.0018856697497540154, "clip_ratio/high_mean": 0.0006844491090305382, "clip_ratio/low_mean": 0.0006869271219329676, "clip_ratio/low_min": 2.636389217514079e-05, "clip_ratio/region_mean": 0.0013713762309635058, "epoch": 0.133279666800833, "grad_norm": 0.11561208218336105, "learning_rate": 2e-07, "loss": 0.0425, "step": 1428 }, { "clip_ratio/high_max": 0.0019381532365514431, "clip_ratio/high_mean": 0.000840874783534673, "clip_ratio/low_mean": 0.000715435337042436, "clip_ratio/low_min": 6.21290796516405e-05, "clip_ratio/region_mean": 0.0015563101151201408, "epoch": 0.1333729999008336, "grad_norm": 0.12583154439926147, "learning_rate": 2e-07, "loss": 0.0172, "step": 1429 }, { "clip_ratio/high_max": 0.0017242007415916305, "clip_ratio/high_mean": 0.0007250793896673713, "clip_ratio/low_mean": 0.0007621540353284217, "clip_ratio/low_min": 0.00011216901111765765, "clip_ratio/region_mean": 0.001487233424995793, "epoch": 0.13346633300083416, "grad_norm": 0.11240265518426895, "learning_rate": 2e-07, "loss": 0.062, "step": 1430 }, { "clip_ratio/high_max": 0.0019297096077934839, "clip_ratio/high_mean": 0.0007666026449442143, "clip_ratio/low_mean": 0.0006348452116071712, "clip_ratio/low_min": 9.507809681963408e-05, "clip_ratio/region_mean": 0.0014014478838362265, "epoch": 0.13355966610083475, "grad_norm": 0.11741531640291214, "learning_rate": 2e-07, "loss": 0.0198, "step": 1431 }, { "clip_ratio/high_max": 0.0023844494062359445, "clip_ratio/high_mean": 0.0009254289434466045, "clip_ratio/low_mean": 0.0007149942921387265, "clip_ratio/low_min": 4.6471323003061116e-05, "clip_ratio/region_mean": 0.0016404232155764475, "epoch": 0.13365299920083534, "grad_norm": 0.11778531223535538, "learning_rate": 2e-07, "loss": 0.0315, "step": 1432 }, { "clip_ratio/high_max": 0.001983109876164235, "clip_ratio/high_mean": 0.0008302333571919007, "clip_ratio/low_mean": 0.0006479879975813674, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.001478221354773268, "epoch": 0.1337463323008359, "grad_norm": 0.10910238325595856, "learning_rate": 2e-07, "loss": 0.0219, "step": 1433 }, { "clip_ratio/high_max": 0.0018589608516776934, "clip_ratio/high_mean": 0.000803500966867432, "clip_ratio/low_mean": 0.0007304258197109448, "clip_ratio/low_min": 4.548735341813881e-05, "clip_ratio/region_mean": 0.0015339267629315145, "epoch": 0.1338396654008365, "grad_norm": 0.12177577614784241, "learning_rate": 2e-07, "loss": -0.001, "step": 1434 }, { "clip_ratio/high_max": 0.0019800846639554948, "clip_ratio/high_mean": 0.0007399069795610558, "clip_ratio/low_mean": 0.0006880286109662848, "clip_ratio/low_min": 2.5069343791983556e-05, "clip_ratio/region_mean": 0.0014279355818871409, "epoch": 0.1339329985008371, "grad_norm": 0.116060271859169, "learning_rate": 2e-07, "loss": 0.0076, "step": 1435 }, { "clip_ratio/high_max": 0.002340161252504913, "clip_ratio/high_mean": 0.0008662767413625261, "clip_ratio/low_mean": 0.000652257731417194, "clip_ratio/low_min": 4.318677929404657e-05, "clip_ratio/region_mean": 0.0015185344418569002, "epoch": 0.13402633160083766, "grad_norm": 0.11506643146276474, "learning_rate": 2e-07, "loss": 0.0057, "step": 1436 }, { "clip_ratio/high_max": 0.0019396092102397233, "clip_ratio/high_mean": 0.0007745549664832652, "clip_ratio/low_mean": 0.0008569749024900375, "clip_ratio/low_min": 5.923406752117444e-05, "clip_ratio/region_mean": 0.0016315299217239954, "epoch": 0.13411966470083825, "grad_norm": 0.13506953418254852, "learning_rate": 2e-07, "loss": 0.0589, "step": 1437 }, { "clip_ratio/high_max": 0.0022617389331571758, "clip_ratio/high_mean": 0.0008626760518382071, "clip_ratio/low_mean": 0.0006205956933627021, "clip_ratio/low_min": 6.942697109479923e-05, "clip_ratio/region_mean": 0.0014832717279205099, "epoch": 0.13421299780083884, "grad_norm": 0.11301650106906891, "learning_rate": 2e-07, "loss": 0.0281, "step": 1438 }, { "clip_ratio/high_max": 0.0017473006446380168, "clip_ratio/high_mean": 0.0007116386314010015, "clip_ratio/low_mean": 0.0008098490106931422, "clip_ratio/low_min": 0.00011563079578991164, "clip_ratio/region_mean": 0.0015214876584650483, "epoch": 0.1343063309008394, "grad_norm": 0.11921726912260056, "learning_rate": 2e-07, "loss": 0.0675, "step": 1439 }, { "clip_ratio/high_max": 0.001566146642289823, "clip_ratio/high_mean": 0.0006612081679122639, "clip_ratio/low_mean": 0.000811291518402868, "clip_ratio/low_min": 8.125036129058572e-05, "clip_ratio/region_mean": 0.0014724996617587749, "epoch": 0.13439966400084, "grad_norm": 0.10796200484037399, "learning_rate": 2e-07, "loss": 0.0521, "step": 1440 }, { "clip_ratio/high_max": 0.001980977802304551, "clip_ratio/high_mean": 0.0007881141264078906, "clip_ratio/low_mean": 0.0007253321600728668, "clip_ratio/low_min": 0.00010377618082202389, "clip_ratio/region_mean": 0.0015134462591959164, "epoch": 0.1344929971008406, "grad_norm": 0.12186485528945923, "learning_rate": 2e-07, "loss": -0.0067, "step": 1441 }, { "clip_ratio/high_max": 0.0016775948643044103, "clip_ratio/high_mean": 0.0006587004627363058, "clip_ratio/low_mean": 0.000784893467425718, "clip_ratio/low_min": 7.820361679478083e-05, "clip_ratio/region_mean": 0.001443593944713939, "epoch": 0.13458633020084115, "grad_norm": 0.11215104162693024, "learning_rate": 2e-07, "loss": 0.0697, "step": 1442 }, { "clip_ratio/high_max": 0.002010987729590852, "clip_ratio/high_mean": 0.0007932093885756331, "clip_ratio/low_mean": 0.0007166429650169448, "clip_ratio/low_min": 2.7240886083745863e-05, "clip_ratio/region_mean": 0.0015098523363121785, "epoch": 0.13467966330084175, "grad_norm": 0.12853403389453888, "learning_rate": 2e-07, "loss": 0.0009, "step": 1443 }, { "clip_ratio/high_max": 0.0020383388218760956, "clip_ratio/high_mean": 0.0008834676664264407, "clip_ratio/low_mean": 0.0007674682019569445, "clip_ratio/low_min": 4.2398195546411444e-05, "clip_ratio/region_mean": 0.0016509358465555124, "epoch": 0.13477299640084234, "grad_norm": 0.11752558499574661, "learning_rate": 2e-07, "loss": 0.0028, "step": 1444 }, { "clip_ratio/high_max": 0.0017493718933110358, "clip_ratio/high_mean": 0.0007452690761056147, "clip_ratio/low_mean": 0.0008068344413914019, "clip_ratio/low_min": 8.516884918208234e-05, "clip_ratio/region_mean": 0.0015521035566052888, "epoch": 0.1348663295008429, "grad_norm": 0.11876316368579865, "learning_rate": 2e-07, "loss": 0.0542, "step": 1445 }, { "clip_ratio/high_max": 0.0021564784547081217, "clip_ratio/high_mean": 0.0009385626563016558, "clip_ratio/low_mean": 0.0006697322232867009, "clip_ratio/low_min": 3.9578520045324694e-05, "clip_ratio/region_mean": 0.0016082948714029044, "epoch": 0.1349596626008435, "grad_norm": 0.10920839756727219, "learning_rate": 2e-07, "loss": -0.0275, "step": 1446 }, { "clip_ratio/high_max": 0.0023614708698005415, "clip_ratio/high_mean": 0.0009068939507415053, "clip_ratio/low_mean": 0.0007766047037875978, "clip_ratio/low_min": 5.3554644182440825e-05, "clip_ratio/region_mean": 0.0016834986745379865, "epoch": 0.1350529957008441, "grad_norm": 0.1340794414281845, "learning_rate": 2e-07, "loss": 0.0413, "step": 1447 }, { "clip_ratio/high_max": 0.0018064972609863617, "clip_ratio/high_mean": 0.0007527923644374823, "clip_ratio/low_mean": 0.0007681156857870519, "clip_ratio/low_min": 6.867258571219281e-05, "clip_ratio/region_mean": 0.0015209080302156508, "epoch": 0.13514632880084468, "grad_norm": 0.11589518189430237, "learning_rate": 2e-07, "loss": 0.0254, "step": 1448 }, { "clip_ratio/high_max": 0.0020689888624474406, "clip_ratio/high_mean": 0.0008515621393598849, "clip_ratio/low_mean": 0.0007656283087271731, "clip_ratio/low_min": 3.123438364127651e-05, "clip_ratio/region_mean": 0.0016171904790098779, "epoch": 0.13523966190084524, "grad_norm": 0.11082395911216736, "learning_rate": 2e-07, "loss": 0.0013, "step": 1449 }, { "clip_ratio/high_max": 0.0020023477700306103, "clip_ratio/high_mean": 0.0007983002287801355, "clip_ratio/low_mean": 0.0007735772232990712, "clip_ratio/low_min": 4.3283996092213783e-05, "clip_ratio/region_mean": 0.0015718774411652703, "epoch": 0.13533299500084583, "grad_norm": 0.11476428806781769, "learning_rate": 2e-07, "loss": -0.0145, "step": 1450 }, { "clip_ratio/high_max": 0.0018441542852087878, "clip_ratio/high_mean": 0.0007500748261008994, "clip_ratio/low_mean": 0.0008122992021526443, "clip_ratio/low_min": 4.516948047239566e-05, "clip_ratio/region_mean": 0.001562374018249102, "epoch": 0.13542632810084643, "grad_norm": 0.11719583719968796, "learning_rate": 2e-07, "loss": 0.0274, "step": 1451 }, { "clip_ratio/high_max": 0.0018311503990844358, "clip_ratio/high_mean": 0.0007566690055682557, "clip_ratio/low_mean": 0.0007725996802037116, "clip_ratio/low_min": 3.669734360300936e-05, "clip_ratio/region_mean": 0.0015292686730390415, "epoch": 0.135519661200847, "grad_norm": 0.1133178323507309, "learning_rate": 2e-07, "loss": 0.0163, "step": 1452 }, { "clip_ratio/high_max": 0.0019924047664972022, "clip_ratio/high_mean": 0.0008320809265569551, "clip_ratio/low_mean": 0.0008117877787299221, "clip_ratio/low_min": 3.994688631792087e-05, "clip_ratio/region_mean": 0.0016438686943729408, "epoch": 0.13561299430084758, "grad_norm": 0.12285424023866653, "learning_rate": 2e-07, "loss": 0.0068, "step": 1453 }, { "clip_ratio/high_max": 0.0019165333433193155, "clip_ratio/high_mean": 0.0007696291977481451, "clip_ratio/low_mean": 0.000779368587245699, "clip_ratio/low_min": 3.477190421108389e-05, "clip_ratio/region_mean": 0.0015489977813558653, "epoch": 0.13570632740084818, "grad_norm": 0.12307151407003403, "learning_rate": 2e-07, "loss": 0.0398, "step": 1454 }, { "clip_ratio/high_max": 0.0016114241370814852, "clip_ratio/high_mean": 0.0006909146832185797, "clip_ratio/low_mean": 0.0006994193599894061, "clip_ratio/low_min": 7.640586773050018e-06, "clip_ratio/region_mean": 0.0013903340950491838, "epoch": 0.13579966050084874, "grad_norm": 0.11408301442861557, "learning_rate": 2e-07, "loss": 0.0215, "step": 1455 }, { "clip_ratio/high_max": 0.00224641843669815, "clip_ratio/high_mean": 0.0008519945749867475, "clip_ratio/low_mean": 0.0008661876254336676, "clip_ratio/low_min": 5.94716120758676e-05, "clip_ratio/region_mean": 0.0017181821676786058, "epoch": 0.13589299360084933, "grad_norm": 0.11069908738136292, "learning_rate": 2e-07, "loss": 0.0262, "step": 1456 }, { "clip_ratio/high_max": 0.0020650003134505823, "clip_ratio/high_mean": 0.0007927407787065022, "clip_ratio/low_mean": 0.0008316412349813618, "clip_ratio/low_min": 4.111545786145143e-05, "clip_ratio/region_mean": 0.0016243820209638216, "epoch": 0.13598632670084992, "grad_norm": 0.11312870681285858, "learning_rate": 2e-07, "loss": 0.0196, "step": 1457 }, { "clip_ratio/high_max": 0.0018805214422172867, "clip_ratio/high_mean": 0.000752954394556582, "clip_ratio/low_mean": 0.0007235482444230001, "clip_ratio/low_min": 6.011170353303896e-05, "clip_ratio/region_mean": 0.0014765026062377729, "epoch": 0.1360796598008505, "grad_norm": 0.11401940137147903, "learning_rate": 2e-07, "loss": 0.0506, "step": 1458 }, { "clip_ratio/high_max": 0.002258387343317736, "clip_ratio/high_mean": 0.0009132294235314475, "clip_ratio/low_mean": 0.000683300218952354, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0015965296115609817, "epoch": 0.13617299290085108, "grad_norm": 0.11211583018302917, "learning_rate": 2e-07, "loss": -0.0088, "step": 1459 }, { "clip_ratio/high_max": 0.0018928261488326825, "clip_ratio/high_mean": 0.0008067896560532972, "clip_ratio/low_mean": 0.0008455054321530042, "clip_ratio/low_min": 6.838709396106424e-05, "clip_ratio/region_mean": 0.0016522951336810365, "epoch": 0.13626632600085167, "grad_norm": 0.11112020164728165, "learning_rate": 2e-07, "loss": 0.01, "step": 1460 }, { "clip_ratio/high_max": 0.002103511036693817, "clip_ratio/high_mean": 0.0008376006244361633, "clip_ratio/low_mean": 0.0008418587331107119, "clip_ratio/low_min": 5.109750054543838e-05, "clip_ratio/region_mean": 0.0016794593539088964, "epoch": 0.13635965910085224, "grad_norm": 0.11802016943693161, "learning_rate": 2e-07, "loss": 0.0605, "step": 1461 }, { "clip_ratio/high_max": 0.0018220002675661817, "clip_ratio/high_mean": 0.0007320384866034146, "clip_ratio/low_mean": 0.0008749408170842798, "clip_ratio/low_min": 2.412511639704462e-05, "clip_ratio/region_mean": 0.0016069793346105143, "epoch": 0.13645299220085283, "grad_norm": 0.11744838953018188, "learning_rate": 2e-07, "loss": 0.0442, "step": 1462 }, { "clip_ratio/high_max": 0.002082470338791609, "clip_ratio/high_mean": 0.0007684449046791997, "clip_ratio/low_mean": 0.0008109148457151605, "clip_ratio/low_min": 2.950435100501636e-05, "clip_ratio/region_mean": 0.0015793597412994131, "epoch": 0.13654632530085342, "grad_norm": 0.12579548358917236, "learning_rate": 2e-07, "loss": 0.0355, "step": 1463 }, { "clip_ratio/high_max": 0.002054590091574937, "clip_ratio/high_mean": 0.0008626723811175907, "clip_ratio/low_mean": 0.0008043238740356173, "clip_ratio/low_min": 4.3937156078754924e-05, "clip_ratio/region_mean": 0.0016669962133164518, "epoch": 0.13663965840085399, "grad_norm": 0.11771884560585022, "learning_rate": 2e-07, "loss": -0.0236, "step": 1464 }, { "clip_ratio/high_max": 0.0019102517653664108, "clip_ratio/high_mean": 0.0007395319062197814, "clip_ratio/low_mean": 0.0008694875104993116, "clip_ratio/low_min": 6.605442104046233e-05, "clip_ratio/region_mean": 0.0016090193930722307, "epoch": 0.13673299150085458, "grad_norm": 0.12299696356058121, "learning_rate": 2e-07, "loss": 0.0398, "step": 1465 }, { "clip_ratio/high_max": 0.002050490329565946, "clip_ratio/high_mean": 0.0009202422206726624, "clip_ratio/low_mean": 0.0007017295683908742, "clip_ratio/low_min": 1.2079628504579887e-05, "clip_ratio/region_mean": 0.0016219718127103988, "epoch": 0.13682632460085517, "grad_norm": 0.11959147453308105, "learning_rate": 2e-07, "loss": 0.0095, "step": 1466 }, { "clip_ratio/high_max": 0.0018018000628217123, "clip_ratio/high_mean": 0.0006763321161997737, "clip_ratio/low_mean": 0.000987244140560506, "clip_ratio/low_min": 0.00016499254343216307, "clip_ratio/region_mean": 0.0016635762622172479, "epoch": 0.13691965770085573, "grad_norm": 0.11646529287099838, "learning_rate": 2e-07, "loss": 0.0945, "step": 1467 }, { "clip_ratio/high_max": 0.0018284965844941325, "clip_ratio/high_mean": 0.0007346723032242153, "clip_ratio/low_mean": 0.0008415589109063148, "clip_ratio/low_min": 5.68041668884689e-05, "clip_ratio/region_mean": 0.0015762312104925513, "epoch": 0.13701299080085633, "grad_norm": 0.12849688529968262, "learning_rate": 2e-07, "loss": 0.0478, "step": 1468 }, { "clip_ratio/high_max": 0.002003147947107209, "clip_ratio/high_mean": 0.0007086854839144507, "clip_ratio/low_mean": 0.0008341411667061038, "clip_ratio/low_min": 5.424440951173892e-05, "clip_ratio/region_mean": 0.0015428266378876287, "epoch": 0.13710632390085692, "grad_norm": 0.125239759683609, "learning_rate": 2e-07, "loss": 0.0483, "step": 1469 }, { "clip_ratio/high_max": 0.0018837411989807151, "clip_ratio/high_mean": 0.0007635022939211922, "clip_ratio/low_mean": 0.0007748775205982383, "clip_ratio/low_min": 7.755357546557207e-05, "clip_ratio/region_mean": 0.0015383798308903351, "epoch": 0.1371996570008575, "grad_norm": 0.12247708439826965, "learning_rate": 2e-07, "loss": 0.0549, "step": 1470 }, { "clip_ratio/high_max": 0.0018130841417587362, "clip_ratio/high_mean": 0.0007645061232324224, "clip_ratio/low_mean": 0.0008059449246502481, "clip_ratio/low_min": 5.703983151761349e-05, "clip_ratio/region_mean": 0.0015704510478826705, "epoch": 0.13729299010085808, "grad_norm": 0.12352964282035828, "learning_rate": 2e-07, "loss": -0.0011, "step": 1471 }, { "clip_ratio/high_max": 0.0022817215794930235, "clip_ratio/high_mean": 0.0009228906492353417, "clip_ratio/low_mean": 0.0008102824958768906, "clip_ratio/low_min": 4.450981487025274e-05, "clip_ratio/region_mean": 0.0017331731360172853, "epoch": 0.13738632320085867, "grad_norm": 0.11435064673423767, "learning_rate": 2e-07, "loss": -0.009, "step": 1472 }, { "clip_ratio/high_max": 0.0018429293704684824, "clip_ratio/high_mean": 0.0007932840198918711, "clip_ratio/low_mean": 0.0007716078071098309, "clip_ratio/low_min": 2.946257245639572e-05, "clip_ratio/region_mean": 0.0015648918015358504, "epoch": 0.13747965630085926, "grad_norm": 0.1262778490781784, "learning_rate": 2e-07, "loss": 0.0346, "step": 1473 }, { "clip_ratio/high_max": 0.002138561067113187, "clip_ratio/high_mean": 0.0008668529299029615, "clip_ratio/low_mean": 0.000854341988087981, "clip_ratio/low_min": 6.820854468969628e-05, "clip_ratio/region_mean": 0.0017211949234479107, "epoch": 0.13757298940085982, "grad_norm": 0.1192367747426033, "learning_rate": 2e-07, "loss": 0.0054, "step": 1474 }, { "clip_ratio/high_max": 0.0019341401202837005, "clip_ratio/high_mean": 0.0008405105472775176, "clip_ratio/low_mean": 0.0007131917627702933, "clip_ratio/low_min": 1.6622339899186045e-05, "clip_ratio/region_mean": 0.0015537023209617473, "epoch": 0.13766632250086042, "grad_norm": 0.1120966449379921, "learning_rate": 2e-07, "loss": -0.0001, "step": 1475 }, { "clip_ratio/high_max": 0.0016519250930286944, "clip_ratio/high_mean": 0.000703207113474491, "clip_ratio/low_mean": 0.0008263814670499414, "clip_ratio/low_min": 0.00013420890627457993, "clip_ratio/region_mean": 0.0015295885823434219, "epoch": 0.137759655600861, "grad_norm": 0.1162533089518547, "learning_rate": 2e-07, "loss": 0.058, "step": 1476 }, { "clip_ratio/high_max": 0.0019603210093919188, "clip_ratio/high_mean": 0.0008785676800471265, "clip_ratio/low_mean": 0.0007607883599121124, "clip_ratio/low_min": 2.8045769795426168e-05, "clip_ratio/region_mean": 0.0016393560290453024, "epoch": 0.13785298870086157, "grad_norm": 0.11489348858594894, "learning_rate": 2e-07, "loss": -0.0106, "step": 1477 }, { "clip_ratio/high_max": 0.0019518959525157697, "clip_ratio/high_mean": 0.0008070275125646731, "clip_ratio/low_mean": 0.0007439487071678741, "clip_ratio/low_min": 3.9592852772329934e-05, "clip_ratio/region_mean": 0.001550976205180632, "epoch": 0.13794632180086216, "grad_norm": 0.1130918487906456, "learning_rate": 2e-07, "loss": -0.0078, "step": 1478 }, { "clip_ratio/high_max": 0.0019165510639140848, "clip_ratio/high_mean": 0.0007913698809716152, "clip_ratio/low_mean": 0.0006961471517570317, "clip_ratio/low_min": 7.071393338264897e-05, "clip_ratio/region_mean": 0.0014875170309096575, "epoch": 0.13803965490086276, "grad_norm": 0.11394207924604416, "learning_rate": 2e-07, "loss": 0.0149, "step": 1479 }, { "clip_ratio/high_max": 0.002071254115435295, "clip_ratio/high_mean": 0.0007932908310976927, "clip_ratio/low_mean": 0.0006818989613748272, "clip_ratio/low_min": 4.8872245315578766e-05, "clip_ratio/region_mean": 0.0014751897906535305, "epoch": 0.13813298800086332, "grad_norm": 0.11755910515785217, "learning_rate": 2e-07, "loss": 0.0145, "step": 1480 }, { "clip_ratio/high_max": 0.001856110346125206, "clip_ratio/high_mean": 0.0007748300213279435, "clip_ratio/low_mean": 0.0007231926574604586, "clip_ratio/low_min": 6.420639783755178e-05, "clip_ratio/region_mean": 0.0014980226842453703, "epoch": 0.1382263211008639, "grad_norm": 0.10258106887340546, "learning_rate": 2e-07, "loss": 0.0155, "step": 1481 }, { "clip_ratio/high_max": 0.0017803746995923575, "clip_ratio/high_mean": 0.0007592463007313199, "clip_ratio/low_mean": 0.0008070137046161108, "clip_ratio/low_min": 5.841034453624161e-05, "clip_ratio/region_mean": 0.001566259998071473, "epoch": 0.1383196542008645, "grad_norm": 0.12491416186094284, "learning_rate": 2e-07, "loss": 0.0379, "step": 1482 }, { "clip_ratio/high_max": 0.001963299233466387, "clip_ratio/high_mean": 0.0007639478099008556, "clip_ratio/low_mean": 0.0009196346545650158, "clip_ratio/low_min": 3.0202295420167502e-05, "clip_ratio/region_mean": 0.0016835824790177867, "epoch": 0.13841298730086507, "grad_norm": 0.12312162667512894, "learning_rate": 2e-07, "loss": 0.0522, "step": 1483 }, { "clip_ratio/high_max": 0.0018340091810387094, "clip_ratio/high_mean": 0.0007375262139248662, "clip_ratio/low_mean": 0.000871125899720937, "clip_ratio/low_min": 3.0543676984962076e-05, "clip_ratio/region_mean": 0.0016086520772660151, "epoch": 0.13850632040086566, "grad_norm": 0.10878380388021469, "learning_rate": 2e-07, "loss": 0.0168, "step": 1484 }, { "clip_ratio/high_max": 0.002034580676991027, "clip_ratio/high_mean": 0.0007892910252849106, "clip_ratio/low_mean": 0.000789464404078899, "clip_ratio/low_min": 6.355701043503359e-05, "clip_ratio/region_mean": 0.0015787554621056188, "epoch": 0.13859965350086625, "grad_norm": 0.10368139296770096, "learning_rate": 2e-07, "loss": 0.0307, "step": 1485 }, { "clip_ratio/high_max": 0.0016998040555336047, "clip_ratio/high_mean": 0.0007035853623165167, "clip_ratio/low_mean": 0.0008077201691776281, "clip_ratio/low_min": 0.00013301407580001978, "clip_ratio/region_mean": 0.001511305534222629, "epoch": 0.13869298660086682, "grad_norm": 0.12030323594808578, "learning_rate": 2e-07, "loss": 0.0462, "step": 1486 }, { "clip_ratio/high_max": 0.0018656953070603777, "clip_ratio/high_mean": 0.0007198357525339816, "clip_ratio/low_mean": 0.0007467694049410056, "clip_ratio/low_min": 4.0534579966333695e-05, "clip_ratio/region_mean": 0.0014666051501990296, "epoch": 0.1387863197008674, "grad_norm": 0.118343286216259, "learning_rate": 2e-07, "loss": 0.0115, "step": 1487 }, { "clip_ratio/high_max": 0.0016743192863941658, "clip_ratio/high_mean": 0.0007550469199486542, "clip_ratio/low_mean": 0.0008532493375241756, "clip_ratio/low_min": 8.071745196502889e-05, "clip_ratio/region_mean": 0.001608296217455063, "epoch": 0.138879652800868, "grad_norm": 0.11635386943817139, "learning_rate": 2e-07, "loss": 0.0803, "step": 1488 }, { "clip_ratio/high_max": 0.002184636556194164, "clip_ratio/high_mean": 0.000846075983645278, "clip_ratio/low_mean": 0.0007427035452565178, "clip_ratio/low_min": 1.4149875823932234e-05, "clip_ratio/region_mean": 0.0015887794761511032, "epoch": 0.13897298590086857, "grad_norm": 0.13983197510242462, "learning_rate": 2e-07, "loss": 0.0167, "step": 1489 }, { "clip_ratio/high_max": 0.002190988845541142, "clip_ratio/high_mean": 0.0008227619036915712, "clip_ratio/low_mean": 0.0007513558302889578, "clip_ratio/low_min": 4.125445502722869e-05, "clip_ratio/region_mean": 0.0015741177121526562, "epoch": 0.13906631900086916, "grad_norm": 0.11038467288017273, "learning_rate": 2e-07, "loss": 0.0161, "step": 1490 }, { "clip_ratio/high_max": 0.002054443488304969, "clip_ratio/high_mean": 0.000799819275016489, "clip_ratio/low_mean": 0.0008269161080534104, "clip_ratio/low_min": 2.1234925952740014e-05, "clip_ratio/region_mean": 0.0016267354076262563, "epoch": 0.13915965210086975, "grad_norm": 0.12629100680351257, "learning_rate": 2e-07, "loss": 0.0539, "step": 1491 }, { "clip_ratio/high_max": 0.0020502476254478097, "clip_ratio/high_mean": 0.000831092342195916, "clip_ratio/low_mean": 0.0008358926952496404, "clip_ratio/low_min": 4.8535353471379494e-05, "clip_ratio/region_mean": 0.0016669850010657683, "epoch": 0.13925298520087034, "grad_norm": 0.10950468480587006, "learning_rate": 2e-07, "loss": 0.0496, "step": 1492 }, { "clip_ratio/high_max": 0.002082509803585708, "clip_ratio/high_mean": 0.0008552373365091626, "clip_ratio/low_mean": 0.0007759485870337812, "clip_ratio/low_min": 0.00010175279294344364, "clip_ratio/region_mean": 0.0016311859217239544, "epoch": 0.1393463183008709, "grad_norm": 0.1217878982424736, "learning_rate": 2e-07, "loss": -0.0008, "step": 1493 }, { "clip_ratio/high_max": 0.0021484994285856374, "clip_ratio/high_mean": 0.0008096314832073404, "clip_ratio/low_mean": 0.0008232501531892922, "clip_ratio/low_min": 0.00011953696684940951, "clip_ratio/region_mean": 0.0016328816782333888, "epoch": 0.1394396514008715, "grad_norm": 0.1365000605583191, "learning_rate": 2e-07, "loss": 0.0181, "step": 1494 }, { "clip_ratio/high_max": 0.0020136953207838815, "clip_ratio/high_mean": 0.0007932530734251486, "clip_ratio/low_mean": 0.0007502967473556055, "clip_ratio/low_min": 0.00010108898277394474, "clip_ratio/region_mean": 0.0015435498498845845, "epoch": 0.1395329845008721, "grad_norm": 0.1172717958688736, "learning_rate": 2e-07, "loss": -0.0258, "step": 1495 }, { "clip_ratio/high_max": 0.001955519095645286, "clip_ratio/high_mean": 0.0009036614683282096, "clip_ratio/low_mean": 0.0008562518378312234, "clip_ratio/low_min": 0.00017809019846026786, "clip_ratio/region_mean": 0.0017599132988834754, "epoch": 0.13962631760087266, "grad_norm": 0.1257271021604538, "learning_rate": 2e-07, "loss": 0.0161, "step": 1496 }, { "clip_ratio/high_max": 0.0023994001021492295, "clip_ratio/high_mean": 0.0007825980010238709, "clip_ratio/low_mean": 0.0009202493456541561, "clip_ratio/low_min": 5.6976257837959565e-05, "clip_ratio/region_mean": 0.0017028473230311647, "epoch": 0.13971965070087325, "grad_norm": 0.12196046113967896, "learning_rate": 2e-07, "loss": 0.0352, "step": 1497 }, { "clip_ratio/high_max": 0.002077218177873874, "clip_ratio/high_mean": 0.0008178950574802002, "clip_ratio/low_mean": 0.0008100532559183193, "clip_ratio/low_min": 3.3784030165406875e-05, "clip_ratio/region_mean": 0.0016279483170364983, "epoch": 0.13981298380087384, "grad_norm": 19.748563766479492, "learning_rate": 2e-07, "loss": 0.0466, "step": 1498 }, { "clip_ratio/high_max": 0.002036976278759539, "clip_ratio/high_mean": 0.0007161404264479643, "clip_ratio/low_mean": 0.0008646048572700238, "clip_ratio/low_min": 9.533472075418103e-05, "clip_ratio/region_mean": 0.0015807452946319245, "epoch": 0.1399063169008744, "grad_norm": 0.1121644601225853, "learning_rate": 2e-07, "loss": 0.035, "step": 1499 }, { "clip_ratio/high_max": 0.0018814212671713904, "clip_ratio/high_mean": 0.0007949936752993381, "clip_ratio/low_mean": 0.0008786795187916141, "clip_ratio/low_min": 3.8852563193358947e-05, "clip_ratio/region_mean": 0.0016736731777200475, "epoch": 0.139999650000875, "grad_norm": 0.12166900187730789, "learning_rate": 2e-07, "loss": 0.0321, "step": 1500 }, { "clip_ratio/high_max": 0.0019891385818482377, "clip_ratio/high_mean": 0.0007780337018630235, "clip_ratio/low_mean": 0.0007578488039143849, "clip_ratio/low_min": 3.9413117519870866e-05, "clip_ratio/region_mean": 0.0015358825257862918, "epoch": 0.1400929831008756, "grad_norm": 0.11292281746864319, "learning_rate": 2e-07, "loss": 0.0117, "step": 1501 }, { "clip_ratio/high_max": 0.002147349252481945, "clip_ratio/high_mean": 0.0008360655428987229, "clip_ratio/low_mean": 0.0009322054920630762, "clip_ratio/low_min": 0.00010167718210141174, "clip_ratio/region_mean": 0.0017682710531516932, "epoch": 0.14018631620087615, "grad_norm": 0.12126880884170532, "learning_rate": 2e-07, "loss": 0.0424, "step": 1502 }, { "clip_ratio/high_max": 0.0020838722921325825, "clip_ratio/high_mean": 0.0008489434549119323, "clip_ratio/low_mean": 0.0007812243984517409, "clip_ratio/low_min": 7.247428857226623e-05, "clip_ratio/region_mean": 0.0016301678551826626, "epoch": 0.14027964930087675, "grad_norm": 0.11141068488359451, "learning_rate": 2e-07, "loss": 0.0035, "step": 1503 }, { "clip_ratio/high_max": 0.0018730681767920032, "clip_ratio/high_mean": 0.0007987346343725221, "clip_ratio/low_mean": 0.0009506357691861922, "clip_ratio/low_min": 6.98070807629847e-05, "clip_ratio/region_mean": 0.0017493704071966931, "epoch": 0.14037298240087734, "grad_norm": 0.10860446095466614, "learning_rate": 2e-07, "loss": 0.0134, "step": 1504 }, { "clip_ratio/high_max": 0.00204423964896705, "clip_ratio/high_mean": 0.0008117208108160412, "clip_ratio/low_mean": 0.0009018660311994608, "clip_ratio/low_min": 8.579812947573373e-05, "clip_ratio/region_mean": 0.0017135868292825762, "epoch": 0.1404663155008779, "grad_norm": 0.12040314078330994, "learning_rate": 2e-07, "loss": 0.0154, "step": 1505 }, { "clip_ratio/high_max": 0.002111365582095459, "clip_ratio/high_mean": 0.0008329499087267322, "clip_ratio/low_mean": 0.0007639014929736732, "clip_ratio/low_min": 7.213773278635927e-05, "clip_ratio/region_mean": 0.001596851354406681, "epoch": 0.1405596486008785, "grad_norm": 0.10473189502954483, "learning_rate": 2e-07, "loss": 0.0127, "step": 1506 }, { "clip_ratio/high_max": 0.0020095140716875903, "clip_ratio/high_mean": 0.0007500226602132898, "clip_ratio/low_mean": 0.0008642314223834546, "clip_ratio/low_min": 6.788511927879881e-05, "clip_ratio/region_mean": 0.0016142540771397762, "epoch": 0.1406529817008791, "grad_norm": 0.11776019632816315, "learning_rate": 2e-07, "loss": 0.0419, "step": 1507 }, { "clip_ratio/high_max": 0.0020106303127249703, "clip_ratio/high_mean": 0.0008470014363410883, "clip_ratio/low_mean": 0.0007102326271706261, "clip_ratio/low_min": 6.373954784066882e-05, "clip_ratio/region_mean": 0.0015572340780636296, "epoch": 0.14074631480087965, "grad_norm": 0.1212378591299057, "learning_rate": 2e-07, "loss": -0.0125, "step": 1508 }, { "clip_ratio/high_max": 0.002043035528913606, "clip_ratio/high_mean": 0.0007536050852650078, "clip_ratio/low_mean": 0.000787485904766072, "clip_ratio/low_min": 7.037601608317345e-05, "clip_ratio/region_mean": 0.0015410909873025957, "epoch": 0.14083964790088024, "grad_norm": 0.11257391422986984, "learning_rate": 2e-07, "loss": 0.0296, "step": 1509 }, { "clip_ratio/high_max": 0.0018142778280889615, "clip_ratio/high_mean": 0.0008058108087425353, "clip_ratio/low_mean": 0.000747894525375159, "clip_ratio/low_min": 6.751533965143608e-05, "clip_ratio/region_mean": 0.0015537053404841572, "epoch": 0.14093298100088084, "grad_norm": 0.11166970431804657, "learning_rate": 2e-07, "loss": 0.0065, "step": 1510 }, { "clip_ratio/high_max": 0.001869442974566482, "clip_ratio/high_mean": 0.0006762733373761876, "clip_ratio/low_mean": 0.0008952445950853871, "clip_ratio/low_min": 0.0001294313569815131, "clip_ratio/region_mean": 0.0015715179360995535, "epoch": 0.14102631410088143, "grad_norm": 0.10648966580629349, "learning_rate": 2e-07, "loss": 0.0348, "step": 1511 }, { "clip_ratio/high_max": 0.0016181381688511465, "clip_ratio/high_mean": 0.0007002374677540502, "clip_ratio/low_mean": 0.0009360471103718737, "clip_ratio/low_min": 0.00014057061162020545, "clip_ratio/region_mean": 0.0016362846181436908, "epoch": 0.141119647200882, "grad_norm": 0.11024022847414017, "learning_rate": 2e-07, "loss": 0.073, "step": 1512 }, { "clip_ratio/high_max": 0.002244188690383453, "clip_ratio/high_mean": 0.0008118854057101998, "clip_ratio/low_mean": 0.0009494754431216279, "clip_ratio/low_min": 8.95027214937727e-05, "clip_ratio/region_mean": 0.00176136087247869, "epoch": 0.14121298030088258, "grad_norm": 0.1143442913889885, "learning_rate": 2e-07, "loss": 0.0335, "step": 1513 }, { "clip_ratio/high_max": 0.0016782991551735904, "clip_ratio/high_mean": 0.0007293934922927292, "clip_ratio/low_mean": 0.0009781317112356192, "clip_ratio/low_min": 5.885858627152629e-05, "clip_ratio/region_mean": 0.001707525210804306, "epoch": 0.14130631340088318, "grad_norm": 0.12796278297901154, "learning_rate": 2e-07, "loss": 0.0521, "step": 1514 }, { "clip_ratio/high_max": 0.001926420911331661, "clip_ratio/high_mean": 0.0008041036744543817, "clip_ratio/low_mean": 0.0007801476940585417, "clip_ratio/low_min": 5.823042465635808e-05, "clip_ratio/region_mean": 0.001584251418535132, "epoch": 0.14139964650088374, "grad_norm": 0.1069251075387001, "learning_rate": 2e-07, "loss": 0.0128, "step": 1515 }, { "clip_ratio/high_max": 0.002123073169059353, "clip_ratio/high_mean": 0.0009536673278489616, "clip_ratio/low_mean": 0.0008516432881151559, "clip_ratio/low_min": 8.277444067061879e-05, "clip_ratio/region_mean": 0.0018053105886792764, "epoch": 0.14149297960088433, "grad_norm": 0.11575865745544434, "learning_rate": 2e-07, "loss": -0.02, "step": 1516 }, { "clip_ratio/high_max": 0.002011477728956379, "clip_ratio/high_mean": 0.0007818517497071298, "clip_ratio/low_mean": 0.0009431977341591846, "clip_ratio/low_min": 7.107400097083882e-05, "clip_ratio/region_mean": 0.001725049500237219, "epoch": 0.14158631270088493, "grad_norm": 0.10971131175756454, "learning_rate": 2e-07, "loss": 0.0512, "step": 1517 }, { "clip_ratio/high_max": 0.0020395308529259637, "clip_ratio/high_mean": 0.0008268411347671645, "clip_ratio/low_mean": 0.0008523019896529149, "clip_ratio/low_min": 8.219391929742415e-05, "clip_ratio/region_mean": 0.0016791430971352383, "epoch": 0.1416796458008855, "grad_norm": 0.11466878652572632, "learning_rate": 2e-07, "loss": 0.0126, "step": 1518 }, { "clip_ratio/high_max": 0.0018154183635488153, "clip_ratio/high_mean": 0.0007742491252429318, "clip_ratio/low_mean": 0.0008142020378727466, "clip_ratio/low_min": 3.547105734469369e-05, "clip_ratio/region_mean": 0.0015884511813055724, "epoch": 0.14177297890088608, "grad_norm": 0.1113245040178299, "learning_rate": 2e-07, "loss": 0.0302, "step": 1519 }, { "clip_ratio/high_max": 0.001867379163741134, "clip_ratio/high_mean": 0.0007851826512705884, "clip_ratio/low_mean": 0.000828938078484498, "clip_ratio/low_min": 1.5078408068802673e-05, "clip_ratio/region_mean": 0.0016141207233886234, "epoch": 0.14186631200088667, "grad_norm": 0.103634312748909, "learning_rate": 2e-07, "loss": 0.047, "step": 1520 }, { "clip_ratio/high_max": 0.0020819746714551, "clip_ratio/high_mean": 0.0008627369279565755, "clip_ratio/low_mean": 0.0008915250909922179, "clip_ratio/low_min": 3.011122407770017e-05, "clip_ratio/region_mean": 0.0017542620335007086, "epoch": 0.14195964510088724, "grad_norm": 0.12072388827800751, "learning_rate": 2e-07, "loss": 0.0069, "step": 1521 }, { "clip_ratio/high_max": 0.002021434840571601, "clip_ratio/high_mean": 0.0007647829770576209, "clip_ratio/low_mean": 0.0009336629082099535, "clip_ratio/low_min": 0.00013893858613300836, "clip_ratio/region_mean": 0.0016984458707156591, "epoch": 0.14205297820088783, "grad_norm": 0.12055246531963348, "learning_rate": 2e-07, "loss": 0.0615, "step": 1522 }, { "clip_ratio/high_max": 0.0019374444818822667, "clip_ratio/high_mean": 0.0008046184120757971, "clip_ratio/low_mean": 0.0007530772363679716, "clip_ratio/low_min": 3.1546022910333704e-05, "clip_ratio/region_mean": 0.0015576956066070125, "epoch": 0.14214631130088842, "grad_norm": 0.11107288300991058, "learning_rate": 2e-07, "loss": 0.0116, "step": 1523 }, { "clip_ratio/high_max": 0.0017896928075060714, "clip_ratio/high_mean": 0.000755719205699279, "clip_ratio/low_mean": 0.0008514986457157647, "clip_ratio/low_min": 6.997356740612304e-05, "clip_ratio/region_mean": 0.0016072178586910013, "epoch": 0.142239644400889, "grad_norm": 0.11630631238222122, "learning_rate": 2e-07, "loss": 0.0047, "step": 1524 }, { "clip_ratio/high_max": 0.0017506766453152522, "clip_ratio/high_mean": 0.0008130429241646198, "clip_ratio/low_mean": 0.0007718485949226306, "clip_ratio/low_min": 5.3715149078925606e-05, "clip_ratio/region_mean": 0.0015848915427341126, "epoch": 0.14233297750088958, "grad_norm": 0.10503137111663818, "learning_rate": 2e-07, "loss": 0.0218, "step": 1525 }, { "clip_ratio/high_max": 0.002142649202141911, "clip_ratio/high_mean": 0.000837158117974468, "clip_ratio/low_mean": 0.0009825169654504862, "clip_ratio/low_min": 0.0001420626213075593, "clip_ratio/region_mean": 0.0018196750606875867, "epoch": 0.14242631060089017, "grad_norm": 0.1174115315079689, "learning_rate": 2e-07, "loss": 0.0797, "step": 1526 }, { "clip_ratio/high_max": 0.0018990368371305522, "clip_ratio/high_mean": 0.0007230203591461759, "clip_ratio/low_mean": 0.0007963449470480555, "clip_ratio/low_min": 4.735834500024794e-05, "clip_ratio/region_mean": 0.0015193653307505883, "epoch": 0.14251964370089074, "grad_norm": 0.10034012794494629, "learning_rate": 2e-07, "loss": 0.063, "step": 1527 }, { "clip_ratio/high_max": 0.002034477085544495, "clip_ratio/high_mean": 0.0008681693652761169, "clip_ratio/low_mean": 0.0008769346377448528, "clip_ratio/low_min": 6.0233365729800425e-05, "clip_ratio/region_mean": 0.0017451039784646127, "epoch": 0.14261297680089133, "grad_norm": 0.11025414615869522, "learning_rate": 2e-07, "loss": 0.0079, "step": 1528 }, { "clip_ratio/high_max": 0.0020003587123937905, "clip_ratio/high_mean": 0.000814242999695125, "clip_ratio/low_mean": 0.0009503914334345609, "clip_ratio/low_min": 0.00011470340723462868, "clip_ratio/region_mean": 0.0017646344349486753, "epoch": 0.14270630990089192, "grad_norm": 0.10999526083469391, "learning_rate": 2e-07, "loss": 0.037, "step": 1529 }, { "clip_ratio/high_max": 0.002087390013912227, "clip_ratio/high_mean": 0.0008566482247260865, "clip_ratio/low_mean": 0.000803464334239834, "clip_ratio/low_min": 0.00010332357487641275, "clip_ratio/region_mean": 0.001660112538957037, "epoch": 0.14279964300089248, "grad_norm": 0.12125776708126068, "learning_rate": 2e-07, "loss": 0.0259, "step": 1530 }, { "clip_ratio/high_max": 0.0023631213225598913, "clip_ratio/high_mean": 0.0008939637173170922, "clip_ratio/low_mean": 0.00078144368762878, "clip_ratio/low_min": 7.081871626724023e-05, "clip_ratio/region_mean": 0.0016754074313212186, "epoch": 0.14289297610089308, "grad_norm": 0.10925637185573578, "learning_rate": 2e-07, "loss": 0.0014, "step": 1531 }, { "clip_ratio/high_max": 0.0018179905127908569, "clip_ratio/high_mean": 0.0007888502750574844, "clip_ratio/low_mean": 0.0008102209812932415, "clip_ratio/low_min": 0.00012884569878224283, "clip_ratio/region_mean": 0.0015990712272468954, "epoch": 0.14298630920089367, "grad_norm": 0.12259503453969955, "learning_rate": 2e-07, "loss": 0.0405, "step": 1532 }, { "clip_ratio/high_max": 0.001834605343901785, "clip_ratio/high_mean": 0.0007581517238577362, "clip_ratio/low_mean": 0.000950851957895793, "clip_ratio/low_min": 5.6370729453192325e-05, "clip_ratio/region_mean": 0.001709003703581402, "epoch": 0.14307964230089426, "grad_norm": 0.11578698456287384, "learning_rate": 2e-07, "loss": 0.0543, "step": 1533 }, { "clip_ratio/high_max": 0.002065629596472718, "clip_ratio/high_mean": 0.0008612626588728745, "clip_ratio/low_mean": 0.0008895626924640965, "clip_ratio/low_min": 5.976615102554206e-05, "clip_ratio/region_mean": 0.001750825351336971, "epoch": 0.14317297540089483, "grad_norm": 0.11130835860967636, "learning_rate": 2e-07, "loss": 0.0154, "step": 1534 }, { "clip_ratio/high_max": 0.0020197745616314933, "clip_ratio/high_mean": 0.0007777186747262022, "clip_ratio/low_mean": 0.0008490165237162728, "clip_ratio/low_min": 8.064355552050984e-05, "clip_ratio/region_mean": 0.0016267351966234855, "epoch": 0.14326630850089542, "grad_norm": 0.10941354930400848, "learning_rate": 2e-07, "loss": 0.0024, "step": 1535 }, { "clip_ratio/high_max": 0.0022591087072214577, "clip_ratio/high_mean": 0.0008735082737985067, "clip_ratio/low_mean": 0.0007928938393888529, "clip_ratio/low_min": 2.6658493879949674e-05, "clip_ratio/region_mean": 0.0016664020804455504, "epoch": 0.143359641600896, "grad_norm": 0.12084412574768066, "learning_rate": 2e-07, "loss": 0.0206, "step": 1536 }, { "clip_ratio/high_max": 0.0, "clip_ratio/high_mean": 0.0, "clip_ratio/low_mean": 0.0, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0, "completions/clipped_ratio": 0.014552525111607095, "completions/max_length": 4096.0, "completions/max_terminated_length": 4095.0, "completions/mean_length": 612.552490234375, "completions/mean_terminated_length": 561.1109619140625, "completions/min_length": 5.0, "completions/min_terminated_length": 5.0, "epoch": 0.14345297470089657, "grad_norm": 0.11977797001600266, "learning_rate": 2e-07, "loss": 0.0323, "num_tokens": 1063213677.0, "reward": 0.5939767360687256, "reward_std": 0.1922587752342224, "rewards/simpleverify_reward/mean": 0.5939766764640808, "rewards/simpleverify_reward/std": 0.49109113216400146, "step": 1537 }, { "clip_ratio/high_max": 0.001969095101230778, "clip_ratio/high_mean": 0.0007721421370661119, "clip_ratio/low_mean": 0.0006108947491156869, "clip_ratio/low_min": 8.397766032430809e-05, "clip_ratio/region_mean": 0.001383036891638767, "epoch": 0.14354630780089717, "grad_norm": 0.11352571099996567, "learning_rate": 2e-07, "loss": 0.01, "step": 1538 }, { "clip_ratio/high_max": 0.0017376322866766714, "clip_ratio/high_mean": 0.0006606369288419955, "clip_ratio/low_mean": 0.0006106126838858472, "clip_ratio/low_min": 3.192048188793706e-05, "clip_ratio/region_mean": 0.0012712495881714858, "epoch": 0.14363964090089776, "grad_norm": 0.12572240829467773, "learning_rate": 2e-07, "loss": 0.078, "step": 1539 }, { "clip_ratio/high_max": 0.0021605878573609516, "clip_ratio/high_mean": 0.0008464278107567225, "clip_ratio/low_mean": 0.0005165131078683771, "clip_ratio/low_min": 1.4114724763203412e-05, "clip_ratio/region_mean": 0.0013629409040731844, "epoch": 0.14373297400089832, "grad_norm": 0.11081253737211227, "learning_rate": 2e-07, "loss": -0.0041, "step": 1540 }, { "clip_ratio/high_max": 0.001996835148020182, "clip_ratio/high_mean": 0.000863813744217623, "clip_ratio/low_mean": 0.0005997594016662333, "clip_ratio/low_min": 7.248619658639655e-05, "clip_ratio/region_mean": 0.0014635731786256656, "epoch": 0.14382630710089891, "grad_norm": 0.12655508518218994, "learning_rate": 2e-07, "loss": 0.0059, "step": 1541 }, { "clip_ratio/high_max": 0.002088934794301167, "clip_ratio/high_mean": 0.0007892701523815049, "clip_ratio/low_mean": 0.000606626305852842, "clip_ratio/low_min": 0.0, "clip_ratio/region_mean": 0.0013958964736957569, "epoch": 0.1439196402008995, "grad_norm": 0.12356770038604736, "learning_rate": 2e-07, "loss": 0.0608, "step": 1542 }, { "clip_ratio/high_max": 0.0018853509391192347, "clip_ratio/high_mean": 0.0008113472831610125, "clip_ratio/low_mean": 0.0005883052981516812, "clip_ratio/low_min": 8.606023584434297e-05, "clip_ratio/region_mean": 0.0013996525849506725, "epoch": 0.14401297330090007, "grad_norm": 0.11853167414665222, "learning_rate": 2e-07, "loss": 0.0475, "step": 1543 }, { "clip_ratio/high_max": 0.0017803561167966109, "clip_ratio/high_mean": 0.0007005601019045571, "clip_ratio/low_mean": 0.0006159584354463732, "clip_ratio/low_min": 5.772756048827432e-05, "clip_ratio/region_mean": 0.0013165185191610362, "epoch": 0.14410630640090066, "grad_norm": 0.11867249757051468, "learning_rate": 2e-07, "loss": -0.0156, "step": 1544 }, { "clip_ratio/high_max": 0.0022019757889211178, "clip_ratio/high_mean": 0.0009056374747160589, "clip_ratio/low_mean": 0.0006331138883979293, "clip_ratio/low_min": 4.4118483856436796e-05, "clip_ratio/region_mean": 0.001538751348562073, "epoch": 0.14419963950090126, "grad_norm": 0.12584801018238068, "learning_rate": 2e-07, "loss": -0.0025, "step": 1545 }, { "clip_ratio/high_max": 0.002090104328090092, "clip_ratio/high_mean": 0.0007946690911921905, "clip_ratio/low_mean": 0.0005864782269782154, "clip_ratio/low_min": 4.910013876724406e-05, "clip_ratio/region_mean": 0.0013811473218083847, "epoch": 0.14429297260090182, "grad_norm": 0.11705493927001953, "learning_rate": 2e-07, "loss": 0.0641, "step": 1546 }, { "clip_ratio/high_max": 0.0019310154239065014, "clip_ratio/high_mean": 0.0008474859168927651, "clip_ratio/low_mean": 0.0005446702907647705, "clip_ratio/low_min": 7.532843028457137e-06, "clip_ratio/region_mean": 0.0013921562058385462, "epoch": 0.1443863057009024, "grad_norm": 0.12216715514659882, "learning_rate": 2e-07, "loss": -0.0139, "step": 1547 }, { "clip_ratio/high_max": 0.0019308718910906464, "clip_ratio/high_mean": 0.0008004292903933674, "clip_ratio/low_mean": 0.000580620976506907, "clip_ratio/low_min": 5.637379308609525e-05, "clip_ratio/region_mean": 0.0013810503005515784, "epoch": 0.144479638800903, "grad_norm": 0.11339802294969559, "learning_rate": 2e-07, "loss": -0.0233, "step": 1548 }, { "clip_ratio/high_max": 0.0020135991617280524, "clip_ratio/high_mean": 0.0007304686905627022, "clip_ratio/low_mean": 0.0006219767819857225, "clip_ratio/low_min": 1.2074960977770388e-05, "clip_ratio/region_mean": 0.0013524454698199406, "epoch": 0.14457297190090357, "grad_norm": 0.1118064597249031, "learning_rate": 2e-07, "loss": 0.0151, "step": 1549 }, { "clip_ratio/high_max": 0.0018665300631255377, "clip_ratio/high_mean": 0.0007987244753167033, "clip_ratio/low_mean": 0.0005590919936366845, "clip_ratio/low_min": 1.8998319319507573e-05, "clip_ratio/region_mean": 0.001357816465315409, "epoch": 0.14466630500090416, "grad_norm": 0.11731677502393723, "learning_rate": 2e-07, "loss": 0.0004, "step": 1550 }, { "clip_ratio/high_max": 0.0017867107126221526, "clip_ratio/high_mean": 0.0008168059903255198, "clip_ratio/low_mean": 0.0005840759858983802, "clip_ratio/low_min": 7.3149675699824e-05, "clip_ratio/region_mean": 0.0014008819744049106, "epoch": 0.14475963810090475, "grad_norm": 0.11835388839244843, "learning_rate": 2e-07, "loss": 0.0149, "step": 1551 }, { "clip_ratio/high_max": 0.0020975028455723077, "clip_ratio/high_mean": 0.0008106478853733279, "clip_ratio/low_mean": 0.0006947967885935213, "clip_ratio/low_min": 5.5110374887590297e-05, "clip_ratio/region_mean": 0.0015054446521389764, "epoch": 0.14485297120090532, "grad_norm": 0.13253165781497955, "learning_rate": 2e-07, "loss": 0.0669, "step": 1552 }, { "clip_ratio/high_max": 0.0018878041264542844, "clip_ratio/high_mean": 0.000813415626907954, "clip_ratio/low_mean": 0.0006846273518021917, "clip_ratio/low_min": 6.534951717185322e-05, "clip_ratio/region_mean": 0.0014980429587012623, "epoch": 0.1449463043009059, "grad_norm": 0.12443888187408447, "learning_rate": 2e-07, "loss": 0.0496, "step": 1553 }, { "clip_ratio/high_max": 0.0021779153939860407, "clip_ratio/high_mean": 0.0008605948969488963, "clip_ratio/low_mean": 0.0005926566991547588, "clip_ratio/low_min": 3.846624713332858e-05, "clip_ratio/region_mean": 0.0014532515924656764, "epoch": 0.1450396374009065, "grad_norm": 0.1230318695306778, "learning_rate": 2e-07, "loss": -0.0208, "step": 1554 }, { "clip_ratio/high_max": 0.0017662104619375896, "clip_ratio/high_mean": 0.000639839488940197, "clip_ratio/low_mean": 0.0006914896657690406, "clip_ratio/low_min": 5.728960513806669e-05, "clip_ratio/region_mean": 0.0013313291055965237, "epoch": 0.1451329705009071, "grad_norm": 0.11071933805942535, "learning_rate": 2e-07, "loss": 0.0492, "step": 1555 }, { "clip_ratio/high_max": 0.0017915999742399435, "clip_ratio/high_mean": 0.0007930038264021277, "clip_ratio/low_mean": 0.0007293668768397765, "clip_ratio/low_min": 8.000021534826374e-05, "clip_ratio/region_mean": 0.0015223707014229149, "epoch": 0.14522630360090766, "grad_norm": 0.11627659946680069, "learning_rate": 2e-07, "loss": 0.0146, "step": 1556 }, { "clip_ratio/high_max": 0.0021358071971917525, "clip_ratio/high_mean": 0.0007584547347505577, "clip_ratio/low_mean": 0.0006738164065609453, "clip_ratio/low_min": 2.1959918740321882e-05, "clip_ratio/region_mean": 0.0014322711394925136, "epoch": 0.14531963670090825, "grad_norm": 0.11754827201366425, "learning_rate": 2e-07, "loss": 0.0529, "step": 1557 }, { "clip_ratio/high_max": 0.001903148164274171, "clip_ratio/high_mean": 0.0007298568070837064, "clip_ratio/low_mean": 0.0006007725178278633, "clip_ratio/low_min": 3.835231109405868e-05, "clip_ratio/region_mean": 0.0013306293003552128, "epoch": 0.14541296980090884, "grad_norm": 0.11277376860380173, "learning_rate": 2e-07, "loss": 0.031, "step": 1558 }, { "clip_ratio/high_max": 0.0017083734055631794, "clip_ratio/high_mean": 0.0007156690280680778, "clip_ratio/low_mean": 0.0006714164001095924, "clip_ratio/low_min": 2.9805961275997106e-05, "clip_ratio/region_mean": 0.0013870854854758363, "epoch": 0.1455063029009094, "grad_norm": 0.11422629654407501, "learning_rate": 2e-07, "loss": 0.0285, "step": 1559 }, { "clip_ratio/high_max": 0.0022567410560441203, "clip_ratio/high_mean": 0.0008304407965624705, "clip_ratio/low_mean": 0.0007039722095214529, "clip_ratio/low_min": 7.493058365071192e-05, "clip_ratio/region_mean": 0.001534413022454828, "epoch": 0.14559963600091, "grad_norm": 0.11293085664510727, "learning_rate": 2e-07, "loss": 0.0372, "step": 1560 }, { "clip_ratio/high_max": 0.0020565335798892193, "clip_ratio/high_mean": 0.0008798873932391871, "clip_ratio/low_mean": 0.0007346973079620511, "clip_ratio/low_min": 3.7973635699017905e-05, "clip_ratio/region_mean": 0.0016145847039297223, "epoch": 0.1456929691009106, "grad_norm": 0.12151321768760681, "learning_rate": 2e-07, "loss": 0.0211, "step": 1561 }, { "clip_ratio/high_max": 0.0016882996933418326, "clip_ratio/high_mean": 0.0006565985495399218, "clip_ratio/low_mean": 0.0006183458826853894, "clip_ratio/low_min": 1.6609088561381213e-05, "clip_ratio/region_mean": 0.0012749444140354171, "epoch": 0.14578630220091116, "grad_norm": 0.11804751306772232, "learning_rate": 2e-07, "loss": 0.0299, "step": 1562 }, { "clip_ratio/high_max": 0.0026345511141698807, "clip_ratio/high_mean": 0.0009750439530762378, "clip_ratio/low_mean": 0.000547631749213906, "clip_ratio/low_min": 1.0261041097692214e-05, "clip_ratio/region_mean": 0.0015226757204800379, "epoch": 0.14587963530091175, "grad_norm": 0.11607442051172256, "learning_rate": 2e-07, "loss": -0.0334, "step": 1563 }, { "clip_ratio/high_max": 0.002052434043434914, "clip_ratio/high_mean": 0.0007492262902815128, "clip_ratio/low_mean": 0.0008021478643058799, "clip_ratio/low_min": 2.683416551008122e-05, "clip_ratio/region_mean": 0.0015513741236645728, "epoch": 0.14597296840091234, "grad_norm": 0.11416371166706085, "learning_rate": 2e-07, "loss": 0.0397, "step": 1564 }, { "clip_ratio/high_max": 0.0018990007010870613, "clip_ratio/high_mean": 0.0008318721957039088, "clip_ratio/low_mean": 0.0006334550607789424, "clip_ratio/low_min": 2.391429188719485e-05, "clip_ratio/region_mean": 0.0014653272592113353, "epoch": 0.1460663015009129, "grad_norm": 0.13010713458061218, "learning_rate": 2e-07, "loss": -0.0099, "step": 1565 }, { "clip_ratio/high_max": 0.0021414379189081956, "clip_ratio/high_mean": 0.0008656622248963686, "clip_ratio/low_mean": 0.0007191951135609997, "clip_ratio/low_min": 3.834687049675267e-05, "clip_ratio/region_mean": 0.0015848573384573683, "epoch": 0.1461596346009135, "grad_norm": 0.11567758768796921, "learning_rate": 2e-07, "loss": 0.0392, "step": 1566 }, { "clip_ratio/high_max": 0.001935828917339677, "clip_ratio/high_mean": 0.0007625206289958442, "clip_ratio/low_mean": 0.0008674328255438013, "clip_ratio/low_min": 0.00011482445461297175, "clip_ratio/region_mean": 0.0016299534399877302, "epoch": 0.1462529677009141, "grad_norm": 0.1291351169347763, "learning_rate": 2e-07, "loss": 0.1015, "step": 1567 }, { "clip_ratio/high_max": 0.0018762724976113532, "clip_ratio/high_mean": 0.0007961198007251369, "clip_ratio/low_mean": 0.0007469664169548196, "clip_ratio/low_min": 1.7043905245373026e-05, "clip_ratio/region_mean": 0.0015430862113134935, "epoch": 0.14634630080091465, "grad_norm": 0.10462664812803268, "learning_rate": 2e-07, "loss": 0.0328, "step": 1568 }, { "clip_ratio/high_max": 0.0021119414741406217, "clip_ratio/high_mean": 0.0008753330021136208, "clip_ratio/low_mean": 0.0007747490853944328, "clip_ratio/low_min": 1.7020696759573184e-05, "clip_ratio/region_mean": 0.0016500820711371489, "epoch": 0.14643963390091524, "grad_norm": 0.12263359874486923, "learning_rate": 2e-07, "loss": 0.0112, "step": 1569 }, { "clip_ratio/high_max": 0.0018372777667536866, "clip_ratio/high_mean": 0.0008107521116471617, "clip_ratio/low_mean": 0.0006573164473593351, "clip_ratio/low_min": 4.589958234646474e-05, "clip_ratio/region_mean": 0.0014680685744679067, "epoch": 0.14653296700091584, "grad_norm": 0.11053671687841415, "learning_rate": 2e-07, "loss": 0.0201, "step": 1570 }, { "clip_ratio/high_max": 0.001631954906770261, "clip_ratio/high_mean": 0.000687703295625397, "clip_ratio/low_mean": 0.0007275756579474546, "clip_ratio/low_min": 0.0001236224125023, "clip_ratio/region_mean": 0.0014152789517538622, "epoch": 0.1466263001009164, "grad_norm": 0.11256250739097595, "learning_rate": 2e-07, "loss": 0.0076, "step": 1571 }, { "clip_ratio/high_max": 0.002314045137609355, "clip_ratio/high_mean": 0.0009373185548611218, "clip_ratio/low_mean": 0.0005701866430172231, "clip_ratio/low_min": 8.774392881605309e-06, "clip_ratio/region_mean": 0.0015075051778694615, "epoch": 0.146719633200917, "grad_norm": 0.11756494641304016, "learning_rate": 2e-07, "loss": -0.047, "step": 1572 }, { "clip_ratio/high_max": 0.0015228014526655897, "clip_ratio/high_mean": 0.0006248222653084667, "clip_ratio/low_mean": 0.0007792311716912081, "clip_ratio/low_min": 3.553479746187804e-05, "clip_ratio/region_mean": 0.0014040534588275477, "epoch": 0.14681296630091759, "grad_norm": 0.10734254121780396, "learning_rate": 2e-07, "loss": 0.0503, "step": 1573 }, { "clip_ratio/high_max": 0.0019816477797576226, "clip_ratio/high_mean": 0.0007934069726616144, "clip_ratio/low_mean": 0.0007646653748452081, "clip_ratio/low_min": 7.578433542221319e-05, "clip_ratio/region_mean": 0.0015580723484163173, "epoch": 0.14690629940091818, "grad_norm": 0.1325664520263672, "learning_rate": 2e-07, "loss": 0.008, "step": 1574 }, { "clip_ratio/high_max": 0.001978918538952712, "clip_ratio/high_mean": 0.0007869852743169758, "clip_ratio/low_mean": 0.0007342981425608741, "clip_ratio/low_min": 8.052799967117608e-05, "clip_ratio/region_mean": 0.0015212834150588606, "epoch": 0.14699963250091874, "grad_norm": 0.10760325938463211, "learning_rate": 2e-07, "loss": 0.0331, "step": 1575 }, { "clip_ratio/high_max": 0.0021623551947413944, "clip_ratio/high_mean": 0.0008246717061410891, "clip_ratio/low_mean": 0.0008150641078827903, "clip_ratio/low_min": 6.586486961168703e-05, "clip_ratio/region_mean": 0.0016397358267568052, "epoch": 0.14709296560091933, "grad_norm": 0.12199617922306061, "learning_rate": 2e-07, "loss": 0.0197, "step": 1576 }, { "clip_ratio/high_max": 0.0019634232958196662, "clip_ratio/high_mean": 0.0007764750262140296, "clip_ratio/low_mean": 0.0007462475041393191, "clip_ratio/low_min": 1.0824384844454471e-05, "clip_ratio/region_mean": 0.0015227225521812215, "epoch": 0.14718629870091993, "grad_norm": 0.11231967061758041, "learning_rate": 2e-07, "loss": -0.0182, "step": 1577 }, { "clip_ratio/high_max": 0.001720855540042976, "clip_ratio/high_mean": 0.0007278201956069097, "clip_ratio/low_mean": 0.0007924207529867999, "clip_ratio/low_min": 5.304842943587573e-05, "clip_ratio/region_mean": 0.0015202409122139215, "epoch": 0.1472796318009205, "grad_norm": 0.11937659978866577, "learning_rate": 2e-07, "loss": 0.039, "step": 1578 }, { "clip_ratio/high_max": 0.001970176846953109, "clip_ratio/high_mean": 0.0008720655368961161, "clip_ratio/low_mean": 0.0008554398427804699, "clip_ratio/low_min": 0.0001231684145750478, "clip_ratio/region_mean": 0.00172750539786648, "epoch": 0.14737296490092108, "grad_norm": 0.12547583878040314, "learning_rate": 2e-07, "loss": -0.006, "step": 1579 }, { "clip_ratio/high_max": 0.0022084797237766907, "clip_ratio/high_mean": 0.0009102516742132138, "clip_ratio/low_mean": 0.0007319341120819445, "clip_ratio/low_min": 9.836914614425041e-05, "clip_ratio/region_mean": 0.0016421858017565683, "epoch": 0.14746629800092168, "grad_norm": 0.12562039494514465, "learning_rate": 2e-07, "loss": 0.0072, "step": 1580 }, { "clip_ratio/high_max": 0.002089322944812011, "clip_ratio/high_mean": 0.0008389055692532565, "clip_ratio/low_mean": 0.0007702347420490696, "clip_ratio/low_min": 4.460462514543906e-05, "clip_ratio/region_mean": 0.0016091403049358632, "epoch": 0.14755963110092224, "grad_norm": 0.11965224891901016, "learning_rate": 2e-07, "loss": 0.0322, "step": 1581 }, { "clip_ratio/high_max": 0.0020219165198795963, "clip_ratio/high_mean": 0.0007996965705387993, "clip_ratio/low_mean": 0.0007333528501476394, "clip_ratio/low_min": 1.7314487195108086e-05, "clip_ratio/region_mean": 0.0015330494097725023, "epoch": 0.14765296420092283, "grad_norm": 0.11467674374580383, "learning_rate": 2e-07, "loss": 0.0456, "step": 1582 }, { "clip_ratio/high_max": 0.002188824913901044, "clip_ratio/high_mean": 0.0008527392456016969, "clip_ratio/low_mean": 0.0007600166973134037, "clip_ratio/low_min": 4.956191241944907e-05, "clip_ratio/region_mean": 0.0016127559283631854, "epoch": 0.14774629730092342, "grad_norm": 0.1122947409749031, "learning_rate": 2e-07, "loss": 0.0192, "step": 1583 }, { "clip_ratio/high_max": 0.0019403612459427677, "clip_ratio/high_mean": 0.0007310775044970796, "clip_ratio/low_mean": 0.0007142092545109335, "clip_ratio/low_min": 8.03355924290372e-05, "clip_ratio/region_mean": 0.0014452867508225609, "epoch": 0.147839630400924, "grad_norm": 0.10535921901464462, "learning_rate": 2e-07, "loss": 0.034, "step": 1584 }, { "clip_ratio/high_max": 0.001952923063072376, "clip_ratio/high_mean": 0.0008673034189996542, "clip_ratio/low_mean": 0.0007378432101177168, "clip_ratio/low_min": 1.5367591913673095e-05, "clip_ratio/region_mean": 0.0016051466009230353, "epoch": 0.14793296350092458, "grad_norm": 0.11429724097251892, "learning_rate": 2e-07, "loss": -0.0141, "step": 1585 }, { "clip_ratio/high_max": 0.0016909778678382281, "clip_ratio/high_mean": 0.0006661737106696819, "clip_ratio/low_mean": 0.0008987397013697773, "clip_ratio/low_min": 4.462033939489629e-05, "clip_ratio/region_mean": 0.001564913400216028, "epoch": 0.14802629660092517, "grad_norm": 0.12109814584255219, "learning_rate": 2e-07, "loss": 0.0651, "step": 1586 }, { "clip_ratio/high_max": 0.002246947664389154, "clip_ratio/high_mean": 0.0008479341140628094, "clip_ratio/low_mean": 0.0008749490771151613, "clip_ratio/low_min": 9.645597674534656e-05, "clip_ratio/region_mean": 0.0017228831857210025, "epoch": 0.14811962970092574, "grad_norm": 0.12280218303203583, "learning_rate": 2e-07, "loss": 0.0337, "step": 1587 }, { "clip_ratio/high_max": 0.002073892257612897, "clip_ratio/high_mean": 0.0007898363128333585, "clip_ratio/low_mean": 0.0008486050373903709, "clip_ratio/low_min": 6.957189543754794e-05, "clip_ratio/region_mean": 0.0016384413647756446, "epoch": 0.14821296280092633, "grad_norm": 0.12390957027673721, "learning_rate": 2e-07, "loss": 0.0352, "step": 1588 }, { "clip_ratio/high_max": 0.002167145808925852, "clip_ratio/high_mean": 0.0009117706758843269, "clip_ratio/low_mean": 0.0007248833189805737, "clip_ratio/low_min": 1.5470297512365505e-05, "clip_ratio/region_mean": 0.00163665399668389, "epoch": 0.14830629590092692, "grad_norm": 0.1179620698094368, "learning_rate": 2e-07, "loss": 0.0183, "step": 1589 }, { "clip_ratio/high_max": 0.0017312454765487928, "clip_ratio/high_mean": 0.0007215636105684098, "clip_ratio/low_mean": 0.0007692145527471439, "clip_ratio/low_min": 1.8939394067274407e-05, "clip_ratio/region_mean": 0.0014907781660440378, "epoch": 0.14839962900092749, "grad_norm": 0.1291106790304184, "learning_rate": 2e-07, "loss": 0.0299, "step": 1590 }, { "clip_ratio/high_max": 0.0020729234456666745, "clip_ratio/high_mean": 0.000813857341199764, "clip_ratio/low_mean": 0.0008116104363580234, "clip_ratio/low_min": 0.00012043855258525582, "clip_ratio/region_mean": 0.0016254677793767769, "epoch": 0.14849296210092808, "grad_norm": 0.1256583333015442, "learning_rate": 2e-07, "loss": 0.0221, "step": 1591 }, { "clip_ratio/high_max": 0.001882519238279201, "clip_ratio/high_mean": 0.000749555330912699, "clip_ratio/low_mean": 0.0008001126170711359, "clip_ratio/low_min": 3.146855442537344e-05, "clip_ratio/region_mean": 0.0015496679188800044, "epoch": 0.14858629520092867, "grad_norm": 0.11073312908411026, "learning_rate": 2e-07, "loss": 0.0086, "step": 1592 }, { "clip_ratio/high_max": 0.0017294862918788567, "clip_ratio/high_mean": 0.000679197632962314, "clip_ratio/low_mean": 0.0009060169295480591, "clip_ratio/low_min": 0.00012911499288748018, "clip_ratio/region_mean": 0.0015852145988901611, "epoch": 0.14867962830092923, "grad_norm": 0.4138675928115845, "learning_rate": 2e-07, "loss": 0.0785, "step": 1593 }, { "clip_ratio/high_max": 0.0018686345720198005, "clip_ratio/high_mean": 0.0008538245274394285, "clip_ratio/low_mean": 0.0006974737843847834, "clip_ratio/low_min": 6.155585742817493e-05, "clip_ratio/region_mean": 0.0015512983445660211, "epoch": 0.14877296140092983, "grad_norm": 0.11856398731470108, "learning_rate": 2e-07, "loss": 0.0183, "step": 1594 }, { "clip_ratio/high_max": 0.0015594684809911996, "clip_ratio/high_mean": 0.0006723962051182752, "clip_ratio/low_mean": 0.0007374149272436625, "clip_ratio/low_min": 2.266978390252916e-05, "clip_ratio/region_mean": 0.0014098111641942523, "epoch": 0.14886629450093042, "grad_norm": 0.11258701235055923, "learning_rate": 2e-07, "loss": 0.0445, "step": 1595 }, { "clip_ratio/high_max": 0.0019473644097161014, "clip_ratio/high_mean": 0.0007636729969817679, "clip_ratio/low_mean": 0.000789721073488181, "clip_ratio/low_min": 6.965963984839618e-05, "clip_ratio/region_mean": 0.0015533941186731681, "epoch": 0.148959627600931, "grad_norm": 0.11592815816402435, "learning_rate": 2e-07, "loss": 0.0745, "step": 1596 }, { "clip_ratio/high_max": 0.0019205576027161442, "clip_ratio/high_mean": 0.0007645352516192361, "clip_ratio/low_mean": 0.0008127012406475842, "clip_ratio/low_min": 5.431197041616542e-05, "clip_ratio/region_mean": 0.0015772364822623786, "epoch": 0.14905296070093157, "grad_norm": 0.12033629417419434, "learning_rate": 2e-07, "loss": 0.0464, "step": 1597 }, { "clip_ratio/high_max": 0.002274166683491785, "clip_ratio/high_mean": 0.0009129213376581902, "clip_ratio/low_mean": 0.0007686048566029058, "clip_ratio/low_min": 4.6083645429462194e-05, "clip_ratio/region_mean": 0.0016815261806186754, "epoch": 0.14914629380093217, "grad_norm": 0.11660020798444748, "learning_rate": 2e-07, "loss": 0.0012, "step": 1598 }, { "clip_ratio/high_max": 0.002078795379929943, "clip_ratio/high_mean": 0.0008251310155173996, "clip_ratio/low_mean": 0.0008992719558591489, "clip_ratio/low_min": 6.815252982050879e-05, "clip_ratio/region_mean": 0.0017244029659195803, "epoch": 0.14923962690093276, "grad_norm": 0.12410469353199005, "learning_rate": 2e-07, "loss": 0.0629, "step": 1599 }, { "clip_ratio/high_max": 0.0017782713985070586, "clip_ratio/high_mean": 0.0006739672189723933, "clip_ratio/low_mean": 0.0009550681552354945, "clip_ratio/low_min": 7.757994717394467e-05, "clip_ratio/region_mean": 0.0016290353814838454, "epoch": 0.14933296000093332, "grad_norm": 0.12016419321298599, "learning_rate": 2e-07, "loss": 0.0516, "step": 1600 }, { "epoch": 0.14933296000093332, "step": 1600, "total_flos": 0.0, "train_loss": 0.024036576095278973, "train_runtime": 114730.7194, "train_samples_per_second": 12.495, "train_steps_per_second": 0.014 } ], "logging_steps": 1, "max_steps": 1600, "num_input_tokens_seen": 1063213677, "num_train_epochs": 1, "save_steps": 160, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 0.0, "train_batch_size": 8, "trial_name": null, "trial_params": null }