{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.41975607329287956, "bleu_stderr": 0.0290900789860069, "rouge1_fmeasure": 0.11806959803903948, "rouge1_fmeasure_stderr": 0.0020779281759781614, "rouge1_precision": 0.07902286487648982, "rouge1_precision_stderr": 0.0017692797192929858, "rouge1_recall": 0.33932196413922855, "rouge1_recall_stderr": 0.005426202467814663, "rouge2_fmeasure": 0.05407292240009696, "rouge2_fmeasure_stderr": 0.0012593686511145933, "rouge2_precision": 0.03645056474058315, "rouge2_precision_stderr": 0.0011698798019417287, "rouge2_recall": 0.1595754862930624, "rouge2_recall_stderr": 0.0033969223420483963, "rougeL_fmeasure": 0.11264814453519295, "rougeL_fmeasure_stderr": 0.0019096220591269593, "rougeL_precision": 0.07521164191664043, "rougeL_precision_stderr": 0.0016373524317681752, "rougeL_recall": 0.3266931469021551, "rougeL_recall_stderr": 0.005207483059054346, "rougeLsum_fmeasure": 0.11109795344198757, "rougeLsum_fmeasure_stderr": 0.0019508680245213894, "rougeLsum_precision": 0.07449989577421517, "rougeLsum_precision_stderr": 0.0016763730170273655, "rougeLsum_recall": 0.317453644006743, "rougeLsum_recall_stderr": 0.004951780039647604}}, "1": {"PALM_prompt": {"bleu": 0.5769814528994545, "bleu_stderr": 0.025193197721755753, "rouge1_fmeasure": 0.1758582381899693, "rouge1_fmeasure_stderr": 0.003983955125647839, "rouge1_precision": 0.14795332919508947, "rouge1_precision_stderr": 0.004555957390491558, "rouge1_recall": 0.34465037640742197, "rouge1_recall_stderr": 0.005138912085240675, "rouge2_fmeasure": 0.08916041446550299, "rouge2_fmeasure_stderr": 0.0027334564814069677, "rouge2_precision": 0.07528809142549421, "rouge2_precision_stderr": 0.003038187204272963, "rouge2_recall": 0.17791285817633576, "rouge2_recall_stderr": 0.003715854466399584, "rougeL_fmeasure": 0.15931010273605145, "rougeL_fmeasure_stderr": 0.003407821554998019, "rougeL_precision": 0.13248575395781848, "rougeL_precision_stderr": 0.003956867634958241, "rougeL_recall": 0.3221858919798644, "rougeL_recall_stderr": 0.004720579998249014, "rougeLsum_fmeasure": 0.16270655720379557, "rougeLsum_fmeasure_stderr": 0.0035051224294684953, "rougeLsum_precision": 0.13588775259570243, "rougeLsum_precision_stderr": 0.004070124124740705, "rougeLsum_recall": 0.32589646142393197, "rougeLsum_recall_stderr": 0.00476225821513649}}, "2": {"PALM_prompt": {"bleu": 0.757273969449508, "bleu_stderr": 0.03769718299942903, "rouge1_fmeasure": 0.1992600593877848, "rouge1_fmeasure_stderr": 0.004442827211921473, "rouge1_precision": 0.17014846386379712, "rouge1_precision_stderr": 0.005016859635763792, "rouge1_recall": 0.3720574802119457, "rouge1_recall_stderr": 0.005087288580346435, "rouge2_fmeasure": 0.10735692192992242, "rouge2_fmeasure_stderr": 0.0031248613937515605, "rouge2_precision": 0.093405478650147, "rouge2_precision_stderr": 0.003429330670409448, "rouge2_recall": 0.20155130751645584, "rouge2_recall_stderr": 0.003877577986701395, "rougeL_fmeasure": 0.17967063536334463, "rougeL_fmeasure_stderr": 0.0037755125066677945, "rougeL_precision": 0.15052700104482344, "rougeL_precision_stderr": 0.004245512272891528, "rougeL_recall": 0.34762630160096625, "rougeL_recall_stderr": 0.004661487852525495, "rougeLsum_fmeasure": 0.18371016924098071, "rougeLsum_fmeasure_stderr": 0.003909872256599441, "rougeLsum_precision": 0.15488064043942504, "rougeLsum_precision_stderr": 0.004417260662615026, "rougeLsum_recall": 0.3519715581663292, "rougeLsum_recall_stderr": 0.004717058539420343}}, "3": {"PALM_prompt": {"bleu": 0.9024397642343164, "bleu_stderr": 0.035266540176724565, "rouge1_fmeasure": 0.20870183213119045, "rouge1_fmeasure_stderr": 0.004631693380652351, "rouge1_precision": 0.18471036125735174, "rouge1_precision_stderr": 0.005489630293374035, "rouge1_recall": 0.3805012755165752, "rouge1_recall_stderr": 0.005005137236981478, "rouge2_fmeasure": 0.113583334725242, "rouge2_fmeasure_stderr": 0.0032948667404603697, "rouge2_precision": 0.10370590806508058, "rouge2_precision_stderr": 0.0038280983454674926, "rouge2_recall": 0.20616429942611994, "rouge2_recall_stderr": 0.0039581668291269155, "rougeL_fmeasure": 0.18586514274351795, "rougeL_fmeasure_stderr": 0.003929923209703445, "rougeL_precision": 0.16176274791316844, "rougeL_precision_stderr": 0.004674192944246113, "rougeL_recall": 0.3520949564821569, "rougeL_recall_stderr": 0.004572988282023115, "rougeLsum_fmeasure": 0.19140446908068304, "rougeLsum_fmeasure_stderr": 0.004100662443643837, "rougeLsum_precision": 0.16816634803526084, "rougeLsum_precision_stderr": 0.00493084866468226, "rougeLsum_recall": 0.357739744231517, "rougeLsum_recall_stderr": 0.00463949061581328}}, "4": {"PALM_prompt": {"bleu": 0.8974227422118427, "bleu_stderr": 0.047376194483330365, "rouge1_fmeasure": 0.2035351419399052, "rouge1_fmeasure_stderr": 0.004399997467418825, "rouge1_precision": 0.17906409643268184, "rouge1_precision_stderr": 0.005321848596589258, "rouge1_recall": 0.3858418753858739, "rouge1_recall_stderr": 0.004976197182937309, "rouge2_fmeasure": 0.11036497737370927, "rouge2_fmeasure_stderr": 0.0030546477915359676, "rouge2_precision": 0.1003122386275391, "rouge2_precision_stderr": 0.003687831966752624, "rouge2_recall": 0.2110778882420644, "rouge2_recall_stderr": 0.003910920096596726, "rougeL_fmeasure": 0.18161837654150934, "rougeL_fmeasure_stderr": 0.003698960847424029, "rougeL_precision": 0.15679117875129847, "rougeL_precision_stderr": 0.004526750041398485, "rougeL_recall": 0.3588874121532017, "rougeL_recall_stderr": 0.004562842692294942, "rougeLsum_fmeasure": 0.18754398782584164, "rougeLsum_fmeasure_stderr": 0.0039024864471833708, "rougeLsum_precision": 0.163680517550013, "rougeLsum_precision_stderr": 0.004816812827870111, "rougeLsum_recall": 0.36491240136204994, "rougeLsum_recall_stderr": 0.00462946723800189}}, "5": {"PALM_prompt": {"bleu": 0.9956165899729509, "bleu_stderr": 0.06673658339337885, "rouge1_fmeasure": 0.21468744079045568, "rouge1_fmeasure_stderr": 0.004643110254140134, "rouge1_precision": 0.19188269401158986, "rouge1_precision_stderr": 0.00561203563916576, "rouge1_recall": 0.39256506990146606, "rouge1_recall_stderr": 0.004988542684482551, "rouge2_fmeasure": 0.1189316600070313, "rouge2_fmeasure_stderr": 0.003337830869868033, "rouge2_precision": 0.11006706143823348, "rouge2_precision_stderr": 0.003975115552752216, "rouge2_recall": 0.215538485673218, "rouge2_recall_stderr": 0.004061715675646945, "rougeL_fmeasure": 0.1912081729138108, "rougeL_fmeasure_stderr": 0.003931938297787203, "rougeL_precision": 0.16804751696447837, "rougeL_precision_stderr": 0.0047820645272711555, "rougeL_recall": 0.36323858744544546, "rougeL_recall_stderr": 0.004545066248882408, "rougeLsum_fmeasure": 0.1976121117931978, "rougeLsum_fmeasure_stderr": 0.004144052510604372, "rougeLsum_precision": 0.17536219403574763, "rougeLsum_precision_stderr": 0.005062470330652636, "rougeLsum_recall": 0.36948279832750863, "rougeLsum_recall_stderr": 0.004621830630866901}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 2.6751795030941934, "bleu_stderr": 0.10893548185214819, "rouge1_fmeasure": 0.17757343542678158, "rouge1_fmeasure_stderr": 0.0023659515786921244, "rouge1_precision": 0.16302596168393382, "rouge1_precision_stderr": 0.0026043532904908915, "rouge1_recall": 0.23884218562608558, "rouge1_recall_stderr": 0.003209368863654021, "rouge2_fmeasure": 0.041694746971811296, "rouge2_fmeasure_stderr": 0.0010552371667732884, "rouge2_precision": 0.03851453154514113, "rouge2_precision_stderr": 0.0011266484541775893, "rouge2_recall": 0.056617587335353374, "rouge2_recall_stderr": 0.001543998959851649, "rougeL_fmeasure": 0.13591143366007433, "rougeL_fmeasure_stderr": 0.0017334271786663014, "rougeL_precision": 0.12429664959917734, "rougeL_precision_stderr": 0.0019956415846682173, "rougeL_recall": 0.18660082124096708, "rougeL_recall_stderr": 0.0025340157320301996, "rougeLsum_fmeasure": 0.1649398191999782, "rougeLsum_fmeasure_stderr": 0.002208373721898539, "rougeLsum_precision": 0.1517977249527908, "rougeLsum_precision_stderr": 0.0024675362929816253, "rougeLsum_recall": 0.22180300829509095, "rougeLsum_recall_stderr": 0.002994157511717411}}, "1": {"tldr_en": {"bleu": 3.1285629126141115, "bleu_stderr": 0.06699880010971354, "rouge1_fmeasure": 0.19523124968611608, "rouge1_fmeasure_stderr": 0.002480253844121557, "rouge1_precision": 0.2406880794108586, "rouge1_precision_stderr": 0.0037351249911156815, "rouge1_recall": 0.21982181393134473, "rouge1_recall_stderr": 0.0031180124535845686, "rouge2_fmeasure": 0.051619315527043796, "rouge2_fmeasure_stderr": 0.0013416387465087093, "rouge2_precision": 0.06928742384394211, "rouge2_precision_stderr": 0.002228375775026415, "rouge2_recall": 0.05748460591087991, "rouge2_recall_stderr": 0.001573745818264863, "rougeL_fmeasure": 0.14740312057857727, "rougeL_fmeasure_stderr": 0.0018928927367065792, "rougeL_precision": 0.18497537477327256, "rougeL_precision_stderr": 0.003068375414420716, "rougeL_recall": 0.16664127935774325, "rougeL_recall_stderr": 0.0024272789346368347, "rougeLsum_fmeasure": 0.18204704442754094, "rougeLsum_fmeasure_stderr": 0.0023120217528265125, "rougeLsum_precision": 0.22528107172837167, "rougeLsum_precision_stderr": 0.00354271806025313, "rougeLsum_recall": 0.20516272489807588, "rougeLsum_recall_stderr": 0.0029191134099530204}}, "2": {"tldr_en": {"bleu": 4.531754082860088, "bleu_stderr": 0.10399125331016994, "rouge1_fmeasure": 0.24644381498812512, "rouge1_fmeasure_stderr": 0.0023884398488959397, "rouge1_precision": 0.3216712594822311, "rouge1_precision_stderr": 0.003935243736119277, "rouge1_recall": 0.261665296778359, "rouge1_recall_stderr": 0.0029845016299826334, "rouge2_fmeasure": 0.07425118282868326, "rouge2_fmeasure_stderr": 0.0015088992630502053, "rouge2_precision": 0.10243345407249466, "rouge2_precision_stderr": 0.0024500886594184678, "rouge2_recall": 0.07778761705483665, "rouge2_recall_stderr": 0.0017154721932877938, "rougeL_fmeasure": 0.18849324888419672, "rougeL_fmeasure_stderr": 0.0019023219568813786, "rougeL_precision": 0.24910289495716958, "rougeL_precision_stderr": 0.0032748777420407017, "rougeL_recall": 0.20046863563167847, "rougeL_recall_stderr": 0.002394928982561243, "rougeLsum_fmeasure": 0.23177807338597264, "rougeLsum_fmeasure_stderr": 0.0022594764590097827, "rougeLsum_precision": 0.30394125045492665, "rougeLsum_precision_stderr": 0.003791358946164842, "rougeLsum_recall": 0.2458194192978099, "rougeLsum_recall_stderr": 0.002811326235952837}}, "3": {"tldr_en": {"bleu": 3.4831406879717304, "bleu_stderr": 0.08241007277658476, "rouge1_fmeasure": 0.21334837350330835, "rouge1_fmeasure_stderr": 0.002748797973981496, "rouge1_precision": 0.287116176382484, "rouge1_precision_stderr": 0.004235323245239033, "rouge1_recall": 0.2216906568387376, "rouge1_recall_stderr": 0.00329958857167838, "rouge2_fmeasure": 0.06412675156601927, "rouge2_fmeasure_stderr": 0.0014982170650911268, "rouge2_precision": 0.08924550212854968, "rouge2_precision_stderr": 0.0023703209930953256, "rouge2_recall": 0.06666258670328788, "rouge2_recall_stderr": 0.001735156074557458, "rougeL_fmeasure": 0.1644719047729543, "rougeL_fmeasure_stderr": 0.0021698660825835584, "rougeL_precision": 0.22414383280690792, "rougeL_precision_stderr": 0.0034753356031202724, "rougeL_recall": 0.17094750999928582, "rougeL_recall_stderr": 0.0026325465762072203, "rougeLsum_fmeasure": 0.20030924486918408, "rougeLsum_fmeasure_stderr": 0.0026045111310754924, "rougeLsum_precision": 0.2704956129845577, "rougeLsum_precision_stderr": 0.004046924536042148, "rougeLsum_recall": 0.2077672697550655, "rougeLsum_recall_stderr": 0.0031107519952077484}}, "4": {"tldr_en": {"bleu": 0.09773178719963505, "bleu_stderr": 0.014031569943916687, "rouge1_fmeasure": 0.06825353401138246, "rouge1_fmeasure_stderr": 0.002377481081988985, "rouge1_precision": 0.09291933511553724, "rouge1_precision_stderr": 0.0034098767152524823, "rouge1_recall": 0.07059094213022822, "rouge1_recall_stderr": 0.002630599874271742, "rouge2_fmeasure": 0.02075705154212734, "rouge2_fmeasure_stderr": 0.0010482697114407534, "rouge2_precision": 0.029453713051828943, "rouge2_precision_stderr": 0.0016387762462872308, "rouge2_recall": 0.02184092382029149, "rouge2_recall_stderr": 0.0012160027688287562, "rougeL_fmeasure": 0.05413179440242159, "rougeL_fmeasure_stderr": 0.001914789784806498, "rougeL_precision": 0.074717142063866, "rougeL_precision_stderr": 0.0028286174265664005, "rougeL_recall": 0.056043239754653675, "rougeL_recall_stderr": 0.002137136457979107, "rougeLsum_fmeasure": 0.06401934188873082, "rougeLsum_fmeasure_stderr": 0.0022379205013876623, "rougeLsum_precision": 0.08767290445104553, "rougeLsum_precision_stderr": 0.003252248886935673, "rougeLsum_recall": 0.06623420496000304, "rougeLsum_recall_stderr": 0.002480797937618585}}, "5": {"tldr_en": {"bleu": 1.3801513209266578e-13, "bleu_stderr": 2.393889428086806e-12, "rouge1_fmeasure": 0.011368084983385242, "rouge1_fmeasure_stderr": 0.0010834664835199614, "rouge1_precision": 0.016567144503697943, "rouge1_precision_stderr": 0.0016628318525338977, "rouge1_recall": 0.01145157830659587, "rouge1_recall_stderr": 0.0011413368815899247, "rouge2_fmeasure": 0.003623121828969715, "rouge2_fmeasure_stderr": 0.000459861976658157, "rouge2_precision": 0.006203627227708661, "rouge2_precision_stderr": 0.0009621763022467949, "rouge2_recall": 0.003527133124727982, "rouge2_recall_stderr": 0.000453501457574406, "rougeL_fmeasure": 0.0090559078219877, "rougeL_fmeasure_stderr": 0.0008783045884688659, "rougeL_precision": 0.013622903443858888, "rougeL_precision_stderr": 0.0014316929410095427, "rougeL_recall": 0.00908972561893824, "rougeL_recall_stderr": 0.0009163365660648137, "rougeLsum_fmeasure": 0.010828476106003168, "rougeLsum_fmeasure_stderr": 0.001037472898446894, "rougeLsum_precision": 0.01588208088477459, "rougeLsum_precision_stderr": 0.001612751389441228, "rougeLsum_recall": 0.010932406997099305, "rougeLsum_recall_stderr": 0.001099163638182611}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 4.937870822395004, "bleu_stderr": 0.10168092321343061, "rouge1_fmeasure": 0.23163264940481687, "rouge1_fmeasure_stderr": 0.00232732297796637, "rouge1_precision": 0.20931092444187419, "rouge1_precision_stderr": 0.002296933384885726, "rouge1_recall": 0.3041303529781163, "rouge1_recall_stderr": 0.00359054708432495, "rouge2_fmeasure": 0.0908781581806501, "rouge2_fmeasure_stderr": 0.0014152397116370878, "rouge2_precision": 0.07841825615094515, "rouge2_precision_stderr": 0.001456123316893818, "rouge2_recall": 0.12678550257947732, "rouge2_recall_stderr": 0.0021999792364059577, "rougeL_fmeasure": 0.19683944920316307, "rougeL_fmeasure_stderr": 0.0018406405928625433, "rougeL_precision": 0.1779176283587332, "rougeL_precision_stderr": 0.0018896632849821813, "rougeL_recall": 0.25918869249939613, "rougeL_recall_stderr": 0.0029674884139845297, "rougeLsum_fmeasure": 0.2077751987566816, "rougeLsum_fmeasure_stderr": 0.002238453785043258, "rougeLsum_precision": 0.1877127969718346, "rougeLsum_precision_stderr": 0.0021922315674800623, "rougeLsum_recall": 0.2734937412585103, "rougeLsum_recall_stderr": 0.0034380553186087663}}, "1": {"generate_text_restaurant": {"bleu": 12.35501585035212, "bleu_stderr": 0.18071372284843687, "rouge1_fmeasure": 0.4904048469507878, "rouge1_fmeasure_stderr": 0.00236029508784366, "rouge1_precision": 0.6159643956249627, "rouge1_precision_stderr": 0.0032510348220640543, "rouge1_recall": 0.44637313252793925, "rouge1_recall_stderr": 0.0030357503260269275, "rouge2_fmeasure": 0.23548323540578064, "rouge2_fmeasure_stderr": 0.002098999906999727, "rouge2_precision": 0.3020822279572484, "rouge2_precision_stderr": 0.002921577416330603, "rouge2_recall": 0.21352904674144402, "rouge2_recall_stderr": 0.0021849373079422542, "rougeL_fmeasure": 0.35771087777438293, "rougeL_fmeasure_stderr": 0.0021223257983437878, "rougeL_precision": 0.4540639031683146, "rougeL_precision_stderr": 0.0031541608471273223, "rougeL_recall": 0.3240708429452446, "rougeL_recall_stderr": 0.0024551718893166866, "rougeLsum_fmeasure": 0.4012496336411595, "rougeLsum_fmeasure_stderr": 0.0023624811787683396, "rougeLsum_precision": 0.506050260076472, "rougeLsum_precision_stderr": 0.00330906118971616, "rougeLsum_recall": 0.36451016514620255, "rougeLsum_recall_stderr": 0.002762896135883007}}, "2": {"generate_text_restaurant": {"bleu": 14.616889340275883, "bleu_stderr": 0.21143357607740182, "rouge1_fmeasure": 0.5168001246025699, "rouge1_fmeasure_stderr": 0.0022398323650930523, "rouge1_precision": 0.6206291956244673, "rouge1_precision_stderr": 0.0030975305933258674, "rouge1_recall": 0.47883869959728276, "rouge1_recall_stderr": 0.0029295710982191942, "rouge2_fmeasure": 0.25956862228055444, "rouge2_fmeasure_stderr": 0.0021439309777063396, "rouge2_precision": 0.31651307777573484, "rouge2_precision_stderr": 0.0028268105311273595, "rouge2_recall": 0.24021271727145022, "rouge2_recall_stderr": 0.002287708719504301, "rougeL_fmeasure": 0.3786193404650426, "rougeL_fmeasure_stderr": 0.002133418892476092, "rougeL_precision": 0.4575987425747188, "rougeL_precision_stderr": 0.003003444774161003, "rougeL_recall": 0.3495714749590036, "rougeL_recall_stderr": 0.002458484856725825, "rougeLsum_fmeasure": 0.43012681307330064, "rougeLsum_fmeasure_stderr": 0.002347788156588727, "rougeLsum_precision": 0.5176479425878214, "rougeLsum_precision_stderr": 0.003175094250090154, "rougeLsum_recall": 0.39788478108529884, "rougeLsum_recall_stderr": 0.0027583423936942022}}, "3": {"generate_text_restaurant": {"bleu": 15.60922413848781, "bleu_stderr": 0.22222075620514087, "rouge1_fmeasure": 0.5243455083909884, "rouge1_fmeasure_stderr": 0.0022677120618699695, "rouge1_precision": 0.6213477308543962, "rouge1_precision_stderr": 0.003127511727417513, "rouge1_recall": 0.48791956313887175, "rouge1_recall_stderr": 0.0028969581884825545, "rouge2_fmeasure": 0.26797191344908083, "rouge2_fmeasure_stderr": 0.0022492971355441097, "rouge2_precision": 0.3211891017766391, "rouge2_precision_stderr": 0.0028592971157519907, "rouge2_recall": 0.24915681113277957, "rouge2_recall_stderr": 0.0023874630155306096, "rougeL_fmeasure": 0.3864420062211574, "rougeL_fmeasure_stderr": 0.0022008161713602944, "rougeL_precision": 0.4595759214605003, "rougeL_precision_stderr": 0.0029916740792618303, "rougeL_recall": 0.3587558615108837, "rougeL_recall_stderr": 0.002498895208664132, "rougeLsum_fmeasure": 0.4383204560402971, "rougeLsum_fmeasure_stderr": 0.002404771234214407, "rougeLsum_precision": 0.5195127110383976, "rougeLsum_precision_stderr": 0.003174890164534984, "rougeLsum_recall": 0.4075244452419279, "rougeLsum_recall_stderr": 0.0027745483399863975}}, "4": {"generate_text_restaurant": {"bleu": 16.011962277678624, "bleu_stderr": 0.22022432943978618, "rouge1_fmeasure": 0.5293198872823365, "rouge1_fmeasure_stderr": 0.0022241855653776944, "rouge1_precision": 0.6211926185877573, "rouge1_precision_stderr": 0.0031252626999772404, "rouge1_recall": 0.4940540671864064, "rouge1_recall_stderr": 0.002811103415975642, "rouge2_fmeasure": 0.27145115399075137, "rouge2_fmeasure_stderr": 0.0022625881987756264, "rouge2_precision": 0.3222299861299632, "rouge2_precision_stderr": 0.002870261163061151, "rouge2_recall": 0.2531196441399145, "rouge2_recall_stderr": 0.002391669204538802, "rougeL_fmeasure": 0.3888843450358488, "rougeL_fmeasure_stderr": 0.0021625481352715572, "rougeL_precision": 0.45749565793505115, "rougeL_precision_stderr": 0.0029239955822613823, "rougeL_recall": 0.3627340059318637, "rougeL_recall_stderr": 0.002475018808839022, "rougeLsum_fmeasure": 0.44303614042086686, "rougeLsum_fmeasure_stderr": 0.002385503362679958, "rougeLsum_precision": 0.5200621000842451, "rougeLsum_precision_stderr": 0.0031757322838288802, "rougeLsum_recall": 0.41347570677906165, "rougeLsum_recall_stderr": 0.0027471428706990248}}, "5": {"generate_text_restaurant": {"bleu": 15.965511431425572, "bleu_stderr": 0.22939254022077785, "rouge1_fmeasure": 0.5304583895558246, "rouge1_fmeasure_stderr": 0.0021896809157722313, "rouge1_precision": 0.620032184682295, "rouge1_precision_stderr": 0.0030854508497314163, "rouge1_recall": 0.494070023316965, "rouge1_recall_stderr": 0.002713528076964048, "rouge2_fmeasure": 0.27194008850636997, "rouge2_fmeasure_stderr": 0.0022394498653639954, "rouge2_precision": 0.3214733690798853, "rouge2_precision_stderr": 0.00283742331030653, "rouge2_recall": 0.2529051360673717, "rouge2_recall_stderr": 0.002334810498609401, "rougeL_fmeasure": 0.39202171201975483, "rougeL_fmeasure_stderr": 0.002176343782453659, "rougeL_precision": 0.4584037931267516, "rougeL_precision_stderr": 0.0028990356337931017, "rougeL_recall": 0.3653287151283581, "rougeL_recall_stderr": 0.0024531687545858334, "rougeLsum_fmeasure": 0.44473199160123383, "rougeLsum_fmeasure_stderr": 0.002391683545192119, "rougeLsum_precision": 0.519612504788164, "rougeLsum_precision_stderr": 0.00315462337627905, "rougeLsum_recall": 0.41429471727641565, "rougeLsum_recall_stderr": 0.0027037586488582216}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 1.6058786904736198, "bleu_stderr": 0.12459015370719587, "rouge1_fmeasure": 0.15975132761730468, "rouge1_fmeasure_stderr": 0.002826489462693867, "rouge1_precision": 0.12368904495741256, "rouge1_precision_stderr": 0.0023171132221842185, "rouge1_recall": 0.2438396047903194, "rouge1_recall_stderr": 0.004587337646816985, "rouge2_fmeasure": 0.03780530734116865, "rouge2_fmeasure_stderr": 0.0015708073244538232, "rouge2_precision": 0.0293373865185686, "rouge2_precision_stderr": 0.0014387609508787426, "rouge2_recall": 0.059007813076984654, "rouge2_recall_stderr": 0.002488834124286237, "rougeL_fmeasure": 0.1253754650359875, "rougeL_fmeasure_stderr": 0.0022280153555414655, "rougeL_precision": 0.09746637369343818, "rougeL_precision_stderr": 0.0019134317711632482, "rougeL_recall": 0.19151135265895355, "rougeL_recall_stderr": 0.0036632482380794923, "rougeLsum_fmeasure": 0.12959185604651055, "rougeLsum_fmeasure_stderr": 0.0023778146868072415, "rougeLsum_precision": 0.10069499239897962, "rougeLsum_precision_stderr": 0.0020159231592045846, "rougeLsum_recall": 0.1978160998586425, "rougeLsum_recall_stderr": 0.0038698495290395056}}, "1": {"article_DOC_summary": {"bleu": 3.334247171090826, "bleu_stderr": 0.2305716078197547, "rouge1_fmeasure": 0.24541064788227074, "rouge1_fmeasure_stderr": 0.00354063506526513, "rouge1_precision": 0.26085076234423055, "rouge1_precision_stderr": 0.004393846973206814, "rouge1_recall": 0.2588441515496624, "rouge1_recall_stderr": 0.004005532773557462, "rouge2_fmeasure": 0.06173760904490974, "rouge2_fmeasure_stderr": 0.0024871664924425037, "rouge2_precision": 0.06771998895758684, "rouge2_precision_stderr": 0.0029066254436555103, "rouge2_recall": 0.06386750564126997, "rouge2_recall_stderr": 0.0025929413613500775, "rougeL_fmeasure": 0.1858021335070401, "rougeL_fmeasure_stderr": 0.0030629589623779076, "rougeL_precision": 0.19864675058790465, "rougeL_precision_stderr": 0.0038209500782218518, "rougeL_recall": 0.195308999787071, "rougeL_recall_stderr": 0.003336163469767863, "rougeLsum_fmeasure": 0.1886174336524096, "rougeLsum_fmeasure_stderr": 0.0030767918248420633, "rougeLsum_precision": 0.20095708193235132, "rougeLsum_precision_stderr": 0.003807825279077122, "rougeLsum_recall": 0.19950787449175908, "rougeLsum_recall_stderr": 0.003471150084006834}}, "2": {"article_DOC_summary": {"bleu": 4.010733459515201, "bleu_stderr": 0.2220017911148554, "rouge1_fmeasure": 0.2606004147942292, "rouge1_fmeasure_stderr": 0.0036081748480290554, "rouge1_precision": 0.2808527202175755, "rouge1_precision_stderr": 0.004370590224070957, "rouge1_recall": 0.2617722819644407, "rouge1_recall_stderr": 0.0037984638757868477, "rouge2_fmeasure": 0.06820161970089914, "rouge2_fmeasure_stderr": 0.0026142084398696414, "rouge2_precision": 0.07481799220647589, "rouge2_precision_stderr": 0.0029899592615070703, "rouge2_recall": 0.06787325129121033, "rouge2_recall_stderr": 0.002638855585594665, "rougeL_fmeasure": 0.19811259443180443, "rougeL_fmeasure_stderr": 0.0031149589842912988, "rougeL_precision": 0.21454050742109196, "rougeL_precision_stderr": 0.003805704528997883, "rougeL_recall": 0.1984559915116539, "rougeL_recall_stderr": 0.0032005701409087216, "rougeLsum_fmeasure": 0.20052042410087703, "rougeLsum_fmeasure_stderr": 0.0031381403706602514, "rougeLsum_precision": 0.21670491964360883, "rougeLsum_precision_stderr": 0.003811777174543378, "rougeLsum_recall": 0.20151490472824285, "rougeLsum_recall_stderr": 0.003270439631264535}}, "3": {"article_DOC_summary": {"bleu": 3.7017664823306986, "bleu_stderr": 0.1507032164624935, "rouge1_fmeasure": 0.24743596030850362, "rouge1_fmeasure_stderr": 0.004130655017151295, "rouge1_precision": 0.2706443419590105, "rouge1_precision_stderr": 0.0049303309520587315, "rouge1_recall": 0.24624474324774795, "rouge1_recall_stderr": 0.004229600775260044, "rouge2_fmeasure": 0.06650858602975873, "rouge2_fmeasure_stderr": 0.0026299416495125026, "rouge2_precision": 0.07386755593801608, "rouge2_precision_stderr": 0.0030555237045533316, "rouge2_recall": 0.06557314117702792, "rouge2_recall_stderr": 0.0025890340219220658, "rougeL_fmeasure": 0.18796867977199047, "rougeL_fmeasure_stderr": 0.003455324216798634, "rougeL_precision": 0.2064337208871898, "rougeL_precision_stderr": 0.004127041768838929, "rougeL_recall": 0.18681632649605892, "rougeL_recall_stderr": 0.003495395945435518, "rougeLsum_fmeasure": 0.18918373638634367, "rougeLsum_fmeasure_stderr": 0.003460104310580898, "rougeLsum_precision": 0.20758116522144787, "rougeLsum_precision_stderr": 0.004120539971998013, "rougeLsum_recall": 0.1882278840684571, "rougeLsum_recall_stderr": 0.003517686123465377}}, "4": {"article_DOC_summary": {"bleu": 0.07887552808866259, "bleu_stderr": 0.030341131889656193, "rouge1_fmeasure": 0.057815204376418204, "rouge1_fmeasure_stderr": 0.003618997876338674, "rouge1_precision": 0.06554749748154207, "rouge1_precision_stderr": 0.004219087280136839, "rouge1_recall": 0.05641814843809397, "rouge1_recall_stderr": 0.003592807957006194, "rouge2_fmeasure": 0.01551850102381909, "rouge2_fmeasure_stderr": 0.0014448306541374053, "rouge2_precision": 0.01829578378881792, "rouge2_precision_stderr": 0.0017753435247383593, "rouge2_recall": 0.014766188974362899, "rouge2_recall_stderr": 0.0013861010727158796, "rougeL_fmeasure": 0.04356445159603049, "rougeL_fmeasure_stderr": 0.0027962345799032616, "rougeL_precision": 0.049847079919462155, "rougeL_precision_stderr": 0.003313380982244201, "rougeL_recall": 0.04239818149428434, "rougeL_recall_stderr": 0.002766706142036047, "rougeLsum_fmeasure": 0.043963760214834266, "rougeLsum_fmeasure_stderr": 0.002813226760349887, "rougeLsum_precision": 0.05028688975410892, "rougeLsum_precision_stderr": 0.0033308048953447043, "rougeLsum_recall": 0.042898501891038276, "rougeLsum_recall_stderr": 0.0028053186516026145}}, "5": {"article_DOC_summary": {"bleu": 3.850151141374283e-51, "bleu_stderr": 9.847373987416963e-37, "rouge1_fmeasure": 0.0017894336969871943, "rouge1_fmeasure_stderr": 0.0006514343833614674, "rouge1_precision": 0.0017127173298628544, "rouge1_precision_stderr": 0.0006359662396544354, "rouge1_recall": 0.0019529368678346303, "rouge1_recall_stderr": 0.0006970359035754604, "rouge2_fmeasure": 0.00022244323459347703, "rouge2_fmeasure_stderr": 0.00010310824874009924, "rouge2_precision": 0.00021661695663762333, "rouge2_precision_stderr": 0.00010194690557663026, "rouge2_recall": 0.00023546341891455505, "rouge2_recall_stderr": 0.00010683333498514203, "rougeL_fmeasure": 0.0011544890871405323, "rougeL_fmeasure_stderr": 0.0004317370833710289, "rougeL_precision": 0.0011066908441476557, "rougeL_precision_stderr": 0.00042211801917848034, "rougeL_recall": 0.001255464636408485, "rougeL_recall_stderr": 0.0004593501480469735, "rougeLsum_fmeasure": 0.0011764796751688564, "rougeLsum_fmeasure_stderr": 0.00043780922937178545, "rougeLsum_precision": 0.00112287259760246, "rougeLsum_precision_stderr": 0.00042548262790938034, "rougeLsum_recall": 0.0012897699537326702, "rougeLsum_recall_stderr": 0.00047316395112219063}}}}