{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.2871925225988394, "bleu_stderr": 0.02880794237734816, "rouge1_fmeasure": 0.10707093959955763, "rouge1_fmeasure_stderr": 0.0019099253416430774, "rouge1_precision": 0.07031750338322859, "rouge1_precision_stderr": 0.0015362201736309874, "rouge1_recall": 0.3012155634284117, "rouge1_recall_stderr": 0.004546846231718025, "rouge2_fmeasure": 0.049917192299013896, "rouge2_fmeasure_stderr": 0.0012014538250113653, "rouge2_precision": 0.03252619427180376, "rouge2_precision_stderr": 0.0009041180535715348, "rouge2_recall": 0.14439430798437106, "rouge2_recall_stderr": 0.0030595449553106713, "rougeL_fmeasure": 0.10327080072990603, "rougeL_fmeasure_stderr": 0.0017814345648663893, "rougeL_precision": 0.06757287768017098, "rougeL_precision_stderr": 0.001414062975537199, "rougeL_recall": 0.2931917692240097, "rougeL_recall_stderr": 0.0044525581749204875, "rougeLsum_fmeasure": 0.10238598559666155, "rougeLsum_fmeasure_stderr": 0.001793711398293261, "rougeLsum_precision": 0.06720725044881726, "rougeLsum_precision_stderr": 0.0014407633141713585, "rougeLsum_recall": 0.2882066628071488, "rougeLsum_recall_stderr": 0.0042625595600572705}}, "1": {"PALM_prompt": {"bleu": 0.4674006237665374, "bleu_stderr": 0.03675015156688127, "rouge1_fmeasure": 0.11843411039548267, "rouge1_fmeasure_stderr": 0.001895876971489225, "rouge1_precision": 0.07708396436923028, "rouge1_precision_stderr": 0.001529013971135644, "rouge1_recall": 0.36235242098066, "rouge1_recall_stderr": 0.00504305962540817, "rouge2_fmeasure": 0.05553061893758205, "rouge2_fmeasure_stderr": 0.0012200850248834274, "rouge2_precision": 0.035725346847754684, "rouge2_precision_stderr": 0.0008827277116185362, "rouge2_recall": 0.17866943863024684, "rouge2_recall_stderr": 0.003599106083841207, "rougeL_fmeasure": 0.11228525846628372, "rougeL_fmeasure_stderr": 0.0017420331023114827, "rougeL_precision": 0.07294152863590639, "rougeL_precision_stderr": 0.0014064426998360536, "rougeL_recall": 0.3437168036630356, "rougeL_recall_stderr": 0.004711682138202734, "rougeLsum_fmeasure": 0.11267135213673385, "rougeLsum_fmeasure_stderr": 0.0017806522868172628, "rougeLsum_precision": 0.07337404630465882, "rougeLsum_precision_stderr": 0.0014496612765965426, "rougeLsum_recall": 0.3436003452114997, "rougeLsum_recall_stderr": 0.004616609203187745}}, "2": {"PALM_prompt": {"bleu": 0.5250778439407279, "bleu_stderr": 0.025625496064299234, "rouge1_fmeasure": 0.1222441134481138, "rouge1_fmeasure_stderr": 0.0019020155784340502, "rouge1_precision": 0.0786831611862841, "rouge1_precision_stderr": 0.0014969718758498687, "rouge1_recall": 0.3956998500897082, "rouge1_recall_stderr": 0.005131459404981971, "rouge2_fmeasure": 0.057331612844470456, "rouge2_fmeasure_stderr": 0.001226447389142751, "rouge2_precision": 0.03682232020364324, "rouge2_precision_stderr": 0.0009265440871287532, "rouge2_recall": 0.19779728011829195, "rouge2_recall_stderr": 0.0038163400420330356, "rougeL_fmeasure": 0.11353522248821303, "rougeL_fmeasure_stderr": 0.001703018837429438, "rougeL_precision": 0.07302274174131225, "rougeL_precision_stderr": 0.001338647584797816, "rougeL_recall": 0.36618568072469376, "rougeL_recall_stderr": 0.004622159858156629, "rougeLsum_fmeasure": 0.11628410210009521, "rougeLsum_fmeasure_stderr": 0.0017922853862293046, "rougeLsum_precision": 0.07488527729009754, "rougeLsum_precision_stderr": 0.001411146414679001, "rougeLsum_recall": 0.3754608054763451, "rougeLsum_recall_stderr": 0.004798151749531035}}, "3": {"PALM_prompt": {"bleu": 0.6240971401779115, "bleu_stderr": 0.03840020245332954, "rouge1_fmeasure": 0.12413425365513392, "rouge1_fmeasure_stderr": 0.0018801730074252724, "rouge1_precision": 0.07946921950052364, "rouge1_precision_stderr": 0.0015734983149428565, "rouge1_recall": 0.41443709705557313, "rouge1_recall_stderr": 0.0052063482293464285, "rouge2_fmeasure": 0.05836966723015618, "rouge2_fmeasure_stderr": 0.0012404189838209753, "rouge2_precision": 0.03727374629297188, "rouge2_precision_stderr": 0.0010068745541143666, "rouge2_recall": 0.20933728572588564, "rouge2_recall_stderr": 0.0039729036741121115, "rougeL_fmeasure": 0.11463438747216832, "rougeL_fmeasure_stderr": 0.0016925693943895671, "rougeL_precision": 0.07340984582992345, "rougeL_precision_stderr": 0.0014110667213403662, "rougeL_recall": 0.3803567082991153, "rougeL_recall_stderr": 0.004624202286888448, "rougeLsum_fmeasure": 0.11802649327609507, "rougeLsum_fmeasure_stderr": 0.0017907209912884955, "rougeLsum_precision": 0.07570628299965847, "rougeLsum_precision_stderr": 0.0015124490142500056, "rougeLsum_recall": 0.39213432148715394, "rougeLsum_recall_stderr": 0.004828378800565317}}, "4": {"PALM_prompt": {"bleu": 0.6460958847523566, "bleu_stderr": 0.03922360003785139, "rouge1_fmeasure": 0.12269659017119199, "rouge1_fmeasure_stderr": 0.0017597424238451932, "rouge1_precision": 0.07760008602513783, "rouge1_precision_stderr": 0.001320690166501572, "rouge1_recall": 0.4207626130570328, "rouge1_recall_stderr": 0.0051343858175420766, "rouge2_fmeasure": 0.0577700863367864, "rouge2_fmeasure_stderr": 0.001158809400479912, "rouge2_precision": 0.03635274690781486, "rouge2_precision_stderr": 0.0008330185169416092, "rouge2_recall": 0.2129557453468375, "rouge2_recall_stderr": 0.003851289229933982, "rougeL_fmeasure": 0.11231459598044416, "rougeL_fmeasure_stderr": 0.0015694568258752962, "rougeL_precision": 0.07107029230772488, "rougeL_precision_stderr": 0.001171387599016451, "rougeL_recall": 0.38200909854824977, "rougeL_recall_stderr": 0.004464667845112728, "rougeLsum_fmeasure": 0.11625392090888889, "rougeLsum_fmeasure_stderr": 0.0016649015391818642, "rougeLsum_precision": 0.07356474812940257, "rougeLsum_precision_stderr": 0.0012438027129333135, "rougeLsum_recall": 0.39729543398826606, "rougeLsum_recall_stderr": 0.004755911479219925}}, "5": {"PALM_prompt": {"bleu": 0.7283147266727299, "bleu_stderr": 0.03506630990313516, "rouge1_fmeasure": 0.12670702220068714, "rouge1_fmeasure_stderr": 0.0018353031821599214, "rouge1_precision": 0.0800529618846568, "rouge1_precision_stderr": 0.0014030415087213262, "rouge1_recall": 0.4360056147654019, "rouge1_recall_stderr": 0.005237161872126708, "rouge2_fmeasure": 0.05951196634046783, "rouge2_fmeasure_stderr": 0.0011799130523628795, "rouge2_precision": 0.037349148159645094, "rouge2_precision_stderr": 0.000853308549188945, "rouge2_recall": 0.2217598521275178, "rouge2_recall_stderr": 0.003994885901439153, "rougeL_fmeasure": 0.11485528722019342, "rougeL_fmeasure_stderr": 0.001589365738462336, "rougeL_precision": 0.07255538123365188, "rougeL_precision_stderr": 0.0012004887370386942, "rougeL_recall": 0.39357574348180674, "rougeL_recall_stderr": 0.004547413362244599, "rougeLsum_fmeasure": 0.11989099231027077, "rougeLsum_fmeasure_stderr": 0.0017190774588667075, "rougeLsum_precision": 0.07578798351325475, "rougeLsum_precision_stderr": 0.0012955589973183616, "rougeLsum_recall": 0.4104972172441367, "rougeLsum_recall_stderr": 0.0048123434799543785}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 1.6192080325529026, "bleu_stderr": 0.04050520870343064, "rouge1_fmeasure": 0.17809655126532312, "rouge1_fmeasure_stderr": 0.0018236388559653763, "rouge1_precision": 0.15222794945796614, "rouge1_precision_stderr": 0.001854391491208858, "rouge1_recall": 0.259279440153063, "rouge1_recall_stderr": 0.0027052349535794085, "rouge2_fmeasure": 0.03601951697280678, "rouge2_fmeasure_stderr": 0.0008300101222283796, "rouge2_precision": 0.030497998250497895, "rouge2_precision_stderr": 0.0007413435249853986, "rouge2_recall": 0.05425261740808977, "rouge2_recall_stderr": 0.001399269212332445, "rougeL_fmeasure": 0.1384741786574652, "rougeL_fmeasure_stderr": 0.0012894950527783321, "rougeL_precision": 0.11697977840134756, "rougeL_precision_stderr": 0.0012794261124303204, "rougeL_recall": 0.2062333696623697, "rougeL_recall_stderr": 0.0021597198817625285, "rougeLsum_fmeasure": 0.1628530750095549, "rougeLsum_fmeasure_stderr": 0.0016530415994811475, "rougeLsum_precision": 0.1389877568936686, "rougeLsum_precision_stderr": 0.0016763555392295747, "rougeLsum_recall": 0.23808538118300834, "rougeLsum_recall_stderr": 0.0025032807703488534}}, "1": {"tldr_en": {"bleu": 2.545643626821724, "bleu_stderr": 0.048869510836124584, "rouge1_fmeasure": 0.20484942755932814, "rouge1_fmeasure_stderr": 0.001960405666708866, "rouge1_precision": 0.17909391212556103, "rouge1_precision_stderr": 0.0021684904700656395, "rouge1_recall": 0.2986428547454232, "rouge1_recall_stderr": 0.002901154619840759, "rouge2_fmeasure": 0.04757609861819433, "rouge2_fmeasure_stderr": 0.0009961877982725383, "rouge2_precision": 0.04098672752953724, "rouge2_precision_stderr": 0.0009402949935154375, "rouge2_recall": 0.07250823843480829, "rouge2_recall_stderr": 0.00171407343966866, "rougeL_fmeasure": 0.14525233898326748, "rougeL_fmeasure_stderr": 0.001303267897245817, "rougeL_precision": 0.12586154047693615, "rougeL_precision_stderr": 0.001447455908294373, "rougeL_recall": 0.21783174447787615, "rougeL_recall_stderr": 0.002284390945146576, "rougeLsum_fmeasure": 0.19265194446101522, "rougeLsum_fmeasure_stderr": 0.0018360173432108782, "rougeLsum_precision": 0.16826083836269604, "rougeLsum_precision_stderr": 0.0020324268022024173, "rougeLsum_recall": 0.28157870760475356, "rougeLsum_recall_stderr": 0.002752878166728396}}, "2": {"tldr_en": {"bleu": 3.123719853905042, "bleu_stderr": 0.09435758546693512, "rouge1_fmeasure": 0.21836409386191818, "rouge1_fmeasure_stderr": 0.001989518194370473, "rouge1_precision": 0.2332474242904849, "rouge1_precision_stderr": 0.0031768172038711467, "rouge1_recall": 0.29410268890498986, "rouge1_recall_stderr": 0.002958828414438297, "rouge2_fmeasure": 0.05650249608530642, "rouge2_fmeasure_stderr": 0.0011487340298214372, "rouge2_precision": 0.06566711930000235, "rouge2_precision_stderr": 0.0019413943466877388, "rouge2_recall": 0.07670871046547496, "rouge2_recall_stderr": 0.0016787739182338268, "rougeL_fmeasure": 0.1603606067900483, "rougeL_fmeasure_stderr": 0.0014157142739287894, "rougeL_precision": 0.1752085713341631, "rougeL_precision_stderr": 0.0026584779502129303, "rougeL_recall": 0.21819240455646285, "rougeL_recall_stderr": 0.002276168106614223, "rougeLsum_fmeasure": 0.20617794726883687, "rougeLsum_fmeasure_stderr": 0.0018867289872942854, "rougeLsum_precision": 0.22112816157170134, "rougeLsum_precision_stderr": 0.0030769042746772593, "rougeLsum_recall": 0.2776979400072693, "rougeLsum_recall_stderr": 0.002813335835445409}}, "3": {"tldr_en": {"bleu": 3.5006949715383118, "bleu_stderr": 0.08071997944617754, "rouge1_fmeasure": 0.1819863863181494, "rouge1_fmeasure_stderr": 0.0024282963824572346, "rouge1_precision": 0.22344987630747953, "rouge1_precision_stderr": 0.0038946320752308397, "rouge1_recall": 0.228687908011972, "rouge1_recall_stderr": 0.0033634865916312945, "rouge2_fmeasure": 0.05005886014366939, "rouge2_fmeasure_stderr": 0.0012507484027525577, "rouge2_precision": 0.06821362116644611, "rouge2_precision_stderr": 0.0023091245896002433, "rouge2_recall": 0.06243742554002245, "rouge2_recall_stderr": 0.001665626169617889, "rougeL_fmeasure": 0.13680266609806765, "rougeL_fmeasure_stderr": 0.001821525871477116, "rougeL_precision": 0.17380086539073145, "rougeL_precision_stderr": 0.003294779021368952, "rougeL_recall": 0.1728818390227638, "rougeL_recall_stderr": 0.0026287282834976822, "rougeLsum_fmeasure": 0.17195845477450572, "rougeLsum_fmeasure_stderr": 0.0023005495305984053, "rougeLsum_precision": 0.21200019749157653, "rougeLsum_precision_stderr": 0.003735810714751958, "rougeLsum_recall": 0.21587781354640423, "rougeLsum_recall_stderr": 0.003186682013692883}}, "4": {"tldr_en": {"bleu": 0.4203638205606742, "bleu_stderr": 0.04062156232814086, "rouge1_fmeasure": 0.05800966504497334, "rouge1_fmeasure_stderr": 0.002055695120200674, "rouge1_precision": 0.06907034391802865, "rouge1_precision_stderr": 0.002842925157819051, "rouge1_recall": 0.07641790711530233, "rouge1_recall_stderr": 0.0028071608967584296, "rouge2_fmeasure": 0.015594437236270214, "rouge2_fmeasure_stderr": 0.0008033551932234715, "rouge2_precision": 0.020323118606363738, "rouge2_precision_stderr": 0.0013765538659170954, "rouge2_recall": 0.020689214217856734, "rouge2_recall_stderr": 0.0011098261782535187, "rougeL_fmeasure": 0.04363217232305618, "rougeL_fmeasure_stderr": 0.0015475509311173715, "rougeL_precision": 0.05326819078634553, "rougeL_precision_stderr": 0.002300594360643888, "rougeL_recall": 0.05823666899257084, "rougeL_recall_stderr": 0.0021806250615139192, "rougeLsum_fmeasure": 0.05441077080277394, "rougeLsum_fmeasure_stderr": 0.0019346325978603714, "rougeLsum_precision": 0.06512227133445396, "rougeLsum_precision_stderr": 0.002711627122094951, "rougeLsum_recall": 0.07184593801381658, "rougeLsum_recall_stderr": 0.0026558284841563095}}, "5": {"tldr_en": {"bleu": 1.610620675193976e-08, "bleu_stderr": 6.336079313722214e-08, "rouge1_fmeasure": 0.008814606254748622, "rouge1_fmeasure_stderr": 0.0008820141996097188, "rouge1_precision": 0.011141473368752484, "rouge1_precision_stderr": 0.0012984382630292146, "rouge1_recall": 0.011356368661606248, "rouge1_recall_stderr": 0.001166446625113568, "rouge2_fmeasure": 0.0024833328621297794, "rouge2_fmeasure_stderr": 0.0003381158590391299, "rouge2_precision": 0.0036979579695363266, "rouge2_precision_stderr": 0.00069734856115032, "rouge2_recall": 0.0030116660387216835, "rouge2_recall_stderr": 0.00039145176963269976, "rougeL_fmeasure": 0.0067361341505456805, "rougeL_fmeasure_stderr": 0.0006778741138953477, "rougeL_precision": 0.008749076310088717, "rougeL_precision_stderr": 0.0010822814361618575, "rougeL_recall": 0.008702418570223684, "rougeL_recall_stderr": 0.0008937526565969341, "rougeLsum_fmeasure": 0.008282398875850052, "rougeLsum_fmeasure_stderr": 0.0008304343325046589, "rougeLsum_precision": 0.010561687151292019, "rougeLsum_precision_stderr": 0.0012526496630397305, "rougeLsum_recall": 0.010693942253000091, "rougeLsum_recall_stderr": 0.001098581608402249}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 0.8175837539659996, "bleu_stderr": 0.06903661804515053, "rouge1_fmeasure": 0.07913875454413057, "rouge1_fmeasure_stderr": 0.0015242869094641899, "rouge1_precision": 0.067410137720777, "rouge1_precision_stderr": 0.0015267778764287776, "rouge1_recall": 0.11905569111444682, "rouge1_recall_stderr": 0.002272837057404917, "rouge2_fmeasure": 0.010022915068112901, "rouge2_fmeasure_stderr": 0.0005999619167956302, "rouge2_precision": 0.00855571479752271, "rouge2_precision_stderr": 0.000610070681102783, "rouge2_recall": 0.01452701665726237, "rouge2_recall_stderr": 0.0008619364610158222, "rougeL_fmeasure": 0.07774011765647057, "rougeL_fmeasure_stderr": 0.0014739968390031794, "rougeL_precision": 0.06588530481318243, "rougeL_precision_stderr": 0.001456682483397516, "rougeL_recall": 0.11730596366118605, "rougeL_recall_stderr": 0.0022143035280371703, "rougeLsum_fmeasure": 0.06060524038626222, "rougeLsum_fmeasure_stderr": 0.0012344605903209444, "rougeLsum_precision": 0.053281568752607505, "rougeLsum_precision_stderr": 0.0013584259494467741, "rougeLsum_recall": 0.0896663423829268, "rougeLsum_recall_stderr": 0.0017758029746831937}}, "1": {"generate_text_restaurant": {"bleu": 11.360023014480657, "bleu_stderr": 0.14523312599938573, "rouge1_fmeasure": 0.4457059970163705, "rouge1_fmeasure_stderr": 0.0023475038584115206, "rouge1_precision": 0.5368002507342822, "rouge1_precision_stderr": 0.003197714150333534, "rouge1_recall": 0.4204347436029918, "rouge1_recall_stderr": 0.0029932330301144583, "rouge2_fmeasure": 0.20489136085595536, "rouge2_fmeasure_stderr": 0.0019458972766888125, "rouge2_precision": 0.25010730577128015, "rouge2_precision_stderr": 0.0025416736419787912, "rouge2_recall": 0.19320140085672308, "rouge2_recall_stderr": 0.0021059841419488645, "rougeL_fmeasure": 0.321161092281206, "rougeL_fmeasure_stderr": 0.001995161634007105, "rougeL_precision": 0.390181985500488, "rougeL_precision_stderr": 0.002842772643373759, "rougeL_recall": 0.30202346410754144, "rougeL_recall_stderr": 0.002382966736707436, "rougeLsum_fmeasure": 0.3629740875330838, "rougeLsum_fmeasure_stderr": 0.00225666081685001, "rougeLsum_precision": 0.4390382418075218, "rougeLsum_precision_stderr": 0.003082038398447118, "rougeLsum_recall": 0.34172069570320107, "rougeLsum_recall_stderr": 0.0026874775375555484}}, "2": {"generate_text_restaurant": {"bleu": 13.284050272128148, "bleu_stderr": 0.1770460818661209, "rouge1_fmeasure": 0.47571760194079554, "rouge1_fmeasure_stderr": 0.002265550724177173, "rouge1_precision": 0.5714641277328295, "rouge1_precision_stderr": 0.0032799480051059426, "rouge1_recall": 0.4468451656698964, "rouge1_recall_stderr": 0.0029010255062063995, "rouge2_fmeasure": 0.2325284196471626, "rouge2_fmeasure_stderr": 0.0020182406639818696, "rouge2_precision": 0.28407643182119585, "rouge2_precision_stderr": 0.002743346128512875, "rouge2_recall": 0.21834852344926514, "rouge2_recall_stderr": 0.0021773726271045162, "rougeL_fmeasure": 0.3475057918065784, "rougeL_fmeasure_stderr": 0.0020325138450125527, "rougeL_precision": 0.4201198181536731, "rougeL_precision_stderr": 0.002974299270315645, "rougeL_recall": 0.32583054256145155, "rougeL_recall_stderr": 0.002409815129643757, "rougeLsum_fmeasure": 0.391612619922272, "rougeLsum_fmeasure_stderr": 0.002268675240750965, "rougeLsum_precision": 0.4715445246123803, "rougeLsum_precision_stderr": 0.0031935178217488633, "rougeLsum_recall": 0.36737757013379746, "rougeLsum_recall_stderr": 0.002675859339354407}}, "3": {"generate_text_restaurant": {"bleu": 14.26351682307982, "bleu_stderr": 0.16518466746497154, "rouge1_fmeasure": 0.4869136869814224, "rouge1_fmeasure_stderr": 0.002252377471622215, "rouge1_precision": 0.5781766953393467, "rouge1_precision_stderr": 0.003232493897043414, "rouge1_recall": 0.45846733751843627, "rouge1_recall_stderr": 0.002862839752183954, "rouge2_fmeasure": 0.24388713793667496, "rouge2_fmeasure_stderr": 0.002081168246828599, "rouge2_precision": 0.2936437583754312, "rouge2_precision_stderr": 0.002766357156065721, "rouge2_recall": 0.2296605325605603, "rouge2_recall_stderr": 0.002239048819483412, "rougeL_fmeasure": 0.35476450327695513, "rougeL_fmeasure_stderr": 0.002131136688683226, "rougeL_precision": 0.42323041568862063, "rougeL_precision_stderr": 0.00299893377825116, "rougeL_recall": 0.3336509571396467, "rougeL_recall_stderr": 0.002463831973937884, "rougeLsum_fmeasure": 0.40259898572566205, "rougeLsum_fmeasure_stderr": 0.0023428037926685654, "rougeLsum_precision": 0.47879240286661645, "rougeLsum_precision_stderr": 0.0032211942725843233, "rougeLsum_recall": 0.3788603945042402, "rougeLsum_recall_stderr": 0.00272506620717064}}, "4": {"generate_text_restaurant": {"bleu": 14.568456206535862, "bleu_stderr": 0.22714934644025087, "rouge1_fmeasure": 0.49248119559722, "rouge1_fmeasure_stderr": 0.002261462995557444, "rouge1_precision": 0.5824109780846385, "rouge1_precision_stderr": 0.0032128656177573896, "rouge1_recall": 0.46303711017335764, "rouge1_recall_stderr": 0.0028550395782162385, "rouge2_fmeasure": 0.24852828649672148, "rouge2_fmeasure_stderr": 0.0020894492308823178, "rouge2_precision": 0.2975497604665679, "rouge2_precision_stderr": 0.002721358209608908, "rouge2_recall": 0.2337393664335435, "rouge2_recall_stderr": 0.0022535476965624083, "rougeL_fmeasure": 0.35908240651080353, "rougeL_fmeasure_stderr": 0.0021535460141111546, "rougeL_precision": 0.4258973373500384, "rougeL_precision_stderr": 0.0029570811260566745, "rougeL_recall": 0.33738654578439453, "rougeL_recall_stderr": 0.002480938975354226, "rougeLsum_fmeasure": 0.4073362598730636, "rougeLsum_fmeasure_stderr": 0.002350552518906019, "rougeLsum_precision": 0.48186572666282207, "rougeLsum_precision_stderr": 0.0031731113183941597, "rougeLsum_recall": 0.3829876385027774, "rougeLsum_recall_stderr": 0.0027332507970680904}}, "5": {"generate_text_restaurant": {"bleu": 14.41705650902542, "bleu_stderr": 0.25051935957566557, "rouge1_fmeasure": 0.4912358527300658, "rouge1_fmeasure_stderr": 0.002175083911938509, "rouge1_precision": 0.5768002584328835, "rouge1_precision_stderr": 0.003210936196026848, "rouge1_recall": 0.4663927464698937, "rouge1_recall_stderr": 0.002827189059265761, "rouge2_fmeasure": 0.24634621400768708, "rouge2_fmeasure_stderr": 0.002025833005255322, "rouge2_precision": 0.2929623409468226, "rouge2_precision_stderr": 0.0026747147184981385, "rouge2_recall": 0.2340255710785021, "rouge2_recall_stderr": 0.002212699322566578, "rougeL_fmeasure": 0.35597711356903294, "rougeL_fmeasure_stderr": 0.002065825901549598, "rougeL_precision": 0.41839619423807317, "rougeL_precision_stderr": 0.0028660522019280242, "rougeL_recall": 0.3383776885015685, "rougeL_recall_stderr": 0.0024683861897523925, "rougeLsum_fmeasure": 0.4066143622258549, "rougeLsum_fmeasure_stderr": 0.002273545252564866, "rougeLsum_precision": 0.47696170422006223, "rougeLsum_precision_stderr": 0.003098280726576402, "rougeLsum_recall": 0.3864090320075692, "rougeLsum_recall_stderr": 0.0027224907209281047}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 2.242352554457821, "bleu_stderr": 0.06303290180001715, "rouge1_fmeasure": 0.22142206258867178, "rouge1_fmeasure_stderr": 0.002657386115409225, "rouge1_precision": 0.17908873736938333, "rouge1_precision_stderr": 0.0025998582918028913, "rouge1_recall": 0.3401581574130041, "rouge1_recall_stderr": 0.00466124187806079, "rouge2_fmeasure": 0.0511787638415587, "rouge2_fmeasure_stderr": 0.0017012685833384458, "rouge2_precision": 0.04001978076164408, "rouge2_precision_stderr": 0.00143853172997629, "rouge2_recall": 0.08351989855551167, "rouge2_recall_stderr": 0.002908378017045409, "rougeL_fmeasure": 0.16457376114227693, "rougeL_fmeasure_stderr": 0.002030624196291875, "rougeL_precision": 0.13280826032727655, "rougeL_precision_stderr": 0.0019720134198053826, "rougeL_recall": 0.2547013277658435, "rougeL_recall_stderr": 0.0036980006484927316, "rougeLsum_fmeasure": 0.1721074292499855, "rougeLsum_fmeasure_stderr": 0.002183282479578269, "rougeLsum_precision": 0.13820058290248866, "rougeLsum_precision_stderr": 0.0020236107693674434, "rougeLsum_recall": 0.267820674383363, "rougeLsum_recall_stderr": 0.00406330233863675}}, "1": {"article_DOC_summary": {"bleu": 1.8494036251126653, "bleu_stderr": 0.06618274112679547, "rouge1_fmeasure": 0.19996151191164502, "rouge1_fmeasure_stderr": 0.0024642136191649943, "rouge1_precision": 0.14242240386934715, "rouge1_precision_stderr": 0.0018474131654211898, "rouge1_recall": 0.34972417416826374, "rouge1_recall_stderr": 0.00425304183688617, "rouge2_fmeasure": 0.04515071736102295, "rouge2_fmeasure_stderr": 0.0014958437813087835, "rouge2_precision": 0.03180784324852304, "rouge2_precision_stderr": 0.0010605401760687887, "rouge2_recall": 0.08122973807701163, "rouge2_recall_stderr": 0.0027530425274732025, "rougeL_fmeasure": 0.15185456372717573, "rougeL_fmeasure_stderr": 0.0018177177985044526, "rougeL_precision": 0.10785508103994479, "rougeL_precision_stderr": 0.001342675196432051, "rougeL_recall": 0.26778299938242467, "rougeL_recall_stderr": 0.0033228224655886393, "rougeLsum_fmeasure": 0.16002746501050483, "rougeLsum_fmeasure_stderr": 0.002040753526176795, "rougeLsum_precision": 0.11366701902108305, "rougeLsum_precision_stderr": 0.0014987342312601044, "rougeLsum_recall": 0.28182954712893066, "rougeLsum_recall_stderr": 0.0036825745017303583}}, "2": {"article_DOC_summary": {"bleu": 1.9553979785993556, "bleu_stderr": 0.08114119801334493, "rouge1_fmeasure": 0.20066139374359412, "rouge1_fmeasure_stderr": 0.002583892537384957, "rouge1_precision": 0.14299555153351842, "rouge1_precision_stderr": 0.0019414837646538163, "rouge1_recall": 0.35054680023331225, "rouge1_recall_stderr": 0.004405959066068025, "rouge2_fmeasure": 0.047730927310845786, "rouge2_fmeasure_stderr": 0.0016012182287873963, "rouge2_precision": 0.03372540037348309, "rouge2_precision_stderr": 0.0011433968826317544, "rouge2_recall": 0.08536452458478411, "rouge2_recall_stderr": 0.002896468085770253, "rougeL_fmeasure": 0.15423466735433622, "rougeL_fmeasure_stderr": 0.0019141237080501433, "rougeL_precision": 0.1096711314096099, "rougeL_precision_stderr": 0.0014240979490601532, "rougeL_recall": 0.2713048964277041, "rougeL_recall_stderr": 0.003435168695225616, "rougeLsum_fmeasure": 0.16073844532804232, "rougeLsum_fmeasure_stderr": 0.0021770573542344426, "rougeLsum_precision": 0.11432354351222646, "rougeLsum_precision_stderr": 0.0016135722781519138, "rougeLsum_recall": 0.282399261929163, "rougeLsum_recall_stderr": 0.0038458320187164767}}, "3": {"article_DOC_summary": {"bleu": 1.9899134724216982, "bleu_stderr": 0.08189694158167818, "rouge1_fmeasure": 0.19424816162568462, "rouge1_fmeasure_stderr": 0.002758326610864678, "rouge1_precision": 0.14095312565957024, "rouge1_precision_stderr": 0.0021252189798371952, "rouge1_recall": 0.3355112558235932, "rouge1_recall_stderr": 0.00482038827448099, "rouge2_fmeasure": 0.04656621187743751, "rouge2_fmeasure_stderr": 0.001620760377451161, "rouge2_precision": 0.03309503575773881, "rouge2_precision_stderr": 0.0011583105646001772, "rouge2_recall": 0.08361606756802129, "rouge2_recall_stderr": 0.0030274265177690917, "rougeL_fmeasure": 0.14844786782549954, "rougeL_fmeasure_stderr": 0.002106590246901777, "rougeL_precision": 0.10750740692234483, "rougeL_precision_stderr": 0.001617470504570499, "rougeL_recall": 0.25822344513710505, "rougeL_recall_stderr": 0.0038342113677037708, "rougeLsum_fmeasure": 0.15564298400864224, "rougeLsum_fmeasure_stderr": 0.002325750760252049, "rougeLsum_precision": 0.11272654966890937, "rougeLsum_precision_stderr": 0.0017739663038892394, "rougeLsum_recall": 0.2704314687293562, "rougeLsum_recall_stderr": 0.0041899251242752955}}, "4": {"article_DOC_summary": {"bleu": 0.851414956048288, "bleu_stderr": 0.10142038717157466, "rouge1_fmeasure": 0.05061277872693584, "rouge1_fmeasure_stderr": 0.0028337392524855837, "rouge1_precision": 0.04182867272383347, "rouge1_precision_stderr": 0.002516912133041032, "rouge1_recall": 0.08068317129523372, "rouge1_recall_stderr": 0.004630110172525636, "rouge2_fmeasure": 0.010817994039374855, "rouge2_fmeasure_stderr": 0.0009898135477985153, "rouge2_precision": 0.00821242826897234, "rouge2_precision_stderr": 0.000780085704496626, "rouge2_recall": 0.018229654639556718, "rouge2_recall_stderr": 0.0016649615737807282, "rougeL_fmeasure": 0.038452182498697945, "rougeL_fmeasure_stderr": 0.002124389719631779, "rougeL_precision": 0.03237406484505732, "rougeL_precision_stderr": 0.0020316037823294927, "rougeL_recall": 0.06169464366711305, "rougeL_recall_stderr": 0.0035477374875163793, "rougeLsum_fmeasure": 0.040956310132902136, "rougeLsum_fmeasure_stderr": 0.0023102690323821627, "rougeLsum_precision": 0.03434532775935572, "rougeLsum_precision_stderr": 0.0021605467450954603, "rougeLsum_recall": 0.06559190633881043, "rougeLsum_recall_stderr": 0.0038270052788935026}}, "5": {"article_DOC_summary": {"bleu": 2.3013943780107486e-40, "bleu_stderr": 6.513754776072693e-35, "rouge1_fmeasure": 0.0019051009413407058, "rouge1_fmeasure_stderr": 0.0005593343846105789, "rouge1_precision": 0.0021529907822185413, "rouge1_precision_stderr": 0.0006324831746531657, "rouge1_recall": 0.001764574432238271, "rouge1_recall_stderr": 0.0005172389485732619, "rouge2_fmeasure": 0.0001299594149643802, "rouge2_fmeasure_stderr": 7.503370260000825e-05, "rouge2_precision": 0.0001457415441877151, "rouge2_precision_stderr": 8.410282821934284e-05, "rouge2_recall": 0.00011802662746058974, "rouge2_recall_stderr": 6.837858900511585e-05, "rougeL_fmeasure": 0.0015504765957310557, "rougeL_fmeasure_stderr": 0.0004402385576724586, "rougeL_precision": 0.0017522974182971845, "rougeL_precision_stderr": 0.000503946684193751, "rougeL_recall": 0.0014399120468157657, "rougeL_recall_stderr": 0.0004056116387189239, "rougeLsum_fmeasure": 0.0015923123485654278, "rougeLsum_fmeasure_stderr": 0.00044995087651658854, "rougeLsum_precision": 0.0018058994766162238, "rougeLsum_precision_stderr": 0.0005178578773672206, "rougeLsum_recall": 0.001474217364139951, "rougeLsum_recall_stderr": 0.0004127036649374616}}}} |