Muennighoff's picture
A
eb2a9c4
{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.31224558314839784, "bleu_stderr": 0.03713618627951878, "rouge1_fmeasure": 0.09597672933276848, "rouge1_fmeasure_stderr": 0.002119566893316448, "rouge1_precision": 0.06416860697398828, "rouge1_precision_stderr": 0.0017145071144190034, "rouge1_recall": 0.27658877051081887, "rouge1_recall_stderr": 0.004689276935825928, "rouge2_fmeasure": 0.04369490354925837, "rouge2_fmeasure_stderr": 0.0012778025959773575, "rouge2_precision": 0.02898895600657147, "rouge2_precision_stderr": 0.0009732573595948091, "rouge2_recall": 0.12474346123394711, "rouge2_recall_stderr": 0.003103993275317445, "rougeL_fmeasure": 0.0916810654796967, "rougeL_fmeasure_stderr": 0.0019730758573202655, "rougeL_precision": 0.061168279447352224, "rougeL_precision_stderr": 0.0016042565824939442, "rougeL_recall": 0.2661016573130979, "rougeL_recall_stderr": 0.004476805597758023, "rougeLsum_fmeasure": 0.09077121152470446, "rougeLsum_fmeasure_stderr": 0.002000842365909719, "rougeLsum_precision": 0.06079097382146833, "rougeLsum_precision_stderr": 0.001638980434900789, "rougeLsum_recall": 0.2611818383395376, "rougeLsum_recall_stderr": 0.004408937318215278}}, "1": {"PALM_prompt": {"bleu": 0.3392027660661122, "bleu_stderr": 0.021974513144963268, "rouge1_fmeasure": 0.10098636709306053, "rouge1_fmeasure_stderr": 0.0018586237655962318, "rouge1_precision": 0.0649237002813453, "rouge1_precision_stderr": 0.0013836117996389116, "rouge1_recall": 0.3252507747834447, "rouge1_recall_stderr": 0.004830093238320235, "rouge2_fmeasure": 0.0456950711509664, "rouge2_fmeasure_stderr": 0.0011687980868032475, "rouge2_precision": 0.029412803554314693, "rouge2_precision_stderr": 0.000840010407149539, "rouge2_recall": 0.1489985792608451, "rouge2_recall_stderr": 0.0033169694716508446, "rougeL_fmeasure": 0.09597600266569703, "rougeL_fmeasure_stderr": 0.0017278112461683963, "rougeL_precision": 0.06161199072970022, "rougeL_precision_stderr": 0.001272442500492367, "rougeL_recall": 0.30851984711534297, "rougeL_recall_stderr": 0.004479724678989707, "rougeLsum_fmeasure": 0.09646257885608286, "rougeLsum_fmeasure_stderr": 0.0017756689280714777, "rougeLsum_precision": 0.062043590899161734, "rougeLsum_precision_stderr": 0.0013176307073547546, "rougeLsum_recall": 0.3089691495669342, "rougeLsum_recall_stderr": 0.004492168762956442}}, "2": {"PALM_prompt": {"bleu": 0.3654954806712323, "bleu_stderr": 0.025040063648794096, "rouge1_fmeasure": 0.10670235122995915, "rouge1_fmeasure_stderr": 0.001806209828663936, "rouge1_precision": 0.06820653358439158, "rouge1_precision_stderr": 0.0013447524023065525, "rouge1_recall": 0.3459044512732088, "rouge1_recall_stderr": 0.004653942809147225, "rouge2_fmeasure": 0.048680867420328906, "rouge2_fmeasure_stderr": 0.001161761999498929, "rouge2_precision": 0.03109751061942729, "rouge2_precision_stderr": 0.0008314173693090511, "rouge2_recall": 0.16361070245426873, "rouge2_recall_stderr": 0.0034348511874994717, "rougeL_fmeasure": 0.10152476531671561, "rougeL_fmeasure_stderr": 0.0016858485831521945, "rougeL_precision": 0.06484016065528389, "rougeL_precision_stderr": 0.0012401376869968777, "rougeL_recall": 0.3269715065567825, "rougeL_recall_stderr": 0.004272067994546378, "rougeLsum_fmeasure": 0.10225161251115494, "rougeLsum_fmeasure_stderr": 0.0017327367584781756, "rougeLsum_precision": 0.06536251718368276, "rougeLsum_precision_stderr": 0.0012825569934637642, "rougeLsum_recall": 0.32966818044940316, "rougeLsum_recall_stderr": 0.004368989276954383}}, "3": {"PALM_prompt": {"bleu": 0.3592609344640833, "bleu_stderr": 0.02304406751100301, "rouge1_fmeasure": 0.10565789241386328, "rouge1_fmeasure_stderr": 0.0017663252684883553, "rouge1_precision": 0.06727272384378305, "rouge1_precision_stderr": 0.0012989075786256402, "rouge1_recall": 0.34514411045024723, "rouge1_recall_stderr": 0.004734096982650293, "rouge2_fmeasure": 0.04863415417606342, "rouge2_fmeasure_stderr": 0.0011329644835331011, "rouge2_precision": 0.030916825454777475, "rouge2_precision_stderr": 0.0008056451738364325, "rouge2_recall": 0.1658153905976806, "rouge2_recall_stderr": 0.003481711090228483, "rougeL_fmeasure": 0.10036601085777433, "rougeL_fmeasure_stderr": 0.0016502859429412418, "rougeL_precision": 0.06386360352562777, "rougeL_precision_stderr": 0.0012027232237294206, "rougeL_recall": 0.32523617484648604, "rougeL_recall_stderr": 0.004324297311903695, "rougeLsum_fmeasure": 0.10090783330802172, "rougeLsum_fmeasure_stderr": 0.0016784875419119682, "rougeLsum_precision": 0.06426144521188693, "rougeLsum_precision_stderr": 0.0012323427980484077, "rougeLsum_recall": 0.32867237062843047, "rougeLsum_recall_stderr": 0.004443576841012128}}, "4": {"PALM_prompt": {"bleu": 0.37835540251359956, "bleu_stderr": 0.028435806983719093, "rouge1_fmeasure": 0.10677394877416337, "rouge1_fmeasure_stderr": 0.0017419426846328717, "rouge1_precision": 0.06785826306020468, "rouge1_precision_stderr": 0.0012639461669679325, "rouge1_recall": 0.3474520077766322, "rouge1_recall_stderr": 0.004635808596091852, "rouge2_fmeasure": 0.04926079317014994, "rouge2_fmeasure_stderr": 0.0011176582047592932, "rouge2_precision": 0.03118629908795949, "rouge2_precision_stderr": 0.0007824248126301933, "rouge2_recall": 0.1686112674466713, "rouge2_recall_stderr": 0.0034686723713827842, "rougeL_fmeasure": 0.1015063853834285, "rougeL_fmeasure_stderr": 0.0016330220290649304, "rougeL_precision": 0.06446018636445104, "rougeL_precision_stderr": 0.0011767040252516788, "rougeL_recall": 0.3290377644596475, "rougeL_recall_stderr": 0.00429945865540488, "rougeLsum_fmeasure": 0.10255214222995561, "rougeLsum_fmeasure_stderr": 0.0016742530012902649, "rougeLsum_precision": 0.06518870615697699, "rougeLsum_precision_stderr": 0.0012152427779437518, "rougeLsum_recall": 0.3330559516297193, "rougeLsum_recall_stderr": 0.004414312796704986}}, "5": {"PALM_prompt": {"bleu": 0.3707957491393801, "bleu_stderr": 0.03149803172288385, "rouge1_fmeasure": 0.10804595534435403, "rouge1_fmeasure_stderr": 0.0016819251634874286, "rouge1_precision": 0.06864134680013424, "rouge1_precision_stderr": 0.0012322679271972023, "rouge1_recall": 0.35035957224055103, "rouge1_recall_stderr": 0.004525153332145143, "rouge2_fmeasure": 0.04953443120550419, "rouge2_fmeasure_stderr": 0.0010974380500823572, "rouge2_precision": 0.03135388148292866, "rouge2_precision_stderr": 0.0007751648761981692, "rouge2_recall": 0.16896861616649583, "rouge2_recall_stderr": 0.003345397272046064, "rougeL_fmeasure": 0.10248439747284772, "rougeL_fmeasure_stderr": 0.0015852907542033721, "rougeL_precision": 0.06510326325941494, "rougeL_precision_stderr": 0.0011560260507405354, "rougeL_recall": 0.33044293852360024, "rougeL_recall_stderr": 0.004153133131273199, "rougeLsum_fmeasure": 0.10323556805167783, "rougeLsum_fmeasure_stderr": 0.0016059700043438213, "rougeLsum_precision": 0.0656014791935983, "rougeLsum_precision_stderr": 0.0011776642200350253, "rougeLsum_recall": 0.3339836287603389, "rougeLsum_recall_stderr": 0.004260131546440473}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 1.6375281102002284, "bleu_stderr": 0.049083205722565484, "rouge1_fmeasure": 0.1821170022700696, "rouge1_fmeasure_stderr": 0.0018365968765570223, "rouge1_precision": 0.15526703395478428, "rouge1_precision_stderr": 0.0019048385092560274, "rouge1_recall": 0.2657362987772207, "rouge1_recall_stderr": 0.002621491681886565, "rouge2_fmeasure": 0.037881954687990986, "rouge2_fmeasure_stderr": 0.0008453802181656135, "rouge2_precision": 0.03206185435985054, "rouge2_precision_stderr": 0.000759586624489302, "rouge2_recall": 0.057440011896085316, "rouge2_recall_stderr": 0.0014245492222374873, "rougeL_fmeasure": 0.1431674380673611, "rougeL_fmeasure_stderr": 0.0013181357642786014, "rougeL_precision": 0.12048492403451228, "rougeL_precision_stderr": 0.0013325755443150576, "rougeL_recall": 0.21415389684069874, "rougeL_recall_stderr": 0.002145834100436848, "rougeLsum_fmeasure": 0.1673439925521862, "rougeLsum_fmeasure_stderr": 0.0016912749684659687, "rougeLsum_precision": 0.14253479978773045, "rougeLsum_precision_stderr": 0.0017513462587583613, "rougeLsum_recall": 0.24495352588719183, "rougeLsum_recall_stderr": 0.0024490806612200763}}, "1": {"tldr_en": {"bleu": 2.3919433608178244, "bleu_stderr": 0.08548762264678461, "rouge1_fmeasure": 0.20800416624670884, "rouge1_fmeasure_stderr": 0.0019096560966773478, "rouge1_precision": 0.17980706675942354, "rouge1_precision_stderr": 0.002098175664461687, "rouge1_recall": 0.3009360804108007, "rouge1_recall_stderr": 0.002722466712920559, "rouge2_fmeasure": 0.046870008000920206, "rouge2_fmeasure_stderr": 0.0009635114797446192, "rouge2_precision": 0.040412609345037494, "rouge2_precision_stderr": 0.000890482142333157, "rouge2_recall": 0.0707443093699949, "rouge2_recall_stderr": 0.0016525596112716557, "rougeL_fmeasure": 0.1486340507538382, "rougeL_fmeasure_stderr": 0.0012723389369324837, "rougeL_precision": 0.1268309364742902, "rougeL_precision_stderr": 0.0013760396751293185, "rougeL_recall": 0.22173573063373433, "rougeL_recall_stderr": 0.0021719897093334284, "rougeLsum_fmeasure": 0.1951271284074896, "rougeLsum_fmeasure_stderr": 0.0017825943482372452, "rougeLsum_precision": 0.1684402130679538, "rougeLsum_precision_stderr": 0.00195351875600882, "rougeLsum_recall": 0.2830602164220028, "rougeLsum_recall_stderr": 0.0025790890750399965}}, "2": {"tldr_en": {"bleu": 2.5303113987588, "bleu_stderr": 0.06314873438274192, "rouge1_fmeasure": 0.21350784531146766, "rouge1_fmeasure_stderr": 0.0018372008047181686, "rouge1_precision": 0.19024342341910272, "rouge1_precision_stderr": 0.002270091248824654, "rouge1_recall": 0.30688686376798624, "rouge1_recall_stderr": 0.002645904846436756, "rouge2_fmeasure": 0.049493121373645386, "rouge2_fmeasure_stderr": 0.0009770655274603632, "rouge2_precision": 0.04485105522627462, "rouge2_precision_stderr": 0.0011025549402209852, "rouge2_recall": 0.07310002107093573, "rouge2_recall_stderr": 0.0016239815932843845, "rougeL_fmeasure": 0.15386240322179967, "rougeL_fmeasure_stderr": 0.001284009017533657, "rougeL_precision": 0.13675580244350435, "rougeL_precision_stderr": 0.0016853525652057188, "rougeL_recall": 0.22643200780218806, "rougeL_recall_stderr": 0.002155739575675694, "rougeLsum_fmeasure": 0.20135002510431343, "rougeLsum_fmeasure_stderr": 0.0017256845604918154, "rougeLsum_precision": 0.17941688106712367, "rougeLsum_precision_stderr": 0.002150275172122676, "rougeLsum_recall": 0.28991649578115825, "rougeLsum_recall_stderr": 0.0025125824058213043}}, "3": {"tldr_en": {"bleu": 2.5056315812266687, "bleu_stderr": 0.0987654628167384, "rouge1_fmeasure": 0.17905977454735247, "rouge1_fmeasure_stderr": 0.0021682988144671764, "rouge1_precision": 0.1667156419346577, "rouge1_precision_stderr": 0.0025223421653541435, "rouge1_recall": 0.2556133564452001, "rouge1_recall_stderr": 0.003255288422257417, "rouge2_fmeasure": 0.04118261236702404, "rouge2_fmeasure_stderr": 0.0009347304524167121, "rouge2_precision": 0.0388323173701326, "rouge2_precision_stderr": 0.0010940369607383355, "rouge2_recall": 0.06213727178884212, "rouge2_recall_stderr": 0.001669610738631409, "rougeL_fmeasure": 0.12952435483301103, "rougeL_fmeasure_stderr": 0.0015357281079718173, "rougeL_precision": 0.12089310071398937, "rougeL_precision_stderr": 0.0018705319801461653, "rougeL_recall": 0.18919380915956352, "rougeL_recall_stderr": 0.002567644889149163, "rougeLsum_fmeasure": 0.16910312476864786, "rougeLsum_fmeasure_stderr": 0.0020403281058382705, "rougeLsum_precision": 0.1573503817985137, "rougeLsum_precision_stderr": 0.0023805026761902592, "rougeLsum_recall": 0.24220269466463637, "rougeLsum_recall_stderr": 0.003114884743178747}}, "4": {"tldr_en": {"bleu": 0.558593061097989, "bleu_stderr": 0.04095297851543845, "rouge1_fmeasure": 0.05795016970693355, "rouge1_fmeasure_stderr": 0.001916255841264876, "rouge1_precision": 0.05512873037041646, "rouge1_precision_stderr": 0.002053021409006724, "rouge1_recall": 0.08653039568969556, "rouge1_recall_stderr": 0.002932898045655817, "rouge2_fmeasure": 0.013165816959927556, "rouge2_fmeasure_stderr": 0.0006382389780016135, "rouge2_precision": 0.012291396262431102, "rouge2_precision_stderr": 0.0006860904350077833, "rouge2_recall": 0.021084941019315177, "rouge2_recall_stderr": 0.001188230063769281, "rougeL_fmeasure": 0.043071887152266786, "rougeL_fmeasure_stderr": 0.001407113300208392, "rougeL_precision": 0.04126037678616895, "rougeL_precision_stderr": 0.0015664586581985208, "rougeL_recall": 0.06589363408283794, "rougeL_recall_stderr": 0.002292257294557098, "rougeLsum_fmeasure": 0.054561504253622946, "rougeLsum_fmeasure_stderr": 0.00180105400180901, "rougeLsum_precision": 0.0520537723141164, "rougeLsum_precision_stderr": 0.0019443085493386046, "rougeLsum_recall": 0.08158523490668657, "rougeLsum_recall_stderr": 0.0027709770644967647}}, "5": {"tldr_en": {"bleu": 2.49693387658237e-06, "bleu_stderr": 4.9254476844807124e-06, "rouge1_fmeasure": 0.009411385725263191, "rouge1_fmeasure_stderr": 0.0008471619506817471, "rouge1_precision": 0.009598793842482911, "rouge1_precision_stderr": 0.0010135227951615076, "rouge1_recall": 0.014751731366643654, "rouge1_recall_stderr": 0.0013823298706162432, "rouge2_fmeasure": 0.0024221607010753237, "rouge2_fmeasure_stderr": 0.00029561192228850174, "rouge2_precision": 0.0025860727447622914, "rouge2_precision_stderr": 0.00048780227870820193, "rouge2_recall": 0.004211421745829904, "rouge2_recall_stderr": 0.0005814098675929214, "rougeL_fmeasure": 0.007136631099672401, "rougeL_fmeasure_stderr": 0.0006388509886284223, "rougeL_precision": 0.007459585367896189, "rougeL_precision_stderr": 0.000834881509938252, "rougeL_recall": 0.011482514249452291, "rougeL_recall_stderr": 0.0011106961669246301, "rougeLsum_fmeasure": 0.008925101458585369, "rougeLsum_fmeasure_stderr": 0.0008030681343683619, "rougeLsum_precision": 0.009060670979252713, "rougeLsum_precision_stderr": 0.0009579283395946946, "rougeLsum_recall": 0.014087779059365814, "rougeLsum_recall_stderr": 0.0013315634718775852}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 4.780545170170601, "bleu_stderr": 0.07118121769393712, "rouge1_fmeasure": 0.23246731745402952, "rouge1_fmeasure_stderr": 0.0017141203715973089, "rouge1_precision": 0.1774633723287846, "rouge1_precision_stderr": 0.0015636360094331604, "rouge1_recall": 0.364075043069517, "rouge1_recall_stderr": 0.002322444967434633, "rouge2_fmeasure": 0.09329941078416822, "rouge2_fmeasure_stderr": 0.0011794536309790357, "rouge2_precision": 0.06978291968631191, "rouge2_precision_stderr": 0.0009315100071943132, "rouge2_recall": 0.14929846575132927, "rouge2_recall_stderr": 0.0018334497217483083, "rougeL_fmeasure": 0.2052968426221788, "rougeL_fmeasure_stderr": 0.0013740335300801536, "rougeL_precision": 0.1559347512157101, "rougeL_precision_stderr": 0.0012468570328765438, "rougeL_recall": 0.3246942073486663, "rougeL_recall_stderr": 0.002000868521767354, "rougeLsum_fmeasure": 0.20379402537245084, "rougeLsum_fmeasure_stderr": 0.0016105541434803087, "rougeLsum_precision": 0.15543450901475353, "rougeLsum_precision_stderr": 0.0014302666176517367, "rougeLsum_recall": 0.3196428693668727, "rougeLsum_recall_stderr": 0.002242319012699104}}, "1": {"generate_text_restaurant": {"bleu": 6.940570293175053, "bleu_stderr": 0.10104547668423318, "rouge1_fmeasure": 0.3575800722995913, "rouge1_fmeasure_stderr": 0.002127689173825895, "rouge1_precision": 0.3496601719591484, "rouge1_precision_stderr": 0.002849559103688844, "rouge1_recall": 0.42359261277664634, "rouge1_recall_stderr": 0.002763477540076445, "rouge2_fmeasure": 0.142023180586533, "rouge2_fmeasure_stderr": 0.0014957539772810853, "rouge2_precision": 0.1429410376669936, "rouge2_precision_stderr": 0.0020796619782422693, "rouge2_recall": 0.1705613877983603, "rouge2_recall_stderr": 0.0019090729632325418, "rougeL_fmeasure": 0.2540611971473509, "rougeL_fmeasure_stderr": 0.001515044497001407, "rougeL_precision": 0.24812697347482596, "rougeL_precision_stderr": 0.0022073871312320963, "rougeL_recall": 0.30667916863775024, "rougeL_recall_stderr": 0.002283669807725874, "rougeLsum_fmeasure": 0.2953396678867069, "rougeLsum_fmeasure_stderr": 0.0019610430628804647, "rougeLsum_precision": 0.29053903973532214, "rougeLsum_precision_stderr": 0.002642421636933054, "rougeLsum_recall": 0.34937076105340387, "rougeLsum_recall_stderr": 0.002510233957991074}}, "2": {"generate_text_restaurant": {"bleu": 9.578029851318268, "bleu_stderr": 0.201482009124794, "rouge1_fmeasure": 0.38938815590089454, "rouge1_fmeasure_stderr": 0.002015416977580809, "rouge1_precision": 0.39404892212892395, "rouge1_precision_stderr": 0.0028317434398928863, "rouge1_recall": 0.4314560771401939, "rouge1_recall_stderr": 0.002630398723273804, "rouge2_fmeasure": 0.17045725388262045, "rouge2_fmeasure_stderr": 0.0016711304351085842, "rouge2_precision": 0.17484313787847716, "rouge2_precision_stderr": 0.0021450695622140473, "rouge2_recall": 0.19062521235801827, "rouge2_recall_stderr": 0.0020301066688945897, "rougeL_fmeasure": 0.28720479387341713, "rougeL_fmeasure_stderr": 0.00166490138295134, "rougeL_precision": 0.2902089433918642, "rougeL_precision_stderr": 0.002309942464742442, "rougeL_recall": 0.3208704945592194, "rougeL_recall_stderr": 0.0022660826248778083, "rougeLsum_fmeasure": 0.3266334163588423, "rougeLsum_fmeasure_stderr": 0.001973231465683255, "rougeLsum_precision": 0.3310651908517372, "rougeLsum_precision_stderr": 0.002649650064405018, "rougeLsum_recall": 0.36193836102433935, "rougeLsum_recall_stderr": 0.002507014363898419}}, "3": {"generate_text_restaurant": {"bleu": 10.920454433065684, "bleu_stderr": 0.1316943729685155, "rouge1_fmeasure": 0.40421930965797104, "rouge1_fmeasure_stderr": 0.001965580619381596, "rouge1_precision": 0.4192958302681238, "rouge1_precision_stderr": 0.0027833911244728436, "rouge1_recall": 0.43191640398277037, "rouge1_recall_stderr": 0.0025958195715232047, "rouge2_fmeasure": 0.181728403672227, "rouge2_fmeasure_stderr": 0.0017180728141282062, "rouge2_precision": 0.19011172601557672, "rouge2_precision_stderr": 0.002113152497347813, "rouge2_recall": 0.19573521805211624, "rouge2_recall_stderr": 0.002055597667273278, "rougeL_fmeasure": 0.3004132022131482, "rougeL_fmeasure_stderr": 0.001744736531356786, "rougeL_precision": 0.31151155319807905, "rougeL_precision_stderr": 0.002356738120811969, "rougeL_recall": 0.3223236931614774, "rougeL_recall_stderr": 0.0022747777223757824, "rougeLsum_fmeasure": 0.34264109704469076, "rougeLsum_fmeasure_stderr": 0.001982280995883766, "rougeLsum_precision": 0.35498206085286044, "rougeLsum_precision_stderr": 0.002606574588757685, "rougeLsum_recall": 0.3668525311353958, "rougeLsum_recall_stderr": 0.0025367007147142026}}, "4": {"generate_text_restaurant": {"bleu": 11.500897320173257, "bleu_stderr": 0.1956034095087363, "rouge1_fmeasure": 0.41092706000969503, "rouge1_fmeasure_stderr": 0.002013505579199469, "rouge1_precision": 0.42930123866901915, "rouge1_precision_stderr": 0.002802161499400842, "rouge1_recall": 0.4331782904924909, "rouge1_recall_stderr": 0.002577476100131464, "rouge2_fmeasure": 0.18641178852244134, "rouge2_fmeasure_stderr": 0.0017617429227832714, "rouge2_precision": 0.1963741088023231, "rouge2_precision_stderr": 0.002127045475765985, "rouge2_recall": 0.19754483584480773, "rouge2_recall_stderr": 0.002036905880965759, "rougeL_fmeasure": 0.30804933657878797, "rougeL_fmeasure_stderr": 0.0018042408542884843, "rougeL_precision": 0.32184870299119356, "rougeL_precision_stderr": 0.0023948432966585135, "rougeL_recall": 0.32560487667250465, "rougeL_recall_stderr": 0.0022611096432227965, "rougeLsum_fmeasure": 0.35022280659725025, "rougeLsum_fmeasure_stderr": 0.002028073865541317, "rougeLsum_precision": 0.36559763624883224, "rougeLsum_precision_stderr": 0.0026458064257003032, "rougeLsum_recall": 0.3697574496463752, "rougeLsum_recall_stderr": 0.0025156597623565424}}, "5": {"generate_text_restaurant": {"bleu": 11.771270305618712, "bleu_stderr": 0.17412022732055477, "rouge1_fmeasure": 0.41830245139279826, "rouge1_fmeasure_stderr": 0.002021004042601933, "rouge1_precision": 0.43818215510000286, "rouge1_precision_stderr": 0.0028851585855894776, "rouge1_recall": 0.4399123520832634, "rouge1_recall_stderr": 0.0025733621012235895, "rouge2_fmeasure": 0.1917272606223869, "rouge2_fmeasure_stderr": 0.001783066182693068, "rouge2_precision": 0.20257411232135283, "rouge2_precision_stderr": 0.0021820200889344113, "rouge2_recall": 0.20260609597182416, "rouge2_recall_stderr": 0.0020654299321480334, "rougeL_fmeasure": 0.31474259806009264, "rougeL_fmeasure_stderr": 0.0018056447106615293, "rougeL_precision": 0.32996450967513996, "rougeL_precision_stderr": 0.0024791014115638364, "rougeL_recall": 0.331872138433623, "rougeL_recall_stderr": 0.0022597005060796707, "rougeLsum_fmeasure": 0.35845598302759274, "rougeLsum_fmeasure_stderr": 0.002046672331208988, "rougeLsum_precision": 0.37550892623756665, "rougeLsum_precision_stderr": 0.0027651776519762796, "rougeLsum_recall": 0.377168038065161, "rougeLsum_recall_stderr": 0.002496827725922857}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 1.8174302706970622, "bleu_stderr": 0.11196728320067137, "rouge1_fmeasure": 0.20114774044747769, "rouge1_fmeasure_stderr": 0.0025269409205907075, "rouge1_precision": 0.1545989297987524, "rouge1_precision_stderr": 0.0022684654702864685, "rouge1_recall": 0.3221703515084542, "rouge1_recall_stderr": 0.004289581865346496, "rouge2_fmeasure": 0.04288345569115875, "rouge2_fmeasure_stderr": 0.00150423780993115, "rouge2_precision": 0.0319437568430621, "rouge2_precision_stderr": 0.0011634686267094517, "rouge2_recall": 0.07254495732539187, "rouge2_recall_stderr": 0.0026632962610127395, "rougeL_fmeasure": 0.15252407111150582, "rougeL_fmeasure_stderr": 0.001904423395546802, "rougeL_precision": 0.11668807171332557, "rougeL_precision_stderr": 0.0016652450570352347, "rougeL_recall": 0.24679085078761165, "rougeL_recall_stderr": 0.003463508045372628, "rougeLsum_fmeasure": 0.15637245537010086, "rougeLsum_fmeasure_stderr": 0.0020947672689738675, "rougeLsum_precision": 0.11942635042403643, "rougeLsum_precision_stderr": 0.0017706637778327492, "rougeLsum_recall": 0.25332562732507136, "rougeLsum_recall_stderr": 0.0037831592179613394}}, "1": {"article_DOC_summary": {"bleu": 1.552748129219279, "bleu_stderr": 0.09997239921399444, "rouge1_fmeasure": 0.17114372550513476, "rouge1_fmeasure_stderr": 0.0024604571497117834, "rouge1_precision": 0.12170201682595827, "rouge1_precision_stderr": 0.001826044289177986, "rouge1_recall": 0.30043563707916027, "rouge1_recall_stderr": 0.004233363825654979, "rouge2_fmeasure": 0.035379638697656535, "rouge2_fmeasure_stderr": 0.0014234913861855445, "rouge2_precision": 0.02491068120814432, "rouge2_precision_stderr": 0.0010056223310594503, "rouge2_recall": 0.06366125078253994, "rouge2_recall_stderr": 0.0026092736589792367, "rougeL_fmeasure": 0.13569122371994208, "rougeL_fmeasure_stderr": 0.0018778599571687325, "rougeL_precision": 0.09626651393384027, "rougeL_precision_stderr": 0.0013808637405283324, "rougeL_recall": 0.24005794800544122, "rougeL_recall_stderr": 0.0034002667798535, "rougeLsum_fmeasure": 0.13720484475514233, "rougeLsum_fmeasure_stderr": 0.0020361013127471544, "rougeLsum_precision": 0.09732882949507539, "rougeLsum_precision_stderr": 0.001491003899937052, "rougeLsum_recall": 0.24264339775958071, "rougeLsum_recall_stderr": 0.003652067540550535}}, "2": {"article_DOC_summary": {"bleu": 1.3601465950321643, "bleu_stderr": 0.0861315196923141, "rouge1_fmeasure": 0.17309895172368248, "rouge1_fmeasure_stderr": 0.002407562936005181, "rouge1_precision": 0.12278797123169674, "rouge1_precision_stderr": 0.001785131647152879, "rouge1_recall": 0.30543718274767545, "rouge1_recall_stderr": 0.004162923693892446, "rouge2_fmeasure": 0.03502857896138652, "rouge2_fmeasure_stderr": 0.0013726414538592514, "rouge2_precision": 0.0246072866788354, "rouge2_precision_stderr": 0.0009656088007101129, "rouge2_recall": 0.06340535253720762, "rouge2_recall_stderr": 0.0025614084712425903, "rougeL_fmeasure": 0.13712998116139988, "rougeL_fmeasure_stderr": 0.001853089467865337, "rougeL_precision": 0.09711482251051126, "rougeL_precision_stderr": 0.0013612129408171914, "rougeL_recall": 0.24338254656295813, "rougeL_recall_stderr": 0.0033638392897146316, "rougeLsum_fmeasure": 0.13797316536629922, "rougeLsum_fmeasure_stderr": 0.0020045397719122386, "rougeLsum_precision": 0.09765391570730775, "rougeLsum_precision_stderr": 0.0014675271246877423, "rougeLsum_recall": 0.24504917885902605, "rougeLsum_recall_stderr": 0.003598210298390468}}, "3": {"article_DOC_summary": {"bleu": 1.5289039831037767, "bleu_stderr": 0.08704589796771511, "rouge1_fmeasure": 0.17194468346922234, "rouge1_fmeasure_stderr": 0.0025657618680217883, "rouge1_precision": 0.12456236869961217, "rouge1_precision_stderr": 0.001979303032414647, "rouge1_recall": 0.2969986877323206, "rouge1_recall_stderr": 0.004379156286983872, "rouge2_fmeasure": 0.034720433489397975, "rouge2_fmeasure_stderr": 0.0013709396923174736, "rouge2_precision": 0.024705844817679887, "rouge2_precision_stderr": 0.000982394972116292, "rouge2_recall": 0.06152065262458846, "rouge2_recall_stderr": 0.002489362220975216, "rougeL_fmeasure": 0.13492154229574052, "rougeL_fmeasure_stderr": 0.0019677258292475, "rougeL_precision": 0.09749135882170305, "rougeL_precision_stderr": 0.0014954299008710392, "rougeL_recall": 0.23449083710611318, "rougeL_recall_stderr": 0.003493009897335876, "rougeLsum_fmeasure": 0.13730295741486614, "rougeLsum_fmeasure_stderr": 0.002115839730669299, "rougeLsum_precision": 0.09915225156332898, "rougeLsum_precision_stderr": 0.001597792391607745, "rougeLsum_recall": 0.23891448433195075, "rougeLsum_recall_stderr": 0.0037586328246274584}}, "4": {"article_DOC_summary": {"bleu": 0.7057885792239146, "bleu_stderr": 0.09633059952297361, "rouge1_fmeasure": 0.047178072114941544, "rouge1_fmeasure_stderr": 0.002616626424383668, "rouge1_precision": 0.038885594409457096, "rouge1_precision_stderr": 0.002307145421336748, "rouge1_recall": 0.07533535776380973, "rouge1_recall_stderr": 0.004278569489488177, "rouge2_fmeasure": 0.009740454133203196, "rouge2_fmeasure_stderr": 0.0008810391003143671, "rouge2_precision": 0.00767009703914481, "rouge2_precision_stderr": 0.0007436396195559962, "rouge2_recall": 0.016162073507849355, "rouge2_recall_stderr": 0.0015013180480267284, "rougeL_fmeasure": 0.03687428992461382, "rougeL_fmeasure_stderr": 0.0020423490604046203, "rougeL_precision": 0.030629416984214033, "rougeL_precision_stderr": 0.0018394051263934531, "rougeL_recall": 0.059033336787710354, "rougeL_recall_stderr": 0.0033568504886673342, "rougeLsum_fmeasure": 0.03798026533325551, "rougeLsum_fmeasure_stderr": 0.002122845512935527, "rougeLsum_precision": 0.03156727174883922, "rougeLsum_precision_stderr": 0.0018991973218119777, "rougeLsum_recall": 0.060734850890216574, "rougeLsum_recall_stderr": 0.003501714228117917}}, "5": {"article_DOC_summary": {"bleu": 1.4101701229157404e-16, "bleu_stderr": 7.284988438739496e-14, "rouge1_fmeasure": 0.0024087011729151905, "rouge1_fmeasure_stderr": 0.0006704731920197829, "rouge1_precision": 0.0020524139087283043, "rouge1_precision_stderr": 0.000588767108298375, "rouge1_recall": 0.003713621943684625, "rouge1_recall_stderr": 0.0010695365153013802, "rouge2_fmeasure": 0.0003686455308029473, "rouge2_fmeasure_stderr": 0.0001512143971336204, "rouge2_precision": 0.00028228247573819387, "rouge2_precision_stderr": 0.0001152152143834138, "rouge2_recall": 0.000611287528601624, "rouge2_recall_stderr": 0.0002553224416713872, "rougeL_fmeasure": 0.0017850468058708325, "rougeL_fmeasure_stderr": 0.0004908275382504802, "rougeL_precision": 0.0015369529867172342, "rougeL_precision_stderr": 0.00043863667780986944, "rougeL_recall": 0.0026922203626893403, "rougeL_recall_stderr": 0.0007595049688272029, "rougeLsum_fmeasure": 0.0019251742486571363, "rougeLsum_fmeasure_stderr": 0.0005450647907848718, "rougeLsum_precision": 0.0016840361597954422, "rougeLsum_precision_stderr": 0.0005020554020988375, "rougeLsum_recall": 0.0029125954622099127, "rougeLsum_recall_stderr": 0.0008341811116817512}}}}