Upload results.json
Browse files- results.json +1 -1
results.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"validation_set": {"ndcg_at_1": 0.828, "ndcg_at_3": 0.87764, "ndcg_at_5": 0.88263, "ndcg_at_10": 0.88981, "ndcg_at_20": 0.89434, "ndcg_at_50": 0.89829, "ndcg_at_100": 0.90018, "map_at_1": 0.828, "map_at_3": 0.86633, "map_at_5": 0.86913, "map_at_10": 0.87213, "map_at_20": 0.87336, "map_at_50": 0.87399, "map_at_100": 0.87413, "recall_at_1": 0.828, "recall_at_3": 0.91, "recall_at_5": 0.922, "recall_at_10": 0.944, "recall_at_20": 0.962, "recall_at_50": 0.982, "recall_at_100": 0.994, "precision_at_1": 0.828, "precision_at_3": 0.30333, "precision_at_5": 0.1844, "precision_at_10": 0.0944, "precision_at_20": 0.0481, "precision_at_50": 0.01964, "precision_at_100": 0.00994, "mrr_at_1": 0.824, "mrr_at_3": 0.8636666666666666, "mrr_at_5": 0.8669666666666667, "mrr_at_10": 0.8702642857142857, "mrr_at_20": 0.871532798573975, "mrr_at_50": 0.8722038761027637, "mrr_at_100": 0.872391544636181, "naucs_at_1_max": 0.21773711896722028, "naucs_at_1_std": 0.2788401902005385, "naucs_at_1_diff1": 0.9399880550387059, "naucs_at_3_max": 0.15050316422865537, "naucs_at_3_std": 0.6578586990351711, "naucs_at_3_diff1": 0.9553376906318075, "naucs_at_5_max": 0.1060954296248405, "naucs_at_5_std": 0.7918073212190876, "naucs_at_5_diff1": 0.9656443774090842, "naucs_at_10_max": -0.018807523009205383, "naucs_at_10_std": 0.86072762438309, "naucs_at_10_diff1": 0.9807422969187695, "naucs_at_20_max": -0.3403607056857979, "naucs_at_20_std": 0.9314708339476163, "naucs_at_20_diff1": 1.0, "naucs_at_50_max": -0.5622471210706596, "naucs_at_50_std": 1.0, "naucs_at_50_diff1": 1.0, "naucs_at_100_max": -0.6288515406162857, "naucs_at_100_std": 1.0, "naucs_at_100_diff1": 1.0}, "syntheticDocQA_energy": {"ndcg_at_1": 0.94, "ndcg_at_3": 0.97155, "ndcg_at_5": 0.97155, "ndcg_at_10": 0.97155, "ndcg_at_20": 0.97155, "ndcg_at_50": 0.9735, "ndcg_at_100": 0.9735, "map_at_1": 0.94, "map_at_3": 0.965, "map_at_5": 0.965, "map_at_10": 0.965, "map_at_20": 0.965, "map_at_50": 0.96529, "map_at_100": 0.96529, "recall_at_1": 0.94, "recall_at_3": 0.99, "recall_at_5": 0.99, "recall_at_10": 0.99, "recall_at_20": 0.99, "recall_at_50": 1.0, "recall_at_100": 1.0, "precision_at_1": 0.94, "precision_at_3": 0.33, "precision_at_5": 0.198, "precision_at_10": 0.099, "precision_at_20": 0.0495, "precision_at_50": 0.02, "precision_at_100": 0.01, "mrr_at_1": 0.95, "mrr_at_3": 0.97, "mrr_at_5": 0.97, "mrr_at_10": 0.97, "mrr_at_20": 0.97, "mrr_at_50": 0.9702941176470589, "mrr_at_100": 0.9702941176470589, "naucs_at_1_max": 0.5834111422346712, "naucs_at_1_std": -0.3165266106442549, "naucs_at_1_diff1": 0.9782135076252712, "naucs_at_3_max": 0.7222222222222157, "naucs_at_3_std": -0.5634920634921204, "naucs_at_3_diff1": 1.0, "naucs_at_5_max": 0.7222222222222276, "naucs_at_5_std": -0.5634920634920767, "naucs_at_5_diff1": 1.0, "naucs_at_10_max": 0.7222222222222276, "naucs_at_10_std": -0.5634920634920767, "naucs_at_10_diff1": 1.0, "naucs_at_20_max": 0.7222222222222276, "naucs_at_20_std": -0.5634920634920767, "naucs_at_20_diff1": 1.0, "naucs_at_50_max": NaN, "naucs_at_50_std": NaN, "naucs_at_50_diff1": NaN, "naucs_at_100_max": NaN, "naucs_at_100_std": NaN, "naucs_at_100_diff1": NaN}, "syntheticDocQA_healthcare_industry": {"ndcg_at_1": 0.98, "ndcg_at_3": 0.99262, "ndcg_at_5": 0.99262, "ndcg_at_10": 0.99262, "ndcg_at_20": 0.99262, "ndcg_at_50": 0.99262, "ndcg_at_100": 0.99262, "map_at_1": 0.98, "map_at_3": 0.99, "map_at_5": 0.99, "map_at_10": 0.99, "map_at_20": 0.99, "map_at_50": 0.99, "map_at_100": 0.99, "recall_at_1": 0.98, "recall_at_3": 1.0, "recall_at_5": 1.0, "recall_at_10": 1.0, "recall_at_20": 1.0, "recall_at_50": 1.0, "recall_at_100": 1.0, "precision_at_1": 0.98, "precision_at_3": 0.33333, "precision_at_5": 0.2, "precision_at_10": 0.1, "precision_at_20": 0.05, "precision_at_50": 0.02, "precision_at_100": 0.01, "mrr_at_1": 0.98, "mrr_at_3": 0.99, "mrr_at_5": 0.99, "mrr_at_10": 0.99, "mrr_at_20": 0.99, "mrr_at_50": 0.99, "mrr_at_100": 0.99, "naucs_at_1_max": 0.795751633986929, "naucs_at_1_std": -0.8576097105508799, "naucs_at_1_diff1": 0.9346405228758133, "naucs_at_3_max": 1.0, "naucs_at_3_std": 1.0, "naucs_at_3_diff1": 1.0, "naucs_at_5_max": 1.0, "naucs_at_5_std": 1.0, "naucs_at_5_diff1": 1.0, "naucs_at_10_max": 1.0, "naucs_at_10_std": 1.0, "naucs_at_10_diff1": 1.0, "naucs_at_20_max": 1.0, "naucs_at_20_std": 1.0, "naucs_at_20_diff1": 1.0, "naucs_at_50_max": NaN, "naucs_at_50_std": NaN, "naucs_at_50_diff1": NaN, "naucs_at_100_max": NaN, "naucs_at_100_std": NaN, "naucs_at_100_diff1": NaN}, "syntheticDocQA_artificial_intelligence_test": {"ndcg_at_1": 0.99, "ndcg_at_3": 0.995, "ndcg_at_5": 0.995, "ndcg_at_10": 0.995, "ndcg_at_20": 0.995, "ndcg_at_50": 0.995, "ndcg_at_100": 0.995, "map_at_1": 0.99, "map_at_3": 0.99333, "map_at_5": 0.99333, "map_at_10": 0.99333, "map_at_20": 0.99333, "map_at_50": 0.99333, "map_at_100": 0.99333, "recall_at_1": 0.99, "recall_at_3": 1.0, "recall_at_5": 1.0, "recall_at_10": 1.0, "recall_at_20": 1.0, "recall_at_50": 1.0, "recall_at_100": 1.0, "precision_at_1": 0.99, "precision_at_3": 0.33333, "precision_at_5": 0.2, "precision_at_10": 0.1, "precision_at_20": 0.05, "precision_at_50": 0.02, "precision_at_100": 0.01, "mrr_at_1": 0.99, "mrr_at_3": 0.9933333333333333, "mrr_at_5": 0.9933333333333333, "mrr_at_10": 0.9933333333333333, "mrr_at_20": 0.9933333333333333, "mrr_at_50": 0.9933333333333333, "mrr_at_100": 0.9933333333333333, "naucs_at_1_max": 1.0, "naucs_at_1_std": 0.8692810457516276, "naucs_at_1_diff1": 1.0, "naucs_at_3_max": 1.0, "naucs_at_3_std": 1.0, "naucs_at_3_diff1": 1.0, "naucs_at_5_max": 1.0, "naucs_at_5_std": 1.0, "naucs_at_5_diff1": 1.0, "naucs_at_10_max": 1.0, "naucs_at_10_std": 1.0, "naucs_at_10_diff1": 1.0, "naucs_at_20_max": 1.0, "naucs_at_20_std": 1.0, "naucs_at_20_diff1": 1.0, "naucs_at_50_max": NaN, "naucs_at_50_std": NaN, "naucs_at_50_diff1": NaN, "naucs_at_100_max": NaN, "naucs_at_100_std": NaN, "naucs_at_100_diff1": NaN}, "syntheticDocQA_government_reports": {"ndcg_at_1": 0.93, "ndcg_at_3": 0.97155, "ndcg_at_5": 0.97155, "ndcg_at_10": 0.97155, "ndcg_at_20": 0.97155, "ndcg_at_50": 0.97155, "ndcg_at_100": 0.97155, "map_at_1": 0.93, "map_at_3": 0.96167, "map_at_5": 0.96167, "map_at_10": 0.96167, "map_at_20": 0.96167, "map_at_50": 0.96167, "map_at_100": 0.96167, "recall_at_1": 0.93, "recall_at_3": 1.0, "recall_at_5": 1.0, "recall_at_10": 1.0, "recall_at_20": 1.0, "recall_at_50": 1.0, "recall_at_100": 1.0, "precision_at_1": 0.93, "precision_at_3": 0.33333, "precision_at_5": 0.2, "precision_at_10": 0.1, "precision_at_20": 0.05, "precision_at_50": 0.02, "precision_at_100": 0.01, "mrr_at_1": 0.94, "mrr_at_3": 0.9666666666666667, "mrr_at_5": 0.9666666666666667, "mrr_at_10": 0.9666666666666667, "mrr_at_20": 0.9666666666666667, "mrr_at_50": 0.9666666666666667, "mrr_at_100": 0.9666666666666667, "naucs_at_1_max": 0.5822328931572631, "naucs_at_1_std": 0.673536081099108, "naucs_at_1_diff1": 0.8622782446311864, "naucs_at_3_max": 1.0, "naucs_at_3_std": 1.0, "naucs_at_3_diff1": 1.0, "naucs_at_5_max": 1.0, "naucs_at_5_std": 1.0, "naucs_at_5_diff1": 1.0, "naucs_at_10_max": 1.0, "naucs_at_10_std": 1.0, "naucs_at_10_diff1": 1.0, "naucs_at_20_max": 1.0, "naucs_at_20_std": 1.0, "naucs_at_20_diff1": 1.0, "naucs_at_50_max": NaN, "naucs_at_50_std": NaN, "naucs_at_50_diff1": NaN, "naucs_at_100_max": NaN, "naucs_at_100_std": NaN, "naucs_at_100_diff1": NaN}, "infovqa_subsampled": {"ndcg_at_1": 0.87, "ndcg_at_3": 0.89567, "ndcg_at_5": 0.9047, "ndcg_at_10": 0.90993, "ndcg_at_20": 0.91299, "ndcg_at_50": 0.91631, "ndcg_at_100": 0.91664, "map_at_1": 0.87, "map_at_3": 0.88933, "map_at_5": 0.89433, "map_at_10": 0.89652, "map_at_20": 0.89737, "map_at_50": 0.89796, "map_at_100": 0.89799, "recall_at_1": 0.87, "recall_at_3": 0.914, "recall_at_5": 0.936, "recall_at_10": 0.952, "recall_at_20": 0.964, "recall_at_50": 0.98, "recall_at_100": 0.982, "precision_at_1": 0.87, "precision_at_3": 0.30467, "precision_at_5": 0.1872, "precision_at_10": 0.0952, "precision_at_20": 0.0482, "precision_at_50": 0.0196, "precision_at_100": 0.00982, "mrr_at_1": 0.872, "mrr_at_3": 0.8903333333333334, "mrr_at_5": 0.8952333333333333, "mrr_at_10": 0.8973857142857142, "mrr_at_20": 0.8981114902641218, "mrr_at_50": 0.8987658806482948, "mrr_at_100": 0.8987961836785979, "naucs_at_1_max": 0.6437088054506402, "naucs_at_1_std": 0.05869806709620076, "naucs_at_1_diff1": 0.9304969266089019, "naucs_at_3_max": 0.6889344885240949, "naucs_at_3_std": 0.1136842333832744, "naucs_at_3_diff1": 0.9251405988752106, "naucs_at_5_max": 0.7031395891690008, "naucs_at_5_std": 0.26028536414565784, "naucs_at_5_diff1": 0.9203431372549006, "naucs_at_10_max": 0.8295012449424186, "naucs_at_10_std": 0.40411998132586524, "naucs_at_10_diff1": 0.9332788671023946, "naucs_at_20_max": 0.8841944185081392, "naucs_at_20_std": 0.49084448594252705, "naucs_at_20_diff1": 0.9337327523601999, "naucs_at_50_max": 0.9292717086834656, "naucs_at_50_std": 0.8650793650793516, "naucs_at_50_diff1": 0.9477124183006472, "naucs_at_100_max": 0.9214130096482952, "naucs_at_100_std": 0.8646125116713362, "naucs_at_100_diff1": 0.9419026870007192}, "docvqa_subsampled": {"ndcg_at_1": 0.478, "ndcg_at_3": 0.53969, "ndcg_at_5": 0.56094, "ndcg_at_10": 0.57779, "ndcg_at_20": 0.59308, "ndcg_at_50": 0.60319, "ndcg_at_100": 0.60994, "map_at_1": 0.478, "map_at_3": 0.525, "map_at_5": 0.5367, "map_at_10": 0.54367, "map_at_20": 0.54794, "map_at_50": 0.54964, "map_at_100": 0.55022, "recall_at_1": 0.478, "recall_at_3": 0.582, "recall_at_5": 0.634, "recall_at_10": 0.686, "recall_at_20": 0.746, "recall_at_50": 0.796, "recall_at_100": 0.838, "precision_at_1": 0.478, "precision_at_3": 0.194, "precision_at_5": 0.1268, "precision_at_10": 0.0686, "precision_at_20": 0.0373, "precision_at_50": 0.01592, "precision_at_100": 0.00838, "mrr_at_1": 0.482, "mrr_at_3": 0.5266666666666666, "mrr_at_5": 0.5375666666666667, "mrr_at_10": 0.5453944444444444, "mrr_at_20": 0.5492540835755232, "mrr_at_50": 0.5511465806213975, "mrr_at_100": 0.5515877171220239, "naucs_at_1_max": 0.17593079866611316, "naucs_at_1_std": 0.6646824085068347, "naucs_at_1_diff1": 0.8815686129321448, "naucs_at_3_max": 0.08521158919497512, "naucs_at_3_std": 0.7560230713519073, "naucs_at_3_diff1": 0.7969302187589984, "naucs_at_5_max": 0.02873191231399215, "naucs_at_5_std": 0.8071899242551022, "naucs_at_5_diff1": 0.7628796322315227, "naucs_at_10_max": -0.07012897967179643, "naucs_at_10_std": 0.874808909287446, "naucs_at_10_diff1": 0.7255395142360395, "naucs_at_20_max": -0.20666283697498458, "naucs_at_20_std": 0.9340741995875509, "naucs_at_20_diff1": 0.6769916807524927, "naucs_at_50_max": -0.25364250789497006, "naucs_at_50_std": 0.913686581994549, "naucs_at_50_diff1": 0.6194624533926231, "naucs_at_100_max": -0.33117544987926306, "naucs_at_100_std": 0.925380107024548, "naucs_at_100_diff1": 0.5889383698778079}, "arxivqa_subsampled": {"ndcg_at_1": 0.774, "ndcg_at_3": 0.82333, "ndcg_at_5": 0.83168, "ndcg_at_10": 0.84763, "ndcg_at_20": 0.85417, "ndcg_at_50": 0.86064, "ndcg_at_100": 0.86196, "map_at_1": 0.774, "map_at_3": 0.81133, "map_at_5": 0.81603, "map_at_10": 0.82249, "map_at_20": 0.82428, "map_at_50": 0.82536, "map_at_100": 0.82548, "recall_at_1": 0.774, "recall_at_3": 0.858, "recall_at_5": 0.878, "recall_at_10": 0.928, "recall_at_20": 0.954, "recall_at_50": 0.986, "recall_at_100": 0.994, "precision_at_1": 0.774, "precision_at_3": 0.286, "precision_at_5": 0.1756, "precision_at_10": 0.0928, "precision_at_20": 0.0477, "precision_at_50": 0.01972, "precision_at_100": 0.00994, "mrr_at_1": 0.774, "mrr_at_3": 0.8103333333333333, "mrr_at_5": 0.8154333333333332, "mrr_at_10": 0.8216412698412698, "mrr_at_20": 0.8235997861185941, "mrr_at_50": 0.8245970376853287, "mrr_at_100": 0.824717741545969, "naucs_at_1_max": 0.6956030338929966, "naucs_at_1_std": 0.034737257785584987, "naucs_at_1_diff1": 0.9216607432220811, "naucs_at_3_max": 0.7191420090012451, "naucs_at_3_std": 0.10592878346397475, "naucs_at_3_diff1": 0.8826691837320956, "naucs_at_5_max": 0.7499255380853105, "naucs_at_5_std": 0.12009531125080068, "naucs_at_5_diff1": 0.8803514602373368, "naucs_at_10_max": 0.8015224608361871, "naucs_at_10_std": 0.08101203444340487, "naucs_at_10_diff1": 0.8493749351592488, "naucs_at_20_max": 0.7641375390735974, "naucs_at_20_std": 0.1359355336337385, "naucs_at_20_diff1": 0.8352819388625017, "naucs_at_50_max": 0.7675736961451084, "naucs_at_50_std": 0.057823129251703305, "naucs_at_50_diff1": 0.8646125116713221, "naucs_at_100_max": 0.7424525365701481, "naucs_at_100_std": 0.49361967009023777, "naucs_at_100_diff1": 0.8638344226579416}, "tabfquad_subsampled": {"ndcg_at_1": 0.73571, "ndcg_at_3": 0.79375, "ndcg_at_5": 0.80251, "ndcg_at_10": 0.81636, "ndcg_at_20": 0.82817, "ndcg_at_50": 0.83832, "ndcg_at_100": 0.83954, "map_at_1": 0.73571, "map_at_3": 0.78036, "map_at_5": 0.78518, "map_at_10": 0.7909, "map_at_20": 0.79416, "map_at_50": 0.79589, "map_at_100": 0.79601, "recall_at_1": 0.73571, "recall_at_3": 0.83214, "recall_at_5": 0.85357, "recall_at_10": 0.89643, "recall_at_20": 0.94286, "recall_at_50": 0.99286, "recall_at_100": 1.0, "precision_at_1": 0.73571, "precision_at_3": 0.27738, "precision_at_5": 0.17071, "precision_at_10": 0.08964, "precision_at_20": 0.04714, "precision_at_50": 0.01986, "precision_at_100": 0.01, "mrr_at_1": 0.7357142857142858, "mrr_at_3": 0.7797619047619048, "mrr_at_5": 0.7838690476190475, "mrr_at_10": 0.7901204648526078, "mrr_at_20": 0.7934665929308786, "mrr_at_50": 0.7952056267189848, "mrr_at_100": 0.7953287794283443, "naucs_at_1_max": 0.3253261692793548, "naucs_at_1_std": 0.06312608068134669, "naucs_at_1_diff1": 0.8084496777604704, "naucs_at_3_max": 0.3105270885332547, "naucs_at_3_std": 0.07538225978983691, "naucs_at_3_diff1": 0.738448308408667, "naucs_at_5_max": 0.31633840963626375, "naucs_at_5_std": 0.09126654154094667, "naucs_at_5_diff1": 0.7328288707799767, "naucs_at_10_max": 0.1824121090591562, "naucs_at_10_std": -0.010980303373330084, "naucs_at_10_diff1": 0.6897377017367963, "naucs_at_20_max": 0.0169234360410811, "naucs_at_20_std": -0.31098272642390185, "naucs_at_20_diff1": 0.6254668534080327, "naucs_at_50_max": -0.3968253968254018, "naucs_at_50_std": -0.690943043884227, "naucs_at_50_diff1": 0.8611111111110865, "naucs_at_100_max": 1.0, "naucs_at_100_std": 1.0, "naucs_at_100_diff1": 1.0}, "tatdqa": {"ndcg_at_1": 0.66987, "ndcg_at_3": 0.77553, "ndcg_at_5": 0.79538, "ndcg_at_10": 0.80853, "ndcg_at_20": 0.81354, "ndcg_at_50": 0.81796, "ndcg_at_100": 0.81903, "map_at_1": 0.66987, "map_at_3": 0.75005, "map_at_5": 0.76108, "map_at_10": 0.76669, "map_at_20": 0.76814, "map_at_50": 0.76886, "map_at_100": 0.76895, "recall_at_1": 0.66987, "recall_at_3": 0.84907, "recall_at_5": 0.89717, "recall_at_10": 0.93686, "recall_at_20": 0.9561, "recall_at_50": 0.97835, "recall_at_100": 0.98497, "precision_at_1": 0.66987, "precision_at_3": 0.28302, "precision_at_5": 0.17943, "precision_at_10": 0.09369, "precision_at_20": 0.04781, "precision_at_50": 0.01957, "precision_at_100": 0.00985, "mrr_at_1": 0.6650631389055923, "mrr_at_3": 0.7486470234515935, "mrr_at_5": 0.7588995790739627, "mrr_at_10": 0.7649008771678646, "mrr_at_20": 0.766294670223957, "mrr_at_50": 0.7669629679577795, "mrr_at_100": 0.7670583172691432, "naucs_at_1_max": 0.2568730737793943, "naucs_at_1_std": -0.12808142195797126, "naucs_at_1_diff1": 0.8234815744151925, "naucs_at_3_max": 0.32424305760807287, "naucs_at_3_std": 0.0023177179676344157, "naucs_at_3_diff1": 0.7226885160746074, "naucs_at_5_max": 0.3697612224125756, "naucs_at_5_std": 0.11798240403444073, "naucs_at_5_diff1": 0.6833142525048825, "naucs_at_10_max": 0.49587555962938135, "naucs_at_10_std": 0.22528738928970488, "naucs_at_10_diff1": 0.7079879601645019, "naucs_at_20_max": 0.5475720475651525, "naucs_at_20_std": 0.3970102434994993, "naucs_at_20_diff1": 0.7067977425806262, "naucs_at_50_max": 0.6739875444992179, "naucs_at_50_std": 0.5159845368869518, "naucs_at_50_diff1": 0.7293116370600532, "naucs_at_100_max": 0.7557825589788986, "naucs_at_100_std": 0.5991543861889267, "naucs_at_100_diff1": 0.787492165390262}, "shift_project": {"ndcg_at_1": 0.67, "ndcg_at_3": 0.77464, "ndcg_at_5": 0.80778, "ndcg_at_10": 0.81467, "ndcg_at_20": 0.82248, "ndcg_at_50": 0.82621, "ndcg_at_100": 0.82621, "map_at_1": 0.67, "map_at_3": 0.75167, "map_at_5": 0.77017, "map_at_10": 0.77326, "map_at_20": 0.77553, "map_at_50": 0.77603, "map_at_100": 0.77603, "recall_at_1": 0.67, "recall_at_3": 0.84, "recall_at_5": 0.92, "recall_at_10": 0.94, "recall_at_20": 0.97, "recall_at_50": 0.99, "recall_at_100": 0.99, "precision_at_1": 0.67, "precision_at_3": 0.28, "precision_at_5": 0.184, "precision_at_10": 0.094, "precision_at_20": 0.0485, "precision_at_50": 0.0198, "precision_at_100": 0.0099, "mrr_at_1": 0.71, "mrr_at_3": 0.775, "mrr_at_5": 0.7935, "mrr_at_10": 0.7961666666666666, "mrr_at_20": 0.7976639928698752, "mrr_at_50": 0.7981844144772533, "mrr_at_100": 0.7981844144772533, "naucs_at_1_max": 0.24121819505341022, "naucs_at_1_std": -0.1675272130148469, "naucs_at_1_diff1": 0.8373652045843135, "naucs_at_3_max": 0.26165930289641504, "naucs_at_3_std": -0.26902307314678475, "naucs_at_3_diff1": 0.697379725085911, "naucs_at_5_max": -0.003501400560219899, "naucs_at_5_std": -0.6327614379084904, "naucs_at_5_diff1": 0.5134220354808603, "naucs_at_10_max": 0.02956738250855913, "naucs_at_10_std": -0.623171490818547, "naucs_at_10_diff1": 0.5325241207594161, "naucs_at_20_max": -0.20572673513850018, "naucs_at_20_std": -1.1190476190476195, "naucs_at_20_diff1": 0.6150015561780299, "naucs_at_50_max": 0.12278244631185525, "naucs_at_50_std": 0.12278244631185525, "naucs_at_50_diff1": 0.12278244631185525, "naucs_at_100_max": 0.12278244631185525, "naucs_at_100_std": 0.12278244631185525, "naucs_at_100_diff1": 0.12278244631185525}}
|
|
|
1 |
+
{"../colpali/data_dir/eval_vidore/tatdqa_test": {"ndcg_at_1": 0.67254, "ndcg_at_3": 0.77154, "ndcg_at_5": 0.79508, "ndcg_at_10": 0.80896, "ndcg_at_20": 0.81304, "ndcg_at_50": 0.81748, "ndcg_at_100": 0.81945, "map_at_1": 0.67254, "map_at_3": 0.74737, "map_at_5": 0.76058, "map_at_10": 0.76651, "map_at_20": 0.76767, "map_at_50": 0.76838, "map_at_100": 0.76855, "recall_at_1": 0.67254, "recall_at_3": 0.84143, "recall_at_5": 0.89793, "recall_at_10": 0.93985, "recall_at_20": 0.95565, "recall_at_50": 0.97813, "recall_at_100": 0.99028, "precision_at_1": 0.67254, "precision_at_3": 0.28048, "precision_at_5": 0.17959, "precision_at_10": 0.09399, "precision_at_20": 0.04778, "precision_at_50": 0.01956, "precision_at_100": 0.0099, "mrr_at_1": 0.6731470230862697, "mrr_at_3": 0.7493924665856622, "mrr_at_5": 0.7618772782503037, "mrr_at_10": 0.7678631699743487, "mrr_at_20": 0.7690541237462379, "mrr_at_50": 0.7697982847348657, "mrr_at_100": 0.7699707664933622, "naucs_at_1_max": 0.20966013356626328, "naucs_at_1_std": -0.22498694181030202, "naucs_at_1_diff1": 0.8203652560809781, "naucs_at_3_max": 0.23726706779023002, "naucs_at_3_std": -0.19910153497947758, "naucs_at_3_diff1": 0.7597696577891234, "naucs_at_5_max": 0.2593769522413535, "naucs_at_5_std": -0.07129523156315126, "naucs_at_5_diff1": 0.7196065288758066, "naucs_at_10_max": 0.39432310858925906, "naucs_at_10_std": 0.18495449574107942, "naucs_at_10_diff1": 0.7253268900545096, "naucs_at_20_max": 0.3930768921714602, "naucs_at_20_std": 0.2479610897886844, "naucs_at_20_diff1": 0.6996988771005946, "naucs_at_50_max": 0.3643319555228912, "naucs_at_50_std": 0.18533772677648166, "naucs_at_50_diff1": 0.7079255723972542, "naucs_at_100_max": 0.3009083862139714, "naucs_at_100_std": 0.09790868216215114, "naucs_at_100_diff1": 0.6858147175459396}, "../colpali/data_dir/eval_vidore/shiftproject_test": {"ndcg_at_1": 0.66, "ndcg_at_3": 0.76071, "ndcg_at_5": 0.79473, "ndcg_at_10": 0.80463, "ndcg_at_20": 0.80926, "ndcg_at_50": 0.81505, "ndcg_at_100": 0.81505, "map_at_1": 0.66, "map_at_3": 0.73667, "map_at_5": 0.75617, "map_at_10": 0.76037, "map_at_20": 0.76143, "map_at_50": 0.76231, "map_at_100": 0.76231, "recall_at_1": 0.66, "recall_at_3": 0.83, "recall_at_5": 0.91, "recall_at_10": 0.94, "recall_at_20": 0.96, "recall_at_50": 0.99, "recall_at_100": 0.99, "precision_at_1": 0.66, "precision_at_3": 0.27667, "precision_at_5": 0.182, "precision_at_10": 0.094, "precision_at_20": 0.048, "precision_at_50": 0.0198, "precision_at_100": 0.0099, "mrr_at_1": 0.67, "mrr_at_3": 0.7516666666666667, "mrr_at_5": 0.7681666666666667, "mrr_at_10": 0.7707063492063492, "mrr_at_20": 0.7723209002899405, "mrr_at_50": 0.7728784938335943, "mrr_at_100": 0.7728784938335943, "naucs_at_1_max": 0.08169869560888152, "naucs_at_1_std": -0.013707723455806894, "naucs_at_1_diff1": 0.7249493843141157, "naucs_at_3_max": 0.2874557380855627, "naucs_at_3_std": -0.13574621234109166, "naucs_at_3_diff1": 0.7652231961455855, "naucs_at_5_max": 0.24380122419338, "naucs_at_5_std": -0.35024380122419174, "naucs_at_5_diff1": 0.7388214545077295, "naucs_at_10_max": 0.3075785869903511, "naucs_at_10_std": -0.32718643012760934, "naucs_at_10_diff1": 0.7786336756925011, "naucs_at_20_max": -0.005952380952378498, "naucs_at_20_std": -0.9213352007469534, "naucs_at_20_diff1": 0.7700746965452813, "naucs_at_50_max": 0.35807656395892007, "naucs_at_50_std": 0.35807656395892007, "naucs_at_50_diff1": 0.7222222222222041, "naucs_at_100_max": 0.35807656395892007, "naucs_at_100_std": 0.35807656395892007, "naucs_at_100_diff1": 0.7222222222222041}, "../colpali/data_dir/eval_vidore/syntheticDocQA_artificial_intelligence_test": {"ndcg_at_1": 0.96, "ndcg_at_3": 0.97762, "ndcg_at_5": 0.98149, "ndcg_at_10": 0.98149, "ndcg_at_20": 0.98149, "ndcg_at_50": 0.98149, "ndcg_at_100": 0.98149, "map_at_1": 0.96, "map_at_3": 0.97333, "map_at_5": 0.97533, "map_at_10": 0.97533, "map_at_20": 0.97533, "map_at_50": 0.97533, "map_at_100": 0.97533, "recall_at_1": 0.96, "recall_at_3": 0.99, "recall_at_5": 1.0, "recall_at_10": 1.0, "recall_at_20": 1.0, "recall_at_50": 1.0, "recall_at_100": 1.0, "precision_at_1": 0.96, "precision_at_3": 0.33, "precision_at_5": 0.2, "precision_at_10": 0.1, "precision_at_20": 0.05, "precision_at_50": 0.02, "precision_at_100": 0.01, "mrr_at_1": 0.97, "mrr_at_3": 0.98, "mrr_at_5": 0.982, "mrr_at_10": 0.982, "mrr_at_20": 0.982, "mrr_at_50": 0.982, "mrr_at_100": 0.982, "naucs_at_1_max": 0.7006302521008423, "naucs_at_1_std": 0.12184873949580065, "naucs_at_1_diff1": 0.96732026143791, "naucs_at_3_max": 0.7222222222222157, "naucs_at_3_std": -1.7399626517274398, "naucs_at_3_diff1": 1.0, "naucs_at_5_max": 1.0, "naucs_at_5_std": 1.0, "naucs_at_5_diff1": 1.0, "naucs_at_10_max": 1.0, "naucs_at_10_std": 1.0, "naucs_at_10_diff1": 1.0, "naucs_at_20_max": 1.0, "naucs_at_20_std": 1.0, "naucs_at_20_diff1": 1.0, "naucs_at_50_max": NaN, "naucs_at_50_std": NaN, "naucs_at_50_diff1": NaN, "naucs_at_100_max": NaN, "naucs_at_100_std": NaN, "naucs_at_100_diff1": NaN}, "../colpali/data_dir/eval_vidore/syntheticDocQA_government_reports_test": {"ndcg_at_1": 0.92, "ndcg_at_3": 0.96917, "ndcg_at_5": 0.96917, "ndcg_at_10": 0.96917, "ndcg_at_20": 0.96917, "ndcg_at_50": 0.96917, "ndcg_at_100": 0.96917, "map_at_1": 0.92, "map_at_3": 0.95833, "map_at_5": 0.95833, "map_at_10": 0.95833, "map_at_20": 0.95833, "map_at_50": 0.95833, "map_at_100": 0.95833, "recall_at_1": 0.92, "recall_at_3": 1.0, "recall_at_5": 1.0, "recall_at_10": 1.0, "recall_at_20": 1.0, "recall_at_50": 1.0, "recall_at_100": 1.0, "precision_at_1": 0.92, "precision_at_3": 0.33333, "precision_at_5": 0.2, "precision_at_10": 0.1, "precision_at_20": 0.05, "precision_at_50": 0.02, "precision_at_100": 0.01, "mrr_at_1": 0.93, "mrr_at_3": 0.965, "mrr_at_5": 0.965, "mrr_at_10": 0.965, "mrr_at_20": 0.965, "mrr_at_50": 0.965, "mrr_at_100": 0.965, "naucs_at_1_max": 0.2525676937441629, "naucs_at_1_std": -0.10498366013071944, "naucs_at_1_diff1": 0.9325980392156855, "naucs_at_3_max": 1.0, "naucs_at_3_std": 1.0, "naucs_at_3_diff1": 1.0, "naucs_at_5_max": 1.0, "naucs_at_5_std": 1.0, "naucs_at_5_diff1": 1.0, "naucs_at_10_max": 1.0, "naucs_at_10_std": 1.0, "naucs_at_10_diff1": 1.0, "naucs_at_20_max": 1.0, "naucs_at_20_std": 1.0, "naucs_at_20_diff1": 1.0, "naucs_at_50_max": NaN, "naucs_at_50_std": NaN, "naucs_at_50_diff1": NaN, "naucs_at_100_max": NaN, "naucs_at_100_std": NaN, "naucs_at_100_diff1": NaN}, "../colpali/data_dir/eval_vidore/arxivqa_test_subsampled": {"ndcg_at_1": 0.738, "ndcg_at_3": 0.78171, "ndcg_at_5": 0.7942, "ndcg_at_10": 0.80782, "ndcg_at_20": 0.81884, "ndcg_at_50": 0.82731, "ndcg_at_100": 0.82893, "map_at_1": 0.738, "map_at_3": 0.77, "map_at_5": 0.777, "map_at_10": 0.78266, "map_at_20": 0.78589, "map_at_50": 0.78731, "map_at_100": 0.78745, "recall_at_1": 0.738, "recall_at_3": 0.816, "recall_at_5": 0.846, "recall_at_10": 0.888, "recall_at_20": 0.93, "recall_at_50": 0.972, "recall_at_100": 0.982, "precision_at_1": 0.738, "precision_at_3": 0.272, "precision_at_5": 0.1692, "precision_at_10": 0.0888, "precision_at_20": 0.0465, "precision_at_50": 0.01944, "precision_at_100": 0.00982, "mrr_at_1": 0.736, "mrr_at_3": 0.7696666666666666, "mrr_at_5": 0.7769666666666667, "mrr_at_10": 0.7824468253968254, "mrr_at_20": 0.7856496591987304, "mrr_at_50": 0.7868935264577809, "mrr_at_100": 0.7870774396931399, "naucs_at_1_max": 0.6441244857086442, "naucs_at_1_std": 0.06486619357906503, "naucs_at_1_diff1": 0.9230124477649233, "naucs_at_3_max": 0.6578972930967495, "naucs_at_3_std": 0.12599296291499376, "naucs_at_3_diff1": 0.8838934939342918, "naucs_at_5_max": 0.6557436425330749, "naucs_at_5_std": 0.14340361177831004, "naucs_at_5_diff1": 0.8845107832297585, "naucs_at_10_max": 0.6284243100649344, "naucs_at_10_std": 0.1057139475108209, "naucs_at_10_diff1": 0.8592228084415582, "naucs_at_20_max": 0.7293850873682812, "naucs_at_20_std": 0.22198212618380547, "naucs_at_20_diff1": 0.8774176337201546, "naucs_at_50_max": 0.6484260370814985, "naucs_at_50_std": 0.5022342270241381, "naucs_at_50_diff1": 0.8701147125516864, "naucs_at_100_max": 0.7380952380952427, "naucs_at_100_std": 0.6890756302521013, "naucs_at_100_diff1": 0.9092229484386288}, "../colpali/data_dir/eval_vidore/docvqa_test_subsampled": {"ndcg_at_1": 0.50776, "ndcg_at_3": 0.57475, "ndcg_at_5": 0.60013, "ndcg_at_10": 0.62058, "ndcg_at_20": 0.63501, "ndcg_at_50": 0.6462, "ndcg_at_100": 0.65513, "map_at_1": 0.50776, "map_at_3": 0.55876, "map_at_5": 0.57273, "map_at_10": 0.58137, "map_at_20": 0.58527, "map_at_50": 0.58695, "map_at_100": 0.58772, "recall_at_1": 0.50776, "recall_at_3": 0.62084, "recall_at_5": 0.68293, "recall_at_10": 0.74501, "recall_at_20": 0.80266, "recall_at_50": 0.86031, "recall_at_100": 0.91574, "precision_at_1": 0.50776, "precision_at_3": 0.20695, "precision_at_5": 0.13659, "precision_at_10": 0.0745, "precision_at_20": 0.04013, "precision_at_50": 0.01721, "precision_at_100": 0.00916, "mrr_at_1": 0.5121951219512195, "mrr_at_3": 0.5598669623059866, "mrr_at_5": 0.5732815964523282, "mrr_at_10": 0.5825062471403935, "mrr_at_20": 0.5859834952726223, "mrr_at_50": 0.5879193696680363, "mrr_at_100": 0.5886403970009746, "naucs_at_1_max": 0.569317766849609, "naucs_at_1_std": 0.2506731863692249, "naucs_at_1_diff1": 0.8940819253399216, "naucs_at_3_max": 0.5320242408844945, "naucs_at_3_std": 0.31139898363283913, "naucs_at_3_diff1": 0.8292659998128213, "naucs_at_5_max": 0.5013862652967811, "naucs_at_5_std": 0.4624341080727763, "naucs_at_5_diff1": 0.8045414688653402, "naucs_at_10_max": 0.5030904726189009, "naucs_at_10_std": 0.533507880084528, "naucs_at_10_diff1": 0.7729429212153898, "naucs_at_20_max": 0.45929954704965514, "naucs_at_20_std": 0.6220482743867082, "naucs_at_20_diff1": 0.7445601717421665, "naucs_at_50_max": 0.3566491997151963, "naucs_at_50_std": 0.6976932061646426, "naucs_at_50_diff1": 0.764513580811436, "naucs_at_100_max": 0.2787609440415055, "naucs_at_100_std": 0.7732527040792341, "naucs_at_100_diff1": 0.797647076714487}, "../colpali/data_dir/eval_vidore/syntheticDocQA_healthcare_industry_test": {"ndcg_at_1": 0.99, "ndcg_at_3": 0.99631, "ndcg_at_5": 0.99631, "ndcg_at_10": 0.99631, "ndcg_at_20": 0.99631, "ndcg_at_50": 0.99631, "ndcg_at_100": 0.99631, "map_at_1": 0.99, "map_at_3": 0.995, "map_at_5": 0.995, "map_at_10": 0.995, "map_at_20": 0.995, "map_at_50": 0.995, "map_at_100": 0.995, "recall_at_1": 0.99, "recall_at_3": 1.0, "recall_at_5": 1.0, "recall_at_10": 1.0, "recall_at_20": 1.0, "recall_at_50": 1.0, "recall_at_100": 1.0, "precision_at_1": 0.99, "precision_at_3": 0.33333, "precision_at_5": 0.2, "precision_at_10": 0.1, "precision_at_20": 0.05, "precision_at_50": 0.02, "precision_at_100": 0.01, "mrr_at_1": 0.99, "mrr_at_3": 0.995, "mrr_at_5": 0.995, "mrr_at_10": 0.995, "mrr_at_20": 0.995, "mrr_at_50": 0.995, "mrr_at_100": 0.995, "naucs_at_1_max": -0.5634920634920657, "naucs_at_1_std": -0.5634920634920657, "naucs_at_1_diff1": 1.0, "naucs_at_3_max": 1.0, "naucs_at_3_std": 1.0, "naucs_at_3_diff1": 1.0, "naucs_at_5_max": 1.0, "naucs_at_5_std": 1.0, "naucs_at_5_diff1": 1.0, "naucs_at_10_max": 1.0, "naucs_at_10_std": 1.0, "naucs_at_10_diff1": 1.0, "naucs_at_20_max": 1.0, "naucs_at_20_std": 1.0, "naucs_at_20_diff1": 1.0, "naucs_at_50_max": NaN, "naucs_at_50_std": NaN, "naucs_at_50_diff1": NaN, "naucs_at_100_max": NaN, "naucs_at_100_std": NaN, "naucs_at_100_diff1": NaN}, "../colpali/data_dir/eval_vidore/infovqa_test_subsampled": {"ndcg_at_1": 0.86235, "ndcg_at_3": 0.90158, "ndcg_at_5": 0.90567, "ndcg_at_10": 0.91363, "ndcg_at_20": 0.91519, "ndcg_at_50": 0.91877, "ndcg_at_100": 0.91943, "map_at_1": 0.86235, "map_at_3": 0.89204, "map_at_5": 0.89426, "map_at_10": 0.89761, "map_at_20": 0.89804, "map_at_50": 0.89861, "map_at_100": 0.89866, "recall_at_1": 0.86235, "recall_at_3": 0.92915, "recall_at_5": 0.93927, "recall_at_10": 0.96356, "recall_at_20": 0.96964, "recall_at_50": 0.98785, "recall_at_100": 0.9919, "precision_at_1": 0.86235, "precision_at_3": 0.30972, "precision_at_5": 0.18785, "precision_at_10": 0.09636, "precision_at_20": 0.04848, "precision_at_50": 0.01976, "precision_at_100": 0.00992, "mrr_at_1": 0.8603238866396761, "mrr_at_3": 0.8903508771929824, "mrr_at_5": 0.8931848852901485, "mrr_at_10": 0.8970864661654135, "mrr_at_20": 0.8973279605897335, "mrr_at_50": 0.8978873365734087, "mrr_at_100": 0.8979428941866536, "naucs_at_1_max": 0.6141087424038754, "naucs_at_1_std": -0.030722276569984355, "naucs_at_1_diff1": 0.9202550833899372, "naucs_at_3_max": 0.6449024060358626, "naucs_at_3_std": -0.1880330467463847, "naucs_at_3_diff1": 0.9225365697409679, "naucs_at_5_max": 0.6732032874315905, "naucs_at_5_std": -0.1432252604677148, "naucs_at_5_diff1": 0.9232372044252183, "naucs_at_10_max": 0.8191686971467412, "naucs_at_10_std": 0.22617716320424064, "naucs_at_10_diff1": 0.9401180393458267, "naucs_at_20_max": 0.8589054528404234, "naucs_at_20_std": 0.1941650857143643, "naucs_at_20_diff1": 0.9640708236075015, "naucs_at_50_max": 0.9319439680295378, "naucs_at_50_std": 0.6371519734027287, "naucs_at_50_diff1": 0.9782330909892136, "naucs_at_100_max": 0.8979159520443043, "naucs_at_100_std": 0.7864897480536438, "naucs_at_100_diff1": 0.9673496364838197}, "../colpali/data_dir/eval_vidore/syntheticDocQA_energy_test": {"ndcg_at_1": 0.93, "ndcg_at_3": 0.95524, "ndcg_at_5": 0.95911, "ndcg_at_10": 0.96267, "ndcg_at_20": 0.96267, "ndcg_at_50": 0.96457, "ndcg_at_100": 0.96457, "map_at_1": 0.93, "map_at_3": 0.95, "map_at_5": 0.952, "map_at_10": 0.95367, "map_at_20": 0.95367, "map_at_50": 0.95394, "map_at_100": 0.95394, "recall_at_1": 0.93, "recall_at_3": 0.97, "recall_at_5": 0.98, "recall_at_10": 0.99, "recall_at_20": 0.99, "recall_at_50": 1.0, "recall_at_100": 1.0, "precision_at_1": 0.93, "precision_at_3": 0.32333, "precision_at_5": 0.196, "precision_at_10": 0.099, "precision_at_20": 0.0495, "precision_at_50": 0.02, "precision_at_100": 0.01, "mrr_at_1": 0.93, "mrr_at_3": 0.95, "mrr_at_5": 0.9545, "mrr_at_10": 0.9545, "mrr_at_20": 0.9545, "mrr_at_50": 0.9547941176470589, "mrr_at_100": 0.9547941176470589, "naucs_at_1_max": 0.5122715752967848, "naucs_at_1_std": -0.8083900226757392, "naucs_at_1_diff1": 0.9626517273576113, "naucs_at_3_max": 0.7587924058512326, "naucs_at_3_std": -0.9752567693744157, "naucs_at_3_diff1": 1.0, "naucs_at_5_max": 0.6381886087768404, "naucs_at_5_std": -1.7399626517273414, "naucs_at_5_diff1": 1.0, "naucs_at_10_max": 0.7222222222222276, "naucs_at_10_std": -1.7399626517273863, "naucs_at_10_diff1": 1.0, "naucs_at_20_max": 0.7222222222222276, "naucs_at_20_std": -1.7399626517273863, "naucs_at_20_diff1": 1.0, "naucs_at_50_max": NaN, "naucs_at_50_std": NaN, "naucs_at_50_diff1": NaN, "naucs_at_100_max": NaN, "naucs_at_100_std": NaN, "naucs_at_100_diff1": NaN}, "../colpali/data_dir/eval_vidore/tabfquad_test_subsampled": {"ndcg_at_1": 0.74286, "ndcg_at_3": 0.80578, "ndcg_at_5": 0.81331, "ndcg_at_10": 0.83414, "ndcg_at_20": 0.84421, "ndcg_at_50": 0.84981, "ndcg_at_100": 0.84981, "map_at_1": 0.74286, "map_at_3": 0.79048, "map_at_5": 0.79476, "map_at_10": 0.80337, "map_at_20": 0.80621, "map_at_50": 0.80708, "map_at_100": 0.80708, "recall_at_1": 0.74286, "recall_at_3": 0.85, "recall_at_5": 0.86786, "recall_at_10": 0.93214, "recall_at_20": 0.97143, "recall_at_50": 1.0, "recall_at_100": 1.0, "precision_at_1": 0.74286, "precision_at_3": 0.28333, "precision_at_5": 0.17357, "precision_at_10": 0.09321, "precision_at_20": 0.04857, "precision_at_50": 0.02, "precision_at_100": 0.01, "mrr_at_1": 0.7392857142857143, "mrr_at_3": 0.7869047619047619, "mrr_at_5": 0.7924404761904762, "mrr_at_10": 0.8010884353741496, "mrr_at_20": 0.8036055972505552, "mrr_at_50": 0.8044824919583908, "mrr_at_100": 0.8044824919583908, "naucs_at_1_max": 0.2579714168809912, "naucs_at_1_std": 0.06030804302080844, "naucs_at_1_diff1": 0.8073342880523727, "naucs_at_3_max": 0.23897075914648253, "naucs_at_3_std": 0.10569011203570283, "naucs_at_3_diff1": 0.7397378085630618, "naucs_at_5_max": 0.23385982745588652, "naucs_at_5_std": 0.08519039799827996, "naucs_at_5_diff1": 0.6976698725467213, "naucs_at_10_max": 0.20789719396530357, "naucs_at_10_std": -0.05779153766769964, "naucs_at_10_diff1": 0.7551968155683331, "naucs_at_20_max": 0.07142857142857674, "naucs_at_20_std": -0.1817810457516319, "naucs_at_20_diff1": 0.7208216619981378, "naucs_at_50_max": 1.0, "naucs_at_50_std": 1.0, "naucs_at_50_diff1": 1.0, "naucs_at_100_max": 1.0, "naucs_at_100_std": 1.0, "naucs_at_100_diff1": 1.0}}
|