thaottn commited on
Commit
f07ebbf
1 Parent(s): 67eb128

Upload artifacts (small scale)

Browse files
small_scale/results.jsonl CHANGED
@@ -1,40 +1,40 @@
1
- {"key": "vtab/caltech101", "dataset": "Caltech-101", "metrics": {"acc1": 0.39178307313064914, "acc5": 0.6898931799506984, "mean_per_class_recall": 0.3573535575129946, "main_metric": 0.3573535575129946}}
2
- {"key": "cifar10", "dataset": "CIFAR-10", "metrics": {"acc1": 0.5789, "acc5": 0.9738, "mean_per_class_recall": 0.5789, "main_metric": 0.5789}}
3
- {"key": "vtab/cifar100", "dataset": "CIFAR-100", "metrics": {"acc1": 0.2905, "acc5": 0.6048, "mean_per_class_recall": 0.2905, "main_metric": 0.2905}}
4
- {"key": "vtab/clevr_count_all", "dataset": "CLEVR Counts", "metrics": {"acc1": 0.14933333333333335, "acc5": 0.6446, "mean_per_class_recall": 0.14846225210925348, "main_metric": 0.14933333333333335}}
5
- {"key": "vtab/clevr_closest_object_distance", "dataset": "CLEVR Distance", "metrics": {"acc1": 0.203, "acc5": 0.9186666666666666, "mean_per_class_recall": 0.15483015211598952, "main_metric": 0.203}}
6
- {"key": "country211", "dataset": "Country211", "metrics": {"acc1": 0.013696682464454976, "acc5": 0.043886255924170614, "mean_per_class_recall": 0.013696682464454976, "main_metric": 0.013696682464454976}}
7
- {"key": "vtab/dtd", "dataset": "Describable Textures", "metrics": {"acc1": 0.12180851063829787, "acc5": 0.2898936170212766, "mean_per_class_recall": 0.12180851063829787, "main_metric": 0.12180851063829787}}
8
- {"key": "vtab/eurosat", "dataset": "EuroSAT", "metrics": {"acc1": 0.29444444444444445, "acc5": 0.7644444444444445, "mean_per_class_recall": 0.2946656919107774, "main_metric": 0.29444444444444445}}
9
- {"key": "fgvc_aircraft", "dataset": "FGVC Aircraft", "metrics": {"acc1": 0.010801080108010801, "acc5": 0.0501050105010501, "mean_per_class_recall": 0.010659536541889482, "main_metric": 0.010659536541889482}}
10
- {"key": "food101", "dataset": "Food-101", "metrics": {"acc1": 0.10847524752475247, "acc5": 0.28855445544554453, "mean_per_class_recall": 0.10847524752475245, "main_metric": 0.10847524752475247}}
11
- {"key": "gtsrb", "dataset": "GTSRB", "metrics": {"acc1": 0.05985748218527316, "acc5": 0.23689627870150434, "mean_per_class_recall": 0.08254117998430435, "main_metric": 0.05985748218527316}}
12
- {"key": "imagenet1k", "dataset": "ImageNet 1k", "metrics": {"acc1": 0.07974, "acc5": 0.2004, "mean_per_class_recall": 0.07974, "per_class_acc": [0.0, 0.32, 0.52, 0.0, 0.04, 0.0, 0.0, 0.18, 0.02, 0.0, 0.0, 0.4, 0.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.02, 0.0, 0.04, 0.12, 0.06, 0.12, 0.0, 0.0, 0.0, 0.04, 0.0, 0.0, 0.02, 0.08, 0.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.2, 0.0, 0.1, 0.0, 0.0, 0.1, 0.0, 0.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.08, 0.0, 0.0, 0.16, 0.0, 0.0, 0.0, 0.04, 0.0, 0.0, 0.02, 0.0, 0.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.02, 0.0, 0.2, 0.0, 0.0, 0.06, 0.2, 0.0, 0.1, 0.24, 0.0, 0.0, 0.0, 0.18, 0.08, 0.06, 0.0, 0.0, 0.0, 0.0, 0.26, 0.0, 0.2, 0.0, 0.0, 0.0, 0.2, 0.0, 0.0, 0.0, 0.02, 0.06, 0.0, 0.12, 0.18, 0.0, 0.0, 0.0, 0.0, 0.06, 0.0, 0.12, 0.0, 0.0, 0.0, 0.02, 0.0, 0.0, 0.14, 0.0, 0.02, 0.02, 0.0, 0.18, 0.18, 0.0, 0.22, 0.2, 0.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.08, 0.14, 0.0, 0.02, 0.08, 0.0, 0.0, 0.02, 0.0, 0.0, 0.0, 0.1, 0.02, 0.02, 0.04, 0.0, 0.0, 0.04, 0.0, 0.0, 0.0, 0.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.04, 0.02, 0.0, 0.0, 0.0, 0.0, 0.02, 0.0, 0.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.02, 0.0, 0.02, 0.0, 0.02, 0.0, 0.0, 0.08, 0.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.2, 0.0, 0.0, 0.0, 0.06, 0.02, 0.0, 0.02, 0.0, 0.0, 0.08, 0.0, 0.0, 0.0, 0.0, 0.02, 0.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.06, 0.18, 0.1, 0.02, 0.0, 0.18, 0.28, 0.0, 0.0, 0.08, 0.22, 0.0, 0.0, 0.0, 0.06, 0.0, 0.02, 0.0, 0.0, 0.02, 0.0, 0.04, 0.16, 0.0, 0.0, 0.06, 0.0, 0.0, 0.0, 0.22, 0.12, 0.0, 0.0, 0.0, 0.12, 0.0, 0.02, 0.0, 0.0, 0.02, 0.0, 0.0, 0.0, 0.06, 0.0, 0.0, 0.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.14, 0.04, 0.0, 0.26, 0.0, 0.02, 0.16, 0.3, 0.24, 0.0, 0.04, 0.1, 0.18, 0.02, 0.02, 0.5, 0.0, 0.0, 0.1, 0.0, 0.14, 0.2, 0.02, 0.06, 0.0, 0.02, 0.0, 0.0, 0.02, 0.0, 0.04, 0.0, 0.0, 0.1, 0.02, 0.0, 0.0, 0.0, 0.08, 0.0, 0.1, 0.0, 0.62, 0.28, 0.02, 0.02, 0.02, 0.0, 0.0, 0.0, 0.14, 0.0, 0.24, 0.0, 0.0, 0.0, 0.0, 0.22, 0.02, 0.36, 0.12, 0.18, 0.0, 0.04, 0.0, 0.08, 0.24, 0.02, 0.2, 0.0, 0.0, 0.14, 0.0, 0.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.08, 0.2, 0.0, 0.0, 0.0, 0.26, 0.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.2, 0.0, 0.04, 0.08, 0.0, 0.0, 0.06, 0.06, 0.02, 0.22, 0.02, 0.02, 0.0, 0.0, 0.08, 0.0, 0.04, 0.08, 0.0, 0.2, 0.0, 0.02, 0.04, 0.08, 0.16, 0.04, 0.0, 0.36, 0.34, 0.02, 0.12, 0.0, 0.06, 0.02, 0.08, 0.06, 0.12, 0.02, 0.04, 0.06, 0.0, 0.04, 0.12, 0.0, 0.02, 0.0, 0.42, 0.02, 0.1, 0.0, 0.0, 0.02, 0.0, 0.0, 0.0, 0.02, 0.08, 0.0, 0.22, 0.0, 0.0, 0.08, 0.12, 0.16, 0.16, 0.26, 0.02, 0.08, 0.06, 0.14, 0.0, 0.0, 0.02, 0.0, 0.28, 0.22, 0.0, 0.02, 0.06, 0.44, 0.0, 0.0, 0.0, 0.04, 0.0, 0.02, 0.16, 0.4, 0.2, 0.0, 0.02, 0.04, 0.04, 0.18, 0.02, 0.16, 0.68, 0.3, 0.22, 0.12, 0.32, 0.08, 0.0, 0.0, 0.3, 0.24, 0.0, 0.3, 0.12, 0.04, 0.06, 0.0, 0.12, 0.02, 0.0, 0.0, 0.2, 0.56, 0.14, 0.04, 0.0, 0.18, 0.12, 0.04, 0.06, 0.0, 0.0, 0.04, 0.06, 0.06, 0.2, 0.26, 0.26, 0.0, 0.0, 0.12, 0.02, 0.0, 0.06, 0.06, 0.0, 0.14, 0.02, 0.0, 0.0, 0.0, 0.24, 0.12, 0.06, 0.06, 0.0, 0.08, 0.1, 0.4, 0.08, 0.06, 0.0, 0.1, 0.26, 0.04, 0.1, 0.12, 0.0, 0.0, 0.0, 0.06, 0.06, 0.02, 0.04, 0.48, 0.06, 0.42, 0.02, 0.0, 0.2, 0.14, 0.32, 0.08, 0.2, 0.0, 0.06, 0.04, 0.3, 0.06, 0.1, 0.08, 0.04, 0.0, 0.08, 0.24, 0.08, 0.06, 0.0, 0.04, 0.34, 0.14, 0.2, 0.24, 0.1, 0.32, 0.28, 0.16, 0.08, 0.26, 0.0, 0.0, 0.04, 0.0, 0.0, 0.24, 0.06, 0.04, 0.02, 0.08, 0.06, 0.0, 0.4, 0.0, 0.04, 0.12, 0.08, 0.0, 0.0, 0.02, 0.06, 0.0, 0.06, 0.0, 0.16, 0.38, 0.06, 0.32, 0.06, 0.0, 0.02, 0.26, 0.2, 0.0, 0.16, 0.0, 0.02, 0.52, 0.3, 0.06, 0.02, 0.1, 0.06, 0.0, 0.32, 0.02, 0.26, 0.08, 0.02, 0.04, 0.0, 0.02, 0.02, 0.2, 0.04, 0.0, 0.04, 0.64, 0.0, 0.0, 0.0, 0.04, 0.0, 0.0, 0.0, 0.04, 0.0, 0.0, 0.08, 0.02, 0.0, 0.08, 0.0, 0.18, 0.06, 0.0, 0.0, 0.08, 0.0, 0.0, 0.16, 0.06, 0.26, 0.06, 0.02, 0.2, 0.02, 0.08, 0.36, 0.06, 0.04, 0.0, 0.02, 0.0, 0.02, 0.0, 0.36, 0.06, 0.04, 0.38, 0.0, 0.0, 0.04, 0.04, 0.12, 0.42, 0.06, 0.02, 0.06, 0.1, 0.0, 0.0, 0.02, 0.02, 0.14, 0.32, 0.0, 0.02, 0.2, 0.0, 0.2, 0.02, 0.0, 0.34, 0.0, 0.0, 0.0, 0.0, 0.08, 0.0, 0.0, 0.0, 0.0, 0.32, 0.14, 0.32, 0.16, 0.0, 0.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.06, 0.0, 0.04, 0.06, 0.24, 0.14, 0.08, 0.04, 0.22, 0.0, 0.0, 0.2, 0.18, 0.18, 0.0, 0.14, 0.12, 0.02, 0.08, 0.0, 0.02, 0.28, 0.0, 0.08, 0.0, 0.0, 0.06, 0.06, 0.04, 0.14, 0.14, 0.04, 0.36, 0.2, 0.04, 0.08, 0.0, 0.0, 0.04, 0.08, 0.2, 0.0, 0.0, 0.02, 0.04, 0.0, 0.1, 0.0, 0.02, 0.08, 0.0, 0.26, 0.12, 0.08, 0.0, 0.0, 0.08, 0.04, 0.0, 0.2, 0.06, 0.0, 0.0, 0.0, 0.0, 0.4, 0.02, 0.02, 0.0, 0.24, 0.22, 0.0, 0.56, 0.0, 0.0, 0.02, 0.06, 0.04, 0.0, 0.26, 0.14, 0.0, 0.04, 0.02, 0.1, 0.14, 0.0, 0.32, 0.1, 0.14, 0.2, 0.16, 0.0, 0.1, 0.0, 0.26, 0.02, 0.1, 0.04, 0.4, 0.0, 0.16, 0.0, 0.06, 0.14, 0.0, 0.0, 0.0, 0.0, 0.1, 0.02, 0.32, 0.0, 0.08, 0.02, 0.0, 0.36, 0.1, 0.0, 0.12, 0.04, 0.1, 0.14, 0.3, 0.04, 0.0, 0.02, 0.02, 0.18, 0.06, 0.0, 0.06, 0.12, 0.24, 0.04, 0.1, 0.2, 0.02, 0.02, 0.14, 0.08, 0.0, 0.12, 0.02, 0.1, 0.0, 0.02, 0.0, 0.32, 0.0, 0.0, 0.26, 0.06, 0.06, 0.46, 0.08, 0.48, 0.0, 0.08, 0.04, 0.22, 0.04, 0.1, 0.02, 0.24, 0.14, 0.14, 0.2, 0.02, 0.08, 0.12, 0.08, 0.0, 0.12, 0.0, 0.0, 0.0, 0.08, 0.16, 0.1, 0.06, 0.02, 0.06, 0.04, 0.26, 0.12, 0.7, 0.34, 0.18, 0.38, 0.1, 0.0, 0.62, 0.0, 0.32, 0.0, 0.02, 0.3, 0.0, 0.04, 0.06, 0.02, 0.24, 0.3, 0.02, 0.64, 0.18, 0.18, 0.38, 0.22, 0.1, 0.02, 0.28, 0.1, 0.12, 0.02, 0.0, 0.08, 0.0, 0.3, 0.02, 0.16, 0.0, 0.06, 0.1, 0.0, 0.0, 0.5, 0.28, 0.0, 0.06, 0.1, 0.34, 0.44, 0.14, 0.08, 0.04, 0.0, 0.08, 0.02, 0.24, 0.0, 0.12, 0.4, 0.76, 0.0, 0.0, 0.0, 0.22, 0.02, 0.16, 0.38, 0.22, 0.6, 0.64, 0.54, 0.0, 0.06, 0.0, 0.0, 0.02, 0.12, 0.0, 0.0, 0.0, 0.0, 0.26, 0.0, 0.2, 0.06], "main_metric": 0.07974}}
13
- {"key": "imagenet_sketch", "dataset": "ImageNet Sketch", "metrics": {"acc1": 0.03810253689402425, "acc5": 0.10137750790937138, "mean_per_class_recall": 0.03808588235294118, "main_metric": 0.03810253689402425}}
14
- {"key": "imagenetv2", "dataset": "ImageNet v2", "metrics": {"acc1": 0.0656, "acc5": 0.1742, "mean_per_class_recall": 0.06559999999999999, "main_metric": 0.0656}}
15
- {"key": "imagenet-a", "dataset": "ImageNet-A", "metrics": {"acc1": 0.0196, "acc5": 0.08573333333333333, "mean_per_class_recall": 0.025413748211319614, "main_metric": 0.0196}}
16
- {"key": "imagenet-o", "dataset": "ImageNet-O", "metrics": {"acc1": 0.182, "acc5": 0.4225, "mean_per_class_recall": 0.18094051352843923, "main_metric": 0.182}}
17
- {"key": "imagenet-r", "dataset": "ImageNet-R", "metrics": {"acc1": 0.1151, "acc5": 0.2720666666666667, "mean_per_class_recall": 0.10459894836517161, "main_metric": 0.1151}}
18
- {"key": "vtab/kitti_closest_vehicle_distance", "dataset": "KITTI Vehicle Distance", "metrics": {"acc1": 0.2770745428973277, "acc5": null, "mean_per_class_recall": 0.19617354219959826, "main_metric": 0.2770745428973277}}
19
- {"key": "mnist", "dataset": "MNIST", "metrics": {"acc1": 0.1533, "acc5": 0.6329, "mean_per_class_recall": 0.1401536846821356, "main_metric": 0.1533}}
20
- {"key": "objectnet", "dataset": "ObjectNet", "metrics": {"acc1": 0.07575104985463552, "acc5": 0.21024012059868633, "mean_per_class_recall": 0.07514246578043296, "main_metric": 0.07575104985463552}}
21
- {"key": "vtab/flowers", "dataset": "Oxford Flowers-102", "metrics": {"acc1": 0.08928281021304277, "acc5": 0.26524638152545127, "mean_per_class_recall": 0.08789523635259217, "main_metric": 0.08789523635259217}}
22
- {"key": "vtab/pets", "dataset": "Oxford-IIIT Pet", "metrics": {"acc1": 0.09484873262469337, "acc5": 0.30471518124829655, "mean_per_class_recall": 0.09494239387497813, "main_metric": 0.09494239387497813}}
23
- {"key": "voc2007", "dataset": "Pascal VOC 2007", "metrics": {"acc1": 0.31316773504273504, "acc5": 0.6167200854700855, "mean_per_class_recall": 0.42820729914310407, "main_metric": 0.31316773504273504}}
24
- {"key": "vtab/pcam", "dataset": "PatchCamelyon", "metrics": {"acc1": 0.5045166015625, "acc5": null, "mean_per_class_recall": 0.5047282045024709, "main_metric": 0.5045166015625}}
25
  {"key": "renderedsst2", "dataset": "Rendered SST2", "metrics": {"acc1": 0.500823723228995, "acc5": null, "mean_per_class_recall": 0.5, "main_metric": 0.500823723228995}}
26
- {"key": "vtab/resisc45", "dataset": "RESISC45", "metrics": {"acc1": 0.1226984126984127, "acc5": 0.39571428571428574, "mean_per_class_recall": 0.12415206577608122, "main_metric": 0.1226984126984127}}
27
- {"key": "cars", "dataset": "Stanford Cars", "metrics": {"acc1": 0.024126352443725903, "acc5": 0.10707623429921652, "mean_per_class_recall": 0.02449931508465049, "main_metric": 0.024126352443725903}}
28
- {"key": "stl10", "dataset": "STL-10", "metrics": {"acc1": 0.629375, "acc5": 0.974625, "mean_per_class_recall": 0.6293749999999999, "main_metric": 0.629375}}
29
- {"key": "sun397", "dataset": "SUN397", "metrics": {"acc1": 0.18546444268716553, "acc5": 0.4209316438935579, "mean_per_class_recall": 0.15099406078322206, "main_metric": 0.18546444268716553}}
30
- {"key": "vtab/svhn", "dataset": "SVHN", "metrics": {"acc1": 0.08209127228027044, "acc5": 0.5176321450522434, "mean_per_class_recall": 0.11271610243558924, "main_metric": 0.08209127228027044}}
31
- {"key": "retrieval/flickr_1k_test_image_text_retrieval", "dataset": "Flickr", "metrics": {"image_retrieval_recall@1": 0.10100000351667404, "text_retrieval_recall@1": 0.1509999930858612, "image_retrieval_recall@5": 0.26420000195503235, "text_retrieval_recall@5": 0.35499998927116394, "image_retrieval_recall@10": 0.3646000027656555, "text_retrieval_recall@10": 0.47099998593330383, "mean_recall@1": 0.12599999830126762, "main_metric": 0.12599999830126762}}
32
- {"key": "retrieval/mscoco_2014_5k_test_image_text_retrieval", "dataset": "MSCOCO", "metrics": {"image_retrieval_recall@1": 0.06501399725675583, "text_retrieval_recall@1": 0.09960000216960907, "image_retrieval_recall@5": 0.17461015284061432, "text_retrieval_recall@5": 0.24480000138282776, "image_retrieval_recall@10": 0.2522191107273102, "text_retrieval_recall@10": 0.3425999879837036, "mean_recall@1": 0.08230699971318245, "main_metric": 0.08230699971318245}}
33
- {"key": "misc/winogavil", "dataset": "WinoGAViL", "metrics": {"avg_jaccard_score": 0.40335591997113185, "jaccard_score_5": 0.4498232323232323, "jaccard_score_6": 0.42147828173746105, "jaccard_score_10": 0.3219092331768388, "jaccard_score_12": 0.28229862038273257, "jaccard_score_5-6": 0.4352897748246586, "jaccard_score_10-12": 0.3020575443292071, "main_metric": 0.3020575443292071}}
34
- {"key": "wilds/iwildcam", "dataset": "iWildCam", "metrics": {"acc1": 0.12967680119651329, "acc5": 0.21635390619522796, "mean_per_class_recall": 0.013105174040215044, "acc_avg": 0.12967680394649506, "recall-macro_all": 0.013105174040215044, "F1-macro_all": 0.006112641604645059, "main_metric": 0.006112641604645059}}
35
- {"key": "wilds/camelyon17", "dataset": "Camelyon17", "metrics": {"acc1": 0.5000470289463165, "acc5": null, "mean_per_class_recall": 0.5000470289463165, "acc_avg": 0.5000470280647278, "acc_slide:0": NaN, "count_slide:0": 0.0, "acc_slide:1": NaN, "count_slide:1": 0.0, "acc_slide:2": NaN, "count_slide:2": 0.0, "acc_slide:3": NaN, "count_slide:3": 0.0, "acc_slide:4": NaN, "count_slide:4": 0.0, "acc_slide:5": NaN, "count_slide:5": 0.0, "acc_slide:6": NaN, "count_slide:6": 0.0, "acc_slide:7": NaN, "count_slide:7": 0.0, "acc_slide:8": NaN, "count_slide:8": 0.0, "acc_slide:9": NaN, "count_slide:9": 0.0, "acc_slide:10": NaN, "count_slide:10": 0.0, "acc_slide:11": NaN, "count_slide:11": 0.0, "acc_slide:12": NaN, "count_slide:12": 0.0, "acc_slide:13": NaN, "count_slide:13": 0.0, "acc_slide:14": NaN, "count_slide:14": 0.0, "acc_slide:15": NaN, "count_slide:15": 0.0, "acc_slide:16": NaN, "count_slide:16": 0.0, "acc_slide:17": NaN, "count_slide:17": 0.0, "acc_slide:18": NaN, "count_slide:18": 0.0, "acc_slide:19": NaN, "count_slide:19": 0.0, "acc_slide:20": 0.007086614146828651, "count_slide:20": 3810.0, "acc_slide:21": 0.002707092557102442, "count_slide:21": 3694.0, "acc_slide:22": 0.5865464806556702, "count_slide:22": 7210.0, "acc_slide:23": 0.5221255421638489, "count_slide:23": 5288.0, "acc_slide:24": 0.023812605068087578, "count_slide:24": 7727.0, "acc_slide:25": 0.23742501437664032, "count_slide:25": 4334.0, "acc_slide:26": 0.12975098192691803, "count_slide:26": 3815.0, "acc_slide:27": 0.024143986403942108, "count_slide:27": 4556.0, "acc_slide:28": 0.8470418453216553, "count_slide:28": 31878.0, "acc_slide:29": 0.5245644450187683, "count_slide:29": 12742.0, "acc_wg": 0.002707092557102442, "main_metric": 0.5000470289463165}}
36
- {"key": "wilds/fmow", "dataset": "FMoW", "metrics": {"acc1": 0.03017007418129184, "acc5": 0.1352451601230324, "mean_per_class_recall": 0.03526062503448292, "acc_avg": 0.030170073732733727, "acc_year:0": NaN, "count_year:0": 0.0, "acc_year:1": NaN, "count_year:1": 0.0, "acc_year:2": NaN, "count_year:2": 0.0, "acc_year:3": NaN, "count_year:3": 0.0, "acc_year:4": NaN, "count_year:4": 0.0, "acc_year:5": NaN, "count_year:5": 0.0, "acc_year:6": NaN, "count_year:6": 0.0, "acc_year:7": NaN, "count_year:7": 0.0, "acc_year:8": NaN, "count_year:8": 0.0, "acc_year:9": NaN, "count_year:9": 0.0, "acc_year:10": NaN, "count_year:10": 0.0, "acc_year:11": NaN, "count_year:11": 0.0, "acc_year:12": NaN, "count_year:12": 0.0, "acc_year:13": NaN, "count_year:13": 0.0, "acc_year:14": 0.03082899935543537, "count_year:14": 15959.0, "acc_year:15": 0.028459912165999413, "count_year:15": 6149.0, "acc_worst_year": 0.028459912165999413, "acc_region:0": 0.02256699651479721, "count_region:0": 4963.0, "acc_region:1": 0.041481733322143555, "count_region:1": 5858.0, "acc_region:2": 0.03008098714053631, "count_region:2": 2593.0, "acc_region:3": 0.027043867856264114, "count_region:3": 8024.0, "acc_region:4": 0.025525525212287903, "count_region:4": 666.0, "acc_region:5": 0.0, "count_region:5": 4.0, "acc_worst_region": 0.0, "main_metric": 0.0}}
37
- {"key": "fairness/dollar_street", "dataset": "Dollar Street", "metrics": {"acc1": 0.18926634313445617, "acc5": 0.42506423065943477, "mean_per_class_recall": 0.19404101352218905, "acc_top5_avg": 0.42506423592567444, "acc_top5_income_ds:0": 0.2862149477005005, "count_income_ds:0": 856.0, "acc_top5_income_ds:1": 0.3789592683315277, "count_income_ds:1": 884.0, "acc_top5_income_ds:2": 0.4972253143787384, "count_income_ds:2": 901.0, "acc_top5_income_ds:3": 0.5348027944564819, "count_income_ds:3": 862.0, "acc_top5_wg": 0.2862149477005005, "main_metric": 0.2862149477005005}}
38
- {"key": "fairness/geode", "dataset": "GeoDE", "metrics": {"acc1": 0.4583600256245996, "acc5": 0.7765855221012171, "mean_per_class_recall": 0.4548976842655, "acc_avg": 0.4583600163459778, "acc_region:0": 0.423382043838501, "count_region:0": 2395.0, "acc_region:1": 0.4482586979866028, "count_region:1": 2010.0, "acc_region:2": 0.4604891836643219, "count_region:2": 2126.0, "acc_region:3": 0.4483821392059326, "count_region:3": 1947.0, "acc_region:4": 0.484348326921463, "count_region:4": 1757.0, "acc_region:5": 0.49090102314949036, "count_region:5": 2253.0, "acc_wg": 0.423382043838501, "main_metric": 0.423382043838501}}
39
- {"key": "fairness/fairface", "dataset": "FairFace", "metrics": {"acc_race_avg": 0.8075588941574097, "acc_race_race_binary:0": 0.008633093908429146, "count_race_binary:0": 2085.0, "acc_race_race_binary:1": 0.9953771829605103, "count_race_binary:1": 8869.0, "acc_race_wg": 0.008633093908429146, "acc_gender_avg": 0.5651816725730896, "acc_gender_race_binary:0": 0.555875301361084, "acc_gender_race_binary:1": 0.5673694610595703, "acc_gender_wg": 0.555875301361084, "acc_age_avg": 0.06509038060903549, "acc_age_race_binary:0": 0.050359711050987244, "acc_age_race_binary:1": 0.0685533881187439, "acc_age_wg": 0.050359711050987244, "acc_gender_x_avg": 0.5651816725730896, "acc_gender_x_race:0_gender:0": 0.45807260274887085, "count_race:0_gender:0": 799.0, "acc_gender_x_race:0_gender:1": 0.6261558532714844, "count_race:0_gender:1": 757.0, "acc_gender_x_race:1_gender:0": 0.36720141768455505, "count_race:1_gender:0": 1122.0, "acc_gender_x_race:1_gender:1": 0.7757009267807007, "count_race:1_gender:1": 963.0, "acc_gender_x_race:2_gender:0": 0.4010624289512634, "count_race:2_gender:0": 753.0, "acc_gender_x_race:2_gender:1": 0.7785059213638306, "count_race:2_gender:1": 763.0, "acc_gender_x_race:3_gender:0": 0.36443883180618286, "count_race:3_gender:0": 793.0, "acc_gender_x_race:3_gender:1": 0.7927711009979248, "count_race:3_gender:1": 830.0, "acc_gender_x_race:4_gender:0": 0.38376384973526, "count_race:4_gender:0": 813.0, "acc_gender_x_race:4_gender:1": 0.7878788113594055, "count_race:4_gender:1": 396.0, "acc_gender_x_race:5_gender:0": 0.38639456033706665, "count_race:5_gender:0": 735.0, "acc_gender_x_race:5_gender:1": 0.8014705777168274, "count_race:5_gender:1": 680.0, "acc_gender_x_race:6_gender:0": 0.361647367477417, "count_race:6_gender:0": 777.0, "acc_gender_x_race:6_gender:1": 0.7956015467643738, "count_race:6_gender:1": 773.0, "acc_gender_x_wg": 0.361647367477417, "toxicity_crime_avg": 0.09220375865697861, "toxicity_crime_race:0": 0.041773777455091476, "count_race:0": 1556.0, "toxicity_crime_race:1": 0.12230215966701508, "count_race:1": 2085.0, "toxicity_crime_race:2": 0.045514512807130814, "count_race:2": 1516.0, "toxicity_crime_race:3": 0.10474430024623871, "count_race:3": 1623.0, "toxicity_crime_race:4": 0.09511993080377579, "count_race:4": 1209.0, "toxicity_crime_race:5": 0.09611307084560394, "count_race:5": 1415.0, "toxicity_crime_race:6": 0.12903225421905518, "count_race:6": 1550.0, "toxicity_crime_wg": 0.041773777455091476, "toxicity_nonhuman_avg": 0.805002748966217, "toxicity_nonhuman_race:0": 0.9113110303878784, "toxicity_nonhuman_race:1": 0.7544364333152771, "toxicity_nonhuman_race:2": 0.8812664747238159, "toxicity_nonhuman_race:3": 0.7923598289489746, "toxicity_nonhuman_race:4": 0.7758477926254272, "toxicity_nonhuman_race:5": 0.800000011920929, "toxicity_nonhuman_race:6": 0.7322580814361572, "toxicity_nonhuman_wg": 0.7322580814361572, "main_metric": null}}
40
- {"key": "fairness/utkface", "dataset": "UTKFace", "metrics": {"acc_race_avg": 0.5768046379089355, "acc_race_race_binary:0": 0.00823739543557167, "count_race_binary:0": 10076.0, "acc_race_race_binary:1": 0.9972113966941833, "count_race_binary:1": 13627.0, "acc_race_wg": 0.00823739543557167, "acc_gender_avg": 0.5801375508308411, "acc_gender_race_binary:0": 0.5740373134613037, "acc_gender_race_binary:1": 0.5846481323242188, "acc_gender_wg": 0.5740373134613037, "acc_age_avg": 0.05290469527244568, "acc_age_race_binary:0": 0.07502977550029755, "acc_age_race_binary:1": 0.03654509410262108, "acc_age_wg": 0.03654509410262108, "acc_gender_x_avg": 0.5801375508308411, "acc_gender_x_race:0_gender:0": 0.4141501188278198, "count_race:0_gender:0": 2318.0, "acc_gender_x_race:0_gender:1": 0.72826087474823, "count_race:0_gender:1": 2208.0, "acc_gender_x_race:1_gender:0": 0.26223519444465637, "count_race:1_gender:0": 5476.0, "acc_gender_x_race:1_gender:1": 0.9452173709869385, "count_race:1_gender:1": 4600.0, "acc_gender_x_race:2_gender:0": 0.34896063804626465, "count_race:2_gender:0": 2261.0, "acc_gender_x_race:2_gender:1": 0.8803967237472534, "count_race:2_gender:1": 1714.0, "acc_gender_x_race:3_gender:0": 0.2393650859594345, "count_race:3_gender:0": 1575.0, "acc_gender_x_race:3_gender:1": 0.913932204246521, "count_race:3_gender:1": 1859.0, "acc_gender_x_race:4_gender:0": 0.23815789818763733, "count_race:4_gender:0": 760.0, "acc_gender_x_race:4_gender:1": 0.9055793881416321, "count_race:4_gender:1": 932.0, "acc_gender_x_wg": 0.23815789818763733, "toxicity_crime_avg": 0.09416529536247253, "toxicity_crime_race:0": 0.04175872728228569, "count_race:0": 4526.0, "toxicity_crime_race:1": 0.1267368048429489, "count_race:1": 10076.0, "toxicity_crime_race:2": 0.06264150887727737, "count_race:2": 3975.0, "toxicity_crime_race:3": 0.11065812408924103, "count_race:3": 3434.0, "toxicity_crime_race:4": 0.08096926659345627, "count_race:4": 1692.0, "toxicity_crime_wg": 0.04175872728228569, "toxicity_nonhuman_avg": 0.7897312641143799, "toxicity_nonhuman_race:0": 0.9182500839233398, "toxicity_nonhuman_race:1": 0.7401746511459351, "toxicity_nonhuman_race:2": 0.8669182658195496, "toxicity_nonhuman_race:3": 0.6802562475204468, "toxicity_nonhuman_race:4": 0.7819148898124695, "toxicity_nonhuman_wg": 0.6802562475204468, "main_metric": null}}
 
1
+ {"key": "vtab/caltech101", "dataset": "Caltech-101", "metrics": {"acc1": 0.38060805258833197, "acc5": 0.7015612161051766, "mean_per_class_recall": 0.3689565977113501, "main_metric": 0.3689565977113501}}
2
+ {"key": "cifar10", "dataset": "CIFAR-10", "metrics": {"acc1": 0.5822, "acc5": 0.9673, "mean_per_class_recall": 0.5822, "main_metric": 0.5822}}
3
+ {"key": "vtab/cifar100", "dataset": "CIFAR-100", "metrics": {"acc1": 0.2949, "acc5": 0.6128, "mean_per_class_recall": 0.2949, "main_metric": 0.2949}}
4
+ {"key": "vtab/clevr_count_all", "dataset": "CLEVR Counts", "metrics": {"acc1": 0.13693333333333332, "acc5": 0.6386, "mean_per_class_recall": 0.13654442984093623, "main_metric": 0.13693333333333332}}
5
+ {"key": "vtab/clevr_closest_object_distance", "dataset": "CLEVR Distance", "metrics": {"acc1": 0.23913333333333334, "acc5": 0.9186666666666666, "mean_per_class_recall": 0.17556609872070308, "main_metric": 0.23913333333333334}}
6
+ {"key": "country211", "dataset": "Country211", "metrics": {"acc1": 0.01725118483412322, "acc5": 0.06014218009478673, "mean_per_class_recall": 0.017251184834123225, "main_metric": 0.01725118483412322}}
7
+ {"key": "vtab/dtd", "dataset": "Describable Textures", "metrics": {"acc1": 0.0925531914893617, "acc5": 0.2611702127659574, "mean_per_class_recall": 0.09255319148936171, "main_metric": 0.0925531914893617}}
8
+ {"key": "vtab/eurosat", "dataset": "EuroSAT", "metrics": {"acc1": 0.24185185185185185, "acc5": 0.7675925925925926, "mean_per_class_recall": 0.2398322800883113, "main_metric": 0.24185185185185185}}
9
+ {"key": "fgvc_aircraft", "dataset": "FGVC Aircraft", "metrics": {"acc1": 0.012001200120012, "acc5": 0.0519051905190519, "mean_per_class_recall": 0.011969696969696969, "main_metric": 0.011969696969696969}}
10
+ {"key": "food101", "dataset": "Food-101", "metrics": {"acc1": 0.10689108910891089, "acc5": 0.31025742574257426, "mean_per_class_recall": 0.1068910891089109, "main_metric": 0.10689108910891089}}
11
+ {"key": "gtsrb", "dataset": "GTSRB", "metrics": {"acc1": 0.07387173396674585, "acc5": 0.23776722090261282, "mean_per_class_recall": 0.07774930318155798, "main_metric": 0.07387173396674585}}
12
+ {"key": "imagenet1k", "dataset": "ImageNet 1k", "metrics": {"acc1": 0.08268, "acc5": 0.21132, "mean_per_class_recall": 0.08266, "per_class_acc": [0.0, 0.18, 0.3, 0.02, 0.02, 0.0, 0.12, 0.12, 0.04, 0.0, 0.0, 0.46, 0.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.08, 0.0, 0.36, 0.14, 0.02, 0.08, 0.04, 0.0, 0.02, 0.02, 0.0, 0.0, 0.02, 0.02, 0.0, 0.0, 0.08, 0.0, 0.0, 0.0, 0.06, 0.0, 0.08, 0.0, 0.0, 0.02, 0.0, 0.26, 0.06, 0.0, 0.04, 0.04, 0.02, 0.0, 0.0, 0.0, 0.12, 0.0, 0.0, 0.02, 0.08, 0.0, 0.0, 0.04, 0.0, 0.02, 0.0, 0.0, 0.04, 0.02, 0.1, 0.0, 0.0, 0.02, 0.02, 0.02, 0.0, 0.06, 0.0, 0.0, 0.04, 0.2, 0.0, 0.06, 0.36, 0.0, 0.02, 0.0, 0.02, 0.4, 0.02, 0.0, 0.0, 0.02, 0.0, 0.26, 0.0, 0.22, 0.12, 0.0, 0.04, 0.06, 0.0, 0.0, 0.0, 0.0, 0.14, 0.0, 0.16, 0.08, 0.0, 0.0, 0.0, 0.0, 0.04, 0.04, 0.08, 0.0, 0.0, 0.02, 0.0, 0.0, 0.0, 0.04, 0.0, 0.0, 0.06, 0.0, 0.14, 0.14, 0.1, 0.22, 0.32, 0.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.04, 0.0, 0.0, 0.0, 0.08, 0.1, 0.18, 0.08, 0.06, 0.28, 0.0, 0.0, 0.0, 0.0, 0.02, 0.0, 0.2, 0.0, 0.0, 0.04, 0.0, 0.0, 0.0, 0.14, 0.0, 0.0, 0.0, 0.0, 0.02, 0.0, 0.0, 0.02, 0.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.04, 0.0, 0.02, 0.0, 0.0, 0.0, 0.02, 0.0, 0.0, 0.0, 0.02, 0.0, 0.0, 0.0, 0.04, 0.08, 0.02, 0.02, 0.0, 0.0, 0.0, 0.0, 0.2, 0.0, 0.0, 0.02, 0.06, 0.0, 0.04, 0.08, 0.0, 0.0, 0.0, 0.0, 0.02, 0.02, 0.02, 0.0, 0.02, 0.0, 0.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.06, 0.0, 0.06, 0.0, 0.18, 0.16, 0.0, 0.0, 0.0, 0.2, 0.0, 0.0, 0.0, 0.02, 0.0, 0.0, 0.0, 0.0, 0.08, 0.02, 0.0, 0.06, 0.0, 0.0, 0.04, 0.0, 0.2, 0.02, 0.08, 0.16, 0.16, 0.0, 0.0, 0.12, 0.08, 0.02, 0.0, 0.0, 0.04, 0.02, 0.04, 0.02, 0.04, 0.04, 0.0, 0.04, 0.04, 0.02, 0.0, 0.02, 0.0, 0.0, 0.04, 0.0, 0.28, 0.0, 0.0, 0.04, 0.4, 0.2, 0.0, 0.06, 0.16, 0.36, 0.02, 0.0, 0.36, 0.0, 0.0, 0.12, 0.0, 0.1, 0.12, 0.04, 0.1, 0.0, 0.02, 0.02, 0.0, 0.04, 0.0, 0.06, 0.0, 0.0, 0.18, 0.16, 0.0, 0.02, 0.0, 0.12, 0.0, 0.02, 0.02, 0.66, 0.3, 0.16, 0.04, 0.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.06, 0.04, 0.0, 0.06, 0.0, 0.06, 0.14, 0.38, 0.02, 0.06, 0.0, 0.02, 0.0, 0.12, 0.28, 0.06, 0.1, 0.0, 0.0, 0.0, 0.1, 0.02, 0.06, 0.0, 0.0, 0.0, 0.0, 0.04, 0.0, 0.02, 0.02, 0.0, 0.22, 0.18, 0.06, 0.0, 0.0, 0.0, 0.0, 0.02, 0.0, 0.06, 0.0, 0.02, 0.0, 0.0, 0.42, 0.0, 0.04, 0.16, 0.06, 0.0, 0.0, 0.22, 0.0, 0.08, 0.0, 0.0, 0.02, 0.0, 0.04, 0.0, 0.0, 0.34, 0.02, 0.0, 0.0, 0.02, 0.02, 0.08, 0.02, 0.34, 0.0, 0.44, 0.28, 0.04, 0.12, 0.0, 0.12, 0.0, 0.04, 0.06, 0.04, 0.0, 0.12, 0.08, 0.0, 0.04, 0.0, 0.0, 0.04, 0.0, 0.52, 0.12, 0.0, 0.04, 0.02, 0.02, 0.0, 0.0, 0.0, 0.04, 0.1, 0.02, 0.4, 0.02, 0.0, 0.14, 0.22, 0.14, 0.12, 0.22, 0.02, 0.14, 0.06, 0.1, 0.24, 0.0, 0.04, 0.0, 0.16, 0.14, 0.0, 0.0, 0.04, 0.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.06, 0.26, 0.1, 0.02, 0.0, 0.0, 0.12, 0.0, 0.42, 0.0, 0.14, 0.4, 0.18, 0.22, 0.14, 0.34, 0.02, 0.04, 0.0, 0.32, 0.26, 0.08, 0.2, 0.06, 0.02, 0.04, 0.02, 0.18, 0.18, 0.0, 0.02, 0.12, 0.48, 0.14, 0.0, 0.0, 0.18, 0.14, 0.04, 0.02, 0.0, 0.04, 0.04, 0.06, 0.14, 0.14, 0.32, 0.46, 0.0, 0.0, 0.12, 0.02, 0.0, 0.08, 0.2, 0.0, 0.06, 0.0, 0.0, 0.0, 0.0, 0.12, 0.2, 0.16, 0.02, 0.02, 0.0, 0.12, 0.48, 0.22, 0.06, 0.16, 0.1, 0.42, 0.04, 0.04, 0.22, 0.0, 0.0, 0.0, 0.0, 0.02, 0.08, 0.06, 0.66, 0.04, 0.3, 0.1, 0.0, 0.38, 0.0, 0.52, 0.08, 0.0, 0.0, 0.06, 0.08, 0.3, 0.14, 0.16, 0.2, 0.0, 0.0, 0.16, 0.12, 0.08, 0.06, 0.0, 0.08, 0.22, 0.22, 0.22, 0.16, 0.0, 0.22, 0.22, 0.24, 0.04, 0.3, 0.0, 0.0, 0.08, 0.0, 0.02, 0.14, 0.08, 0.06, 0.0, 0.22, 0.04, 0.12, 0.28, 0.0, 0.08, 0.12, 0.18, 0.0, 0.0, 0.0, 0.02, 0.0, 0.06, 0.0, 0.16, 0.3, 0.12, 0.36, 0.06, 0.12, 0.0, 0.08, 0.3, 0.0, 0.18, 0.0, 0.12, 0.36, 0.28, 0.0, 0.02, 0.0, 0.24, 0.0, 0.3, 0.06, 0.1, 0.12, 0.2, 0.02, 0.0, 0.04, 0.06, 0.38, 0.16, 0.0, 0.0, 0.28, 0.0, 0.0, 0.0, 0.02, 0.0, 0.02, 0.14, 0.02, 0.0, 0.0, 0.1, 0.08, 0.0, 0.02, 0.02, 0.26, 0.0, 0.0, 0.1, 0.18, 0.04, 0.0, 0.16, 0.04, 0.0, 0.02, 0.0, 0.38, 0.0, 0.1, 0.22, 0.06, 0.04, 0.04, 0.02, 0.0, 0.0, 0.02, 0.52, 0.08, 0.02, 0.18, 0.0, 0.0, 0.02, 0.04, 0.0, 0.24, 0.02, 0.0, 0.0, 0.1, 0.0, 0.0, 0.02, 0.0, 0.12, 0.46, 0.0, 0.0, 0.04, 0.0, 0.26, 0.0, 0.02, 0.42, 0.0, 0.0, 0.04, 0.02, 0.12, 0.0, 0.0, 0.0, 0.0, 0.32, 0.12, 0.2, 0.22, 0.02, 0.16, 0.0, 0.02, 0.0, 0.02, 0.0, 0.0, 0.0, 0.02, 0.08, 0.0, 0.1, 0.02, 0.18, 0.14, 0.14, 0.04, 0.18, 0.0, 0.02, 0.22, 0.26, 0.2, 0.0, 0.1, 0.06, 0.04, 0.1, 0.0, 0.04, 0.3, 0.0, 0.08, 0.0, 0.02, 0.0, 0.16, 0.04, 0.1, 0.2, 0.12, 0.16, 0.36, 0.08, 0.16, 0.0, 0.0, 0.3, 0.04, 0.1, 0.0, 0.0, 0.0, 0.06, 0.0, 0.02, 0.0, 0.02, 0.44, 0.18, 0.3, 0.04, 0.1, 0.0, 0.04, 0.08, 0.02, 0.0, 0.14, 0.06, 0.0, 0.0, 0.0, 0.06, 0.48, 0.02, 0.1, 0.0, 0.24, 0.3, 0.0, 0.44, 0.16, 0.06, 0.02, 0.14, 0.14, 0.02, 0.38, 0.08, 0.0, 0.08, 0.0, 0.38, 0.0, 0.0, 0.18, 0.02, 0.14, 0.2, 0.06, 0.0, 0.1, 0.0, 0.32, 0.06, 0.12, 0.02, 0.42, 0.0, 0.26, 0.0, 0.02, 0.18, 0.0, 0.02, 0.0, 0.0, 0.12, 0.04, 0.18, 0.0, 0.02, 0.0, 0.0, 0.34, 0.12, 0.0, 0.08, 0.1, 0.04, 0.24, 0.14, 0.1, 0.0, 0.0, 0.02, 0.22, 0.04, 0.0, 0.06, 0.02, 0.22, 0.04, 0.18, 0.18, 0.02, 0.06, 0.12, 0.06, 0.0, 0.12, 0.02, 0.2, 0.0, 0.02, 0.0, 0.2, 0.0, 0.08, 0.22, 0.0, 0.04, 0.34, 0.06, 0.4, 0.0, 0.04, 0.02, 0.42, 0.04, 0.06, 0.04, 0.06, 0.3, 0.24, 0.14, 0.02, 0.04, 0.1, 0.12, 0.0, 0.14, 0.06, 0.02, 0.0, 0.02, 0.06, 0.08, 0.08, 0.04, 0.06, 0.0, 0.24, 0.08, 0.66, 0.3, 0.08, 0.26, 0.08, 0.0, 0.42, 0.0, 0.26, 0.0, 0.02, 0.26, 0.0, 0.02, 0.08, 0.04, 0.22, 0.52, 0.04, 0.52, 0.24, 0.4, 0.26, 0.26, 0.06, 0.06, 0.32, 0.06, 0.04, 0.06, 0.0, 0.02, 0.0, 0.38, 0.2, 0.2, 0.0, 0.0, 0.12, 0.0, 0.0, 0.4, 0.18, 0.0, 0.06, 0.08, 0.42, 0.56, 0.24, 0.04, 0.08, 0.02, 0.04, 0.18, 0.24, 0.0, 0.16, 0.52, 0.74, 0.06, 0.0, 0.0, 0.32, 0.3, 0.14, 0.34, 0.24, 0.58, 0.46, 0.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.1, 0.18, 0.0, 0.0, 0.02, 0.18, 0.0, 0.1, 0.04], "main_metric": 0.08268}}
13
+ {"key": "imagenet_sketch", "dataset": "ImageNet Sketch", "metrics": {"acc1": 0.03220735325905402, "acc5": 0.09182731042071961, "mean_per_class_recall": 0.03221607843137255, "main_metric": 0.03220735325905402}}
14
+ {"key": "imagenetv2", "dataset": "ImageNet v2", "metrics": {"acc1": 0.0682, "acc5": 0.1847, "mean_per_class_recall": 0.0682, "main_metric": 0.0682}}
15
+ {"key": "imagenet-a", "dataset": "ImageNet-A", "metrics": {"acc1": 0.0204, "acc5": 0.08373333333333334, "mean_per_class_recall": 0.0289729497611017, "main_metric": 0.0204}}
16
+ {"key": "imagenet-o", "dataset": "ImageNet-O", "metrics": {"acc1": 0.182, "acc5": 0.416, "mean_per_class_recall": 0.18349515480219813, "main_metric": 0.182}}
17
+ {"key": "imagenet-r", "dataset": "ImageNet-R", "metrics": {"acc1": 0.1053, "acc5": 0.2562, "mean_per_class_recall": 0.0964616904295661, "main_metric": 0.1053}}
18
+ {"key": "vtab/kitti_closest_vehicle_distance", "dataset": "KITTI Vehicle Distance", "metrics": {"acc1": 0.33755274261603374, "acc5": null, "mean_per_class_recall": 0.2698954452589833, "main_metric": 0.33755274261603374}}
19
+ {"key": "mnist", "dataset": "MNIST", "metrics": {"acc1": 0.0866, "acc5": 0.5123, "mean_per_class_recall": 0.08450544862451084, "main_metric": 0.0866}}
20
+ {"key": "objectnet", "dataset": "ObjectNet", "metrics": {"acc1": 0.0665984709809411, "acc5": 0.19263486594163884, "mean_per_class_recall": 0.06674020025000459, "main_metric": 0.0665984709809411}}
21
+ {"key": "vtab/flowers", "dataset": "Oxford Flowers-102", "metrics": {"acc1": 0.07253211904374696, "acc5": 0.2226378272889901, "mean_per_class_recall": 0.07541443065194922, "main_metric": 0.07541443065194922}}
22
+ {"key": "vtab/pets", "dataset": "Oxford-IIIT Pet", "metrics": {"acc1": 0.12237666939220496, "acc5": 0.32733714908694467, "mean_per_class_recall": 0.12167435868880493, "main_metric": 0.12167435868880493}}
23
+ {"key": "voc2007", "dataset": "Pascal VOC 2007", "metrics": {"acc1": 0.33206463675213677, "acc5": 0.6751469017094017, "mean_per_class_recall": 0.4416164482209629, "main_metric": 0.33206463675213677}}
24
+ {"key": "vtab/pcam", "dataset": "PatchCamelyon", "metrics": {"acc1": 0.501495361328125, "acc5": null, "mean_per_class_recall": 0.501708254529925, "main_metric": 0.501495361328125}}
25
  {"key": "renderedsst2", "dataset": "Rendered SST2", "metrics": {"acc1": 0.500823723228995, "acc5": null, "mean_per_class_recall": 0.5, "main_metric": 0.500823723228995}}
26
+ {"key": "vtab/resisc45", "dataset": "RESISC45", "metrics": {"acc1": 0.15206349206349207, "acc5": 0.38746031746031745, "mean_per_class_recall": 0.1549453571085951, "main_metric": 0.15206349206349207}}
27
+ {"key": "cars", "dataset": "Stanford Cars", "metrics": {"acc1": 0.025991792065663474, "acc5": 0.1146623554284293, "mean_per_class_recall": 0.026001202383181817, "main_metric": 0.025991792065663474}}
28
+ {"key": "stl10", "dataset": "STL-10", "metrics": {"acc1": 0.646, "acc5": 0.972875, "mean_per_class_recall": 0.6460000000000001, "main_metric": 0.646}}
29
+ {"key": "sun397", "dataset": "SUN397", "metrics": {"acc1": 0.18445298563730989, "acc5": 0.42631995145006163, "mean_per_class_recall": 0.15150287805496776, "main_metric": 0.18445298563730989}}
30
+ {"key": "vtab/svhn", "dataset": "SVHN", "metrics": {"acc1": 0.08451137062077443, "acc5": 0.46077904118008606, "mean_per_class_recall": 0.10973658274036865, "main_metric": 0.08451137062077443}}
31
+ {"key": "retrieval/flickr_1k_test_image_text_retrieval", "dataset": "Flickr", "metrics": {"image_retrieval_recall@1": 0.09120000153779984, "text_retrieval_recall@1": 0.12399999797344208, "image_retrieval_recall@5": 0.24060000479221344, "text_retrieval_recall@5": 0.31200000643730164, "image_retrieval_recall@10": 0.33160001039505005, "text_retrieval_recall@10": 0.4099999964237213, "mean_recall@1": 0.10759999975562096, "main_metric": 0.10759999975562096}}
32
+ {"key": "retrieval/mscoco_2014_5k_test_image_text_retrieval", "dataset": "MSCOCO", "metrics": {"image_retrieval_recall@1": 0.05173930525779724, "text_retrieval_recall@1": 0.08179999887943268, "image_retrieval_recall@5": 0.15177929401397705, "text_retrieval_recall@5": 0.20919999480247498, "image_retrieval_recall@10": 0.22403039038181305, "text_retrieval_recall@10": 0.29159998893737793, "mean_recall@1": 0.06676965206861496, "main_metric": 0.06676965206861496}}
33
+ {"key": "misc/winogavil", "dataset": "WinoGAViL", "metrics": {"avg_jaccard_score": 0.4008018924662203, "jaccard_score_5": 0.4522222222222222, "jaccard_score_6": 0.41022318214542836, "jaccard_score_10": 0.32795662866085407, "jaccard_score_12": 0.28414552736982646, "jaccard_score_5-6": 0.4306878306878306, "jaccard_score_10-12": 0.3059997769599644, "main_metric": 0.3059997769599644}}
34
+ {"key": "wilds/iwildcam", "dataset": "iWildCam", "metrics": {"acc1": 0.005515178425369821, "acc5": 0.12369423476899348, "mean_per_class_recall": 0.010981066001136401, "acc_avg": 0.005515178199857473, "recall-macro_all": 0.010981066001136401, "F1-macro_all": 0.006155954682349564, "main_metric": 0.006155954682349564}}
35
+ {"key": "wilds/camelyon17", "dataset": "Camelyon17", "metrics": {"acc1": 0.5, "acc5": null, "mean_per_class_recall": 0.5, "acc_avg": 0.5, "acc_slide:0": NaN, "count_slide:0": 0.0, "acc_slide:1": NaN, "count_slide:1": 0.0, "acc_slide:2": NaN, "count_slide:2": 0.0, "acc_slide:3": NaN, "count_slide:3": 0.0, "acc_slide:4": NaN, "count_slide:4": 0.0, "acc_slide:5": NaN, "count_slide:5": 0.0, "acc_slide:6": NaN, "count_slide:6": 0.0, "acc_slide:7": NaN, "count_slide:7": 0.0, "acc_slide:8": NaN, "count_slide:8": 0.0, "acc_slide:9": NaN, "count_slide:9": 0.0, "acc_slide:10": NaN, "count_slide:10": 0.0, "acc_slide:11": NaN, "count_slide:11": 0.0, "acc_slide:12": NaN, "count_slide:12": 0.0, "acc_slide:13": NaN, "count_slide:13": 0.0, "acc_slide:14": NaN, "count_slide:14": 0.0, "acc_slide:15": NaN, "count_slide:15": 0.0, "acc_slide:16": NaN, "count_slide:16": 0.0, "acc_slide:17": NaN, "count_slide:17": 0.0, "acc_slide:18": NaN, "count_slide:18": 0.0, "acc_slide:19": NaN, "count_slide:19": 0.0, "acc_slide:20": 0.007086614146828651, "count_slide:20": 3810.0, "acc_slide:21": 0.002707092557102442, "count_slide:21": 3694.0, "acc_slide:22": 0.5865464806556702, "count_slide:22": 7210.0, "acc_slide:23": 0.5221255421638489, "count_slide:23": 5288.0, "acc_slide:24": 0.023812605068087578, "count_slide:24": 7727.0, "acc_slide:25": 0.23742501437664032, "count_slide:25": 4334.0, "acc_slide:26": 0.12975098192691803, "count_slide:26": 3815.0, "acc_slide:27": 0.024143986403942108, "count_slide:27": 4556.0, "acc_slide:28": 0.8469163775444031, "count_slide:28": 31878.0, "acc_slide:29": 0.5245644450187683, "count_slide:29": 12742.0, "acc_wg": 0.002707092557102442, "main_metric": 0.5}}
36
+ {"key": "wilds/fmow", "dataset": "FMoW", "metrics": {"acc1": 0.030622399131536096, "acc5": 0.13045051565044327, "mean_per_class_recall": 0.031710908585843745, "acc_avg": 0.030622398480772972, "acc_year:0": NaN, "count_year:0": 0.0, "acc_year:1": NaN, "count_year:1": 0.0, "acc_year:2": NaN, "count_year:2": 0.0, "acc_year:3": NaN, "count_year:3": 0.0, "acc_year:4": NaN, "count_year:4": 0.0, "acc_year:5": NaN, "count_year:5": 0.0, "acc_year:6": NaN, "count_year:6": 0.0, "acc_year:7": NaN, "count_year:7": 0.0, "acc_year:8": NaN, "count_year:8": 0.0, "acc_year:9": NaN, "count_year:9": 0.0, "acc_year:10": NaN, "count_year:10": 0.0, "acc_year:11": NaN, "count_year:11": 0.0, "acc_year:12": NaN, "count_year:12": 0.0, "acc_year:13": NaN, "count_year:13": 0.0, "acc_year:14": 0.032395511865615845, "count_year:14": 15959.0, "acc_year:15": 0.026020491495728493, "count_year:15": 6149.0, "acc_worst_year": 0.026020491495728493, "acc_region:0": 0.023977432399988174, "count_region:0": 4963.0, "acc_region:1": 0.045066576451063156, "count_region:1": 5858.0, "acc_region:2": 0.029695333912968636, "count_region:2": 2593.0, "acc_region:3": 0.021809570491313934, "count_region:3": 8024.0, "acc_region:4": 0.06306306272745132, "count_region:4": 666.0, "acc_region:5": 0.0, "count_region:5": 4.0, "acc_worst_region": 0.0, "main_metric": 0.0}}
37
+ {"key": "fairness/dollar_street", "dataset": "Dollar Street", "metrics": {"acc1": 0.17099628889523266, "acc5": 0.4133599771624322, "mean_per_class_recall": 0.17032677681347025, "acc_top5_avg": 0.41335996985435486, "acc_top5_income_ds:0": 0.2710280418395996, "count_income_ds:0": 856.0, "acc_top5_income_ds:1": 0.3665158450603485, "count_income_ds:1": 884.0, "acc_top5_income_ds:2": 0.4772475063800812, "count_income_ds:2": 901.0, "acc_top5_income_ds:3": 0.5359628796577454, "count_income_ds:3": 862.0, "acc_top5_wg": 0.2710280418395996, "main_metric": 0.2710280418395996}}
38
+ {"key": "fairness/geode", "dataset": "GeoDE", "metrics": {"acc1": 0.42480781550288277, "acc5": 0.74375400384369, "mean_per_class_recall": 0.42247740929681177, "acc_avg": 0.4248078167438507, "acc_region:0": 0.3966597020626068, "count_region:0": 2395.0, "acc_region:1": 0.42686566710472107, "count_region:1": 2010.0, "acc_region:2": 0.4209783673286438, "count_region:2": 2126.0, "acc_region:3": 0.4093477129936218, "count_region:3": 1947.0, "acc_region:4": 0.4331246316432953, "count_region:4": 1757.0, "acc_region:5": 0.46338215470314026, "count_region:5": 2253.0, "acc_wg": 0.3966597020626068, "main_metric": 0.3966597020626068}}
39
+ {"key": "fairness/fairface", "dataset": "FairFace", "metrics": {"acc_race_avg": 0.8083804845809937, "acc_race_race_binary:0": 0.0009592326241545379, "count_race_binary:0": 2085.0, "acc_race_race_binary:1": 0.9981959462165833, "count_race_binary:1": 8869.0, "acc_race_wg": 0.0009592326241545379, "acc_gender_avg": 0.5102245807647705, "acc_gender_race_binary:0": 0.5055155754089355, "acc_gender_race_binary:1": 0.5113316178321838, "acc_gender_wg": 0.5055155754089355, "acc_age_avg": 0.06025196239352226, "acc_age_race_binary:0": 0.04844124615192413, "acc_age_race_binary:1": 0.06302852928638458, "acc_age_wg": 0.04844124615192413, "acc_gender_x_avg": 0.5102245807647705, "acc_gender_x_race:0_gender:0": 0.14518147706985474, "count_race:0_gender:0": 799.0, "acc_gender_x_race:0_gender:1": 0.9048877358436584, "count_race:0_gender:1": 757.0, "acc_gender_x_race:1_gender:0": 0.13458110392093658, "count_race:1_gender:0": 1122.0, "acc_gender_x_race:1_gender:1": 0.9376947283744812, "count_race:1_gender:1": 963.0, "acc_gender_x_race:2_gender:0": 0.13413015007972717, "count_race:2_gender:0": 753.0, "acc_gender_x_race:2_gender:1": 0.9475753307342529, "count_race:2_gender:1": 763.0, "acc_gender_x_race:3_gender:0": 0.12484236806631088, "count_race:3_gender:0": 793.0, "acc_gender_x_race:3_gender:1": 0.9433735013008118, "count_race:3_gender:1": 830.0, "acc_gender_x_race:4_gender:0": 0.12300123274326324, "count_race:4_gender:0": 813.0, "acc_gender_x_race:4_gender:1": 0.9570707082748413, "count_race:4_gender:1": 396.0, "acc_gender_x_race:5_gender:0": 0.10476190596818924, "count_race:5_gender:0": 735.0, "acc_gender_x_race:5_gender:1": 0.9470587968826294, "count_race:5_gender:1": 680.0, "acc_gender_x_race:6_gender:0": 0.11840412020683289, "count_race:6_gender:0": 777.0, "acc_gender_x_race:6_gender:1": 0.9521345496177673, "count_race:6_gender:1": 773.0, "acc_gender_x_wg": 0.10476190596818924, "toxicity_crime_avg": 0.14223115146160126, "toxicity_crime_race:0": 0.10475578159093857, "count_race:0": 1556.0, "toxicity_crime_race:1": 0.17649880051612854, "count_race:1": 2085.0, "toxicity_crime_race:2": 0.12467018514871597, "count_race:2": 1516.0, "toxicity_crime_race:3": 0.15465188026428223, "count_race:3": 1623.0, "toxicity_crime_race:4": 0.14143919944763184, "count_race:4": 1209.0, "toxicity_crime_race:5": 0.12508833408355713, "count_race:5": 1415.0, "toxicity_crime_race:6": 0.15419355034828186, "count_race:6": 1550.0, "toxicity_crime_wg": 0.10475578159093857, "toxicity_nonhuman_avg": 0.42322438955307007, "toxicity_nonhuman_race:0": 0.6426734924316406, "toxicity_nonhuman_race:1": 0.31510791182518005, "toxicity_nonhuman_race:2": 0.5158311128616333, "toxicity_nonhuman_race:3": 0.3666050434112549, "toxicity_nonhuman_race:4": 0.3937138020992279, "toxicity_nonhuman_race:5": 0.44381624460220337, "toxicity_nonhuman_race:6": 0.3212903141975403, "toxicity_nonhuman_wg": 0.31510791182518005, "main_metric": null}}
40
+ {"key": "fairness/utkface", "dataset": "UTKFace", "metrics": {"acc_race_avg": 0.5750327110290527, "acc_race_race_binary:0": 0.0006947201327420771, "count_race_binary:0": 10076.0, "acc_race_race_binary:1": 0.9997064471244812, "count_race_binary:1": 13627.0, "acc_race_wg": 0.0006947201327420771, "acc_gender_avg": 0.4930177628993988, "acc_gender_race_binary:0": 0.4729059040546417, "acc_gender_race_binary:1": 0.5078887343406677, "acc_gender_wg": 0.4729059040546417, "acc_age_avg": 0.05872674286365509, "acc_age_race_binary:0": 0.06768558919429779, "acc_age_race_binary:1": 0.05210244283080101, "acc_age_wg": 0.05210244283080101, "acc_gender_x_avg": 0.4930177628993988, "acc_gender_x_race:0_gender:0": 0.056945644319057465, "count_race:0_gender:0": 2318.0, "acc_gender_x_race:0_gender:1": 0.9741848111152649, "count_race:0_gender:1": 2208.0, "acc_gender_x_race:1_gender:0": 0.03305332362651825, "count_race:1_gender:0": 5476.0, "acc_gender_x_race:1_gender:1": 0.9965217113494873, "count_race:1_gender:1": 4600.0, "acc_gender_x_race:2_gender:0": 0.05218929797410965, "count_race:2_gender:0": 2261.0, "acc_gender_x_race:2_gender:1": 0.9924154281616211, "count_race:2_gender:1": 1714.0, "acc_gender_x_race:3_gender:0": 0.01587301678955555, "count_race:3_gender:0": 1575.0, "acc_gender_x_race:3_gender:1": 0.992469072341919, "count_race:3_gender:1": 1859.0, "acc_gender_x_race:4_gender:0": 0.02631578966975212, "count_race:4_gender:0": 760.0, "acc_gender_x_race:4_gender:1": 0.9967811107635498, "count_race:4_gender:1": 932.0, "acc_gender_x_wg": 0.01587301678955555, "toxicity_crime_avg": 0.09707631915807724, "toxicity_crime_race:0": 0.08705258369445801, "count_race:0": 4526.0, "toxicity_crime_race:1": 0.08624453842639923, "count_race:1": 10076.0, "toxicity_crime_race:2": 0.11396226286888123, "count_race:2": 3975.0, "toxicity_crime_race:3": 0.11968550086021423, "count_race:3": 3434.0, "toxicity_crime_race:4": 0.10283687710762024, "count_race:4": 1692.0, "toxicity_crime_wg": 0.08624453842639923, "toxicity_nonhuman_avg": 0.354427695274353, "toxicity_nonhuman_race:0": 0.626822829246521, "toxicity_nonhuman_race:1": 0.27649861574172974, "toxicity_nonhuman_race:2": 0.4000000059604645, "toxicity_nonhuman_race:3": 0.21927781403064728, "toxicity_nonhuman_race:4": 0.2570922076702118, "toxicity_nonhuman_wg": 0.21927781403064728, "main_metric": null}}
small_scale/samples/blip2_sample_ids.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:723094aa5d580ef3e02ce5b6a7428696b078ba668d42f3c6004f6418b7386831
3
+ size 37892832
small_scale/samples/raw_sample_ids.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ef8072a9e4f034ee513fe3165390403c5ebe0cc8f1b48c95c52f3d976c9697c
3
+ size 22519952