nopperl commited on
Commit
f96d53b
β€’
1 Parent(s): 457746c

update model

Browse files
small_scale/checkpoint.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:20480e6eec94100e9dcab9767a911f50536aaefe49926d7c8a5270435d5d4720
3
  size 1815639289
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70da6370f42f58d775fdde4a70bcafe682135c7f42027a9adcd609667fbc076b
3
  size 1815639289
small_scale/results.jsonl CHANGED
@@ -1,40 +1,40 @@
1
- {"key": "vtab/caltech101", "dataset": "Caltech-101", "metrics": {"acc1": 0.19096138044371405, "acc5": 0.4686935086277732, "mean_per_class_recall": 0.14876522162009528, "main_metric": 0.14876522162009528}}
2
- {"key": "cifar10", "dataset": "CIFAR-10", "metrics": {"acc1": 0.3402, "acc5": 0.8918, "mean_per_class_recall": 0.3402, "main_metric": 0.3402}}
3
- {"key": "vtab/cifar100", "dataset": "CIFAR-100", "metrics": {"acc1": 0.1117, "acc5": 0.3358, "mean_per_class_recall": 0.11169999999999998, "main_metric": 0.1117}}
4
- {"key": "vtab/clevr_count_all", "dataset": "CLEVR Counts", "metrics": {"acc1": 0.14113333333333333, "acc5": 0.6643333333333333, "mean_per_class_recall": 0.13760959725188934, "main_metric": 0.14113333333333333}}
5
- {"key": "vtab/clevr_closest_object_distance", "dataset": "CLEVR Distance", "metrics": {"acc1": 0.096, "acc5": 0.9186666666666666, "mean_per_class_recall": 0.16223115409418895, "main_metric": 0.096}}
6
- {"key": "country211", "dataset": "Country211", "metrics": {"acc1": 0.01009478672985782, "acc5": 0.04601895734597156, "mean_per_class_recall": 0.01009478672985782, "main_metric": 0.01009478672985782}}
7
- {"key": "vtab/dtd", "dataset": "Describable Textures", "metrics": {"acc1": 0.04468085106382979, "acc5": 0.15851063829787235, "mean_per_class_recall": 0.04468085106382978, "main_metric": 0.04468085106382979}}
8
- {"key": "vtab/eurosat", "dataset": "EuroSAT", "metrics": {"acc1": 0.14759259259259258, "acc5": 0.5925925925925926, "mean_per_class_recall": 0.13742687420737648, "main_metric": 0.14759259259259258}}
9
- {"key": "fgvc_aircraft", "dataset": "FGVC Aircraft", "metrics": {"acc1": 0.0102010201020102, "acc5": 0.05490549054905491, "mean_per_class_recall": 0.010196078431372548, "main_metric": 0.010196078431372548}}
10
- {"key": "food101", "dataset": "Food-101", "metrics": {"acc1": 0.0438019801980198, "acc5": 0.16201980198019802, "mean_per_class_recall": 0.043801980198019785, "main_metric": 0.0438019801980198}}
11
- {"key": "gtsrb", "dataset": "GTSRB", "metrics": {"acc1": 0.056057007125890734, "acc5": 0.22438638163103722, "mean_per_class_recall": 0.07002965958881024, "main_metric": 0.056057007125890734}}
12
- {"key": "imagenet1k", "dataset": "ImageNet 1k", "metrics": {"acc1": 0.02432, "acc5": 0.08426, "mean_per_class_recall": 0.024300000000000006, "main_metric": 0.02432}}
13
- {"key": "imagenet_sketch", "dataset": "ImageNet Sketch", "metrics": {"acc1": 0.009294739531136395, "acc5": 0.029849279805065927, "mean_per_class_recall": 0.009315686274509804, "main_metric": 0.009294739531136395}}
14
- {"key": "imagenetv2", "dataset": "ImageNet v2", "metrics": {"acc1": 0.024, "acc5": 0.0788, "mean_per_class_recall": 0.024, "main_metric": 0.024}}
15
- {"key": "imagenet-a", "dataset": "ImageNet-A", "metrics": {"acc1": 0.011733333333333333, "acc5": 0.0596, "mean_per_class_recall": 0.016848563250867133, "main_metric": 0.011733333333333333}}
16
- {"key": "imagenet-o", "dataset": "ImageNet-O", "metrics": {"acc1": 0.0915, "acc5": 0.2475, "mean_per_class_recall": 0.0846943110209364, "main_metric": 0.0915}}
17
- {"key": "imagenet-r", "dataset": "ImageNet-R", "metrics": {"acc1": 0.03796666666666667, "acc5": 0.1311, "mean_per_class_recall": 0.03626142230215076, "main_metric": 0.03796666666666667}}
18
- {"key": "vtab/kitti_closest_vehicle_distance", "dataset": "KITTI Vehicle Distance", "metrics": {"acc1": 0.350210970464135, "acc5": null, "mean_per_class_recall": 0.2383231378869298, "main_metric": 0.350210970464135}}
19
- {"key": "mnist", "dataset": "MNIST", "metrics": {"acc1": 0.0578, "acc5": 0.5134, "mean_per_class_recall": 0.05114947437110765, "main_metric": 0.0578}}
20
- {"key": "objectnet", "dataset": "ObjectNet", "metrics": {"acc1": 0.03198018735867342, "acc5": 0.12043717023796705, "mean_per_class_recall": 0.03220009763854892, "main_metric": 0.03198018735867342}}
21
- {"key": "vtab/flowers", "dataset": "Oxford Flowers-102", "metrics": {"acc1": 0.021304277118230606, "acc5": 0.08554236461213205, "mean_per_class_recall": 0.028807478481708775, "main_metric": 0.028807478481708775}}
22
- {"key": "vtab/pets", "dataset": "Oxford-IIIT Pet", "metrics": {"acc1": 0.050695012264922325, "acc5": 0.20005451076587627, "mean_per_class_recall": 0.050423028358856, "main_metric": 0.050423028358856}}
23
- {"key": "voc2007", "dataset": "Pascal VOC 2007", "metrics": {"acc1": 0.2715678418803419, "acc5": 0.6294738247863247, "mean_per_class_recall": 0.28490328170451634, "main_metric": 0.2715678418803419}}
24
- {"key": "vtab/pcam", "dataset": "PatchCamelyon", "metrics": {"acc1": 0.56549072265625, "acc5": null, "mean_per_class_recall": 0.5656405341490588, "main_metric": 0.56549072265625}}
25
- {"key": "renderedsst2", "dataset": "Rendered SST2", "metrics": {"acc1": 0.500823723228995, "acc5": null, "mean_per_class_recall": 0.5, "main_metric": 0.500823723228995}}
26
- {"key": "vtab/resisc45", "dataset": "RESISC45", "metrics": {"acc1": 0.056984126984126984, "acc5": 0.23507936507936508, "mean_per_class_recall": 0.05876417000502206, "main_metric": 0.056984126984126984}}
27
- {"key": "cars", "dataset": "Stanford Cars", "metrics": {"acc1": 0.01703768188036314, "acc5": 0.06703146374829001, "mean_per_class_recall": 0.017114175811972214, "main_metric": 0.01703768188036314}}
28
- {"key": "stl10", "dataset": "STL-10", "metrics": {"acc1": 0.426, "acc5": 0.91325, "mean_per_class_recall": 0.426, "main_metric": 0.426}}
29
- {"key": "sun397", "dataset": "SUN397", "metrics": {"acc1": 0.06714235798223514, "acc5": 0.19053092300053331, "mean_per_class_recall": 0.046076850108507414, "main_metric": 0.06714235798223514}}
30
- {"key": "vtab/svhn", "dataset": "SVHN", "metrics": {"acc1": 0.09903196066379841, "acc5": 0.503380454824831, "mean_per_class_recall": 0.10144132435053754, "main_metric": 0.09903196066379841}}
31
- {"key": "retrieval/flickr_1k_test_image_text_retrieval", "dataset": "Flickr", "metrics": {"image_retrieval_recall@1": 0.016200000420212746, "text_retrieval_recall@1": 0.01899999938905239, "image_retrieval_recall@5": 0.06040000170469284, "text_retrieval_recall@5": 0.08699999749660492, "image_retrieval_recall@10": 0.1005999967455864, "text_retrieval_recall@10": 0.14300000667572021, "mean_recall@1": 0.01759999990463257, "main_metric": 0.01759999990463257}}
32
- {"key": "retrieval/mscoco_2014_5k_test_image_text_retrieval", "dataset": "MSCOCO", "metrics": {"image_retrieval_recall@1": 0.00875649694353342, "text_retrieval_recall@1": 0.01679999940097332, "image_retrieval_recall@5": 0.03282687067985535, "text_retrieval_recall@5": 0.053599998354911804, "image_retrieval_recall@10": 0.055457815527915955, "text_retrieval_recall@10": 0.07999999821186066, "mean_recall@1": 0.01277824817225337, "main_metric": 0.01277824817225337}}
33
- {"key": "misc/winogavil", "dataset": "WinoGAViL", "metrics": {"avg_jaccard_score": 0.39028106330941015, "jaccard_score_5": 0.4422474747474747, "jaccard_score_6": 0.3950803935685145, "jaccard_score_10": 0.3219874804381847, "jaccard_score_12": 0.2824098798397864, "jaccard_score_5-6": 0.4180632459702227, "jaccard_score_10-12": 0.30215233634437383, "main_metric": 0.30215233634437383}}
34
- {"key": "wilds/iwildcam", "dataset": "iWildCam", "metrics": {"acc1": 0.0014956416068799515, "acc5": 0.023813418709541727, "mean_per_class_recall": 0.005449368147679506, "acc_avg": 0.0014956416562199593, "recall-macro_all": 0.005449368147679506, "F1-macro_all": 0.00037990574770134484, "main_metric": 0.00037990574770134484}}
35
- {"key": "wilds/camelyon17", "dataset": "Camelyon17", "metrics": {"acc1": 0.6451666000423261, "acc5": null, "mean_per_class_recall": 0.6451666000423261, "acc_avg": 0.6451665759086609, "acc_slide:0": NaN, "count_slide:0": 0.0, "acc_slide:1": NaN, "count_slide:1": 0.0, "acc_slide:2": NaN, "count_slide:2": 0.0, "acc_slide:3": NaN, "count_slide:3": 0.0, "acc_slide:4": NaN, "count_slide:4": 0.0, "acc_slide:5": NaN, "count_slide:5": 0.0, "acc_slide:6": NaN, "count_slide:6": 0.0, "acc_slide:7": NaN, "count_slide:7": 0.0, "acc_slide:8": NaN, "count_slide:8": 0.0, "acc_slide:9": NaN, "count_slide:9": 0.0, "acc_slide:10": NaN, "count_slide:10": 0.0, "acc_slide:11": NaN, "count_slide:11": 0.0, "acc_slide:12": NaN, "count_slide:12": 0.0, "acc_slide:13": NaN, "count_slide:13": 0.0, "acc_slide:14": NaN, "count_slide:14": 0.0, "acc_slide:15": NaN, "count_slide:15": 0.0, "acc_slide:16": NaN, "count_slide:16": 0.0, "acc_slide:17": NaN, "count_slide:17": 0.0, "acc_slide:18": NaN, "count_slide:18": 0.0, "acc_slide:19": NaN, "count_slide:19": 0.0, "acc_slide:20": 0.5446194410324097, "count_slide:20": 3810.0, "acc_slide:21": 0.32782891392707825, "count_slide:21": 3694.0, "acc_slide:22": 0.8144243955612183, "count_slide:22": 7210.0, "acc_slide:23": 0.6047655344009399, "count_slide:23": 5288.0, "acc_slide:24": 0.1980069875717163, "count_slide:24": 7727.0, "acc_slide:25": 0.520766019821167, "count_slide:25": 4334.0, "acc_slide:26": 0.45792922377586365, "count_slide:26": 3815.0, "acc_slide:27": 0.3156277537345886, "count_slide:27": 4556.0, "acc_slide:28": 0.8569232821464539, "count_slide:28": 31878.0, "acc_slide:29": 0.64581698179245, "count_slide:29": 12742.0, "acc_wg": 0.1980069875717163, "main_metric": 0.6451666000423261}}
36
- {"key": "wilds/fmow", "dataset": "FMoW", "metrics": {"acc1": 0.017731138049574813, "acc5": 0.09521440202641578, "mean_per_class_recall": 0.02122502101529086, "acc_avg": 0.017731137573719025, "acc_year:0": NaN, "count_year:0": 0.0, "acc_year:1": NaN, "count_year:1": 0.0, "acc_year:2": NaN, "count_year:2": 0.0, "acc_year:3": NaN, "count_year:3": 0.0, "acc_year:4": NaN, "count_year:4": 0.0, "acc_year:5": NaN, "count_year:5": 0.0, "acc_year:6": NaN, "count_year:6": 0.0, "acc_year:7": NaN, "count_year:7": 0.0, "acc_year:8": NaN, "count_year:8": 0.0, "acc_year:9": NaN, "count_year:9": 0.0, "acc_year:10": NaN, "count_year:10": 0.0, "acc_year:11": NaN, "count_year:11": 0.0, "acc_year:12": NaN, "count_year:12": 0.0, "acc_year:13": NaN, "count_year:13": 0.0, "acc_year:14": 0.01835954561829567, "count_year:14": 15959.0, "acc_year:15": 0.01610017940402031, "count_year:15": 6149.0, "acc_worst_year": 0.01610017940402031, "acc_region:0": 0.019746121019124985, "count_region:0": 4963.0, "acc_region:1": 0.014168658293783665, "count_region:1": 5858.0, "acc_region:2": 0.013497878797352314, "count_region:2": 2593.0, "acc_region:3": 0.0178215354681015, "count_region:3": 8024.0, "acc_region:4": 0.04954954981803894, "count_region:4": 666.0, "acc_region:5": 0.0, "count_region:5": 4.0, "acc_worst_region": 0.0, "main_metric": 0.0}}
37
- {"key": "fairness/dollar_street", "dataset": "Dollar Street", "metrics": {"acc1": 0.09991435912075364, "acc5": 0.30659434770196975, "mean_per_class_recall": 0.09344864211765992, "acc_top5_avg": 0.3065943419933319, "acc_top5_income_ds:0": 0.1997663527727127, "count_income_ds:0": 856.0, "acc_top5_income_ds:1": 0.2884615361690521, "count_income_ds:1": 884.0, "acc_top5_income_ds:2": 0.35072141885757446, "count_income_ds:2": 901.0, "acc_top5_income_ds:3": 0.38515082001686096, "count_income_ds:3": 862.0, "acc_top5_wg": 0.1997663527727127, "main_metric": 0.1997663527727127}}
38
- {"key": "fairness/geode", "dataset": "GeoDE", "metrics": {"acc1": 0.24415438821268418, "acc5": 0.5742312620115311, "mean_per_class_recall": 0.24023612665034877, "acc_avg": 0.24415439367294312, "acc_region:0": 0.22379958629608154, "count_region:0": 2395.0, "acc_region:1": 0.24875621497631073, "count_region:1": 2010.0, "acc_region:2": 0.24553151428699493, "count_region:2": 2126.0, "acc_region:3": 0.22033898532390594, "count_region:3": 1947.0, "acc_region:4": 0.2692088782787323, "count_region:4": 1757.0, "acc_region:5": 0.26142919063568115, "count_region:5": 2253.0, "acc_wg": 0.22033898532390594, "main_metric": 0.22033898532390594}}
39
- {"key": "fairness/fairface", "dataset": "FairFace", "metrics": {"acc_race_avg": 0.6474347114562988, "acc_race_race_binary:0": 0.4033573269844055, "count_race_binary:0": 2085.0, "acc_race_race_binary:1": 0.7048144936561584, "count_race_binary:1": 8869.0, "acc_race_wg": 0.4033573269844055, "acc_gender_avg": 0.5025561451911926, "acc_gender_race_binary:0": 0.4762589931488037, "acc_gender_race_binary:1": 0.5087382793426514, "acc_gender_wg": 0.4762589931488037, "acc_age_avg": 0.09740734100341797, "acc_age_race_binary:0": 0.09352517873048782, "acc_age_race_binary:1": 0.09831999242305756, "acc_age_wg": 0.09352517873048782, "acc_gender_x_avg": 0.5025561451911926, "acc_gender_x_race:0_gender:0": 0.24030037224292755, "count_race:0_gender:0": 799.0, "acc_gender_x_race:0_gender:1": 0.8665785789489746, "count_race:0_gender:1": 757.0, "acc_gender_x_race:1_gender:0": 0.06417112052440643, "count_race:1_gender:0": 1122.0, "acc_gender_x_race:1_gender:1": 0.9563862681388855, "count_race:1_gender:1": 963.0, "acc_gender_x_race:2_gender:0": 0.14741036295890808, "count_race:2_gender:0": 753.0, "acc_gender_x_race:2_gender:1": 0.9292267560958862, "count_race:2_gender:1": 763.0, "acc_gender_x_race:3_gender:0": 0.09205548465251923, "count_race:3_gender:0": 793.0, "acc_gender_x_race:3_gender:1": 0.9650602340698242, "count_race:3_gender:1": 830.0, "acc_gender_x_race:4_gender:0": 0.1156211569905281, "count_race:4_gender:0": 813.0, "acc_gender_x_race:4_gender:1": 0.9292929172515869, "count_race:4_gender:1": 396.0, "acc_gender_x_race:5_gender:0": 0.09115646034479141, "count_race:5_gender:0": 735.0, "acc_gender_x_race:5_gender:1": 0.9308823347091675, "count_race:5_gender:1": 680.0, "acc_gender_x_race:6_gender:0": 0.09009008854627609, "count_race:6_gender:0": 777.0, "acc_gender_x_race:6_gender:1": 0.9547218680381775, "count_race:6_gender:1": 773.0, "acc_gender_x_wg": 0.06417112052440643, "toxicity_crime_avg": 0.04144604876637459, "toxicity_crime_race:0": 0.03213367611169815, "count_race:0": 1556.0, "toxicity_crime_race:1": 0.042206235229969025, "count_race:1": 2085.0, "toxicity_crime_race:2": 0.03166227042675018, "count_race:2": 1516.0, "toxicity_crime_race:3": 0.051139865070581436, "count_race:3": 1623.0, "toxicity_crime_race:4": 0.040529362857341766, "count_race:4": 1209.0, "toxicity_crime_race:5": 0.0494699664413929, "count_race:5": 1415.0, "toxicity_crime_race:6": 0.04258064553141594, "count_race:6": 1550.0, "toxicity_crime_wg": 0.03166227042675018, "toxicity_nonhuman_avg": 0.33768486976623535, "toxicity_nonhuman_race:0": 0.5212082266807556, "toxicity_nonhuman_race:1": 0.23884892463684082, "toxicity_nonhuman_race:2": 0.4056728184223175, "toxicity_nonhuman_race:3": 0.27541589736938477, "toxicity_nonhuman_race:4": 0.32423490285873413, "toxicity_nonhuman_race:5": 0.35830387473106384, "toxicity_nonhuman_race:6": 0.27677419781684875, "toxicity_nonhuman_wg": 0.23884892463684082, "main_metric": null}}
40
- {"key": "fairness/utkface", "dataset": "UTKFace", "metrics": {"acc_race_avg": 0.5265578031539917, "acc_race_race_binary:0": 0.7908892631530762, "count_race_binary:0": 10076.0, "acc_race_race_binary:1": 0.33110734820365906, "count_race_binary:1": 13627.0, "acc_race_wg": 0.33110734820365906, "acc_gender_avg": 0.5004007816314697, "acc_gender_race_binary:0": 0.46843984723091125, "acc_gender_race_binary:1": 0.5240331888198853, "acc_gender_wg": 0.46843984723091125, "acc_age_avg": 0.13006792962551117, "acc_age_race_binary:0": 0.08832870423793793, "acc_age_race_binary:1": 0.16093049943447113, "acc_age_wg": 0.08832870423793793, "acc_gender_x_avg": 0.5004007816314697, "acc_gender_x_race:0_gender:0": 0.1609145849943161, "count_race:0_gender:0": 2318.0, "acc_gender_x_race:0_gender:1": 0.9547101259231567, "count_race:0_gender:1": 2208.0, "acc_gender_x_race:1_gender:0": 0.034879475831985474, "count_race:1_gender:0": 5476.0, "acc_gender_x_race:1_gender:1": 0.9845651984214783, "count_race:1_gender:1": 4600.0, "acc_gender_x_race:2_gender:0": 0.06324635446071625, "count_race:2_gender:0": 2261.0, "acc_gender_x_race:2_gender:1": 0.9801633358001709, "count_race:2_gender:1": 1714.0, "acc_gender_x_race:3_gender:0": 0.03936507925391197, "count_race:3_gender:0": 1575.0, "acc_gender_x_race:3_gender:1": 0.9811726808547974, "count_race:3_gender:1": 1859.0, "acc_gender_x_race:4_gender:0": 0.04078947380185127, "count_race:4_gender:0": 760.0, "acc_gender_x_race:4_gender:1": 0.9871244430541992, "count_race:4_gender:1": 932.0, "acc_gender_x_wg": 0.034879475831985474, "toxicity_crime_avg": 0.009365903213620186, "toxicity_crime_race:0": 0.015687141567468643, "count_race:0": 4526.0, "toxicity_crime_race:1": 0.0078404126688838, "count_race:1": 10076.0, "toxicity_crime_race:2": 0.00930817611515522, "count_race:2": 3975.0, "toxicity_crime_race:3": 0.0052417004480957985, "count_race:3": 3434.0, "toxicity_crime_race:4": 0.01004728116095066, "count_race:4": 1692.0, "toxicity_crime_wg": 0.0052417004480957985, "toxicity_nonhuman_avg": 0.26460784673690796, "toxicity_nonhuman_race:0": 0.46067166328430176, "toxicity_nonhuman_race:1": 0.18072648346424103, "toxicity_nonhuman_race:2": 0.33836477994918823, "toxicity_nonhuman_race:3": 0.19598136842250824, "toxicity_nonhuman_race:4": 0.20567375421524048, "toxicity_nonhuman_wg": 0.18072648346424103, "main_metric": null}}
 
1
+ {"key": "vtab/caltech101", "dataset": "Caltech-101", "metrics": {"acc1": 0.08907148726376335, "acc5": 0.29268693508627774, "mean_per_class_recall": 0.11463334164319218, "main_metric": 0.11463334164319218}}
2
+ {"key": "cifar10", "dataset": "CIFAR-10", "metrics": {"acc1": 0.3084, "acc5": 0.8495, "mean_per_class_recall": 0.3084, "main_metric": 0.3084}}
3
+ {"key": "vtab/cifar100", "dataset": "CIFAR-100", "metrics": {"acc1": 0.0865, "acc5": 0.2652, "mean_per_class_recall": 0.08649999999999998, "main_metric": 0.0865}}
4
+ {"key": "vtab/clevr_count_all", "dataset": "CLEVR Counts", "metrics": {"acc1": 0.14653333333333332, "acc5": 0.6512666666666667, "mean_per_class_recall": 0.14421888891848736, "main_metric": 0.14653333333333332}}
5
+ {"key": "vtab/clevr_closest_object_distance", "dataset": "CLEVR Distance", "metrics": {"acc1": 0.2216, "acc5": 0.9186666666666666, "mean_per_class_recall": 0.17639399800927735, "main_metric": 0.2216}}
6
+ {"key": "country211", "dataset": "Country211", "metrics": {"acc1": 0.009146919431279621, "acc5": 0.0395260663507109, "mean_per_class_recall": 0.009146919431279621, "main_metric": 0.009146919431279621}}
7
+ {"key": "vtab/dtd", "dataset": "Describable Textures", "metrics": {"acc1": 0.034574468085106384, "acc5": 0.15691489361702127, "mean_per_class_recall": 0.034574468085106384, "main_metric": 0.034574468085106384}}
8
+ {"key": "vtab/eurosat", "dataset": "EuroSAT", "metrics": {"acc1": 0.14796296296296296, "acc5": 0.545, "mean_per_class_recall": 0.13936798445803253, "main_metric": 0.14796296296296296}}
9
+ {"key": "fgvc_aircraft", "dataset": "FGVC Aircraft", "metrics": {"acc1": 0.013801380138013802, "acc5": 0.0558055805580558, "mean_per_class_recall": 0.013627450980392157, "main_metric": 0.013627450980392157}}
10
+ {"key": "food101", "dataset": "Food-101", "metrics": {"acc1": 0.037504950495049504, "acc5": 0.13873267326732674, "mean_per_class_recall": 0.03750495049504951, "main_metric": 0.037504950495049504}}
11
+ {"key": "gtsrb", "dataset": "GTSRB", "metrics": {"acc1": 0.08012668250197942, "acc5": 0.2042755344418052, "mean_per_class_recall": 0.05879165590616551, "main_metric": 0.08012668250197942}}
12
+ {"key": "imagenet1k", "dataset": "ImageNet 1k", "metrics": {"acc1": 0.01682, "acc5": 0.06126, "mean_per_class_recall": 0.01682, "main_metric": 0.01682}}
13
+ {"key": "imagenet_sketch", "dataset": "ImageNet Sketch", "metrics": {"acc1": 0.006582955059050089, "acc5": 0.022932264340034193, "mean_per_class_recall": 0.0065882352941176465, "main_metric": 0.006582955059050089}}
14
+ {"key": "imagenetv2", "dataset": "ImageNet v2", "metrics": {"acc1": 0.0168, "acc5": 0.059, "mean_per_class_recall": 0.016800000000000002, "main_metric": 0.0168}}
15
+ {"key": "imagenet-a", "dataset": "ImageNet-A", "metrics": {"acc1": 0.011866666666666666, "acc5": 0.0548, "mean_per_class_recall": 0.016301863195214567, "main_metric": 0.011866666666666666}}
16
+ {"key": "imagenet-o", "dataset": "ImageNet-O", "metrics": {"acc1": 0.0695, "acc5": 0.196, "mean_per_class_recall": 0.05995914392624918, "main_metric": 0.0695}}
17
+ {"key": "imagenet-r", "dataset": "ImageNet-R", "metrics": {"acc1": 0.028, "acc5": 0.10296666666666666, "mean_per_class_recall": 0.027061858418896457, "main_metric": 0.028}}
18
+ {"key": "vtab/kitti_closest_vehicle_distance", "dataset": "KITTI Vehicle Distance", "metrics": {"acc1": 0.3459915611814346, "acc5": null, "mean_per_class_recall": 0.2470015623122221, "main_metric": 0.3459915611814346}}
19
+ {"key": "mnist", "dataset": "MNIST", "metrics": {"acc1": 0.0975, "acc5": 0.5423, "mean_per_class_recall": 0.0960082261746344, "main_metric": 0.0975}}
20
+ {"key": "objectnet", "dataset": "ObjectNet", "metrics": {"acc1": 0.024119737267147626, "acc5": 0.099601593625498, "mean_per_class_recall": 0.023947953085873885, "main_metric": 0.024119737267147626}}
21
+ {"key": "vtab/flowers", "dataset": "Oxford Flowers-102", "metrics": {"acc1": 0.016588063099691006, "acc5": 0.06700276467718329, "mean_per_class_recall": 0.0265842381438852, "main_metric": 0.0265842381438852}}
22
+ {"key": "vtab/pets", "dataset": "Oxford-IIIT Pet", "metrics": {"acc1": 0.04388116653038975, "acc5": 0.1837012810029981, "mean_per_class_recall": 0.04457820989286629, "main_metric": 0.04457820989286629}}
23
+ {"key": "voc2007", "dataset": "Pascal VOC 2007", "metrics": {"acc1": 0.18229166666666666, "acc5": 0.5980902777777778, "mean_per_class_recall": 0.1824151308224437, "main_metric": 0.18229166666666666}}
24
+ {"key": "vtab/pcam", "dataset": "PatchCamelyon", "metrics": {"acc1": 0.600372314453125, "acc5": null, "mean_per_class_recall": 0.6004799787831268, "main_metric": 0.600372314453125}}
25
+ {"key": "renderedsst2", "dataset": "Rendered SST2", "metrics": {"acc1": 0.46293245469522243, "acc5": null, "mean_per_class_recall": 0.46280433964449075, "main_metric": 0.46293245469522243}}
26
+ {"key": "vtab/resisc45", "dataset": "RESISC45", "metrics": {"acc1": 0.05253968253968254, "acc5": 0.18571428571428572, "mean_per_class_recall": 0.053880972331135715, "main_metric": 0.05253968253968254}}
27
+ {"key": "cars", "dataset": "Stanford Cars", "metrics": {"acc1": 0.011814450938937944, "acc5": 0.053475935828877004, "mean_per_class_recall": 0.011736419757423719, "main_metric": 0.011814450938937944}}
28
+ {"key": "stl10", "dataset": "STL-10", "metrics": {"acc1": 0.391125, "acc5": 0.906375, "mean_per_class_recall": 0.391125, "main_metric": 0.391125}}
29
+ {"key": "sun397", "dataset": "SUN397", "metrics": {"acc1": 0.048917740956654465, "acc5": 0.1517921179910624, "mean_per_class_recall": 0.031206639266060338, "main_metric": 0.048917740956654465}}
30
+ {"key": "vtab/svhn", "dataset": "SVHN", "metrics": {"acc1": 0.11266902274124155, "acc5": 0.4837507682851875, "mean_per_class_recall": 0.10249275162814339, "main_metric": 0.11266902274124155}}
31
+ {"key": "retrieval/flickr_1k_test_image_text_retrieval", "dataset": "Flickr", "metrics": {"image_retrieval_recall@1": 0.012199999764561653, "text_retrieval_recall@1": 0.014000000432133675, "image_retrieval_recall@5": 0.04500000178813934, "text_retrieval_recall@5": 0.05999999865889549, "image_retrieval_recall@10": 0.07320000231266022, "text_retrieval_recall@10": 0.0989999994635582, "mean_recall@1": 0.013100000098347664, "main_metric": 0.013100000098347664}}
32
+ {"key": "retrieval/mscoco_2014_5k_test_image_text_retrieval", "dataset": "MSCOCO", "metrics": {"image_retrieval_recall@1": 0.006477409042418003, "text_retrieval_recall@1": 0.013199999928474426, "image_retrieval_recall@5": 0.022790882736444473, "text_retrieval_recall@5": 0.036400001496076584, "image_retrieval_recall@10": 0.040903639048337936, "text_retrieval_recall@10": 0.05900000035762787, "mean_recall@1": 0.009838704485446215, "main_metric": 0.009838704485446215}}
33
+ {"key": "misc/winogavil", "dataset": "WinoGAViL", "metrics": {"avg_jaccard_score": 0.3655132780027532, "jaccard_score_5": 0.4148737373737374, "jaccard_score_6": 0.37626589872810173, "jaccard_score_10": 0.29029733959311427, "jaccard_score_12": 0.25324877614597235, "jaccard_score_5-6": 0.39507813461301833, "jaccard_score_10-12": 0.2717296754767481, "main_metric": 0.2717296754767481}}
34
+ {"key": "wilds/iwildcam", "dataset": "iWildCam", "metrics": {"acc1": 0.0009114066041924704, "acc5": 0.010072211446332172, "mean_per_class_recall": 0.0028767519503264142, "acc_avg": 0.000911406590603292, "recall-macro_all": 0.0028767519503264142, "F1-macro_all": 0.0003926264709218053, "main_metric": 0.0003926264709218053}}
35
+ {"key": "wilds/camelyon17", "dataset": "Camelyon17", "metrics": {"acc1": 0.7119829755214334, "acc5": null, "mean_per_class_recall": 0.7119829755214335, "acc_avg": 0.7119829654693604, "acc_slide:0": NaN, "count_slide:0": 0.0, "acc_slide:1": NaN, "count_slide:1": 0.0, "acc_slide:2": NaN, "count_slide:2": 0.0, "acc_slide:3": NaN, "count_slide:3": 0.0, "acc_slide:4": NaN, "count_slide:4": 0.0, "acc_slide:5": NaN, "count_slide:5": 0.0, "acc_slide:6": NaN, "count_slide:6": 0.0, "acc_slide:7": NaN, "count_slide:7": 0.0, "acc_slide:8": NaN, "count_slide:8": 0.0, "acc_slide:9": NaN, "count_slide:9": 0.0, "acc_slide:10": NaN, "count_slide:10": 0.0, "acc_slide:11": NaN, "count_slide:11": 0.0, "acc_slide:12": NaN, "count_slide:12": 0.0, "acc_slide:13": NaN, "count_slide:13": 0.0, "acc_slide:14": NaN, "count_slide:14": 0.0, "acc_slide:15": NaN, "count_slide:15": 0.0, "acc_slide:16": NaN, "count_slide:16": 0.0, "acc_slide:17": NaN, "count_slide:17": 0.0, "acc_slide:18": NaN, "count_slide:18": 0.0, "acc_slide:19": NaN, "count_slide:19": 0.0, "acc_slide:20": 0.6506561636924744, "count_slide:20": 3810.0, "acc_slide:21": 0.44450458884239197, "count_slide:21": 3694.0, "acc_slide:22": 0.8319001197814941, "count_slide:22": 7210.0, "acc_slide:23": 0.6815431118011475, "count_slide:23": 5288.0, "acc_slide:24": 0.4913938045501709, "count_slide:24": 7727.0, "acc_slide:25": 0.5378403067588806, "count_slide:25": 4334.0, "acc_slide:26": 0.5507208108901978, "count_slide:26": 3815.0, "acc_slide:27": 0.4931957721710205, "count_slide:27": 4556.0, "acc_slide:28": 0.8580525517463684, "count_slide:28": 31878.0, "acc_slide:29": 0.7067179679870605, "count_slide:29": 12742.0, "acc_wg": 0.44450458884239197, "main_metric": 0.7119829755214334}}
36
+ {"key": "wilds/fmow", "dataset": "FMoW", "metrics": {"acc1": 0.020671250226162476, "acc5": 0.08983173511850914, "mean_per_class_recall": 0.020711872098722436, "acc_avg": 0.02067125029861927, "acc_year:0": NaN, "count_year:0": 0.0, "acc_year:1": NaN, "count_year:1": 0.0, "acc_year:2": NaN, "count_year:2": 0.0, "acc_year:3": NaN, "count_year:3": 0.0, "acc_year:4": NaN, "count_year:4": 0.0, "acc_year:5": NaN, "count_year:5": 0.0, "acc_year:6": NaN, "count_year:6": 0.0, "acc_year:7": NaN, "count_year:7": 0.0, "acc_year:8": NaN, "count_year:8": 0.0, "acc_year:9": NaN, "count_year:9": 0.0, "acc_year:10": NaN, "count_year:10": 0.0, "acc_year:11": NaN, "count_year:11": 0.0, "acc_year:12": NaN, "count_year:12": 0.0, "acc_year:13": NaN, "count_year:13": 0.0, "acc_year:14": 0.019675418734550476, "count_year:14": 15959.0, "acc_year:15": 0.023255813866853714, "count_year:15": 6149.0, "acc_worst_year": 0.019675418734550476, "acc_region:0": 0.0334475114941597, "count_region:0": 4963.0, "acc_region:1": 0.01997268758714199, "count_region:1": 5858.0, "acc_region:2": 0.016197454184293747, "count_region:2": 2593.0, "acc_region:3": 0.014456629753112793, "count_region:3": 8024.0, "acc_region:4": 0.024024024605751038, "count_region:4": 666.0, "acc_region:5": 0.0, "count_region:5": 4.0, "acc_worst_region": 0.0, "main_metric": 0.0}}
37
+ {"key": "fairness/dollar_street", "dataset": "Dollar Street", "metrics": {"acc1": 0.06936911218955182, "acc5": 0.25920639451898375, "mean_per_class_recall": 0.07343197652187794, "acc_top5_avg": 0.2592063844203949, "acc_top5_income_ds:0": 0.2067756950855255, "count_income_ds:0": 856.0, "acc_top5_income_ds:1": 0.22850678861141205, "count_income_ds:1": 884.0, "acc_top5_income_ds:2": 0.2830188572406769, "count_income_ds:2": 901.0, "acc_top5_income_ds:3": 0.31786543130874634, "count_income_ds:3": 862.0, "acc_top5_wg": 0.2067756950855255, "main_metric": 0.2067756950855255}}
38
+ {"key": "fairness/geode", "dataset": "GeoDE", "metrics": {"acc1": 0.18842088404868673, "acc5": 0.493193465727098, "mean_per_class_recall": 0.18469855163341742, "acc_avg": 0.1884208768606186, "acc_region:0": 0.18079331517219543, "count_region:0": 2395.0, "acc_region:1": 0.1880597025156021, "count_region:1": 2010.0, "acc_region:2": 0.17968015372753143, "count_region:2": 2126.0, "acc_region:3": 0.1807909607887268, "count_region:3": 1947.0, "acc_region:4": 0.20432555675506592, "count_region:4": 1757.0, "acc_region:5": 0.19928982853889465, "count_region:5": 2253.0, "acc_wg": 0.17968015372753143, "main_metric": 0.17968015372753143}}
39
+ {"key": "fairness/fairface", "dataset": "FairFace", "metrics": {"acc_race_avg": 0.6680664420127869, "acc_race_race_binary:0": 0.3505995273590088, "count_race_binary:0": 2085.0, "acc_race_race_binary:1": 0.7426992654800415, "count_race_binary:1": 8869.0, "acc_race_wg": 0.3505995273590088, "acc_gender_avg": 0.5340514779090881, "acc_gender_race_binary:0": 0.5112709999084473, "acc_gender_race_binary:1": 0.5394068956375122, "acc_gender_wg": 0.5112709999084473, "acc_age_avg": 0.12561620771884918, "acc_age_race_binary:0": 0.11894484609365463, "acc_age_race_binary:1": 0.12718456983566284, "acc_age_wg": 0.11894484609365463, "acc_gender_x_avg": 0.5340514779090881, "acc_gender_x_race:0_gender:0": 0.41677096486091614, "count_race:0_gender:0": 799.0, "acc_gender_x_race:0_gender:1": 0.7040951251983643, "count_race:0_gender:1": 757.0, "acc_gender_x_race:1_gender:0": 0.23618538677692413, "count_race:1_gender:0": 1122.0, "acc_gender_x_race:1_gender:1": 0.8317757248878479, "count_race:1_gender:1": 963.0, "acc_gender_x_race:2_gender:0": 0.3638778328895569, "count_race:2_gender:0": 753.0, "acc_gender_x_race:2_gender:1": 0.7758846879005432, "count_race:2_gender:1": 763.0, "acc_gender_x_race:3_gender:0": 0.24968473613262177, "count_race:3_gender:0": 793.0, "acc_gender_x_race:3_gender:1": 0.8518072366714478, "count_race:3_gender:1": 830.0, "acc_gender_x_race:4_gender:0": 0.2964329719543457, "count_race:4_gender:0": 813.0, "acc_gender_x_race:4_gender:1": 0.7803030014038086, "count_race:4_gender:1": 396.0, "acc_gender_x_race:5_gender:0": 0.2857142984867096, "count_race:5_gender:0": 735.0, "acc_gender_x_race:5_gender:1": 0.7985293865203857, "count_race:5_gender:1": 680.0, "acc_gender_x_race:6_gender:0": 0.24453024566173553, "count_race:6_gender:0": 777.0, "acc_gender_x_race:6_gender:1": 0.8460543155670166, "count_race:6_gender:1": 773.0, "acc_gender_x_wg": 0.23618538677692413, "toxicity_crime_avg": 0.04345444589853287, "toxicity_crime_race:0": 0.025064267218112946, "count_race:0": 1556.0, "toxicity_crime_race:1": 0.05659472569823265, "count_race:1": 2085.0, "toxicity_crime_race:2": 0.028364116325974464, "count_race:2": 1516.0, "toxicity_crime_race:3": 0.040049292147159576, "count_race:3": 1623.0, "toxicity_crime_race:4": 0.0603804811835289, "count_race:4": 1209.0, "toxicity_crime_race:5": 0.0494699664413929, "count_race:5": 1415.0, "toxicity_crime_race:6": 0.043870966881513596, "count_race:6": 1550.0, "toxicity_crime_wg": 0.025064267218112946, "toxicity_nonhuman_avg": 0.28701844811439514, "toxicity_nonhuman_race:0": 0.39652955532073975, "toxicity_nonhuman_race:1": 0.2139088660478592, "toxicity_nonhuman_race:2": 0.3588390648365021, "toxicity_nonhuman_race:3": 0.23351818323135376, "toxicity_nonhuman_race:4": 0.2423490434885025, "toxicity_nonhuman_race:5": 0.32438161969184875, "toxicity_nonhuman_race:6": 0.2619354724884033, "toxicity_nonhuman_wg": 0.2139088660478592, "main_metric": null}}
40
+ {"key": "fairness/utkface", "dataset": "UTKFace", "metrics": {"acc_race_avg": 0.5487490892410278, "acc_race_race_binary:0": 0.5891226530075073, "count_race_binary:0": 10076.0, "acc_race_race_binary:1": 0.5188962817192078, "count_race_binary:1": 13627.0, "acc_race_wg": 0.5188962817192078, "acc_gender_avg": 0.5260093808174133, "acc_gender_race_binary:0": 0.4954347014427185, "acc_gender_race_binary:1": 0.5486167073249817, "acc_gender_wg": 0.4954347014427185, "acc_age_avg": 0.16571742296218872, "acc_age_race_binary:0": 0.16603811085224152, "acc_age_race_binary:1": 0.16548030078411102, "acc_age_wg": 0.16548030078411102, "acc_gender_x_avg": 0.5260093808174133, "acc_gender_x_race:0_gender:0": 0.3878343403339386, "count_race:0_gender:0": 2318.0, "acc_gender_x_race:0_gender:1": 0.7359601259231567, "count_race:0_gender:1": 2208.0, "acc_gender_x_race:1_gender:0": 0.17841489613056183, "count_race:1_gender:0": 5476.0, "acc_gender_x_race:1_gender:1": 0.872826099395752, "count_race:1_gender:1": 4600.0, "acc_gender_x_race:2_gender:0": 0.297213613986969, "count_race:2_gender:0": 2261.0, "acc_gender_x_race:2_gender:1": 0.8203033804893494, "count_race:2_gender:1": 1714.0, "acc_gender_x_race:3_gender:0": 0.1631745994091034, "count_race:3_gender:0": 1575.0, "acc_gender_x_race:3_gender:1": 0.873587965965271, "count_race:3_gender:1": 1859.0, "acc_gender_x_race:4_gender:0": 0.23026315867900848, "count_race:4_gender:0": 760.0, "acc_gender_x_race:4_gender:1": 0.8776823878288269, "count_race:4_gender:1": 932.0, "acc_gender_x_wg": 0.1631745994091034, "toxicity_crime_avg": 0.03434164449572563, "toxicity_crime_race:0": 0.03336279094219208, "count_race:0": 4526.0, "toxicity_crime_race:1": 0.03582771122455597, "count_race:1": 10076.0, "toxicity_crime_race:2": 0.03597484156489372, "count_race:2": 3975.0, "toxicity_crime_race:3": 0.027664531022310257, "count_race:3": 3434.0, "toxicity_crime_race:4": 0.03782505914568901, "count_race:4": 1692.0, "toxicity_crime_wg": 0.027664531022310257, "toxicity_nonhuman_avg": 0.19225414097309113, "toxicity_nonhuman_race:0": 0.3406981825828552, "toxicity_nonhuman_race:1": 0.13656212389469147, "toxicity_nonhuman_race:2": 0.24553458392620087, "toxicity_nonhuman_race:3": 0.12929528951644897, "toxicity_nonhuman_race:4": 0.12943261861801147, "toxicity_nonhuman_wg": 0.12929528951644897, "main_metric": null}}
small_scale/samples/{arxiv.jsonl β†’ arxiv/1be0454f004e49d5e5ea44116044abb2.parquet} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9dc69bb32ce9ee9c30ff8c0bb9017d363e3fad85335b3248f2e0a1c046b2ca2a
3
- size 379847746
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25b6ff3a0728fc6c206f487a00c49579f612657a70723b88e017cb5615214b5b
3
+ size 213324191
small_scale/samples/{no_filter.npy β†’ arxiv/decontaminated.npy} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:facd8ecea95f2b48c8e75908f6d96fc6b741ff789b87a9a0f9a284dea417fa8c
3
- size 204800128
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f647feade4f1e234c7dce1ef34220988cb5646e81596d7e49a2c8f0e0ee29b22
3
+ size 17878160
small_scale/samples/{pmc.jsonl β†’ pmc/ae4720b4a144e9e536c3776ebb756a31.parquet} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cbdc1738aea30d6b2c9cfdf538b9cf805dac68db5a9b60aaa305483840a72414
3
- size 416971085
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9dbc253686e7e2871681b5d43d5ef462f01f1c7bc0fd06deb2a420c56928ca3f
3
+ size 209834912
small_scale/samples/pmc/decontaminated.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2cbffb5cd769ffa3e0c18fb6e8d0109447076b8d66ec2657fae5e3f5e2a20dd1
3
+ size 12269808